typeprof 0.14.0 → 0.15.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -73,9 +73,9 @@ module TypeProf
73
73
  else
74
74
  ty = Type::Instance.new(recv)
75
75
  end
76
- meths = scratch.get_method(recv, false, :initialize)
76
+ meths = scratch.get_method(recv, false, false, :initialize)
77
77
  meths.flat_map do |meth|
78
- meth.do_send(ty, :initialize, aargs, ep, env, scratch) do |ret_ty, ep, env|
78
+ meth.do_send(ty, :initialize, aargs, ep, env, scratch) do |_ret_ty, ep, env|
79
79
  ctn[ty, ep, env]
80
80
  end
81
81
  end
@@ -104,7 +104,7 @@ module TypeProf
104
104
  sym = get_sym("respond_to?", aargs.lead_tys[0], ep, scratch)
105
105
  if sym
106
106
  klass, singleton = recv.method_dispatch_info
107
- if scratch.get_method(klass, singleton, sym)
107
+ if scratch.get_method(klass, singleton, false, sym)
108
108
  true_val = Type::Instance.new(Type::Builtin[:true])
109
109
  ctn[true_val, ep, env]
110
110
  else
@@ -334,7 +334,7 @@ module TypeProf
334
334
  else
335
335
  aargs.lead_tys.each do |aarg|
336
336
  sym = get_sym("module_function", aarg, ep, scratch) or next
337
- meths = scratch.get_method(recv, false, sym)
337
+ meths = scratch.get_method(recv, false, false, sym)
338
338
  meths.each do |mdef|
339
339
  scratch.add_method(recv, sym, true, mdef)
340
340
  end
@@ -350,7 +350,7 @@ module TypeProf
350
350
  if recv.is_a?(Type::Class)
351
351
  aargs.lead_tys.each do |aarg|
352
352
  sym = get_sym("public", aarg, ep, scratch) or next
353
- meths = scratch.get_method(recv, false, sym)
353
+ meths = scratch.get_method(recv, false, false, sym)
354
354
  next unless meths
355
355
  meths.each do |mdef|
356
356
  mdef.pub_meth = true if mdef.respond_to?(:pub_meth=)
@@ -370,7 +370,7 @@ module TypeProf
370
370
  if recv.is_a?(Type::Class)
371
371
  aargs.lead_tys.each do |aarg|
372
372
  sym = get_sym("private", aarg, ep, scratch) or next
373
- meths = scratch.get_method(recv, false, sym)
373
+ meths = scratch.get_method(recv, false, false, sym)
374
374
  next unless meths
375
375
  meths.each do |mdef|
376
376
  mdef.pub_meth = false if mdef.respond_to?(:pub_meth=)
@@ -635,9 +635,6 @@ module TypeProf
635
635
  end
636
636
 
637
637
  def self.file_require(feature, scratch)
638
- return :done, :false if scratch.loaded_features[feature]
639
- scratch.loaded_features[feature] = true
640
-
641
638
  # XXX: dynamic RBS load is really needed?? Another idea:
642
639
  #
643
640
  # * RBS should be loaded in advance of analysis
@@ -653,7 +650,11 @@ module TypeProf
653
650
 
654
651
  begin
655
652
  filetype, path = $LOAD_PATH.resolve_feature_path(feature)
653
+
656
654
  if filetype == :rb
655
+ return :done, :false if scratch.loaded_files[path]
656
+ scratch.loaded_files[path] = true
657
+
657
658
  return :do, path if File.readable?(path)
658
659
 
659
660
  return :error, "failed to load: #{ path }"
@@ -714,13 +715,14 @@ module TypeProf
714
715
  return ctn[Type.any, ep, env]
715
716
  end
716
717
 
717
- if scratch.loaded_features[feature]
718
+ path = File.join(File.dirname(ep.ctx.iseq.absolute_path), feature) + ".rb" # XXX
719
+
720
+ if scratch.loaded_files[path]
718
721
  result = Type::Instance.new(Type::Builtin[:false])
719
722
  return ctn[result, ep, env]
720
723
  end
721
- scratch.loaded_features[feature] = true
724
+ scratch.loaded_files[path] = true
722
725
 
723
- path = File.join(File.dirname(ep.ctx.iseq.path), feature) + ".rb" # XXX
724
726
  return Builtin.file_load(path, ep, env, scratch, &ctn) if File.readable?(path)
725
727
 
726
728
  scratch.warn(ep, "failed to load: #{ path }")
@@ -811,6 +813,7 @@ module TypeProf
811
813
  Type::Builtin[:exc] = scratch.get_constant(klass_obj, :Exception)
812
814
  Type::Builtin[:encoding] = scratch.get_constant(klass_obj, :Encoding)
813
815
  Type::Builtin[:enumerator] = scratch.get_constant(klass_obj, :Enumerator)
816
+ Type::Builtin[:kernel] = scratch.get_constant(klass_obj, :Kernel)
814
817
 
815
818
  klass_vmcore = Type::Builtin[:vmcore]
816
819
  klass_ary = Type::Builtin[:ary]
@@ -823,6 +826,7 @@ module TypeProf
823
826
  scratch.set_custom_method(klass_vmcore, :"core#undef_method", Builtin.method(:vmcore_undef_method))
824
827
  scratch.set_custom_method(klass_vmcore, :"core#hash_merge_kwd", Builtin.method(:vmcore_hash_merge_kwd))
825
828
  scratch.set_custom_method(klass_vmcore, :"core#raise", Builtin.method(:vmcore_raise))
829
+
826
830
  scratch.set_custom_method(klass_vmcore, :lambda, Builtin.method(:lambda))
827
831
  scratch.set_singleton_custom_method(klass_obj, :"new", Builtin.method(:object_s_new))
828
832
  scratch.set_custom_method(klass_obj, :p, Builtin.method(:kernel_p), false)
@@ -878,6 +882,12 @@ module TypeProf
878
882
  str_ty = Type::Instance.new(Type::Builtin[:str])
879
883
  env_ty = Type.gen_hash {|h| h[str_ty] = Type.optional(str_ty) }
880
884
  scratch.add_constant(klass_obj, :ENV, env_ty, false)
885
+
886
+ scratch.search_method(Type::Builtin[:kernel], false, :sprintf) do |mdefs,|
887
+ mdefs.each do |mdef|
888
+ scratch.add_method(klass_vmcore, :"core#sprintf", false, mdef)
889
+ end
890
+ end
881
891
  end
882
892
  end
883
893
  end
data/lib/typeprof/cli.rb CHANGED
@@ -64,6 +64,7 @@ module TypeProf
64
64
  opt.separator "Advanced options:"
65
65
  opt.on("--[no-]stub-execution", "Force to call all unreachable methods with \"untyped\" arguments") {|v| options[:stub_execution] = v }
66
66
  opt.on("--type-depth-limit DEPTH", Integer, "Limit the maximum depth of nested types") {|v| options[:type_depth_limit] = v }
67
+ opt.on("--union-width-limit WIDTH", Integer, "Limit the maximum count of class instances in one union type") {|v| options[:union_width_limit] = v }
67
68
  opt.on("--debug", "Display analysis log (for debugging purpose)") { verbose = 2 }
68
69
  opt.on("--[no-]stackprof MODE", /\Acpu|wall|object\z/, "Enable stackprof (for debugging purpose)") {|v| options[:stackprof] = v.to_sym }
69
70
 
@@ -40,6 +40,7 @@ module TypeProf
40
40
  show_source_locations: false,
41
41
  stub_execution: true,
42
42
  type_depth_limit: 5,
43
+ union_width_limit: 10,
43
44
  stackprof: nil,
44
45
  }.merge(opt[:options])
45
46
  super(**opt)
@@ -98,7 +99,7 @@ module TypeProf
98
99
  if rb.is_a?(Array) # [String name, String content]
99
100
  iseq = ISeq.compile_str(*rb.reverse)
100
101
  else
101
- iseq = ISeq.compile(rb)
102
+ iseq = rb
102
103
  end
103
104
  scratch.add_entrypoint(iseq)
104
105
  end
@@ -69,14 +69,17 @@ module TypeProf
69
69
  end
70
70
 
71
71
  def show_gvars(scratch, gvars, output)
72
+ gvars = gvars.dump.filter_map do |gvar_name, entry|
73
+ if entry.type != Type.bot && !entry.rbs_declared
74
+ [gvar_name, entry]
75
+ end
76
+ end
72
77
  # A signature for global variables is not supported in RBS
73
- return if gvars.dump.empty?
78
+ return if gvars.empty?
74
79
 
75
80
  output.puts "# Global variables"
76
- gvars.dump.each do |gvar_name, entry|
77
- next if entry.type == Type.bot
78
- s = entry.rbs_declared ? "#" : ""
79
- output.puts s + "#{ gvar_name }: #{ entry.type.screen_name(scratch) }"
81
+ gvars.each do |gvar_name, entry|
82
+ output.puts "#{ gvar_name }: #{ entry.type.screen_name(scratch) }"
80
83
  end
81
84
  output.puts
82
85
  end
@@ -149,6 +152,7 @@ module TypeProf
149
152
  source_locations[key] ||= ctx.iseq.source_location(0)
150
153
  (methods[key] ||= []) << @scratch.show_method_signature(ctx)
151
154
  when AliasMethodDef
155
+ next if mdef.def_ep && Config.check_dir_filter(mdef.def_ep.source_location) == :exclude
152
156
  alias_name, orig_name = mid, mdef.orig_mid
153
157
  if singleton
154
158
  alias_name = "self.#{ alias_name }"
@@ -373,25 +373,30 @@ module TypeProf
373
373
  end
374
374
 
375
375
  def conv_block(rbs_block)
376
- type = rbs_block.type
376
+ blk = rbs_block.type
377
377
 
378
- # XXX
379
- raise NotImplementedError unless type.optional_keywords.empty?
380
- raise NotImplementedError unless type.required_keywords.empty?
381
- raise NotImplementedError if type.rest_keywords
382
-
383
- req = rbs_block.required
384
-
385
- lead_tys = type.required_positionals.map do |type|
386
- conv_type(type.type)
387
- end
388
- opt_tys = type.optional_positionals.map do |type|
389
- conv_type(type.type)
390
- end
378
+ lead_tys = blk.required_positionals.map {|type| conv_type(type.type) }
379
+ opt_tys = blk.optional_positionals.map {|type| conv_type(type.type) }
380
+ rest_ty = blk.rest_positionals
381
+ rest_ty = conv_type(rest_ty.type) if rest_ty
382
+ opt_kw_tys = blk.optional_keywords.to_h {|key, type| [key, conv_type(type.type)] }
383
+ req_kw_tys = blk.required_keywords.to_h {|key, type| [key, conv_type(type.type)] }
384
+ rest_kw_ty = blk.rest_keywords
385
+ rest_kw_ty = conv_type(rest_kw_ty.type) if rest_kw_ty
391
386
 
392
- ret_ty = conv_type(type.return_type)
387
+ ret_ty = conv_type(blk.return_type)
393
388
 
394
- [req, lead_tys, opt_tys, ret_ty]
389
+ {
390
+ required_block: rbs_block.required,
391
+ lead_tys: lead_tys,
392
+ opt_tys: opt_tys,
393
+ rest_ty: rest_ty,
394
+ req_kw_tys: req_kw_tys,
395
+ opt_kw_tys: opt_kw_tys,
396
+ rest_kw_ty: rest_kw_ty,
397
+ blk: blk,
398
+ ret_ty: ret_ty,
399
+ }
395
400
  end
396
401
 
397
402
  def conv_type(ty)
@@ -630,7 +635,13 @@ module TypeProf
630
635
  kw_tys = []
631
636
  req_kw_tys.each {|key, ty| kw_tys << [true, key, conv_type(ty)] }
632
637
  opt_kw_tys.each {|key, ty| kw_tys << [false, key, conv_type(ty)] }
633
- kw_rest_ty = conv_type(rest_kw_ty) if rest_kw_ty
638
+ if rest_kw_ty
639
+ ty = conv_type(rest_kw_ty)
640
+ kw_rest_ty = Type.gen_hash do |h|
641
+ k_ty = Type::Instance.new(Type::Builtin[:sym])
642
+ h[k_ty] = ty
643
+ end
644
+ end
634
645
 
635
646
  blks = conv_block(blk)
636
647
 
@@ -643,13 +654,36 @@ module TypeProf
643
654
 
644
655
  def conv_block(blk)
645
656
  return [Type.nil] unless blk
646
- req, lead_tys, opt_tys, ret_ty = blk
657
+
658
+ required_block = blk[:required_block]
659
+ lead_tys = blk[:lead_tys]
660
+ opt_tys = blk[:opt_tys]
661
+ rest_ty = blk[:rest_ty]
662
+ req_kw_tys = blk[:req_kw_tys]
663
+ opt_kw_tys = blk[:opt_kw_tys]
664
+ rest_kw_ty = blk[:rest_kw_ty]
665
+ ret_ty = blk[:ret_ty]
666
+
647
667
  lead_tys = lead_tys.map {|ty| conv_type(ty) }
648
668
  opt_tys = opt_tys.map {|ty| conv_type(ty) }
649
- msig = MethodSignature.new(lead_tys, opt_tys, nil, [], {}, nil, Type.nil)
669
+ rest_ty = conv_type(rest_ty) if rest_ty
670
+ kw_tys = []
671
+ req_kw_tys.each {|key, ty| kw_tys << [true, key, conv_type(ty)] }
672
+ opt_kw_tys.each {|key, ty| kw_tys << [false, key, conv_type(ty)] }
673
+ if rest_kw_ty
674
+ ty = conv_type(rest_kw_ty)
675
+ kw_rest_ty = Type.gen_hash do |h|
676
+ k_ty = Type::Instance.new(Type::Builtin[:sym])
677
+ h[k_ty] = ty
678
+ end
679
+ end
680
+
681
+ msig = MethodSignature.new(lead_tys, opt_tys, rest_ty, [], kw_tys, kw_rest_ty, Type.nil)
682
+
650
683
  ret_ty = conv_type(ret_ty)
684
+
651
685
  ret = [Type::Proc.new(TypedBlock.new(msig, ret_ty), Type::Builtin[:proc])]
652
- ret << Type.nil unless req
686
+ ret << Type.nil unless required_block
653
687
  ret
654
688
  end
655
689
 
@@ -694,7 +728,7 @@ module TypeProf
694
728
  end
695
729
  when :union
696
730
  tys = ty[1]
697
- Type::Union.new(Utils::Set[*tys.map {|ty2| conv_type(ty2) }], nil).normalize # XXX: Array and Hash support
731
+ Type::Union.create(Utils::Set[*tys.map {|ty2| conv_type(ty2) }], nil) # XXX: Array and Hash support
698
732
  when :var
699
733
  Type::Var.new(ty[1])
700
734
  when :proc
data/lib/typeprof/iseq.rb CHANGED
@@ -1,74 +1,67 @@
1
1
  module TypeProf
2
2
  class ISeq
3
- include Utils::StructuralEquality
4
-
5
- def self.compile(file)
6
- opt = RubyVM::InstructionSequence.compile_option
7
- opt[:inline_const_cache] = false
8
- opt[:peephole_optimization] = false
9
- opt[:specialized_instruction] = false
10
- opt[:operands_unification] = false
11
- opt[:coverage_enabled] = false
12
- new(RubyVM::InstructionSequence.compile_file(file, **opt).to_a)
3
+ # https://github.com/ruby/ruby/pull/4468
4
+ CASE_WHEN_CHECKMATCH = RubyVM::InstructionSequence.compile("case 1; when Integer; end").to_a.last.any? {|insn,| insn == :checkmatch }
5
+
6
+ class << self
7
+ def compile(file)
8
+ compile_core(nil, file)
9
+ end
10
+
11
+ def compile_str(str, path = nil)
12
+ compile_core(str, path)
13
+ end
14
+
15
+ private def compile_core(str, path)
16
+ opt = RubyVM::InstructionSequence.compile_option
17
+ opt[:inline_const_cache] = false
18
+ opt[:peephole_optimization] = false
19
+ opt[:specialized_instruction] = false
20
+ opt[:operands_unification] = false
21
+ opt[:coverage_enabled] = false
22
+
23
+ if str
24
+ iseq = RubyVM::InstructionSequence.compile(str, path, **opt)
25
+ else
26
+ iseq = RubyVM::InstructionSequence.compile_file(path, **opt)
27
+ end
28
+
29
+ return new(iseq.to_a)
30
+ end
13
31
  end
14
32
 
15
- def self.compile_str(str, path = nil)
16
- opt = RubyVM::InstructionSequence.compile_option
17
- opt[:inline_const_cache] = false
18
- opt[:peephole_optimization] = false
19
- opt[:specialized_instruction] = false
20
- opt[:operands_unification] = false
21
- opt[:coverage_enabled] = false
22
- new(RubyVM::InstructionSequence.compile(str, path, **opt).to_a)
33
+ Insn = Struct.new(:insn, :operands, :lineno)
34
+ class Insn
35
+ def check?(insn_cmp, operands_cmp = nil)
36
+ return insn == insn_cmp && (!operands_cmp || operands == operands_cmp)
37
+ end
23
38
  end
24
39
 
25
- FRESH_ID = [0]
40
+ ISEQ_FRESH_ID = [0]
26
41
 
27
42
  def initialize(iseq)
28
- @id = FRESH_ID[0]
29
- FRESH_ID[0] += 1
43
+ @id = (ISEQ_FRESH_ID[0] += 1)
30
44
 
31
45
  _magic, _major_version, _minor_version, _format_type, _misc,
32
46
  @name, @path, @absolute_path, @start_lineno, @type,
33
47
  @locals, @fargs_format, catch_table, insns = *iseq
34
48
 
35
- case @type
36
- when :method, :block
37
- if @fargs_format[:opt]
38
- label = @fargs_format[:opt].last
39
- i = insns.index(label) + 1
40
- else
41
- i = insns.find_index {|insn| insn.is_a?(Array) }
42
- end
43
- # skip keyword initialization
44
- while insns[i][0] == :checkkeyword
45
- raise if insns[i + 1][0] != :branchif
46
- label = insns[i + 1][1]
47
- i = insns.index(label) + 1
48
- end
49
- insns[i, 0] = [[:_iseq_body_start]]
50
- end
49
+ convert_insns(insns)
51
50
 
52
- # rescue/ensure clauses need to have a dedicated return addresses
53
- # because they requires to be virtually called.
54
- # So, this preprocess adds "nop" to make a new insn for their return addresses
55
- special_labels = {}
56
- catch_table.map do |type, iseq, first, last, cont, stack_depth|
57
- special_labels[cont] = true if type == :rescue || type == :ensure
58
- end
51
+ add_body_start_marker(insns)
52
+
53
+ add_exception_cont_marker(insns, catch_table)
59
54
 
60
- @insns = []
61
- @linenos = []
55
+ labels = create_label_table(insns)
62
56
 
63
- labels = setup_iseq(insns, special_labels)
57
+ @insns = setup_insns(insns, labels)
64
58
 
65
- # checkmatch->branch
66
- # send->branch
59
+ @fargs_format[:opt] = @fargs_format[:opt].map {|l| labels[l] } if @fargs_format[:opt]
67
60
 
68
61
  @catch_table = []
69
62
  catch_table.map do |type, iseq, first, last, cont, stack_depth|
70
63
  iseq = iseq ? ISeq.new(iseq) : nil
71
- target = labels[special_labels[cont] ? :"#{ cont }_special" : cont]
64
+ target = labels[cont]
72
65
  entry = [type, iseq, target, stack_depth]
73
66
  labels[first].upto(labels[last]) do |i|
74
67
  @catch_table[i] ||= []
@@ -76,43 +69,143 @@ module TypeProf
76
69
  end
77
70
  end
78
71
 
79
- merge_branches
72
+ rename_insn_types
73
+
74
+ unify_instructions
75
+ end
76
+
77
+ def source_location(pc)
78
+ "#{ @path }:#{ @insns[pc].lineno }"
79
+ end
80
+
81
+ attr_reader :name, :path, :absolute_path, :start_lineno, :type, :locals, :fargs_format, :catch_table, :insns
82
+ attr_reader :id
80
83
 
81
- analyze_stack
84
+ def pretty_print(q)
85
+ q.text "ISeq["
86
+ q.group do
87
+ q.nest(1) do
88
+ q.breakable ""
89
+ q.text "@type= #{ @type }"
90
+ q.breakable ", "
91
+ q.text "@name= #{ @name }"
92
+ q.breakable ", "
93
+ q.text "@path= #{ @path }"
94
+ q.breakable ", "
95
+ q.text "@absolute_path= #{ @absolute_path }"
96
+ q.breakable ", "
97
+ q.text "@start_lineno= #{ @start_lineno }"
98
+ q.breakable ", "
99
+ q.text "@fargs_format= #{ @fargs_format.inspect }"
100
+ q.breakable ", "
101
+ q.text "@insns="
102
+ q.group(2) do
103
+ @insns.each_with_index do |(insn, *operands), i|
104
+ q.breakable
105
+ q.group(2, "#{ i }: #{ insn.to_s }", "") do
106
+ q.pp operands
107
+ end
108
+ end
109
+ end
110
+ end
111
+ q.breakable
112
+ end
113
+ q.text "]"
82
114
  end
83
115
 
84
116
  def <=>(other)
85
117
  @id <=> other.id
86
118
  end
87
119
 
88
- def setup_iseq(insns, special_labels)
120
+ # Remove lineno entry and convert instructions to Insn instances
121
+ def convert_insns(insns)
122
+ ninsns = []
123
+ lineno = 0
124
+ insns.each do |e|
125
+ case e
126
+ when Integer # lineno
127
+ lineno = e
128
+ when Symbol # label or trace
129
+ ninsns << e
130
+ when Array
131
+ insn, *operands = e
132
+ ninsns << Insn.new(insn, operands, lineno)
133
+ else
134
+ raise "unknown iseq entry: #{ e }"
135
+ end
136
+ end
137
+ insns.replace(ninsns)
138
+ end
139
+
140
+ # Insert a dummy instruction "_iseq_body_start"
141
+ def add_body_start_marker(insns)
142
+ case @type
143
+ when :method, :block
144
+ # skip initialization code of optional arguments
145
+ if @fargs_format[:opt]
146
+ label = @fargs_format[:opt].last
147
+ i = insns.index(label) + 1
148
+ else
149
+ i = insns.find_index {|insn| insn.is_a?(Insn) }
150
+ end
151
+
152
+ # skip initialization code of keyword arguments
153
+ while insns[i][0] == :checkkeyword
154
+ raise if insns[i + 1].insn != :branchif
155
+ label = insns[i + 1].operands[0]
156
+ i = insns.index(label) + 1
157
+ end
158
+
159
+ insns.insert(i, Insn.new(:_iseq_body_start, [], @start_lineno))
160
+ end
161
+ end
162
+
163
+ # Insert "nop" instruction to continuation point of exception handlers
164
+ def add_exception_cont_marker(insns, catch_table)
165
+ # rescue/ensure clauses need to have a dedicated return addresses
166
+ # because they requires to be virtually called.
167
+ # So, this preprocess adds "nop" to make a new insn for their return addresses
168
+ exception_cont_labels = {}
169
+ catch_table.map! do |type, iseq, first, last, cont, stack_depth|
170
+ if type == :rescue || type == :ensure
171
+ exception_cont_labels[cont] = true
172
+ cont = :"#{ cont }_exception_cont"
173
+ end
174
+ [type, iseq, first, last, cont, stack_depth]
175
+ end
176
+
89
177
  i = 0
178
+ while i < insns.size
179
+ e = insns[i]
180
+ if exception_cont_labels[e]
181
+ insns.insert(i, :"#{ e }_exception_cont", Insn.new(:nop, []))
182
+ i += 2
183
+ end
184
+ i += 1
185
+ end
186
+ end
187
+
188
+ def create_label_table(insns)
189
+ pc = 0
90
190
  labels = {}
91
- ninsns = []
92
191
  insns.each do |e|
93
- if e.is_a?(Symbol) && e.to_s.start_with?("label")
94
- if special_labels[e]
95
- labels[:"#{ e }_special"] = i
96
- ninsns << [:nop]
97
- i += 1
98
- end
99
- labels[e] = i
192
+ if e.is_a?(Symbol)
193
+ labels[e] = pc
100
194
  else
101
- i += 1 if e.is_a?(Array)
102
- ninsns << e
195
+ pc += 1
103
196
  end
104
197
  end
198
+ labels
199
+ end
105
200
 
106
- lineno = 0
107
- ninsns.each do |e|
201
+ def setup_insns(insns, labels)
202
+ ninsns = []
203
+ insns.each do |e|
108
204
  case e
109
- when Integer # lineno
110
- lineno = e
111
205
  when Symbol # label or trace
112
206
  nil
113
- when Array
114
- insn, *operands = e
115
- operands = (INSN_TABLE[insn] || []).zip(operands).map do |type, operand|
207
+ when Insn
208
+ operands = (INSN_TABLE[e.insn] || []).zip(e.operands).map do |type, operand|
116
209
  case type
117
210
  when "ISEQ"
118
211
  operand && ISeq.new(operand)
@@ -128,81 +221,64 @@ module TypeProf
128
221
  end
129
222
  end
130
223
 
131
- @insns << [insn, operands]
132
- @linenos << lineno
224
+ ninsns << Insn.new(e.insn, operands, e.lineno)
133
225
  else
134
226
  raise "unknown iseq entry: #{ e }"
135
227
  end
136
228
  end
137
-
138
- @fargs_format[:opt] = @fargs_format[:opt].map {|l| labels[l] } if @fargs_format[:opt]
139
-
140
- labels
229
+ ninsns
141
230
  end
142
231
 
143
- def merge_branches
144
- @insns.size.times do |i|
145
- insn, operands = @insns[i]
146
- case insn
232
+ def rename_insn_types
233
+ @insns.each do |insn|
234
+ case insn.insn
147
235
  when :branchif
148
- @insns[i] = [:branch, [:if] + operands]
236
+ insn.insn, insn.operands = :branch, [:if] + insn.operands
149
237
  when :branchunless
150
- @insns[i] = [:branch, [:unless] + operands]
238
+ insn.insn, insn.operands = :branch, [:unless] + insn.operands
151
239
  when :branchnil
152
- @insns[i] = [:branch, [:nil] + operands]
240
+ insn.insn, insn.operands = :branch, [:nil] + insn.operands
241
+ when :getblockparam, :getblockparamproxy
242
+ insn.insn = :getlocal
153
243
  end
154
244
  end
155
245
  end
156
246
 
157
- def source_location(pc)
158
- "#{ @path }:#{ @linenos[pc] }"
159
- end
160
-
161
- attr_reader :name, :path, :absolute_path, :start_lineno, :type, :locals, :fargs_format, :catch_table, :insns, :linenos
162
- attr_reader :id
247
+ # Unify some instructions for flow-sensitive analysis
248
+ def unify_instructions
249
+ # This method rewrites instructions to enable flow-sensitive analysis.
250
+ #
251
+ # Consider `if x; ...; else; ... end`.
252
+ # When the variable `x` is of type "Integer | nil",
253
+ # we want to make sure that `x` is "Integer" in then clause.
254
+ # So, we need to split the environment to two ones:
255
+ # one is that `x` is of type "Integer", and the other is that
256
+ # `x` is type "nil".
257
+ #
258
+ # However, `if x` is compiled to "getlocal; branch".
259
+ # TypeProf evaluates them as follows:
260
+ #
261
+ # * "getlocal" pushes the value of `x` to the stack, amd
262
+ # * "branch" checks the value on the top of the stack
263
+ #
264
+ # TypeProf does not keep where the value comes from, so
265
+ # it is difficult to split the environment when evaluating "branch".
266
+ #
267
+ # This method rewrites "getlocal; branch" to "nop; getlocal_branch".
268
+ # The two instructions are unified to "getlocal_branch" instruction,
269
+ # so TypeProf can split the environment.
270
+ #
271
+ # This is a very fragile appoach because it highly depends on the compiler of Ruby.
163
272
 
164
- def pretty_print(q)
165
- q.text "ISeq["
166
- q.group do
167
- q.nest(1) do
168
- q.breakable ""
169
- q.text "@type= #{ @type }"
170
- q.breakable ", "
171
- q.text "@name= #{ @name }"
172
- q.breakable ", "
173
- q.text "@path= #{ @path }"
174
- q.breakable ", "
175
- q.text "@absolute_path= #{ @absolute_path }"
176
- q.breakable ", "
177
- q.text "@start_lineno= #{ @start_lineno }"
178
- q.breakable ", "
179
- q.text "@fargs_format= #{ @fargs_format.inspect }"
180
- q.breakable ", "
181
- q.text "@insns="
182
- q.group(2) do
183
- @insns.each_with_index do |(insn, *operands), i|
184
- q.breakable
185
- q.group(2, "#{ i }: #{ insn.to_s }", "") do
186
- q.pp operands
187
- end
188
- end
189
- end
190
- end
191
- q.breakable
192
- end
193
- q.text "]"
194
- end
195
-
196
- def analyze_stack
197
273
  # gather branch targets
198
274
  # TODO: catch_table should be also considered
199
275
  branch_targets = {}
200
- @insns.each do |insn, operands|
201
- case insn
276
+ @insns.each do |insn|
277
+ case insn.insn
202
278
  when :branch
203
- branch_targets[operands[1]] = true
279
+ branch_targets[insn.operands[1]] = true
204
280
  when :jump
205
- branch_targets[operands[0]] = true
281
+ branch_targets[insn.operands[0]] = true
206
282
  end
207
283
  end
208
284
 
@@ -210,27 +286,29 @@ module TypeProf
210
286
  # find a pattern: getlocal, (dup, putobject(true), getconstant(class name), checkmatch, branch)* for ..Ruby 3.0
211
287
  # find a pattern: getlocal, (putobject(true), getconstant(class name), top(1), send(===), branch)* for Ruby 3.1..
212
288
  case_branch_list = []
213
- if (RUBY_VERSION.split(".") <=> %w(3 1 0)) < 0
289
+ if CASE_WHEN_CHECKMATCH
214
290
  (@insns.size - 1).times do |i|
215
- insn0, getlocal_operands = @insns[i]
216
- next unless [:getlocal, :getblockparam, :getblockparamproxy].include?(insn0) && getlocal_operands[1] == 0
291
+ insn = @insns[i]
292
+ next unless insn.insn == :getlocal && insn.operands[1] == 0
293
+ getlocal_operands = insn.operands
217
294
  nops = [i]
218
295
  new_insns = []
219
296
  j = i + 1
220
297
  while true
221
- case @insns[j]
222
- when [:dup, []]
223
- break unless @insns[j + 1] == [:putnil, []]
224
- break unless @insns[j + 2] == [:putobject, [true]]
225
- break unless @insns[j + 3][0] == :getconstant # TODO: support A::B::C
226
- break unless @insns[j + 4] == [:checkmatch, [2]]
227
- break unless @insns[j + 5][0] == :branch
228
- target_pc = @insns[j + 5][1][1]
229
- break unless @insns[target_pc] == [:pop, []]
298
+ case @insns[j].insn
299
+ when :dup
300
+ break unless @insns[j + 1].check?(:putnil, [])
301
+ break unless @insns[j + 2].check?(:putobject, [true])
302
+ break unless @insns[j + 3].check?(:getconstant) # TODO: support A::B::C
303
+ break unless @insns[j + 4].check?(:checkmatch, [2])
304
+ break unless @insns[j + 5].check?(:branch)
305
+ target_pc = @insns[j + 5].operands[1]
306
+ break unless @insns[target_pc].check?(:pop, [])
230
307
  nops << j << (j + 4) << target_pc
231
- new_insns << [j + 5, [:getlocal_checkmatch_branch, [getlocal_operands, @insns[j + 5][1]]]]
308
+ branch_operands = @insns[j + 5][1]
309
+ new_insns << [j + 5, Insn.new(:getlocal_checkmatch_branch, [getlocal_operands, branch_operands])]
232
310
  j += 6
233
- when [:pop, []]
311
+ when :pop
234
312
  nops << j
235
313
  case_branch_list << [nops, new_insns]
236
314
  break
@@ -241,25 +319,28 @@ module TypeProf
241
319
  end
242
320
  else
243
321
  (@insns.size - 1).times do |i|
244
- insn0, getlocal_operands = @insns[i]
245
- next unless [:getlocal, :getblockparam, :getblockparamproxy].include?(insn0) && getlocal_operands[1] == 0
322
+ insn = @insns[i]
323
+ next unless insn.insn == :getlocal && insn.operands[1] == 0
324
+ getlocal_operands = insn.operands
246
325
  nops = []
247
326
  new_insns = []
248
327
  j = i + 1
249
328
  while true
250
- case @insns[j]
251
- when [:putnil, []]
252
- break unless @insns[j + 1] == [:putobject, [true]]
253
- break unless @insns[j + 2][0] == :getconstant # TODO: support A::B::C
254
- break unless @insns[j + 3] == [:topn, [1]]
255
- break unless @insns[j + 4] == [:send, [{:mid=>:===, :flag=>20, :orig_argc=>1}, nil]]
256
- break unless @insns[j + 5][0] == :branch
257
- target_pc = @insns[j + 5][1][1]
258
- break unless @insns[target_pc] == [:pop, []]
329
+ insn = @insns[j]
330
+ if insn.check?(:putnil, [])
331
+ break unless @insns[j + 1].check?(:putobject, [true])
332
+ break unless @insns[j + 2].check?(:getconstant) # TODO: support A::B::C
333
+ break unless @insns[j + 3].check?(:topn, [1])
334
+ break unless @insns[j + 4].check?(:send, [{:mid=>:===, :flag=>20, :orig_argc=>1}, nil])
335
+ break unless @insns[j + 5].check?(:branch)
336
+ target_pc = @insns[j + 5].operands[1]
337
+ break unless @insns[target_pc].check?(:pop, [])
259
338
  nops << (j + 4) #<< target_pc
260
- new_insns << [j + 5, [:arg_getlocal_send_branch, [getlocal_operands, @insns[j + 4][1], @insns[j + 5][1]]]]
339
+ send_operands = @insns[j + 4][1]
340
+ branch_operands = @insns[j + 5][1]
341
+ new_insns << [j + 5, Insn.new(:arg_getlocal_send_branch, [getlocal_operands, send_operands, branch_operands])]
261
342
  j += 6
262
- when [:pop, []]
343
+ elsif insn.check?(:pop, [])
263
344
  #nops << j
264
345
  case_branch_list << [nops, new_insns]
265
346
  break
@@ -270,15 +351,15 @@ module TypeProf
270
351
  end
271
352
  end
272
353
  case_branch_list.each do |nops, new_insns|
273
- nops.each {|i| @insns[i] = [:nop, []] }
354
+ nops.each {|i| @insns[i] = Insn.new(:nop, []) }
274
355
  new_insns.each {|i, insn| @insns[i] = insn }
275
356
  end
276
357
 
277
358
  # find a pattern: getlocal(recv), ..., send (is_a?, respond_to?), branch
278
359
  recv_getlocal_send_branch_list = []
279
360
  (@insns.size - 1).times do |i|
280
- insn, operands = @insns[i]
281
- if insn == :getlocal && operands[1] == 0
361
+ insn = @insns[i]
362
+ if insn.insn == :getlocal && insn.operands[1] == 0
282
363
  j = i + 1
283
364
  sp = 1
284
365
  while @insns[j]
@@ -294,94 +375,118 @@ module TypeProf
294
375
  end
295
376
  recv_getlocal_send_branch_list.each do |i, j|
296
377
  next if (i + 1 .. j + 1).any? {|i| branch_targets[i] }
297
- _insn, getlocal_operands = @insns[i]
298
- _insn, send_operands = @insns[j]
299
- _insn, branch_operands = @insns[j + 1]
300
- @insns[j] = [:nop]
301
- @insns[j + 1] = [:recv_getlocal_send_branch, [getlocal_operands, send_operands, branch_operands]]
378
+ getlocal_operands = @insns[i].operands
379
+ send_operands = @insns[j].operands
380
+ branch_operands = @insns[j + 1].operands
381
+ @insns[j] = Insn.new(:nop, [])
382
+ @insns[j + 1] = Insn.new(:recv_getlocal_send_branch, [getlocal_operands, send_operands, branch_operands])
302
383
  end
303
384
 
304
385
  # find a pattern: getlocal, send (===), branch
305
386
  arg_getlocal_send_branch_list = []
306
387
  (@insns.size - 1).times do |i|
307
- insn1, operands1 = @insns[i]
308
- next unless insn1 == :getlocal && operands1[1] == 0
309
- insn2, operands2 = @insns[i + 1]
310
- next unless insn2 == :send
311
- send_opt = operands2[0]
312
- next unless send_opt[:flag] == 16 && send_opt[:orig_argc] == 1
313
- insn3, _operands3 = @insns[i + 2]
314
- next unless insn3 == :branch
388
+ insn1 = @insns[i]
389
+ next unless insn1.insn == :getlocal && insn1.operands[1] == 0
390
+ insn2 = @insns[i + 1]
391
+ next unless insn2.insn == :send
392
+ send_operands = insn2.operands[0]
393
+ next unless send_operands[:flag] == 16 && send_operands[:orig_argc] == 1
394
+ insn3 = @insns[i + 2]
395
+ next unless insn3.insn == :branch
315
396
  arg_getlocal_send_branch_list << i
316
397
  end
317
398
  arg_getlocal_send_branch_list.each do |i|
318
399
  next if (i .. i + 2).any? {|i| branch_targets[i] }
319
- _insn, getlocal_operands = @insns[i]
320
- _insn, send_operands = @insns[i + 1]
321
- _insn, branch_operands = @insns[i + 2]
322
- @insns[i + 1] = [:nop]
323
- @insns[i + 2] = [:arg_getlocal_send_branch, [getlocal_operands, send_operands, branch_operands]]
400
+ getlocal_operands = @insns[i].operands
401
+ send_operands = @insns[i + 1].operands
402
+ branch_operands = @insns[i + 2].operands
403
+ @insns[i + 1] = Insn.new(:nop, [])
404
+ @insns[i + 2] = Insn.new(:arg_getlocal_send_branch, [getlocal_operands, send_operands, branch_operands])
324
405
  end
325
406
 
326
407
  # find a pattern: send (block_given?), branch
327
408
  send_branch_list = []
328
409
  (@insns.size - 1).times do |i|
329
- insn, _operands = @insns[i]
330
- if insn == :send
331
- insn, _operands = @insns[i + 1]
332
- if insn == :branch
410
+ insn = @insns[i]
411
+ if insn.insn == :send
412
+ insn = @insns[i + 1]
413
+ if insn.insn == :branch
333
414
  send_branch_list << i
334
415
  end
335
416
  end
336
417
  end
337
418
  send_branch_list.each do |i|
338
419
  next if branch_targets[i + 1]
339
- _insn, send_operands = @insns[i]
340
- _insn, branch_operands = @insns[i + 1]
341
- @insns[i] = [:nop]
342
- @insns[i + 1] = [:send_branch, [send_operands, branch_operands]]
420
+ send_operands = @insns[i].operands
421
+ branch_operands = @insns[i + 1].operands
422
+ @insns[i] = Insn.new(:nop, [])
423
+ @insns[i + 1] = Insn.new(:send_branch, [send_operands, branch_operands])
343
424
  end
344
425
 
345
426
  # find a pattern: getlocal, dup, branch
346
427
  (@insns.size - 2).times do |i|
347
428
  next if branch_targets[i + 1] || branch_targets[i + 2]
348
- insn0, getlocal_operands = @insns[i]
349
- insn1, dup_operands = @insns[i + 1]
350
- insn2, branch_operands = @insns[i + 2]
351
- if insn0 == :getlocal && insn1 == :dup && insn2 == :branch && getlocal_operands[1] == 0
352
- @insns[i ] = [:nop]
353
- @insns[i + 1] = [:nop]
354
- @insns[i + 2] = [:getlocal_dup_branch, [getlocal_operands, dup_operands, branch_operands]]
429
+ insn0 = @insns[i]
430
+ insn1 = @insns[i + 1]
431
+ insn2 = @insns[i + 2]
432
+ if insn0.insn == :getlocal && insn1.insn == :dup && insn2.insn == :branch && insn0.operands[1] == 0
433
+ getlocal_operands = insn0.operands
434
+ dup_operands = insn1.operands
435
+ branch_operands = insn2.operands
436
+ @insns[i ] = Insn.new(:nop, [])
437
+ @insns[i + 1] = Insn.new(:nop, [])
438
+ @insns[i + 2] = Insn.new(:getlocal_dup_branch, [getlocal_operands, dup_operands, branch_operands])
439
+ end
440
+ end
441
+
442
+ # find a pattern: dup, setlocal, branch
443
+ (@insns.size - 2).times do |i|
444
+ next if branch_targets[i + 1] || branch_targets[i + 2]
445
+ insn0 = @insns[i]
446
+ insn1 = @insns[i + 1]
447
+ insn2 = @insns[i + 2]
448
+ if insn0.insn == :dup && insn1.insn == :setlocal && insn2.insn == :branch && insn1.operands[1] == 0
449
+ dup_operands = insn0.operands
450
+ setlocal_operands = insn1.operands
451
+ branch_operands = insn2.operands
452
+ @insns[i ] = Insn.new(:nop, [])
453
+ @insns[i + 1] = Insn.new(:nop, [])
454
+ @insns[i + 2] = Insn.new(:dup_setlocal_branch, [dup_operands, setlocal_operands, branch_operands])
355
455
  end
356
456
  end
357
457
 
358
458
  # find a pattern: dup, branch
359
459
  (@insns.size - 1).times do |i|
360
460
  next if branch_targets[i + 1]
361
- insn0, dup_operands = @insns[i]
362
- insn1, branch_operands = @insns[i + 1]
363
- if insn0 == :dup && insn1 == :branch
364
- @insns[i ] = [:nop]
365
- @insns[i + 1] = [:dup_branch, [dup_operands, branch_operands]]
461
+ insn0 = @insns[i]
462
+ insn1 = @insns[i + 1]
463
+ if insn0.insn == :dup && insn1.insn == :branch
464
+ dup_operands = insn0.operands
465
+ branch_operands = insn1.operands
466
+ @insns[i ] = Insn.new(:nop, [])
467
+ @insns[i + 1] = Insn.new(:dup_branch, [dup_operands, branch_operands])
366
468
  end
367
469
  end
368
470
 
369
471
  # find a pattern: getlocal, branch
370
472
  (@insns.size - 1).times do |i|
371
473
  next if branch_targets[i + 1]
372
- insn0, getlocal_operands = @insns[i]
373
- insn1, branch_operands = @insns[i + 1]
374
- if [:getlocal, :getblockparam, :getblockparamproxy].include?(insn0) && getlocal_operands[1] == 0 && insn1 == :branch
375
- @insns[i ] = [:nop]
376
- @insns[i + 1] = [:getlocal_branch, [getlocal_operands, branch_operands]]
474
+ insn0 = @insns[i]
475
+ insn1 = @insns[i + 1]
476
+ if insn0.insn == :getlocal && insn0.operands[1] == 0 && insn1.insn == :branch
477
+ getlocal_operands = insn0.operands
478
+ branch_operands = insn1.operands
479
+ @insns[i ] = Insn.new(:nop, [])
480
+ @insns[i + 1] = Insn.new(:getlocal_branch, [getlocal_operands, branch_operands])
377
481
  end
378
482
  end
379
483
  end
380
484
 
381
485
  def check_send_branch(sp, j)
382
- insn, operands = @insns[j]
486
+ insn = @insns[j]
487
+ operands = insn.operands
383
488
 
384
- case insn
489
+ case insn.insn
385
490
  when :putspecialobject, :putnil, :putobject, :duparray, :putstring,
386
491
  :putself
387
492
  sp += 1
@@ -419,7 +524,7 @@ module TypeProf
419
524
  argc += 1 # receiver
420
525
  argc += kw_arg.size if kw_arg
421
526
  sp -= argc
422
- return :match if insn == :send && sp == 0 && @insns[j + 1][0] == :branch
527
+ return :match if insn.insn == :send && sp == 0 && @insns[j + 1].insn == :branch
423
528
  sp += 1
424
529
  when :arg_getlocal_send_branch
425
530
  return # not implemented