nit: Added link to `CONTRIBUTING.md` from the README
[nit.git] / src / rapid_type_analysis.nit
1 # This file is part of NIT ( http://www.nitlanguage.org ).
2 #
3 # Copyright 2012 Jean Privat <jean@pryen.org>
4 #
5 # Licensed under the Apache License, Version 2.0 (the "License");
6 # you may not use this file except in compliance with the License.
7 # You may obtain a copy of the License at
8 #
9 # http://www.apache.org/licenses/LICENSE-2.0
10 #
11 # Unless required by applicable law or agreed to in writing, software
12 # distributed under the License is distributed on an "AS IS" BASIS,
13 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 # See the License for the specific language governing permissions and
15 # limitations under the License.
16
17
18 # Rapid type analysis on the AST
19 #
20 # Rapid type analysis is an analyse that aproximates the set of live classes
21 # and the set of live methods starting from the entry point of the program.
22 # These two sets are interdependant and computed together.
23 # It is quite efficient but the type set is global and pollutes each call site.
24 module rapid_type_analysis
25
26 import semantize
27
28 import csv # for live_types_to_csv
29 private import ordered_tree # for live_methods_to_tree
30
31 private import more_collections
32
33 redef class ModelBuilder
34 # Performs a rapid-type-analysis on the program associated with `mainmodule`.
35 fun do_rapid_type_analysis(mainmodule: MModule): RapidTypeAnalysis
36 do
37 var analysis = new RapidTypeAnalysis(self, mainmodule)
38 analysis.run_analysis
39
40 if toolcontext.opt_log.value then
41 var basename = toolcontext.log_directory / mainmodule.name
42 analysis.live_methods_to_tree.write_to_file(basename + ".rta_methods.txt")
43 analysis.live_types_to_csv.write_to_file(basename + ".rta_types.csv")
44 end
45
46 return analysis
47 end
48 end
49
50 # RapidTypeAnalysis looks for alive rapid types in application.
51 # The entry point of the analysis is the mainmodule of the application.
52 class RapidTypeAnalysis
53 # The modelbuilder used to get the AST.
54 var modelbuilder: ModelBuilder
55
56 # The main module of the analysis.
57 # Used to perform types operations.
58 var mainmodule: MModule
59
60 # The pool to live types.
61 # During the analysis, new types are added and combined with
62 # live_methods to determine new methoddefs to visit
63 var live_types = new HashSet[MClassType]
64
65 # The pool of undesolved live types
66 # They are globally resolved at the end of the analaysis
67 var live_open_types = new HashSet[MClassType]
68
69 # Live (instantiated) classes.
70 var live_classes = new HashSet[MClass]
71
72 # The pool of types used to perform type checks (isa and as).
73 var live_cast_types = new HashSet[MType]
74
75 # The pool of undesolved types used to perform type checks (isa and as).
76 # They are globally resolved at the end of the analaysis
77 var live_open_cast_types = new HashSet[MType]
78
79 # Live method definitions.
80 var live_methoddefs = new HashSet[MMethodDef]
81
82 # Live methods.
83 var live_methods = new HashSet[MMethod]
84
85 # Live mmodules.
86 # Those with a live method definitions (see `live_methoddefs`)
87 var live_mmodules = new HashSet[MModule]
88
89 # Live callsites.
90 var live_callsites = new HashSet[CallSite]
91
92 private var live_targets_cache = new HashMap2[MType, MProperty, Set[MMethodDef]]
93
94 # The live targets of a specific callsite.
95 fun live_targets(callsite: CallSite): Set[MMethodDef]
96 do
97 var mtype = callsite.recv
98 var anchor = callsite.anchor
99 if anchor != null then mtype = mtype.anchor_to(callsite.mmodule, anchor)
100 mtype = mtype.undecorate
101 if mtype isa MClassType then mtype = mtype.mclass.intro.bound_mtype
102 var mproperty = callsite.mproperty
103 var res = live_targets_cache[mtype, mproperty]
104 if res != null then return res
105 res = new ArraySet[MMethodDef]
106 live_targets_cache[mtype, mproperty] = res
107
108 for c in live_classes do
109 var tc = c.intro.bound_mtype
110 if not tc.is_subtype(mainmodule, null, mtype) then continue
111 var d = mproperty.lookup_first_definition(mainmodule, tc)
112 res.add d
113 end
114
115 return res
116 end
117
118 # Live call-to-super.
119 var live_super_sends = new HashSet[MMethodDef]
120
121 # Return a ready-to-save CSV document objet that agregates informations about live types.
122 # Each discovered type is listed in a line, with its status: resolution, liveness, cast-liveness.
123 # Note: types are listed in an alphanumeric order to improve human reading.
124 fun live_types_to_csv: CsvDocument
125 do
126 # Gather all kind of type
127 var typeset = new HashSet[MType]
128 typeset.add_all(live_types)
129 typeset.add_all(live_open_types)
130 typeset.add_all(live_cast_types)
131 typeset.add_all(live_open_cast_types)
132 var types = typeset.to_a
133 (new CachedAlphaComparator).sort(types)
134 var res = new CsvDocument
135 res.separator = ';'
136 res.header = ["Type", "Resolution", "Liveness", "Cast-liveness"]
137 for t in types do
138 var reso
139 if t.need_anchor then reso = "OPEN " else reso = "CLOSED"
140 var live
141 if t isa MClassType and (live_types.has(t) or live_open_types.has(t)) then live = "LIVE" else live = "DEAD"
142 var cast
143 if live_cast_types.has(t) or live_open_cast_types.has(t) then cast = "CAST LIVE" else cast = "CAST DEAD"
144 res.add_record(t, reso, live, cast)
145 end
146 return res
147 end
148
149 # Return a ready-to-save OrderedTree object that agregates infomration about live methods.
150 # Note: methods are listed in an alphanumeric order to improve human reading.
151 fun live_methods_to_tree: OrderedTree[Object]
152 do
153 var tree = new OrderedTree[Object]
154 for x in live_methods do
155 var xn = x.full_name
156 tree.add(null, xn)
157 for z in x.mpropdefs do
158 var zn = z.to_s
159 if live_methoddefs.has(z) then
160 tree.add(xn, zn)
161 if live_super_sends.has(z) then
162 tree.add(zn, zn + "(super)")
163 end
164 else if live_super_sends.has(z) then
165 tree.add(xn, zn + "(super)")
166 end
167 end
168 end
169 tree.sort_with(alpha_comparator)
170 return tree
171 end
172
173 # Methods that are still candidate to the try_send
174 private var totry_methods = new HashSet[MMethod]
175
176 # Methods that are are no more candidate to the try_send
177 private var totry_methods_to_remove = new Array[MMethod]
178
179 # Methods that are or were candidate to the try_send
180 # Used to ensure that try_send is only used once
181 private var try_methods = new HashSet[MMethod]
182
183 # The method definitions that remain to visit
184 private var todo = new List[MMethodDef]
185
186 private fun force_alive(classname: String)
187 do
188 var classes = self.modelbuilder.model.get_mclasses_by_name(classname)
189 if classes != null then for c in classes do self.add_new(c.mclass_type, c.mclass_type)
190 end
191
192 # Run the analysis until all visitable method definitions are visited.
193 fun run_analysis
194 do
195 var maintype = mainmodule.sys_type
196 if maintype == null then return # No entry point
197 add_new(maintype, maintype)
198 var initprop = mainmodule.try_get_primitive_method("init", maintype.mclass)
199 if initprop != null then
200 add_send(maintype, initprop)
201 end
202 var mainprop = mainmodule.try_get_primitive_method("run", maintype.mclass) or else
203 mainmodule.try_get_primitive_method("main", maintype.mclass)
204 if mainprop != null then
205 add_send(maintype, mainprop)
206 end
207
208 var finalizable_type = mainmodule.finalizable_type
209 if finalizable_type != null then
210 var finalize_meth = mainmodule.try_get_primitive_method("finalize", finalizable_type.mclass)
211 if finalize_meth != null then add_send(finalizable_type, finalize_meth)
212 end
213
214 # Force primitive types
215 force_alive("Bool")
216 force_alive("Float")
217 force_alive("Char")
218 force_alive("Pointer")
219 force_alive("Byte")
220 force_alive("Int")
221 force_alive("Int8")
222 force_alive("Int16")
223 force_alive("UInt16")
224 force_alive("Int32")
225 force_alive("UInt32")
226
227 while not todo.is_empty do
228 var mmethoddef = todo.shift
229 var mmeth = mmethoddef.mproperty
230 var msignature = mmethoddef.msignature
231 if msignature == null then continue # Skip broken method
232
233 #print "# visit {mmethoddef}"
234 var v = new RapidTypeVisitor(self, mmethoddef.mclassdef.bound_mtype, mmethoddef)
235
236 var vararg_rank = msignature.vararg_rank
237 if vararg_rank > -1 then
238 var node = self.modelbuilder.mpropdef2node(mmethoddef)
239 var elttype = msignature.mparameters[vararg_rank].mtype
240 #elttype = elttype.anchor_to(self.mainmodule, v.receiver)
241 var vararg = self.mainmodule.array_type(elttype)
242 v.add_type(vararg)
243 var native = self.mainmodule.native_array_type(elttype)
244 v.add_type(native)
245 v.add_monomorphic_send(vararg, self.modelbuilder.force_get_primitive_method(node, "with_native", vararg.mclass, self.mainmodule))
246 end
247
248 # TODO? new_msignature
249 var sig = msignature
250 var osig = mmeth.intro.msignature.as(not null)
251 for i in [0..sig.arity[ do
252 var origtype = osig.mparameters[i].mtype
253 if not origtype.need_anchor then continue # skip non covariant stuff
254 var paramtype = sig.mparameters[i].mtype
255 add_cast(paramtype)
256 end
257
258 var npropdef = modelbuilder.mpropdef2node(mmethoddef)
259
260 if npropdef isa AClassdef then
261 if mmethoddef.mproperty.is_root_init then
262 if not mmethoddef.is_intro then
263 self.add_super_send(v.receiver, mmethoddef)
264 end
265 else
266 npropdef.debug "cannot RTA {mmethoddef}"
267 abort
268 end
269 continue
270 else if mmethoddef.constant_value != null then
271 # Make the return type live
272 v.add_type(msignature.return_mtype.as(MClassType))
273 continue
274 else if npropdef == null then
275 abort
276 end
277
278 if npropdef isa AMethPropdef then
279 var auto_super_inits = npropdef.auto_super_inits
280 if auto_super_inits != null then
281 for auto_super_init in auto_super_inits do
282 v.add_callsite(auto_super_init)
283 end
284 end
285 if npropdef.auto_super_call then
286 self.add_super_send(v.receiver, mmethoddef)
287 end
288 end
289
290 if mmethoddef.is_intern or mmethoddef.is_extern then
291 # UGLY: We force the "instantation" of the concrete return type if any
292 var ret = msignature.return_mtype
293 if ret != null and ret isa MClassType and ret.mclass.kind != abstract_kind and ret.mclass.kind != interface_kind then
294 v.add_type(ret)
295 end
296 end
297
298 v.enter_visit(npropdef)
299 end
300
301 #print "MMethod {live_methods.length}: {live_methods.join(", ")}"
302 #print "MMethodDef {live_methoddefs.length}: {live_methoddefs.join(", ")}"
303
304 #print "open MType {live_open_types.length}: {live_open_types.join(", ")}"
305 var todo_types = new List[MClassType]
306 todo_types.add_all(live_types)
307 while not todo_types.is_empty do
308 var t = todo_types.shift
309 for ot in live_open_types do
310 #print "{ot}/{t} ?"
311 if not ot.can_resolve_for(t, t, mainmodule) then continue
312 var rt = ot.anchor_to(mainmodule, t)
313 if live_types.has(rt) then continue
314 if not check_depth(rt) then continue
315 #print "{ot}/{t} -> {rt}"
316 live_types.add(rt)
317 todo_types.add(rt)
318 end
319 end
320 #print "MType {live_types.length}: {live_types.join(", ")}"
321
322 #print "open cast MType {live_open_cast_types.length}: {live_open_cast_types.join(", ")}"
323 for ot in live_open_cast_types do
324 #print "live_open_cast_type: {ot}"
325 for t in live_types do
326 if not ot.can_resolve_for(t, t, mainmodule) then continue
327 var rt = ot.anchor_to(mainmodule, t)
328 live_cast_types.add(rt)
329 #print " {ot}/{t} -> {rt}"
330 end
331 end
332 #print "cast MType {live_cast_types.length}: {live_cast_types.join(", ")}"
333 end
334
335 private fun check_depth(mtype: MClassType): Bool
336 do
337 var d = mtype.length
338 if d > 255 then
339 self.modelbuilder.toolcontext.fatal_error(null, "Fatal Error: limitation in the rapidtype analysis engine: a type depth of {d} is too important, the problematic type is `{mtype}`.")
340 return false
341 end
342 return true
343 end
344
345 fun add_new(recv: MClassType, mtype: MClassType)
346 do
347 assert not recv.need_anchor
348 if mtype.need_anchor then
349 if live_open_types.has(mtype) then return
350 live_open_types.add(mtype)
351 else
352 if live_types.has(mtype) then return
353 live_types.add(mtype)
354 end
355
356 var mclass = mtype.mclass
357 if live_classes.has(mclass) then return
358 live_classes.add(mclass)
359
360 for p in totry_methods do try_send(mtype, p)
361 for p in live_super_sends do try_super_send(mtype, p)
362
363 # Remove cleared ones
364 for p in totry_methods_to_remove do totry_methods.remove(p)
365 totry_methods_to_remove.clear
366
367 var bound_mtype = mtype.anchor_to(mainmodule, recv)
368 for cd in bound_mtype.collect_mclassdefs(mainmodule)
369 do
370 for npropdef in modelbuilder.collect_attr_propdef(cd) do
371 if not npropdef.has_value then continue
372
373 var mpropdef = npropdef.mreadpropdef.as(not null)
374 var v = new RapidTypeVisitor(self, bound_mtype, mpropdef)
375 v.enter_visit(npropdef.n_expr)
376 v.enter_visit(npropdef.n_block)
377 end
378 end
379
380 end
381
382 fun add_cast(mtype: MType)
383 do
384 if mtype.need_anchor then
385 live_open_cast_types.add(mtype)
386 else
387 live_cast_types.add(mtype)
388 end
389 end
390
391 fun try_send(recv: MClassType, mproperty: MMethod)
392 do
393 recv = recv.mclass.intro.bound_mtype
394 if not recv.has_mproperty(mainmodule, mproperty) then return
395 var d = mproperty.lookup_first_definition(mainmodule, recv)
396 add_call(d)
397 end
398
399 fun add_call(mpropdef: MMethodDef)
400 do
401 if live_methoddefs.has(mpropdef) then return
402 live_methoddefs.add(mpropdef)
403 live_mmodules.add(mpropdef.mclassdef.mmodule)
404 todo.add(mpropdef)
405
406 var mproperty = mpropdef.mproperty
407 if mproperty.mpropdefs.length <= 1 then return
408 # If all definitions of a method are live, we can remove the definition of the totry set
409 for d in mproperty.mpropdefs do
410 if not live_methoddefs.has(d) then return
411 end
412 #print "full property: {mpropdef.mproperty} for {mpropdef.mproperty.mpropdefs.length} definitions"
413 totry_methods_to_remove.add(mpropdef.mproperty)
414 end
415
416 fun add_send(recv: MType, mproperty: MMethod)
417 do
418 if try_methods.has(mproperty) then return
419 #print "new prop: {mproperty}"
420 live_methods.add(mproperty)
421 try_methods.add(mproperty)
422 if mproperty.mpropdefs.length == 1 then
423 # If there is only one definition, just add the definition and do not try again the property
424 var d = mproperty.mpropdefs.first
425 add_call(d)
426 return
427 end
428 # Else, the property is potentially called with various reciever
429 # So just try the methods with existing receiver and register it for future receiver
430 totry_methods.add(mproperty)
431 for c in live_classes do
432 try_send(c.intro.bound_mtype, mproperty)
433 end
434 end
435
436 fun try_super_send(recv: MClassType, mpropdef: MMethodDef)
437 do
438 recv = recv.mclass.intro.bound_mtype
439 if not recv.collect_mclassdefs(mainmodule).has(mpropdef.mclassdef) then return
440 var d = mpropdef.lookup_next_definition(mainmodule, recv)
441 add_call(d)
442 end
443
444 fun add_super_send(recv: MType, mpropdef: MMethodDef)
445 do
446 assert mpropdef.has_supercall
447 if live_super_sends.has(mpropdef) then return
448 #print "new super prop: {mpropdef}"
449 live_super_sends.add(mpropdef)
450 for c in live_classes do
451 try_super_send(c.intro.bound_mtype, mpropdef)
452 end
453 end
454 end
455
456 class RapidTypeVisitor
457 super Visitor
458
459 var analysis: RapidTypeAnalysis
460 var receiver: MClassType
461 var mpropdef: MPropDef
462
463 init
464 do
465 assert not receiver.need_anchor
466 end
467
468 redef fun visit(n)
469 do
470 if n isa AExpr then
471 if n.mtype != null or n.is_typed then
472 n.accept_rapid_type_visitor(self)
473 var implicit_cast_to = n.implicit_cast_to
474 if implicit_cast_to != null then self.add_cast_type(implicit_cast_to)
475 end
476 else
477 n.accept_rapid_type_visitor(self)
478 end
479
480 # RTA does not enter in AAnnotations
481 if not n isa AAnnotations then
482 n.visit_all(self)
483 end
484 end
485
486 fun cleanup_type(mtype: MType): nullable MClassType
487 do
488 mtype = mtype.anchor_to(self.analysis.mainmodule, self.receiver)
489 if mtype isa MNullType then return null
490 mtype = mtype.undecorate
491 assert mtype isa MClassType
492 assert not mtype.need_anchor
493 return mtype
494 end
495
496 fun get_method(recv: MType, name: String): MMethod
497 do
498 var mtype = cleanup_type(recv)
499 assert mtype != null
500 return self.analysis.modelbuilder.force_get_primitive_method(self.current_node.as(not null), name, mtype.mclass, self.analysis.mainmodule)
501 end
502
503 fun add_type(mtype: MClassType) do analysis.add_new(receiver, mtype)
504
505 fun add_monomorphic_send(mtype: MType, mproperty: MMethod)
506 do
507 analysis.live_methods.add(mproperty)
508 analysis.try_send(mtype.as(MClassType), mproperty)
509 end
510
511 fun add_send(mtype: MType, mproperty: MMethod) do analysis.add_send(mtype, mproperty)
512
513 fun add_cast_type(mtype: MType) do analysis.add_cast(mtype)
514
515 fun add_callsite(callsite: nullable CallSite) do if callsite != null then
516 for m in callsite.mpropdef.initializers do
517 if m isa MMethod then
518 analysis.add_send(callsite.recv, m)
519 end
520 end
521 analysis.add_send(callsite.recv, callsite.mproperty)
522 analysis.live_callsites.add(callsite)
523 end
524 end
525
526 ###
527
528 redef class ANode
529 private fun accept_rapid_type_visitor(v: RapidTypeVisitor)
530 do
531 end
532 end
533
534 redef class AExpr
535 # Make the `mtype` of the expression live
536 # Used by literals and instantiations
537 fun allocate_mtype(v: RapidTypeVisitor)
538 do
539 var mtype = self.mtype
540 if not mtype isa MClassType then return
541 v.add_type(self.mtype.as(MClassType))
542 end
543 end
544
545 redef class AIntegerExpr
546 redef fun accept_rapid_type_visitor(v)
547 do
548 allocate_mtype(v)
549 end
550 end
551
552 redef class AFloatExpr
553 redef fun accept_rapid_type_visitor(v)
554 do
555 allocate_mtype(v)
556 end
557 end
558
559 redef class ACharExpr
560 redef fun accept_rapid_type_visitor(v)
561 do
562 allocate_mtype(v)
563 end
564 end
565
566 redef class AArrayExpr
567 redef fun accept_rapid_type_visitor(v)
568 do
569 var mtype = self.mtype.as(MClassType)
570 v.add_type(mtype)
571 var native = v.analysis.mainmodule.native_array_type(mtype.arguments.first)
572 v.add_type(native)
573 mtype = v.cleanup_type(mtype).as(not null)
574 var prop = v.get_method(mtype, "with_native")
575 v.add_monomorphic_send(mtype, prop)
576 v.add_callsite(with_capacity_callsite)
577 v.add_callsite(push_callsite)
578 end
579 end
580
581 redef class AStringFormExpr
582 redef fun accept_rapid_type_visitor(v)
583 do
584 var native = v.analysis.mainmodule.native_string_type
585 v.add_type(native)
586 var prop = v.get_method(native, "to_s_full")
587 v.add_monomorphic_send(native, prop)
588 v.add_callsite(to_re)
589 v.add_callsite(ignore_case)
590 v.add_callsite(newline)
591 v.add_callsite(extended)
592 v.add_callsite(to_bytes_with_copy)
593 end
594 end
595
596 redef class ASuperstringExpr
597 redef fun accept_rapid_type_visitor(v)
598 do
599 var mmodule = v.analysis.mainmodule
600 var object_type = mmodule.string_type
601 var arraytype = mmodule.array_type(object_type)
602 v.add_type(arraytype)
603 var nattype = mmodule.native_array_type(object_type)
604 v.add_type(nattype)
605 var prop = v.get_method(arraytype, "join")
606 v.add_monomorphic_send(arraytype, prop)
607 var prop2 = v.get_method(arraytype, "with_native")
608 v.add_monomorphic_send(arraytype, prop2)
609 v.add_monomorphic_send(nattype, v.get_method(nattype, "native_to_s"))
610 end
611 end
612
613 redef class ACrangeExpr
614 redef fun accept_rapid_type_visitor(v)
615 do
616 var mtype = self.mtype
617 if not mtype isa MClassType then return
618 v.add_type(mtype)
619 v.add_callsite(init_callsite)
620 end
621 end
622
623 redef class AOrangeExpr
624 redef fun accept_rapid_type_visitor(v)
625 do
626 var mtype = self.mtype
627 if not mtype isa MClassType then return
628 v.add_type(mtype)
629 v.add_callsite(init_callsite)
630 end
631 end
632
633 redef class ATrueExpr
634 redef fun accept_rapid_type_visitor(v)
635 do
636 allocate_mtype(v)
637 end
638 end
639
640 redef class AFalseExpr
641 redef fun accept_rapid_type_visitor(v)
642 do
643 allocate_mtype(v)
644 end
645 end
646
647 redef class AIsaExpr
648 redef fun accept_rapid_type_visitor(v)
649 do
650 var cast_type = self.cast_type
651 if cast_type == null then return
652 v.add_cast_type(cast_type)
653 end
654 end
655
656 redef class AAsCastExpr
657 redef fun accept_rapid_type_visitor(v)
658 do
659 var mtype = self.mtype
660 if mtype == null then return
661 v.add_cast_type(mtype)
662 end
663 end
664
665 redef class ASendExpr
666 redef fun accept_rapid_type_visitor(v)
667 do
668 v.add_callsite(callsite)
669 end
670 end
671
672
673 redef class ASendReassignFormExpr
674 redef fun accept_rapid_type_visitor(v)
675 do
676 v.add_callsite(callsite)
677 v.add_callsite(reassign_callsite)
678 v.add_callsite(write_callsite)
679 end
680 end
681
682 redef class AVarReassignExpr
683 redef fun accept_rapid_type_visitor(v)
684 do
685 v.add_callsite(reassign_callsite)
686 end
687 end
688
689 redef class AAttrReassignExpr
690 redef fun accept_rapid_type_visitor(v)
691 do
692 v.add_callsite(reassign_callsite)
693 end
694 end
695
696 redef class ASuperExpr
697 redef fun accept_rapid_type_visitor(v)
698 do
699 var callsite = self.callsite
700 if callsite != null then
701 v.add_callsite(callsite)
702 return
703 end
704
705 v.analysis.add_super_send(v.receiver, mpropdef.as(not null))
706 end
707 end
708
709 redef class AForGroup
710 redef fun accept_rapid_type_visitor(v)
711 do
712 v.add_callsite(self.method_iterator)
713 v.add_callsite(self.method_is_ok)
714 if self.variables.length == 1 then
715 v.add_callsite(self.method_item)
716 else if self.variables.length == 2 then
717 v.add_callsite(self.method_key)
718 v.add_callsite(self.method_item)
719 else
720 abort
721 end
722 v.add_callsite(self.method_next)
723 var mf = self.method_finish
724 if mf != null then v.add_callsite(mf)
725 end
726 end
727
728 redef class ANewExpr
729 redef fun accept_rapid_type_visitor(v)
730 do
731 var mtype = self.recvtype.as(not null)
732 v.add_type(mtype)
733 v.add_callsite(callsite)
734 end
735 end