@@ -106,6 +106,7 @@ function finish!(interp::AbstractInterpreter, caller::InferenceState)
106
106
# @assert last(result.valid_worlds) <= get_world_counter() || isempty(caller.edges)
107
107
if isdefined (result, :ci )
108
108
ci = result. ci
109
+ mi = result. linfo
109
110
# if we aren't cached, we don't need this edge
110
111
# but our caller might, so let's just make it anyways
111
112
if last (result. valid_worlds) >= get_world_counter ()
@@ -132,15 +133,15 @@ function finish!(interp::AbstractInterpreter, caller::InferenceState)
132
133
end
133
134
di = inferred_result. debuginfo
134
135
uncompressed = inferred_result
135
- inferred_result = maybe_compress_codeinfo (interp, result . linfo , inferred_result)
136
+ inferred_result = maybe_compress_codeinfo (interp, mi , inferred_result)
136
137
result. is_src_volatile = false
137
138
elseif ci. owner === nothing
138
139
# The global cache can only handle objects that codegen understands
139
140
inferred_result = nothing
140
141
end
141
142
end
142
143
if ! @isdefined di
143
- di = DebugInfo (result . linfo )
144
+ di = DebugInfo (mi )
144
145
end
145
146
min_world, max_world = first (result. valid_worlds), last (result. valid_worlds)
146
147
ipo_effects = encode_effects (result. ipo_effects)
@@ -149,6 +150,9 @@ function finish!(interp::AbstractInterpreter, caller::InferenceState)
149
150
UInt32, Any, Any, Any),
150
151
ci, inferred_result, rettype, exctype, rettype_const, const_flags, min_world, max_world,
151
152
ipo_effects, result. analysis_results, di, edges)
153
+ if is_cached (caller) # CACHE_MODE_GLOBAL
154
+ cache_result! (interp, mi, ci)
155
+ end
152
156
engine_reject (interp, ci)
153
157
if ! discard_src && isdefined (interp, :codegen ) && uncompressed isa CodeInfo
154
158
# record that the caller could use this result to generate code when required, if desired, to avoid repeating n^2 work
@@ -157,7 +161,6 @@ function finish!(interp::AbstractInterpreter, caller::InferenceState)
157
161
# This is necessary to get decent bootstrapping performance
158
162
# when compiling the compiler to inject everything eagerly
159
163
# where codegen can start finding and using it right away
160
- mi = result. linfo
161
164
if mi. def isa Method && isa_compileable_sig (mi)
162
165
ccall (:jl_add_codeinst_to_jit , Cvoid, (Any, Any), ci, uncompressed)
163
166
end
@@ -167,6 +170,10 @@ function finish!(interp::AbstractInterpreter, caller::InferenceState)
167
170
return nothing
168
171
end
169
172
173
+ function cache_result! (interp:: AbstractInterpreter , mi:: MethodInstance , ci:: CodeInstance )
174
+ code_cache (interp)[mi] = ci
175
+ end
176
+
170
177
function finish! (interp:: AbstractInterpreter , mi:: MethodInstance , ci:: CodeInstance , src:: CodeInfo )
171
178
user_edges = src. edges
172
179
edges = user_edges isa SimpleVector ? user_edges : user_edges === nothing ? Core. svec () : Core. svec (user_edges... )
@@ -200,11 +207,13 @@ function finish!(interp::AbstractInterpreter, mi::MethodInstance, ci::CodeInstan
200
207
end
201
208
202
209
function finish_nocycle (:: AbstractInterpreter , frame:: InferenceState )
203
- finishinfer! (frame, frame. interp)
210
+ opt_cache = IdDict {MethodInstance,CodeInstance} ()
211
+ finishinfer! (frame, frame. interp, opt_cache)
204
212
opt = frame. result. src
205
213
if opt isa OptimizationState # implies `may_optimize(caller.interp) === true`
206
214
optimize (frame. interp, opt, frame. result)
207
215
end
216
+ empty! (opt_cache)
208
217
finish! (frame. interp, frame)
209
218
if frame. cycleid != 0
210
219
frames = frame. callstack:: Vector{AbsIntState}
@@ -227,10 +236,11 @@ function finish_cycle(::AbstractInterpreter, frames::Vector{AbsIntState}, cyclei
227
236
cycle_valid_worlds = intersect (cycle_valid_worlds, caller. world. valid_worlds)
228
237
cycle_valid_effects = merge_effects (cycle_valid_effects, caller. ipo_effects)
229
238
end
239
+ opt_cache = IdDict {MethodInstance,CodeInstance} ()
230
240
for frameid = cycleid: length (frames)
231
241
caller = frames[frameid]:: InferenceState
232
242
adjust_cycle_frame! (caller, cycle_valid_worlds, cycle_valid_effects)
233
- finishinfer! (caller, caller. interp)
243
+ finishinfer! (caller, caller. interp, opt_cache )
234
244
end
235
245
for frameid = cycleid: length (frames)
236
246
caller = frames[frameid]:: InferenceState
@@ -239,6 +249,7 @@ function finish_cycle(::AbstractInterpreter, frames::Vector{AbsIntState}, cyclei
239
249
optimize (caller. interp, opt, caller. result)
240
250
end
241
251
end
252
+ empty! (opt_cache)
242
253
for frameid = cycleid: length (frames)
243
254
caller = frames[frameid]:: InferenceState
244
255
finish! (caller. interp, caller)
@@ -285,22 +296,6 @@ function maybe_compress_codeinfo(interp::AbstractInterpreter, mi::MethodInstance
285
296
end
286
297
end
287
298
288
- function cache_result! (interp:: AbstractInterpreter , result:: InferenceResult , ci:: CodeInstance )
289
- @assert isdefined (ci, :inferred )
290
- # check if the existing linfo metadata is also sufficient to describe the current inference result
291
- # to decide if it is worth caching this right now
292
- mi = result. linfo
293
- cache = WorldView (code_cache (interp), result. valid_worlds)
294
- if haskey (cache, mi)
295
- ci = cache[mi]
296
- # n.b.: accurate edge representation might cause the CodeInstance for this to be constructed later
297
- @assert isdefined (ci, :inferred )
298
- return false
299
- end
300
- code_cache (interp)[mi] = ci
301
- return true
302
- end
303
-
304
299
function cycle_fix_limited (@nospecialize (typ), sv:: InferenceState )
305
300
if typ isa LimitedAccuracy
306
301
if sv. parentid === 0
@@ -428,7 +423,8 @@ const empty_edges = Core.svec()
428
423
429
424
# inference completed on `me`
430
425
# update the MethodInstance
431
- function finishinfer! (me:: InferenceState , interp:: AbstractInterpreter )
426
+ function finishinfer! (me:: InferenceState , interp:: AbstractInterpreter ,
427
+ opt_cache:: IdDict{MethodInstance, CodeInstance} )
432
428
# prepare to run optimization passes on fulltree
433
429
@assert isempty (me. ip)
434
430
# inspect whether our inference had a limited result accuracy,
@@ -481,7 +477,7 @@ function finishinfer!(me::InferenceState, interp::AbstractInterpreter)
481
477
# disable optimization if we've already obtained very accurate result
482
478
! result_is_constabi (interp, result)
483
479
if doopt
484
- result. src = OptimizationState (me, interp)
480
+ result. src = OptimizationState (me, interp, opt_cache )
485
481
else
486
482
result. src = me. src # for reflection etc.
487
483
end
@@ -502,9 +498,11 @@ function finishinfer!(me::InferenceState, interp::AbstractInterpreter)
502
498
ci, rettype, exctype, rettype_const, const_flags, min_world, max_world,
503
499
encode_effects (result. ipo_effects), result. analysis_results, di, edges)
504
500
if is_cached (me) # CACHE_MODE_GLOBAL
505
- cached_result = cache_result! (me. interp, result, ci)
506
- if ! cached_result
501
+ already_cached = is_already_cached (me. interp, result, ci)
502
+ if already_cached
507
503
me. cache_mode = CACHE_MODE_VOLATILE
504
+ else
505
+ opt_cache[result. linfo] = ci
508
506
end
509
507
end
510
508
end
551
549
return ResultForCache (rettype, exctype, rettype_const, const_flags)
552
550
end
553
551
552
+ function is_already_cached (interp:: AbstractInterpreter , result:: InferenceResult , ci:: CodeInstance )
553
+ # check if the existing linfo metadata is also sufficient to describe the current inference result
554
+ # to decide if it is worth caching this right now
555
+ mi = result. linfo
556
+ cache = WorldView (code_cache (interp), result. valid_worlds)
557
+ if haskey (cache, mi)
558
+ # n.b.: accurate edge representation might cause the CodeInstance for this to be constructed later
559
+ @assert isdefined (cache[mi], :inferred )
560
+ return true
561
+ end
562
+ return false
563
+ end
564
+
554
565
# record the backedges
555
566
function store_backedges (caller:: CodeInstance , edges:: SimpleVector )
556
567
isa (caller. def. def, Method) || return # don't add backedges to toplevel method instance
0 commit comments