Skip to content

Commit fd959c7

Browse files
committed
wip: fix EA regression, better approach
1 parent 828c20d commit fd959c7

File tree

2 files changed

+34
-44
lines changed

2 files changed

+34
-44
lines changed

base/compiler/optimize.jl

+33-27
Original file line numberDiff line numberDiff line change
@@ -626,47 +626,51 @@ end
626626
GetNativeEscapeCache(interp::AbstractInterpreter) = GetNativeEscapeCache(code_cache(interp))
627627
function ((; code_cache)::GetNativeEscapeCache)(mi::MethodInstance)
628628
codeinst = get(code_cache, mi, nothing)
629-
codeinst isa CodeInstance || return false
630-
argescapes = traverse_analysis_results(codeinst) do @nospecialize result
629+
codeinst isa CodeInstance || return nothing
630+
return traverse_analysis_results(codeinst) do @nospecialize result
631631
return result isa EscapeAnalysis.ArgEscapeCache ? result : nothing
632632
end
633-
if argescapes !== nothing
634-
return argescapes
635-
end
636-
effects = decode_effects(codeinst.ipo_purity_bits)
637-
if is_effect_free(effects) && is_inaccessiblememonly(effects)
638-
# We might not have run EA on simple frames without any escapes (e.g. when optimization
639-
# is skipped when result is constant-folded by abstract interpretation). If those
640-
# frames aren't inlined, the accuracy of EA for caller context takes a big hit.
641-
# This is a HACK to avoid that, but obviously, a more comprehensive fix would be ideal.
642-
return true
643-
end
644-
return false
633+
end
634+
635+
analyze_and_cache_escapes!(interp::AbstractInterpreter, opt::OptimizationState, sv::PostOptAnalysisState) =
636+
analyze_and_cache_escapes!(interp, opt, sv.ir, sv.result)
637+
638+
function analyze_and_cache_escapes!(interp::AbstractInterpreter, opt::OptimizationState,
639+
ir::IRCode, result::InferenceResult)
640+
nargs = Int(opt.src.nargs)
641+
estate = EscapeAnalysis.analyze_escapes(ir, nargs, optimizer_lattice(interp), get_escape_cache(interp))
642+
argescapes = EscapeAnalysis.ArgEscapeCache(estate)
643+
stack_analysis_result!(result, argescapes)
644+
return estate
645645
end
646646

647647
function refine_effects!(interp::AbstractInterpreter, opt::OptimizationState, sv::PostOptAnalysisState)
648+
EA_cached = false
648649
if !is_effect_free(sv.result.ipo_effects) && sv.all_effect_free && !isempty(sv.ea_analysis_pending)
649-
ir = sv.ir
650-
nargs = Int(opt.src.nargs)
651-
estate = EscapeAnalysis.analyze_escapes(ir, nargs, optimizer_lattice(interp), get_escape_cache(interp))
652-
argescapes = EscapeAnalysis.ArgEscapeCache(estate)
653-
stack_analysis_result!(sv.result, argescapes)
650+
estate = analyze_and_cache_escapes!(interp, opt, sv)
654651
validate_mutable_arg_escapes!(estate, sv)
652+
EA_cached = true
655653
end
656654

657-
any_refinable(sv) || return false
658655
effects = sv.result.ipo_effects
659-
sv.result.ipo_effects = Effects(effects;
656+
any_refinable(sv) || @goto run_EA_on_simple_frame
657+
effects = sv.result.ipo_effects = Effects(effects;
660658
consistent = sv.all_retpaths_consistent ? ALWAYS_TRUE : effects.consistent,
661659
effect_free = sv.all_effect_free ? ALWAYS_TRUE :
662-
sv.effect_free_if_argmem_only === true ? EFFECT_FREE_IF_INACCESSIBLEMEMONLY : effects.effect_free,
660+
sv.effect_free_if_argmem_only === true ? EFFECT_FREE_IF_INACCESSIBLEMEMONLY : effects.effect_free,
663661
nothrow = sv.all_nothrow ? true : effects.nothrow,
664662
noub = sv.all_noub ? (sv.any_conditional_ub ? NOUB_IF_NOINBOUNDS : ALWAYS_TRUE) : effects.noub,
665663
nortcall = sv.nortcall ? true : effects.nortcall)
666-
return true
664+
665+
@label run_EA_on_simple_frame
666+
if !EA_cached && is_effect_free(effects) && is_inaccessiblememonly(effects)
667+
analyze_and_cache_escapes!(interp, opt, sv)
668+
end
669+
670+
nothing
667671
end
668672

669-
function is_ipo_dataflow_analysis_profitable(effects::Effects)
673+
function is_ipo_effects_refinable(effects::Effects)
670674
return !(is_consistent(effects) && is_effect_free(effects) &&
671675
is_nothrow(effects) && is_noub(effects))
672676
end
@@ -941,8 +945,9 @@ end
941945

942946
function ipo_dataflow_analysis!(interp::AbstractInterpreter, opt::OptimizationState,
943947
ir::IRCode, result::InferenceResult)
944-
if !is_ipo_dataflow_analysis_profitable(result.ipo_effects)
945-
return false
948+
if !is_ipo_effects_refinable(result.ipo_effects)
949+
analyze_and_cache_escapes!(interp, opt, ir, result)
950+
return nothing
946951
end
947952

948953
@assert isempty(ir.new_nodes) "IRCode should be compacted before post-opt analysis"
@@ -968,7 +973,8 @@ function ipo_dataflow_analysis!(interp::AbstractInterpreter, opt::OptimizationSt
968973
end
969974
end
970975

971-
return refine_effects!(interp, opt, sv)
976+
refine_effects!(interp, opt, sv)
977+
nothing
972978
end
973979

974980
# run the optimization work

base/compiler/ssair/EscapeAnalysis/EscapeAnalysis.jl

+1-17
Original file line numberDiff line numberDiff line change
@@ -1068,24 +1068,8 @@ function escape_invoke!(astate::AnalysisState, pc::Int, args::Vector{Any})
10681068
add_liveness_changes!(astate, pc, args, first_idx, last_idx)
10691069
# TODO inspect `astate.ir.stmts[pc][:info]` and use const-prop'ed `InferenceResult` if available
10701070
cache = astate.get_escape_cache(mi)
1071+
cache isa ArgEscapeCache || return add_conservative_changes!(astate, pc, args, 2)
10711072
ret = SSAValue(pc)
1072-
if cache isa Bool
1073-
if cache
1074-
# This method call is very simple and has good effects, so there's no need to
1075-
# escape its arguments. However, since the arguments might be returned, we need
1076-
# to consider the possibility of aliasing between them and the return value.
1077-
for argidx = first_idx:last_idx
1078-
arg = args[argidx]
1079-
if !is_mutation_free_argtype(argextype(arg, astate.ir))
1080-
add_alias_change!(astate, ret, arg)
1081-
end
1082-
end
1083-
return nothing
1084-
else
1085-
return add_conservative_changes!(astate, pc, args, 2)
1086-
end
1087-
end
1088-
cache = cache::ArgEscapeCache
10891073
retinfo = astate.estate[ret] # escape information imposed on the call statement
10901074
method = mi.def::Method
10911075
nargs = Int(method.nargs)

0 commit comments

Comments
 (0)