Skip to content

Commit efc43cb

Browse files
authored
[late-gc-lowering] null-out GC frame slots for dead objects (#52935)
Should fix #51818. MWE: ```julia function testme() X = @noinline rand(1_000_000_00) Y = @noinline sum(X) X = nothing GC.gc() return Y end ``` Note that it now stores a `NULL` in the GC frame before calling `jl_gc_collect`. Before: ```llvm ; Function Signature: testme() ; @ /Users/dnetto/Personal/test.jl:3 within `testme` define double @julia_testme_535() #0 { top: %gcframe1 = alloca [3 x ptr], align 16 call void @llvm.memset.p0.i64(ptr align 16 %gcframe1, i8 0, i64 24, i1 true) %pgcstack = call ptr inttoptr (i64 6595051180 to ptr)(i64 262) #10 store i64 4, ptr %gcframe1, align 16 %task.gcstack = load ptr, ptr %pgcstack, align 8 %frame.prev = getelementptr inbounds ptr, ptr %gcframe1, i64 1 store ptr %task.gcstack, ptr %frame.prev, align 8 store ptr %gcframe1, ptr %pgcstack, align 8 ; @ /Users/dnetto/Personal/test.jl:4 within `testme` %0 = call nonnull ptr @j_rand_539(i64 signext 100000000) %gc_slot_addr_0 = getelementptr inbounds ptr, ptr %gcframe1, i64 2 store ptr %0, ptr %gc_slot_addr_0, align 16 ; @ /Users/dnetto/Personal/test.jl:5 within `testme` %1 = call double @j_sum_541(ptr nonnull %0) ; @ /Users/dnetto/Personal/test.jl:7 within `testme` ; ┌ @ gcutils.jl:132 within `gc` @ gcutils.jl:132 call void @jlplt_ijl_gc_collect_543_got.jit(i32 1) %frame.prev4 = load ptr, ptr %frame.prev, align 8 store ptr %frame.prev4, ptr %pgcstack, align 8 ; └ ; @ /Users/dnetto/Personal/test.jl:8 within `testme` ret double %1 } ``` After: ```llvm ; Function Signature: testme() ; @ /Users/dnetto/Personal/test.jl:3 within `testme` define double @julia_testme_752() #0 { top: %gcframe1 = alloca [3 x ptr], align 16 call void @llvm.memset.p0.i64(ptr align 16 %gcframe1, i8 0, i64 24, i1 true) %pgcstack = call ptr inttoptr (i64 6595051180 to ptr)(i64 262) #10 store i64 4, ptr %gcframe1, align 16 %task.gcstack = load ptr, ptr %pgcstack, align 8 %frame.prev = getelementptr inbounds ptr, ptr %gcframe1, i64 1 store ptr %task.gcstack, ptr %frame.prev, align 8 store ptr %gcframe1, ptr %pgcstack, align 8 ; @ /Users/dnetto/Personal/test.jl:4 within `testme` %0 = call nonnull ptr @j_rand_756(i64 signext 100000000) %gc_slot_addr_0 = getelementptr inbounds ptr, ptr %gcframe1, i64 2 store ptr %0, ptr %gc_slot_addr_0, align 16 ; @ /Users/dnetto/Personal/test.jl:5 within `testme` %1 = call double @j_sum_758(ptr nonnull %0) store ptr null, ptr %gc_slot_addr_0, align 16 ; @ /Users/dnetto/Personal/test.jl:7 within `testme` ; ┌ @ gcutils.jl:132 within `gc` @ gcutils.jl:132 call void @jlplt_ijl_gc_collect_760_got.jit(i32 1) %frame.prev6 = load ptr, ptr %frame.prev, align 8 store ptr %frame.prev6, ptr %pgcstack, align 8 ; └ ; @ /Users/dnetto/Personal/test.jl:8 within `testme` ret double %1 } ```
1 parent bce3d4d commit efc43cb

File tree

4 files changed

+62
-12
lines changed

4 files changed

+62
-12
lines changed

src/llvm-gc-interface-passes.h

+4-3
Original file line numberDiff line numberDiff line change
@@ -353,10 +353,11 @@ struct LateLowerGCFrame: private JuliaPassContext {
353353
State LocalScan(Function &F);
354354
void ComputeLiveness(State &S);
355355
void ComputeLiveSets(State &S);
356-
SmallVector<int, 0> ColorRoots(const State &S);
356+
std::pair<SmallVector<int, 0>, int> ColorRoots(const State &S);
357357
void PlaceGCFrameStore(State &S, unsigned R, unsigned MinColorRoot, ArrayRef<int> Colors, Value *GCFrame, Instruction *InsertBefore);
358-
void PlaceGCFrameStores(State &S, unsigned MinColorRoot, ArrayRef<int> Colors, Value *GCFrame);
359-
void PlaceRootsAndUpdateCalls(SmallVectorImpl<int> &Colors, State &S, std::map<Value *, std::pair<int, int>>);
358+
void PlaceGCFrameStores(State &S, unsigned MinColorRoot, ArrayRef<int> Colors, int PreAssignedColors, Value *GCFrame);
359+
void PlaceGCFrameReset(State &S, unsigned R, unsigned MinColorRoot, ArrayRef<int> Colors, Value *GCFrame, Instruction *InsertBefore);
360+
void PlaceRootsAndUpdateCalls(ArrayRef<int> Colors, int PreAssignedColors, State &S, std::map<Value *, std::pair<int, int>>);
360361
void CleanupWriteBarriers(Function &F, State *S, const SmallVector<CallInst*, 0> &WriteBarriers, bool *CFGModified);
361362
bool CleanupIR(Function &F, State *S, bool *CFGModified);
362363
void NoteUseChain(State &S, BBState &BBS, User *TheUser);

src/llvm-late-gc-lowering.cpp

+29-7
Original file line numberDiff line numberDiff line change
@@ -1820,7 +1820,7 @@ JL_USED_FUNC static void dumpColorAssignments(const State &S, const ArrayRef<int
18201820
}
18211821
}
18221822

1823-
SmallVector<int, 0> LateLowerGCFrame::ColorRoots(const State &S) {
1823+
std::pair<SmallVector<int, 0>, int> LateLowerGCFrame::ColorRoots(const State &S) {
18241824
SmallVector<int, 0> Colors;
18251825
Colors.resize(S.MaxPtrNumber + 1, -1);
18261826
PEOIterator Ordering(S.Neighbors);
@@ -1862,7 +1862,7 @@ SmallVector<int, 0> LateLowerGCFrame::ColorRoots(const State &S) {
18621862
NewColor += PreAssignedColors;
18631863
Colors[ActiveElement] = NewColor;
18641864
}
1865-
return Colors;
1865+
return {Colors, PreAssignedColors};
18661866
}
18671867

18681868
// Size of T is assumed to be `sizeof(void*)`
@@ -2292,8 +2292,21 @@ void LateLowerGCFrame::PlaceGCFrameStore(State &S, unsigned R, unsigned MinColor
22922292
new StoreInst(Val, slotAddress, InsertBefore);
22932293
}
22942294

2295+
void LateLowerGCFrame::PlaceGCFrameReset(State &S, unsigned R, unsigned MinColorRoot,
2296+
ArrayRef<int> Colors, Value *GCFrame,
2297+
Instruction *InsertBefore) {
2298+
// Get the slot address.
2299+
auto slotAddress = CallInst::Create(
2300+
getOrDeclare(jl_intrinsics::getGCFrameSlot),
2301+
{GCFrame, ConstantInt::get(Type::getInt32Ty(InsertBefore->getContext()), Colors[R] + MinColorRoot)},
2302+
"gc_slot_addr_" + StringRef(std::to_string(Colors[R] + MinColorRoot)), InsertBefore);
2303+
// Reset the slot to NULL.
2304+
Value *Val = ConstantPointerNull::get(T_prjlvalue);
2305+
new StoreInst(Val, slotAddress, InsertBefore);
2306+
}
2307+
22952308
void LateLowerGCFrame::PlaceGCFrameStores(State &S, unsigned MinColorRoot,
2296-
ArrayRef<int> Colors, Value *GCFrame)
2309+
ArrayRef<int> Colors, int PreAssignedColors, Value *GCFrame)
22972310
{
22982311
for (auto &BB : *S.F) {
22992312
const BBState &BBS = S.BBStates[&BB];
@@ -2306,6 +2319,15 @@ void LateLowerGCFrame::PlaceGCFrameStores(State &S, unsigned MinColorRoot,
23062319
for(auto rit = BBS.Safepoints.rbegin();
23072320
rit != BBS.Safepoints.rend(); ++rit ) {
23082321
const LargeSparseBitVector &NowLive = S.LiveSets[*rit];
2322+
// reset slots which are no longer alive
2323+
for (int Idx : *LastLive) {
2324+
if (Idx >= PreAssignedColors && !HasBitSet(NowLive, Idx)) {
2325+
PlaceGCFrameReset(S, Idx, MinColorRoot, Colors, GCFrame,
2326+
S.ReverseSafepointNumbering[*rit]);
2327+
}
2328+
}
2329+
// store values which are alive in this safepoint but
2330+
// haven't been stored in the GC frame before
23092331
for (int Idx : NowLive) {
23102332
if (!HasBitSet(*LastLive, Idx)) {
23112333
PlaceGCFrameStore(S, Idx, MinColorRoot, Colors, GCFrame,
@@ -2317,7 +2339,7 @@ void LateLowerGCFrame::PlaceGCFrameStores(State &S, unsigned MinColorRoot,
23172339
}
23182340
}
23192341

2320-
void LateLowerGCFrame::PlaceRootsAndUpdateCalls(SmallVectorImpl<int> &Colors, State &S,
2342+
void LateLowerGCFrame::PlaceRootsAndUpdateCalls(ArrayRef<int> Colors, int PreAssignedColors, State &S,
23212343
std::map<Value *, std::pair<int, int>>) {
23222344
auto F = S.F;
23232345
auto T_int32 = Type::getInt32Ty(F->getContext());
@@ -2439,7 +2461,7 @@ void LateLowerGCFrame::PlaceRootsAndUpdateCalls(SmallVectorImpl<int> &Colors, St
24392461
pushGcframe->setArgOperand(1, NRoots);
24402462

24412463
// Insert GC frame stores
2442-
PlaceGCFrameStores(S, AllocaSlot - 2, Colors, gcframe);
2464+
PlaceGCFrameStores(S, AllocaSlot - 2, Colors, PreAssignedColors, gcframe);
24432465
// Insert GCFrame pops
24442466
for (auto &BB : *F) {
24452467
if (isa<ReturnInst>(BB.getTerminator())) {
@@ -2464,9 +2486,9 @@ bool LateLowerGCFrame::runOnFunction(Function &F, bool *CFGModified) {
24642486

24652487
State S = LocalScan(F);
24662488
ComputeLiveness(S);
2467-
SmallVector<int, 0> Colors = ColorRoots(S);
2489+
auto Colors = ColorRoots(S);
24682490
std::map<Value *, std::pair<int, int>> CallFrames; // = OptimizeCallFrames(S, Ordering);
2469-
PlaceRootsAndUpdateCalls(Colors, S, CallFrames);
2491+
PlaceRootsAndUpdateCalls(Colors.first, Colors.second, S, CallFrames);
24702492
CleanupIR(F, &S, CFGModified);
24712493
return true;
24722494
}

test/compiler/codegen.jl

+22
Original file line numberDiff line numberDiff line change
@@ -1003,3 +1003,25 @@ end
10031003
@test f55768(Vector)
10041004
@test f55768(Vector{T} where T)
10051005
@test !f55768(Vector{S} where S)
1006+
1007+
# test that values get rooted correctly over throw
1008+
for a in ((@noinline Ref{Int}(2)),
1009+
(@noinline Ref{Int}(3)),
1010+
5,
1011+
(@noinline Ref{Int}(4)),
1012+
6)
1013+
@test a[] != 0
1014+
try
1015+
b = (@noinline Ref{Int}(5),
1016+
@noinline Ref{Int}(6),
1017+
@noinline Ref{Int}(7),
1018+
@noinline Ref{Int}(8),
1019+
@noinline Ref{Int}(9),
1020+
@noinline Ref{Int}(10),
1021+
@noinline Ref{Int}(11))
1022+
GC.gc(true)
1023+
GC.@preserve b throw(a)
1024+
catch ex
1025+
@test ex === a
1026+
end
1027+
end

test/llvmpasses/returnstwicegc.ll

+7-2
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
; This file is a part of Julia. License is MIT: https://julialang.org/license
22

3-
; RUN: opt --load-pass-plugin=libjulia-codegen%shlibext -passes='function(LateLowerGCFrame,FinalLowerGC)' -S %s | FileCheck %s --check-prefixes=OPAQUE
3+
; RUN: opt --load-pass-plugin=libjulia-codegen%shlibext -passes='function(LateLowerGCFrame,FinalLowerGC)' -S %s | FileCheck %s
44

55

66
declare void @boxed_simple({} addrspace(10)*, {} addrspace(10)*)
@@ -13,7 +13,12 @@ declare void @one_arg_boxed({} addrspace(10)*)
1313
define void @try_catch(i64 %a, i64 %b)
1414
{
1515
; Because of the returns_twice function, we need to keep aboxed live everywhere
16-
; OPAQUE: %gcframe = alloca ptr addrspace(10), i32 4
16+
; CHECK: %gcframe = alloca ptr addrspace(10), i32 4
17+
; CHECK: store ptr addrspace(10) %aboxed, ptr [[slot_0:%.*]],
18+
; CHECK-NOT: store {{.*}} ptr [[slot_0]]
19+
; CHECK: store ptr addrspace(10) %bboxed, ptr {{%.*}}
20+
; CHECK-NOT: store {{.*}} ptr [[slot_0]]
21+
1722
top:
1823
%sigframe = alloca [208 x i8], align 16
1924
%sigframe.sub = getelementptr inbounds [208 x i8], [208 x i8]* %sigframe, i64 0, i64 0

0 commit comments

Comments
 (0)