mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 20:51:52 +01:00
[coroutines] Fix spills of static array allocas
Summary: CoroFrame was not considering static array allocas, and was only ever reserving a single element in the coroutine frame. This meant that stores to the non-zero'th element would corrupt later frame data. Store static array allocas as field arrays in the coroutine frame. Added test. Committed by Gor Nishanov on behalf of ben-clayton Reviewers: GorNishanov, modocache Reviewed By: GorNishanov Subscribers: Orlando, capn, EricWF, llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D61372 llvm-svn: 360636
This commit is contained in:
parent
55419fb427
commit
8de3d7fc0b
@ -402,6 +402,7 @@ static StructType *buildFrameType(Function &F, coro::Shape &Shape,
|
|||||||
if (CurrentDef == Shape.PromiseAlloca)
|
if (CurrentDef == Shape.PromiseAlloca)
|
||||||
continue;
|
continue;
|
||||||
|
|
||||||
|
uint64_t Count = 1;
|
||||||
Type *Ty = nullptr;
|
Type *Ty = nullptr;
|
||||||
if (auto *AI = dyn_cast<AllocaInst>(CurrentDef)) {
|
if (auto *AI = dyn_cast<AllocaInst>(CurrentDef)) {
|
||||||
Ty = AI->getAllocatedType();
|
Ty = AI->getAllocatedType();
|
||||||
@ -413,11 +414,18 @@ static StructType *buildFrameType(Function &F, coro::Shape &Shape,
|
|||||||
Padder.addType(PaddingTy);
|
Padder.addType(PaddingTy);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
if (auto *CI = dyn_cast<ConstantInt>(AI->getArraySize()))
|
||||||
|
Count = CI->getValue().getZExtValue();
|
||||||
|
else
|
||||||
|
report_fatal_error("Coroutines cannot handle non static allocas yet");
|
||||||
} else {
|
} else {
|
||||||
Ty = CurrentDef->getType();
|
Ty = CurrentDef->getType();
|
||||||
}
|
}
|
||||||
S.setFieldIndex(Types.size());
|
S.setFieldIndex(Types.size());
|
||||||
|
if (Count == 1)
|
||||||
Types.push_back(Ty);
|
Types.push_back(Ty);
|
||||||
|
else
|
||||||
|
Types.push_back(ArrayType::get(Ty, Count));
|
||||||
Padder.addType(Ty);
|
Padder.addType(Ty);
|
||||||
}
|
}
|
||||||
FrameTy->setBody(Types);
|
FrameTy->setBody(Types);
|
||||||
@ -470,6 +478,7 @@ static Instruction *splitBeforeCatchSwitch(CatchSwitchInst *CatchSwitch) {
|
|||||||
//
|
//
|
||||||
static Instruction *insertSpills(SpillInfo &Spills, coro::Shape &Shape) {
|
static Instruction *insertSpills(SpillInfo &Spills, coro::Shape &Shape) {
|
||||||
auto *CB = Shape.CoroBegin;
|
auto *CB = Shape.CoroBegin;
|
||||||
|
LLVMContext &C = CB->getContext();
|
||||||
IRBuilder<> Builder(CB->getNextNode());
|
IRBuilder<> Builder(CB->getNextNode());
|
||||||
StructType *FrameTy = Shape.FrameTy;
|
StructType *FrameTy = Shape.FrameTy;
|
||||||
PointerType *FramePtrTy = FrameTy->getPointerTo();
|
PointerType *FramePtrTy = FrameTy->getPointerTo();
|
||||||
@ -491,14 +500,38 @@ static Instruction *insertSpills(SpillInfo &Spills, coro::Shape &Shape) {
|
|||||||
if (Shape.PromiseAlloca)
|
if (Shape.PromiseAlloca)
|
||||||
Allocas.emplace_back(Shape.PromiseAlloca, coro::Shape::PromiseField);
|
Allocas.emplace_back(Shape.PromiseAlloca, coro::Shape::PromiseField);
|
||||||
|
|
||||||
|
// Create a GEP with the given index into the coroutine frame for the original
|
||||||
|
// value Orig. Appends an extra 0 index for array-allocas, preserving the
|
||||||
|
// original type.
|
||||||
|
auto GetFramePointer = [&](uint32_t Index, Value *Orig) -> Value * {
|
||||||
|
SmallVector<Value *, 3> Indices = {
|
||||||
|
ConstantInt::get(Type::getInt32Ty(C), 0),
|
||||||
|
ConstantInt::get(Type::getInt32Ty(C), Index),
|
||||||
|
};
|
||||||
|
|
||||||
|
if (auto *AI = dyn_cast<AllocaInst>(Orig)) {
|
||||||
|
if (auto *CI = dyn_cast<ConstantInt>(AI->getArraySize())) {
|
||||||
|
auto Count = CI->getValue().getZExtValue();
|
||||||
|
if (Count > 1) {
|
||||||
|
Indices.push_back(ConstantInt::get(Type::getInt32Ty(C), 0));
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
report_fatal_error("Coroutines cannot handle non static allocas yet");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return Builder.CreateInBoundsGEP(FrameTy, FramePtr, Indices);
|
||||||
|
};
|
||||||
|
|
||||||
// Create a load instruction to reload the spilled value from the coroutine
|
// Create a load instruction to reload the spilled value from the coroutine
|
||||||
// frame.
|
// frame.
|
||||||
auto CreateReload = [&](Instruction *InsertBefore) {
|
auto CreateReload = [&](Instruction *InsertBefore) {
|
||||||
assert(Index && "accessing unassigned field number");
|
assert(Index && "accessing unassigned field number");
|
||||||
Builder.SetInsertPoint(InsertBefore);
|
Builder.SetInsertPoint(InsertBefore);
|
||||||
auto *G = Builder.CreateConstInBoundsGEP2_32(FrameTy, FramePtr, 0, Index,
|
|
||||||
CurrentValue->getName() +
|
auto *G = GetFramePointer(Index, CurrentValue);
|
||||||
Twine(".reload.addr"));
|
G->setName(CurrentValue->getName() + Twine(".reload.addr"));
|
||||||
|
|
||||||
return isa<AllocaInst>(CurrentValue)
|
return isa<AllocaInst>(CurrentValue)
|
||||||
? G
|
? G
|
||||||
: Builder.CreateLoad(FrameTy->getElementType(Index), G,
|
: Builder.CreateLoad(FrameTy->getElementType(Index), G,
|
||||||
@ -588,8 +621,8 @@ static Instruction *insertSpills(SpillInfo &Spills, coro::Shape &Shape) {
|
|||||||
Builder.SetInsertPoint(&Shape.AllocaSpillBlock->front());
|
Builder.SetInsertPoint(&Shape.AllocaSpillBlock->front());
|
||||||
// If we found any allocas, replace all of their remaining uses with Geps.
|
// If we found any allocas, replace all of their remaining uses with Geps.
|
||||||
for (auto &P : Allocas) {
|
for (auto &P : Allocas) {
|
||||||
auto *G =
|
auto *G = GetFramePointer(P.second, P.first);
|
||||||
Builder.CreateConstInBoundsGEP2_32(FrameTy, FramePtr, 0, P.second);
|
|
||||||
// We are not using ReplaceInstWithInst(P.first, cast<Instruction>(G)) here,
|
// We are not using ReplaceInstWithInst(P.first, cast<Instruction>(G)) here,
|
||||||
// as we are changing location of the instruction.
|
// as we are changing location of the instruction.
|
||||||
G->takeName(P.first);
|
G->takeName(P.first);
|
||||||
|
72
test/Transforms/Coroutines/coro-frame-arrayalloca.ll
Normal file
72
test/Transforms/Coroutines/coro-frame-arrayalloca.ll
Normal file
@ -0,0 +1,72 @@
|
|||||||
|
; Check that we can handle spills of array allocas
|
||||||
|
; RUN: opt < %s -coro-split -S | FileCheck %s
|
||||||
|
|
||||||
|
declare void @consume.double.ptr(double*)
|
||||||
|
declare void @consume.i32.ptr(i32*)
|
||||||
|
|
||||||
|
define i8* @f() "coroutine.presplit"="1" {
|
||||||
|
entry:
|
||||||
|
%prefix = alloca double
|
||||||
|
%data = alloca i32, i32 4
|
||||||
|
%suffix = alloca double
|
||||||
|
%id = call token @llvm.coro.id(i32 0, i8* null, i8* null, i8* null)
|
||||||
|
%size = call i32 @llvm.coro.size.i32()
|
||||||
|
%alloc = call i8* @malloc(i32 %size)
|
||||||
|
%hdl = call i8* @llvm.coro.begin(token %id, i8* %alloc)
|
||||||
|
call void @consume.double.ptr(double* %prefix)
|
||||||
|
call void @consume.i32.ptr(i32* %data)
|
||||||
|
call void @consume.double.ptr(double* %suffix)
|
||||||
|
%0 = call i8 @llvm.coro.suspend(token none, i1 false)
|
||||||
|
switch i8 %0, label %suspend [i8 0, label %resume
|
||||||
|
i8 1, label %cleanup]
|
||||||
|
resume:
|
||||||
|
call void @consume.double.ptr(double* %prefix)
|
||||||
|
call void @consume.i32.ptr(i32* %data)
|
||||||
|
call void @consume.double.ptr(double* %suffix)
|
||||||
|
br label %cleanup
|
||||||
|
|
||||||
|
cleanup:
|
||||||
|
%mem = call i8* @llvm.coro.free(token %id, i8* %hdl)
|
||||||
|
call void @free(i8* %mem)
|
||||||
|
br label %suspend
|
||||||
|
suspend:
|
||||||
|
call i1 @llvm.coro.end(i8* %hdl, i1 0)
|
||||||
|
ret i8* %hdl
|
||||||
|
}
|
||||||
|
|
||||||
|
; See if the array alloca was stored as an array field.
|
||||||
|
; CHECK-LABEL: %f.Frame = type { void (%f.Frame*)*, void (%f.Frame*)*, i1, i1, double, [4 x i32], double }
|
||||||
|
|
||||||
|
; See if we used correct index to access prefix, data, suffix (@f)
|
||||||
|
; CHECK-LABEL: @f(
|
||||||
|
; CHECK: %prefix = getelementptr inbounds %f.Frame, %f.Frame* %FramePtr, i32 0, i32 4
|
||||||
|
; CHECK-NEXT: %data = getelementptr inbounds %f.Frame, %f.Frame* %FramePtr, i32 0, i32 5
|
||||||
|
; CHECK-NEXT: %suffix = getelementptr inbounds %f.Frame, %f.Frame* %FramePtr, i32 0, i32 6
|
||||||
|
; CHECK-NEXT: call void @consume.double.ptr(double* %prefix)
|
||||||
|
; CHECK-NEXT: call void @consume.i32.ptr(i32* %data)
|
||||||
|
; CHECK-NEXT: call void @consume.double.ptr(double* %suffix)
|
||||||
|
; CHECK: ret i8*
|
||||||
|
|
||||||
|
; See if we used correct index to access prefix, data, suffix (@f.resume)
|
||||||
|
; CHECK-LABEL: @f.resume(
|
||||||
|
; CHECK: %[[SUFFIX:.+]] = getelementptr inbounds %f.Frame, %f.Frame* %FramePtr, i32 0, i32 6
|
||||||
|
; CHECK: %[[DATA:.+]] = getelementptr inbounds %f.Frame, %f.Frame* %FramePtr, i32 0, i32 5
|
||||||
|
; CHECK: %[[PREFIX:.+]] = getelementptr inbounds %f.Frame, %f.Frame* %FramePtr, i32 0, i32 4
|
||||||
|
; CHECK: call void @consume.double.ptr(double* %[[PREFIX]])
|
||||||
|
; CHECK-NEXT: call void @consume.i32.ptr(i32* %[[DATA]])
|
||||||
|
; CHECK-NEXT: call void @consume.double.ptr(double* %[[SUFFIX]])
|
||||||
|
|
||||||
|
declare i8* @llvm.coro.free(token, i8*)
|
||||||
|
declare i32 @llvm.coro.size.i32()
|
||||||
|
declare i8 @llvm.coro.suspend(token, i1)
|
||||||
|
declare void @llvm.coro.resume(i8*)
|
||||||
|
declare void @llvm.coro.destroy(i8*)
|
||||||
|
|
||||||
|
declare token @llvm.coro.id(i32, i8*, i8*, i8*)
|
||||||
|
declare i1 @llvm.coro.alloc(token)
|
||||||
|
declare i8* @llvm.coro.begin(token, i8*)
|
||||||
|
declare i1 @llvm.coro.end(i8*, i1)
|
||||||
|
|
||||||
|
declare noalias i8* @malloc(i32)
|
||||||
|
declare double @print(double)
|
||||||
|
declare void @free(i8*)
|
Loading…
x
Reference in New Issue
Block a user