src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2022-01-27 22:06:42 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2022-01-27 22:06:42 +0000
commit	6f8fc217eaa12bf657be1c6468ed9938d10168b3 (patch)
tree	a1fd89b864d9b93e2ad68fe1dcf7afee2e3c8d76 /llvm/lib/Transforms/Coroutines
parent	77fc4c146f0870ffb09c1afb823ccbe742c5e6ff (diff)

vendor/llvm-project/llvmorg-14-init-17616-g024a1fab5c35

Diffstat (limited to 'llvm/lib/Transforms/Coroutines')

-rw-r--r--

llvm/lib/Transforms/Coroutines/CoroEarly.cpp

-rw-r--r--

llvm/lib/Transforms/Coroutines/CoroFrame.cpp

-rw-r--r--

llvm/lib/Transforms/Coroutines/CoroInstr.h

-rw-r--r--

llvm/lib/Transforms/Coroutines/CoroInternal.h

-rw-r--r--

llvm/lib/Transforms/Coroutines/CoroSplit.cpp

167

-rw-r--r--

llvm/lib/Transforms/Coroutines/Coroutines.cpp

6 files changed, 161 insertions, 77 deletions

diff --git a/llvm/lib/Transforms/Coroutines/CoroEarly.cpp b/llvm/lib/Transforms/Coroutines/CoroEarly.cpp
index 68a34bdcb1cd..1533e1805f17 100644
--- a/llvm/lib/Transforms/Coroutines/CoroEarly.cpp
+++ b/llvm/lib/Transforms/Coroutines/CoroEarly.cpp

@@ -176,11 +176,14 @@ bool Lowerer::lowerEarlyIntrinsics(Function &F) {

lowerCoroNoop(cast<IntrinsicInst>(&I));

break;

case Intrinsic::coro_id:

- // Mark a function that comes out of the frontend that has a coro.id

- // with a coroutine attribute.

if (auto *CII = cast<CoroIdInst>(&I)) {

if (CII->getInfo().isPreSplit()) {

- F.addFnAttr(CORO_PRESPLIT_ATTR, UNPREPARED_FOR_SPLIT);

+ assert(F.hasFnAttribute(CORO_PRESPLIT_ATTR) &&

+ F.getFnAttribute(CORO_PRESPLIT_ATTR).getValueAsString() ==

+ UNPREPARED_FOR_SPLIT &&

+ "The frontend uses Swtich-Resumed ABI should emit "

+ "\"coroutine.presplit\" attribute with value \"0\" for the "

+ "coroutine.");

setCannotDuplicate(CII);

CII->setCoroutineSelf();

CoroId = cast<CoroIdInst>(&I);

@@ -190,6 +193,8 @@ bool Lowerer::lowerEarlyIntrinsics(Function &F) {

case Intrinsic::coro_id_retcon:

case Intrinsic::coro_id_retcon_once:

case Intrinsic::coro_id_async:

+ // TODO: Remove the line once we support it in the corresponding

+ // frontend.

F.addFnAttr(CORO_PRESPLIT_ATTR, PREPARED_FOR_SPLIT);

break;

case Intrinsic::coro_resume:

diff --git a/llvm/lib/Transforms/Coroutines/CoroFrame.cpp b/llvm/lib/Transforms/Coroutines/CoroFrame.cpp
index a0d12865bd3a..92acfb93057a 100644
--- a/llvm/lib/Transforms/Coroutines/CoroFrame.cpp
+++ b/llvm/lib/Transforms/Coroutines/CoroFrame.cpp

@@ -587,7 +587,7 @@ void FrameTypeBuilder::addFieldForAllocas(const Function &F,

}

});

- if (!Shape.ReuseFrameSlot && !EnableReuseStorageInFrame) {

+ if (!Shape.OptimizeFrame && !EnableReuseStorageInFrame) {

for (const auto &A : FrameData.Allocas) {

AllocaInst *Alloca = A.Alloca;

NonOverlapedAllocas.emplace_back(AllocaSetType(1, Alloca));

@@ -808,7 +808,7 @@ static StringRef solveTypeName(Type *Ty) {

if (Ty->isPointerTy()) {

auto *PtrTy = cast<PointerType>(Ty);

- Type *PointeeTy = PtrTy->getElementType();

+ Type *PointeeTy = PtrTy->getPointerElementType();

auto Name = solveTypeName(PointeeTy);

if (Name == "UnknownType")

return "PointerType";

@@ -1659,7 +1659,7 @@ static Instruction *insertSpills(const FrameDataInfo &FrameData,

&*Builder.GetInsertPoint());

// This dbg.declare is for the main function entry point. It

// will be deleted in all coro-split functions.

- coro::salvageDebugInfo(DbgPtrAllocaCache, DDI, Shape.ReuseFrameSlot);

+ coro::salvageDebugInfo(DbgPtrAllocaCache, DDI, Shape.OptimizeFrame);

}

@@ -2278,7 +2278,7 @@ static void eliminateSwiftErrorArgument(Function &F, Argument &Arg,

IRBuilder<> Builder(F.getEntryBlock().getFirstNonPHIOrDbg());

auto ArgTy = cast<PointerType>(Arg.getType());

- auto ValueTy = ArgTy->getElementType();

+ auto ValueTy = ArgTy->getPointerElementType();

// Reduce to the alloca case:

@@ -2506,7 +2506,7 @@ static void collectFrameAllocas(Function &F, coro::Shape &Shape,

void coro::salvageDebugInfo(

SmallDenseMap<llvm::Value *, llvm::AllocaInst *, 4> &DbgPtrAllocaCache,

- DbgVariableIntrinsic *DVI, bool ReuseFrameSlot) {

+ DbgVariableIntrinsic *DVI, bool OptimizeFrame) {

Function *F = DVI->getFunction();

IRBuilder<> Builder(F->getContext());

auto InsertPt = F->getEntryBlock().getFirstInsertionPt();

@@ -2558,7 +2558,7 @@ void coro::salvageDebugInfo(

// Avoid to create the alloca would be eliminated by optimization

// passes and the corresponding dbg.declares would be invalid.

- if (!ReuseFrameSlot && !EnableReuseStorageInFrame)

+ if (!OptimizeFrame && !EnableReuseStorageInFrame)

if (auto *Arg = dyn_cast<llvm::Argument>(Storage)) {

auto &Cached = DbgPtrAllocaCache[Storage];

if (!Cached) {

diff --git a/llvm/lib/Transforms/Coroutines/CoroInstr.h b/llvm/lib/Transforms/Coroutines/CoroInstr.h
index bf3d781ba43e..014938c15a0a 100644
--- a/llvm/lib/Transforms/Coroutines/CoroInstr.h
+++ b/llvm/lib/Transforms/Coroutines/CoroInstr.h

@@ -599,6 +599,18 @@ public:

}

};

+/// This represents the llvm.coro.align instruction.

+class LLVM_LIBRARY_VISIBILITY CoroAlignInst : public IntrinsicInst {

+public:

+ // Methods to support type inquiry through isa, cast, and dyn_cast:

+ static bool classof(const IntrinsicInst *I) {

+ return I->getIntrinsicID() == Intrinsic::coro_align;

+ }

+ static bool classof(const Value *V) {

+ return isa<IntrinsicInst>(V) && classof(cast<IntrinsicInst>(V));

+ }

+};

class LLVM_LIBRARY_VISIBILITY AnyCoroEndInst : public IntrinsicInst {

enum { FrameArg, UnwindArg };

diff --git a/llvm/lib/Transforms/Coroutines/CoroInternal.h b/llvm/lib/Transforms/Coroutines/CoroInternal.h
index 27ba8524f975..9a17068df3a9 100644
--- a/llvm/lib/Transforms/Coroutines/CoroInternal.h
+++ b/llvm/lib/Transforms/Coroutines/CoroInternal.h

@@ -36,6 +36,11 @@ void initializeCoroCleanupLegacyPass(PassRegistry &);

// adds coroutine subfunctions to the SCC to be processed by IPO pipeline.

// Async lowering similarily triggers a restart of the pipeline after it has

// split the coroutine.

+//

+// FIXME: Refactor these attributes as LLVM attributes instead of string

+// attributes since these attributes are already used outside LLVM's

+// coroutine module.

+// FIXME: Remove these values once we remove the Legacy PM.

#define CORO_PRESPLIT_ATTR "coroutine.presplit"

#define UNPREPARED_FOR_SPLIT "0"

#define PREPARED_FOR_SPLIT "1"

@@ -54,7 +59,7 @@ void updateCallGraph(Function &Caller, ArrayRef<Function *> Funcs,

/// holding a pointer to the coroutine frame.

void salvageDebugInfo(

SmallDenseMap<llvm::Value *, llvm::AllocaInst *, 4> &DbgPtrAllocaCache,

- DbgVariableIntrinsic *DVI, bool ReuseFrameSlot);

+ DbgVariableIntrinsic *DVI, bool OptimizeFrame);

// Keeps data and helper functions for lowering coroutine intrinsics.

struct LowererBase {

@@ -99,6 +104,7 @@ struct LLVM_LIBRARY_VISIBILITY Shape {

CoroBeginInst *CoroBegin;

SmallVector<AnyCoroEndInst *, 4> CoroEnds;

SmallVector<CoroSizeInst *, 2> CoroSizes;

+ SmallVector<CoroAlignInst *, 2> CoroAligns;

SmallVector<AnyCoroSuspendInst *, 4> CoroSuspends;

SmallVector<CallInst*, 2> SwiftErrorOps;

@@ -126,7 +132,7 @@ struct LLVM_LIBRARY_VISIBILITY Shape {

BasicBlock *AllocaSpillBlock;

/// This would only be true if optimization are enabled.

- bool ReuseFrameSlot;

+ bool OptimizeFrame;

struct SwitchLoweringStorage {

SwitchInst *ResumeSwitch;

@@ -272,8 +278,8 @@ struct LLVM_LIBRARY_VISIBILITY Shape {

void emitDealloc(IRBuilder<> &Builder, Value *Ptr, CallGraph *CG) const;

Shape() = default;

- explicit Shape(Function &F, bool ReuseFrameSlot = false)

- : ReuseFrameSlot(ReuseFrameSlot) {

+ explicit Shape(Function &F, bool OptimizeFrame = false)

+ : OptimizeFrame(OptimizeFrame) {

buildFrom(F);

}

void buildFrom(Function &F);

diff --git a/llvm/lib/Transforms/Coroutines/CoroSplit.cpp b/llvm/lib/Transforms/Coroutines/CoroSplit.cpp
index 12c1829524ef..b5129809c6a6 100644
--- a/llvm/lib/Transforms/Coroutines/CoroSplit.cpp
+++ b/llvm/lib/Transforms/Coroutines/CoroSplit.cpp

@@ -29,6 +29,7 @@

#include "llvm/Analysis/CFG.h"

#include "llvm/Analysis/CallGraph.h"

#include "llvm/Analysis/CallGraphSCCPass.h"

+#include "llvm/Analysis/ConstantFolding.h"

#include "llvm/Analysis/LazyCallGraph.h"

#include "llvm/IR/Argument.h"

#include "llvm/IR/Attributes.h"

@@ -617,7 +618,8 @@ static void replaceSwiftErrorOps(Function &F, coro::Shape &Shape,

Value *CachedSlot = nullptr;

auto getSwiftErrorSlot = [&](Type *ValueTy) -> Value * {

if (CachedSlot) {

- assert(CachedSlot->getType()->getPointerElementType() == ValueTy &&

+ assert(cast<PointerType>(CachedSlot->getType())

+ ->isOpaqueOrPointeeTypeMatches(ValueTy) &&

"multiple swifterror slots in function with different types");

return CachedSlot;

}

@@ -626,7 +628,8 @@ static void replaceSwiftErrorOps(Function &F, coro::Shape &Shape,

for (auto &Arg : F.args()) {

if (Arg.isSwiftError()) {

CachedSlot = &Arg;

- assert(Arg.getType()->getPointerElementType() == ValueTy &&

+ assert(cast<PointerType>(Arg.getType())

+ ->isOpaqueOrPointeeTypeMatches(ValueTy) &&

"swifterror argument does not have expected type");

return &Arg;

}

@@ -682,7 +685,7 @@ void CoroCloner::salvageDebugInfo() {

if (auto *DVI = dyn_cast<DbgVariableIntrinsic>(&I))

Worklist.push_back(DVI);

for (DbgVariableIntrinsic *DVI : Worklist)

- coro::salvageDebugInfo(DbgPtrAllocaCache, DVI, Shape.ReuseFrameSlot);

+ coro::salvageDebugInfo(DbgPtrAllocaCache, DVI, Shape.OptimizeFrame);

// Remove all salvaged dbg.declare intrinsics that became

// either unreachable or stale due to the CoroSplit transformation.

@@ -835,7 +838,7 @@ Value *CoroCloner::deriveNewFramePointer() {

static void addFramePointerAttrs(AttributeList &Attrs, LLVMContext &Context,

unsigned ParamIndex,

uint64_t Size, Align Alignment) {

- AttrBuilder ParamAttrs;

+ AttrBuilder ParamAttrs(Context);

ParamAttrs.addAttribute(Attribute::NonNull);

ParamAttrs.addAttribute(Attribute::NoAlias);

ParamAttrs.addAlignmentAttr(Alignment);

@@ -845,14 +848,14 @@ static void addFramePointerAttrs(AttributeList &Attrs, LLVMContext &Context,

static void addAsyncContextAttrs(AttributeList &Attrs, LLVMContext &Context,

unsigned ParamIndex) {

- AttrBuilder ParamAttrs;

+ AttrBuilder ParamAttrs(Context);

ParamAttrs.addAttribute(Attribute::SwiftAsync);

Attrs = Attrs.addParamAttributes(Context, ParamIndex, ParamAttrs);

}

static void addSwiftSelfAttrs(AttributeList &Attrs, LLVMContext &Context,

unsigned ParamIndex) {

- AttrBuilder ParamAttrs;

+ AttrBuilder ParamAttrs(Context);

ParamAttrs.addAttribute(Attribute::SwiftSelf);

Attrs = Attrs.addParamAttributes(Context, ParamIndex, ParamAttrs);

}

@@ -929,7 +932,7 @@ void CoroCloner::create() {

case coro::ABI::Switch:

// Bootstrap attributes by copying function attributes from the

// original function. This should include optimization settings and so on.

- NewAttrs = NewAttrs.addFnAttributes(Context, OrigAttrs.getFnAttrs());

+ NewAttrs = NewAttrs.addFnAttributes(Context, AttrBuilder(Context, OrigAttrs.getFnAttrs()));

addFramePointerAttrs(NewAttrs, Context, 0,

Shape.FrameSize, Shape.FrameAlign);

@@ -952,7 +955,7 @@ void CoroCloner::create() {

// Transfer the original function's attributes.

auto FnAttrs = OrigF.getAttributes().getFnAttrs();

- NewAttrs = NewAttrs.addFnAttributes(Context, FnAttrs);

+ NewAttrs = NewAttrs.addFnAttributes(Context, AttrBuilder(Context, FnAttrs));

break;

}

case coro::ABI::Retcon:

@@ -1082,10 +1085,16 @@ static void updateAsyncFuncPointerContextSize(coro::Shape &Shape) {

Shape.AsyncLowering.AsyncFuncPointer->setInitializer(NewFuncPtrStruct);

}

-static void replaceFrameSize(coro::Shape &Shape) {

+static void replaceFrameSizeAndAlignment(coro::Shape &Shape) {

if (Shape.ABI == coro::ABI::Async)

updateAsyncFuncPointerContextSize(Shape);

+ for (CoroAlignInst *CA : Shape.CoroAligns) {

+ CA->replaceAllUsesWith(

+ ConstantInt::get(CA->getType(), Shape.FrameAlign.value()));

+ CA->eraseFromParent();

+ }

if (Shape.CoroSizes.empty())

return;

@@ -1197,10 +1206,34 @@ scanPHIsAndUpdateValueMap(Instruction *Prev, BasicBlock *NewBlock,

static bool simplifyTerminatorLeadingToRet(Instruction *InitialInst) {

DenseMap<Value *, Value *> ResolvedValues;

BasicBlock *UnconditionalSucc = nullptr;

+ assert(InitialInst->getModule());

+ const DataLayout &DL = InitialInst->getModule()->getDataLayout();

+ auto GetFirstValidInstruction = [](Instruction *I) {

+ while (I) {

+ // BitCastInst wouldn't generate actual code so that we could skip it.

+ if (isa<BitCastInst>(I) || I->isDebugOrPseudoInst() ||

+ I->isLifetimeStartOrEnd())

+ I = I->getNextNode();

+ else if (isInstructionTriviallyDead(I))

+ // Duing we are in the middle of the transformation, we need to erase

+ // the dead instruction manually.

+ I = &*I->eraseFromParent();

+ else

+ break;

+ }

+ return I;

+ };

+ auto TryResolveConstant = [&ResolvedValues](Value *V) {

+ auto It = ResolvedValues.find(V);

+ if (It != ResolvedValues.end())

+ V = It->second;

+ return dyn_cast<ConstantInt>(V);

+ };

Instruction *I = InitialInst;

- while (I->isTerminator() ||

- (isa<CmpInst>(I) && I->getNextNode()->isTerminator())) {

+ while (I->isTerminator() || isa<CmpInst>(I)) {

if (isa<ReturnInst>(I)) {

if (I != InitialInst) {

// If InitialInst is an unconditional branch,

@@ -1213,48 +1246,68 @@ static bool simplifyTerminatorLeadingToRet(Instruction *InitialInst) {

}

if (auto *BR = dyn_cast<BranchInst>(I)) {

if (BR->isUnconditional()) {

- BasicBlock *BB = BR->getSuccessor(0);

+ BasicBlock *Succ = BR->getSuccessor(0);

if (I == InitialInst)

- UnconditionalSucc = BB;

- scanPHIsAndUpdateValueMap(I, BB, ResolvedValues);

- I = BB->getFirstNonPHIOrDbgOrLifetime();

+ UnconditionalSucc = Succ;

+ scanPHIsAndUpdateValueMap(I, Succ, ResolvedValues);

+ I = GetFirstValidInstruction(Succ->getFirstNonPHIOrDbgOrLifetime());

continue;

}

- } else if (auto *CondCmp = dyn_cast<CmpInst>(I)) {

- auto *BR = dyn_cast<BranchInst>(I->getNextNode());

- if (BR && BR->isConditional() && CondCmp == BR->getCondition()) {

- // If the case number of suspended switch instruction is reduced to

- // 1, then it is simplified to CmpInst in llvm::ConstantFoldTerminator.

- // And the comparsion looks like : %cond = icmp eq i8 %V, constant.

- ConstantInt *CondConst = dyn_cast<ConstantInt>(CondCmp->getOperand(1));

- if (CondConst && CondCmp->getPredicate() == CmpInst::ICMP_EQ) {

- Value *V = CondCmp->getOperand(0);

- auto it = ResolvedValues.find(V);

- if (it != ResolvedValues.end())

- V = it->second;

- if (ConstantInt *Cond0 = dyn_cast<ConstantInt>(V)) {

- BasicBlock *BB = Cond0->equalsInt(CondConst->getZExtValue())

- ? BR->getSuccessor(0)

- : BR->getSuccessor(1);

- scanPHIsAndUpdateValueMap(I, BB, ResolvedValues);

- I = BB->getFirstNonPHIOrDbgOrLifetime();

- continue;

- }

- } else if (auto *SI = dyn_cast<SwitchInst>(I)) {

- Value *V = SI->getCondition();

- auto it = ResolvedValues.find(V);

- if (it != ResolvedValues.end())

- V = it->second;

- if (ConstantInt *Cond = dyn_cast<ConstantInt>(V)) {

- BasicBlock *BB = SI->findCaseValue(Cond)->getCaseSuccessor();

- scanPHIsAndUpdateValueMap(I, BB, ResolvedValues);

- I = BB->getFirstNonPHIOrDbgOrLifetime();

+ BasicBlock *BB = BR->getParent();

+ // Handle the case the condition of the conditional branch is constant.

+ // e.g.,

+ //

+ // br i1 false, label %cleanup, label %CoroEnd

+ //

+ // It is possible during the transformation. We could continue the

+ // simplifying in this case.

+ if (ConstantFoldTerminator(BB, /*DeleteDeadConditions=*/true)) {

+ // Handle this branch in next iteration.

+ I = BB->getTerminator();

continue;

}

+ } else if (auto *CondCmp = dyn_cast<CmpInst>(I)) {

+ // If the case number of suspended switch instruction is reduced to

+ // 1, then it is simplified to CmpInst in llvm::ConstantFoldTerminator.

+ auto *BR = dyn_cast<BranchInst>(

+ GetFirstValidInstruction(CondCmp->getNextNode()));

+ if (!BR || !BR->isConditional() || CondCmp != BR->getCondition())

+ return false;

+ // And the comparsion looks like : %cond = icmp eq i8 %V, constant.

+ // So we try to resolve constant for the first operand only since the

+ // second operand should be literal constant by design.

+ ConstantInt *Cond0 = TryResolveConstant(CondCmp->getOperand(0));

+ auto *Cond1 = dyn_cast<ConstantInt>(CondCmp->getOperand(1));

+ if (!Cond0 || !Cond1)

+ return false;

+ // Both operands of the CmpInst are Constant. So that we could evaluate

+ // it immediately to get the destination.

+ auto *ConstResult =

+ dyn_cast_or_null<ConstantInt>(ConstantFoldCompareInstOperands(

+ CondCmp->getPredicate(), Cond0, Cond1, DL));

+ if (!ConstResult)

+ return false;

+ CondCmp->replaceAllUsesWith(ConstResult);

+ CondCmp->eraseFromParent();

+ // Handle this branch in next iteration.

+ I = BR;

+ continue;

+ } else if (auto *SI = dyn_cast<SwitchInst>(I)) {

+ ConstantInt *Cond = TryResolveConstant(SI->getCondition());

+ if (!Cond)

+ return false;

+ BasicBlock *BB = SI->findCaseValue(Cond)->getCaseSuccessor();

+ scanPHIsAndUpdateValueMap(I, BB, ResolvedValues);

+ I = GetFirstValidInstruction(BB->getFirstNonPHIOrDbgOrLifetime());

+ continue;

}

return false;

}

return false;

@@ -1826,20 +1879,20 @@ namespace {

static coro::Shape splitCoroutine(Function &F,

SmallVectorImpl<Function *> &Clones,

- bool ReuseFrameSlot) {

+ bool OptimizeFrame) {

PrettyStackTraceFunction prettyStackTrace(F);

// The suspend-crossing algorithm in buildCoroutineFrame get tripped

// up by uses in unreachable blocks, so remove them as a first pass.

removeUnreachableBlocks(F);

- coro::Shape Shape(F, ReuseFrameSlot);

+ coro::Shape Shape(F, OptimizeFrame);

if (!Shape.CoroBegin)

return Shape;

simplifySuspendPoints(Shape);

buildCoroutineFrame(F, Shape);

- replaceFrameSize(Shape);

+ replaceFrameSizeAndAlignment(Shape);

// If there are no suspend points, no split required, just remove

// the allocation and deallocation blocks, they are not needed.

@@ -2165,7 +2218,7 @@ PreservedAnalyses CoroSplitPass::run(LazyCallGraph::SCC &C,

F.removeFnAttr(CORO_PRESPLIT_ATTR);

SmallVector<Function *, 4> Clones;

- const coro::Shape Shape = splitCoroutine(F, Clones, ReuseFrameSlot);

+ const coro::Shape Shape = splitCoroutine(F, Clones, OptimizeFrame);

updateCallGraphAfterCoroutineSplit(*N, Shape, Clones, C, CG, AM, UR, FAM);

if (!Shape.CoroSuspends.empty()) {

@@ -2198,13 +2251,13 @@ namespace {

struct CoroSplitLegacy : public CallGraphSCCPass {

static char ID; // Pass identification, replacement for typeid

- CoroSplitLegacy(bool ReuseFrameSlot = false)

- : CallGraphSCCPass(ID), ReuseFrameSlot(ReuseFrameSlot) {

+ CoroSplitLegacy(bool OptimizeFrame = false)

+ : CallGraphSCCPass(ID), OptimizeFrame(OptimizeFrame) {

initializeCoroSplitLegacyPass(*PassRegistry::getPassRegistry());

}

bool Run = false;

- bool ReuseFrameSlot;

+ bool OptimizeFrame;

// A coroutine is identified by the presence of coro.begin intrinsic, if

// we don't have any, this pass has nothing to do.

@@ -2263,7 +2316,7 @@ struct CoroSplitLegacy : public CallGraphSCCPass {

F->removeFnAttr(CORO_PRESPLIT_ATTR);

SmallVector<Function *, 4> Clones;

- const coro::Shape Shape = splitCoroutine(*F, Clones, ReuseFrameSlot);

+ const coro::Shape Shape = splitCoroutine(*F, Clones, OptimizeFrame);

updateCallGraphAfterCoroutineSplit(*F, Shape, Clones, CG, SCC);

if (Shape.ABI == coro::ABI::Async) {

// Restart SCC passes.

@@ -2300,6 +2353,6 @@ INITIALIZE_PASS_END(

"Split coroutine into a set of functions driving its state machine", false,

false)

-Pass *llvm::createCoroSplitLegacyPass(bool ReuseFrameSlot) {

- return new CoroSplitLegacy(ReuseFrameSlot);

+Pass *llvm::createCoroSplitLegacyPass(bool OptimizeFrame) {

+ return new CoroSplitLegacy(OptimizeFrame);

}

diff --git a/llvm/lib/Transforms/Coroutines/Coroutines.cpp b/llvm/lib/Transforms/Coroutines/Coroutines.cpp
index fba8b03e44ba..965a146c143f 100644
--- a/llvm/lib/Transforms/Coroutines/Coroutines.cpp
+++ b/llvm/lib/Transforms/Coroutines/Coroutines.cpp

@@ -123,6 +123,7 @@ Value *coro::LowererBase::makeSubFnCall(Value *Arg, int Index,

static bool isCoroutineIntrinsicName(StringRef Name) {

// NOTE: Must be sorted!

static const char *const CoroIntrinsics[] = {

+ "llvm.coro.align",

"llvm.coro.alloc",

"llvm.coro.async.context.alloc",

"llvm.coro.async.context.dealloc",

@@ -268,6 +269,9 @@ void coro::Shape::buildFrom(Function &F) {

case Intrinsic::coro_size:

CoroSizes.push_back(cast<CoroSizeInst>(II));

break;

+ case Intrinsic::coro_align:

+ CoroAligns.push_back(cast<CoroAlignInst>(II));

+ break;

case Intrinsic::coro_frame:

CoroFrames.push_back(cast<CoroFrameInst>(II));

break;

@@ -672,8 +676,11 @@ static void checkAsyncFuncPointer(const Instruction *I, Value *V) {

if (!AsyncFuncPtrAddr)

fail(I, "llvm.coro.id.async async function pointer not a global", V);

- auto *StructTy =

- cast<StructType>(AsyncFuncPtrAddr->getType()->getPointerElementType());

+ if (AsyncFuncPtrAddr->getType()->isOpaquePointerTy())

+ return;

+ auto *StructTy = cast<StructType>(

+ AsyncFuncPtrAddr->getType()->getNonOpaquePointerElementType());

if (StructTy->isOpaque() || !StructTy->isPacked() ||

StructTy->getNumElements() != 2 ||

!StructTy->getElementType(0)->isIntegerTy(32) ||

@@ -697,14 +704,16 @@ void CoroIdAsyncInst::checkWellFormed() const {

static void checkAsyncContextProjectFunction(const Instruction *I,

Function *F) {

auto *FunTy = cast<FunctionType>(F->getValueType());

- if (!FunTy->getReturnType()->isPointerTy() ||

- !FunTy->getReturnType()->getPointerElementType()->isIntegerTy(8))

+ Type *Int8Ty = Type::getInt8Ty(F->getContext());

+ auto *RetPtrTy = dyn_cast<PointerType>(FunTy->getReturnType());

+ if (!RetPtrTy || !RetPtrTy->isOpaqueOrPointeeTypeMatches(Int8Ty))

fail(I,

"llvm.coro.suspend.async resume function projection function must "

"return an i8* type",

F);

if (FunTy->getNumParams() != 1 || !FunTy->getParamType(0)->isPointerTy() ||

- !FunTy->getParamType(0)->getPointerElementType()->isIntegerTy(8))

+ !cast<PointerType>(FunTy->getParamType(0))

+ ->isOpaqueOrPointeeTypeMatches(Int8Ty))

fail(I,

"llvm.coro.suspend.async resume function projection function must "

"take one i8* type as parameter",

@@ -719,8 +728,7 @@ void CoroAsyncEndInst::checkWellFormed() const {

auto *MustTailCallFunc = getMustTailCallFunction();

if (!MustTailCallFunc)

return;

- auto *FnTy =

- cast<FunctionType>(MustTailCallFunc->getType()->getPointerElementType());

+ auto *FnTy = MustTailCallFunc->getFunctionType();

if (FnTy->getNumParams() != (arg_size() - 3))

fail(this,

"llvm.coro.end.async must tail call function argument type must "