mirror of
https://github.com/apple/swift.git
synced 2025-12-21 12:14:44 +01:00
This follows the model of dominance info and allows me to create reachability methods on SILBasicBlock without creating dependencies from swiftSIL to swiftSILAnalysis. Swift SVN r21866
392 lines
14 KiB
C++
392 lines
14 KiB
C++
//===-- ClosureSpecializer.cpp ------ Performs Closure Specialization----===//
|
|
//
|
|
// This source file is part of the Swift.org open source project
|
|
//
|
|
// Copyright (c) 2014 - 2015 Apple Inc. and the Swift project authors
|
|
// Licensed under Apache License v2.0 with Runtime Library Exception
|
|
//
|
|
// See http://swift.org/LICENSE.txt for license information
|
|
// See http://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#define DEBUG_TYPE "closure-specialization"
|
|
#include "swift/SIL/SILCloner.h"
|
|
#include "swift/SIL/SILFunction.h"
|
|
#include "swift/SIL/SILInstruction.h"
|
|
#include "swift/SIL/SILModule.h"
|
|
#include "swift/SILAnalysis/CallGraphAnalysis.h"
|
|
#include "swift/SILAnalysis/LoopAnalysis.h"
|
|
#include "swift/SILPasses/Passes.h"
|
|
#include "swift/SILPasses/Transforms.h"
|
|
#include "llvm/ADT/Statistic.h"
|
|
#include "llvm/ADT/SmallString.h"
|
|
#include "llvm/Support/Debug.h"
|
|
|
|
using namespace swift;
|
|
|
|
STATISTIC(NumClosureSpecialized,
|
|
"Number of functions with closures specialized");
|
|
|
|
namespace {
|
|
|
|
/// \brief A SILCloner subclass which clones a function that takes a closure
|
|
/// argument. We update the parameter list to remove the parameter for the
|
|
/// closure argument and to append the variables captured in the closure.
|
|
/// We also need to replace the closure parameter with the partial apply
|
|
/// on the closure. We need to update the callsite to pass in the correct
|
|
/// arguments.
|
|
class ClosureSpecCloner : public SILClonerWithScopes<ClosureSpecCloner> {
|
|
public:
|
|
using SuperTy = SILClonerWithScopes<ClosureSpecCloner>;
|
|
friend class SILVisitor<ClosureSpecCloner>;
|
|
friend class SILCloner<ClosureSpecCloner>;
|
|
|
|
ClosureSpecCloner(SILFunction *Orig, PartialApplyInst *PAI,
|
|
unsigned ClosureIndex, StringRef ClonedName)
|
|
: SuperTy(*initCloned(Orig, PAI, ClosureIndex, ClonedName)),
|
|
Orig(Orig), ClosureIndex(ClosureIndex), PAI(PAI) {
|
|
}
|
|
|
|
void populateCloned();
|
|
|
|
SILFunction *getCloned() { return &getBuilder().getFunction(); }
|
|
static SILFunction *cloneFunction(SILFunction *F, PartialApplyInst *PAI,
|
|
unsigned ClosureIndex, StringRef NewName) {
|
|
ClosureSpecCloner C(F, PAI, ClosureIndex, NewName);
|
|
C.populateCloned();
|
|
++NumClosureSpecialized;
|
|
return C.getCloned();
|
|
};
|
|
|
|
private:
|
|
static SILFunction *initCloned(SILFunction *Orig, PartialApplyInst *PAI,
|
|
unsigned ClosureIndex, StringRef ClonedName);
|
|
SILFunction *Orig;
|
|
unsigned ClosureIndex;
|
|
PartialApplyInst *PAI;
|
|
};
|
|
|
|
SILFunction *ClosureSpecCloner::initCloned(SILFunction *Orig,
|
|
PartialApplyInst *PAI,
|
|
unsigned ClosureIndex,
|
|
StringRef ClonedName) {
|
|
SmallVector<SILParameterInfo, 4> ClonedInterfaceArgTys;
|
|
|
|
SILFunctionType *OrigFTI = Orig->getLoweredFunctionType();
|
|
unsigned Index = 0;
|
|
// Remove the parameter for the closure argument.
|
|
for (auto ¶m : OrigFTI->getParameters()) {
|
|
if (Index != ClosureIndex)
|
|
ClonedInterfaceArgTys.push_back(param);
|
|
++Index;
|
|
}
|
|
|
|
// Append the variables captured in the closure.
|
|
auto *FRI = cast<FunctionRefInst>(PAI->getCallee());
|
|
SILFunction *ClosureWithCaptured = FRI->getReferencedFunction();
|
|
SILFunctionType *ClosureWithCapturedFTI =
|
|
ClosureWithCaptured->getLoweredFunctionType();
|
|
auto ClosureType = PAI->getType().castTo<SILFunctionType>();
|
|
// Add the parameters of ClosureWithCapturedFTI starting from
|
|
// ClosureType->getParameters().size().
|
|
for (auto I = ClosureWithCapturedFTI->getParameters().begin() +
|
|
ClosureType->getParameters().size(),
|
|
E = ClosureWithCapturedFTI->getParameters().end(); I != E; I++)
|
|
ClonedInterfaceArgTys.push_back(*I);
|
|
|
|
SILModule &M = Orig->getModule();
|
|
auto ClonedTy =
|
|
SILFunctionType::get(OrigFTI->getGenericSignature(),
|
|
OrigFTI->getExtInfo(),
|
|
OrigFTI->getCalleeConvention(),
|
|
ClonedInterfaceArgTys,
|
|
OrigFTI->getResult(),
|
|
M.getASTContext());
|
|
|
|
auto Fn = SILFunction::create(M, Orig->getLinkage(), ClonedName, ClonedTy,
|
|
Orig->getContextGenericParams(),
|
|
Orig->getLocation(), Orig->isBare(),
|
|
Orig->isTransparent(), Orig->getInlineStrategy(),
|
|
Orig->getEffectsInfo(),
|
|
Orig, Orig->getDebugScope());
|
|
Fn->setSemanticsAttr(Orig->getSemanticsAttr());
|
|
return Fn;
|
|
}
|
|
|
|
/// \brief Populate the body of the cloned closure, modifying instructions as
|
|
/// necessary.
|
|
void ClosureSpecCloner::populateCloned() {
|
|
SILFunction *Cloned = getCloned();
|
|
SILModule &M = Cloned->getModule();
|
|
|
|
// Create arguments for the entry block.
|
|
SILBasicBlock *OrigEntryBB = Orig->begin();
|
|
SILBasicBlock *ClonedEntryBB = new (M) SILBasicBlock(Cloned);
|
|
|
|
// Remove the closure argument.
|
|
SILArgument *ClosureArg = nullptr;
|
|
for (size_t i = 0, e = OrigEntryBB->bbarg_size(); i != e; ++i) {
|
|
SILArgument *Arg = OrigEntryBB->getBBArg(i);
|
|
if (i == ClosureIndex) {
|
|
ClosureArg = Arg;
|
|
continue;
|
|
}
|
|
|
|
// Otherwise, create a new argument which copies the original argument
|
|
SILValue MappedValue =
|
|
new (M) SILArgument(Arg->getType(), ClonedEntryBB, Arg->getDecl());
|
|
ValueMap.insert(std::make_pair(Arg, MappedValue));
|
|
}
|
|
|
|
auto *FRI = cast<FunctionRefInst>(PAI->getCallee());
|
|
SILFunction *ClosureWithCaptured = FRI->getReferencedFunction();
|
|
SILBasicBlock *ClosureEntryBB = ClosureWithCaptured->begin();
|
|
auto ClosureType = PAI->getType().castTo<SILFunctionType>();
|
|
// Add the parameters of ClosureWithCapturedFTI starting from
|
|
// ClosureType->getParameters().size().
|
|
SmallVector<SILValue, 16> NewPAIArgs;
|
|
for (auto I = ClosureEntryBB->bbarg_begin() +
|
|
ClosureType->getParameters().size(),
|
|
E = ClosureEntryBB->bbarg_end(); I != E; I++) {
|
|
SILValue MappedValue =
|
|
new (M) SILArgument((*I)->getType(), ClonedEntryBB, (*I)->getDecl());
|
|
NewPAIArgs.push_back(MappedValue);
|
|
ValueMap.insert(std::make_pair(*I, MappedValue));
|
|
}
|
|
|
|
getBuilder().setInsertionPoint(ClonedEntryBB);
|
|
// Clone FRI and PAI, and replace usage of the removed closure argument
|
|
// with result of cloned PAI.
|
|
SILValue FnVal = getBuilder().createFunctionRef(FRI->getLoc(),
|
|
ClosureWithCaptured);
|
|
auto *NewPAI = getBuilder().createPartialApply(PAI->getLoc(), FnVal,
|
|
FnVal.getType(), {},
|
|
NewPAIArgs, PAI->getType());
|
|
ValueMap.insert(std::make_pair(ClosureArg, SILValue(NewPAI, 0)));
|
|
|
|
BBMap.insert(std::make_pair(OrigEntryBB, ClonedEntryBB));
|
|
// Recursively visit original BBs in depth-first preorder, starting with the
|
|
// entry block, cloning all instructions other than terminators.
|
|
visitSILBasicBlock(OrigEntryBB);
|
|
|
|
// Now iterate over the BBs and fix up the terminators.
|
|
for (auto BI = BBMap.begin(), BE = BBMap.end(); BI != BE; ++BI) {
|
|
getBuilder().setInsertionPoint(BI->second);
|
|
visit(BI->first->getTerminator());
|
|
}
|
|
}
|
|
|
|
struct ArgSpecDescriptor {
|
|
PartialApplyInst *PAI;
|
|
ApplyInst *AI;
|
|
unsigned ClosureIndex;
|
|
ArgSpecDescriptor(PartialApplyInst *PAI, ApplyInst *AI,
|
|
unsigned ClosureIndex) :
|
|
PAI(PAI), AI(AI), ClosureIndex(ClosureIndex) {
|
|
}
|
|
};
|
|
|
|
/// Update the callsite to pass in the correct arguments.
|
|
static void rewriteApplyInst(ArgSpecDescriptor &AD, SILFunction *NewF) {
|
|
SILBuilder Builder(AD.AI);
|
|
FunctionRefInst *FRI = Builder.createFunctionRef(AD.AI->getLoc(), NewF);
|
|
|
|
// Create the args for the new apply by removing the closure argument and
|
|
// appending the captured argument.
|
|
llvm::SmallVector<SILValue, 8> NewArgs;
|
|
unsigned Index = 0;
|
|
for (auto Arg : AD.AI->getArguments()) {
|
|
if (Index != AD.ClosureIndex)
|
|
NewArgs.push_back(Arg);
|
|
Index++;
|
|
}
|
|
for (auto Arg : AD.PAI->getArguments())
|
|
NewArgs.push_back(Arg);
|
|
|
|
SILType LoweredType = NewF->getLoweredType();
|
|
SILType ResultType = LoweredType.getFunctionInterfaceResultType();
|
|
ApplyInst *NewAI = Builder.createApply(AD.AI->getLoc(), FRI, LoweredType,
|
|
ResultType, ArrayRef<Substitution>(),
|
|
NewArgs, NewF->isTransparent());
|
|
|
|
// Replace all uses of the old apply with the new apply.
|
|
AD.AI->replaceAllUsesWith(NewAI);
|
|
// Erase the old apply.
|
|
AD.AI->eraseFromParent();
|
|
|
|
if (AD.PAI->use_empty())
|
|
AD.PAI->eraseFromParent();
|
|
}
|
|
|
|
struct ClosureSpecializer {
|
|
SILLoopAnalysis *LA;
|
|
|
|
ClosureSpecializer(SILLoopAnalysis *LA)
|
|
: LA(LA) {
|
|
}
|
|
|
|
bool isProfitable(ArgSpecDescriptor &AD);
|
|
bool specialize(SILFunction *Caller);
|
|
};
|
|
|
|
static unsigned getInstCount(SILFunction *F) {
|
|
unsigned Cost = 0;
|
|
for (auto &BB : *F)
|
|
Cost += BB.getInstList().size();
|
|
return Cost;
|
|
}
|
|
|
|
bool ClosureSpecializer::isProfitable(ArgSpecDescriptor &AD) {
|
|
// Check the relative size of the callee and the closure.
|
|
auto *ClosureFRI = cast<FunctionRefInst>(AD.PAI->getCallee());
|
|
// We only handle the case where callee is FunctionRefInst.
|
|
if (!isa<FunctionRefInst>(AD.AI->getCallee()))
|
|
return false;
|
|
auto *CalleeFRI = cast<FunctionRefInst>(AD.AI->getCallee());
|
|
auto *Callee = CalleeFRI->getReferencedFunction();
|
|
|
|
unsigned ClosureCount = getInstCount(ClosureFRI->getReferencedFunction());
|
|
unsigned CalleeCount = getInstCount(Callee);
|
|
if (CalleeCount < 2 * ClosureCount) {
|
|
DEBUG(llvm::dbgs() << " Callsite is not profitable: " << ClosureCount
|
|
<< ", " << CalleeCount << "\n");
|
|
return false;
|
|
}
|
|
DEBUG(llvm::dbgs() << " Callsite is profitable: " << ClosureCount
|
|
<< ", " << CalleeCount << "\n");
|
|
|
|
// Collect callsites to the closure.
|
|
SmallVector<ApplyInst*, 8> CallSites;
|
|
SILArgument *ClosureArg = Callee->begin()->getBBArg(AD.ClosureIndex);
|
|
for (auto U : ClosureArg->getUses())
|
|
if (auto CS = dyn_cast<ApplyInst>(U->getUser()))
|
|
CallSites.push_back(CS);
|
|
|
|
if (CallSites.empty())
|
|
return false;
|
|
|
|
// Check hotness of the callsite (AI) and callsites to closure inside callee.
|
|
// For now, if closure is called inside a loop, we think it is profitable.
|
|
SILLoopInfo *LI = LA->getLoopInfo(Callee);
|
|
for (auto AI : CallSites) {
|
|
if (LI->getLoopFor(AI->getParent()))
|
|
return true;
|
|
}
|
|
|
|
DEBUG(llvm::dbgs() << " Callsite is not profitable: closure not called "
|
|
"inside a loop\n");
|
|
return false;
|
|
}
|
|
|
|
static void createName(SILFunction *Callee, SILFunction *Closure,
|
|
unsigned ClosureIndex,
|
|
llvm::SmallString<64> &Name) {
|
|
llvm::raw_svector_ostream buffer(Name);
|
|
buffer << "_TTS";
|
|
buffer << Closure->getName() << "_as" << ClosureIndex
|
|
<< '_' << Callee->getName();
|
|
}
|
|
|
|
bool ClosureSpecializer::specialize(SILFunction *Caller) {
|
|
DEBUG(llvm::dbgs() << "Optimizing callsites that take closure argument in "
|
|
<< Caller->getName() << '\n');
|
|
|
|
// Collect all of the PartialApplyInsts that are used as arguments to
|
|
// ApplyInsts. Check the profitability of specializing the closure argument.
|
|
llvm::SmallVector<ArgSpecDescriptor, 8> CallSites;
|
|
for (auto &BB : *Caller) {
|
|
auto I = BB.begin(), E = BB.end();
|
|
while (I != E) {
|
|
PartialApplyInst *PAI = dyn_cast<PartialApplyInst>(I++);
|
|
if (!PAI || I == E)
|
|
continue;
|
|
auto *FRI = dyn_cast<FunctionRefInst>(PAI->getCallee());
|
|
if (!FRI)
|
|
continue;
|
|
|
|
// Make sure the next instruction is ApplyInst and PAI feeds into one
|
|
// operand.
|
|
auto *AI = dyn_cast<ApplyInst>(I);
|
|
if (!AI)
|
|
continue;
|
|
unsigned Idx = 0;
|
|
for (auto Arg : AI->getArguments()) {
|
|
if (Arg == SILValue(PAI, 0)) {
|
|
CallSites.push_back(ArgSpecDescriptor(PAI, AI, Idx));
|
|
DEBUG(llvm::dbgs() << " Found callsite with closure argument at "
|
|
<< Idx << ": " << *AI);
|
|
break;
|
|
}
|
|
Idx++;
|
|
}
|
|
}
|
|
}
|
|
|
|
bool Changed = false;
|
|
for (auto &AD : CallSites) {
|
|
if (AD.AI->hasSubstitutions() || AD.PAI->hasSubstitutions()) {
|
|
DEBUG(llvm::dbgs() << " Callsite has substitutions\n");
|
|
continue;
|
|
}
|
|
if (!isProfitable(AD))
|
|
continue;
|
|
|
|
auto *ClosureFRI = cast<FunctionRefInst>(AD.PAI->getCallee());
|
|
auto *CalleeFRI = cast<FunctionRefInst>(AD.AI->getCallee());
|
|
auto *Callee = CalleeFRI->getReferencedFunction();
|
|
|
|
llvm::SmallString<64> NewFName;
|
|
createName(Callee, ClosureFRI->getReferencedFunction(), AD.ClosureIndex,
|
|
NewFName);
|
|
DEBUG(llvm::dbgs() << " Perform optimizations with new name "
|
|
<< NewFName << '\n');
|
|
|
|
SILFunction *NewF = Callee->getModule().lookUpFunction(NewFName);
|
|
if (!NewF)
|
|
NewF = ClosureSpecCloner::cloneFunction(Callee, AD.PAI, AD.ClosureIndex,
|
|
NewFName);
|
|
|
|
rewriteApplyInst(AD, NewF);
|
|
Changed = true;
|
|
}
|
|
|
|
return Changed;
|
|
}
|
|
|
|
} // end anonymous namespace.
|
|
|
|
namespace {
|
|
class SILClosureSpecializerTransform : public SILModuleTransform {
|
|
public:
|
|
SILClosureSpecializerTransform() {}
|
|
|
|
virtual void run() {
|
|
CallGraphAnalysis* CGA = PM->getAnalysis<CallGraphAnalysis>();
|
|
SILLoopAnalysis *LA = PM->getAnalysis<SILLoopAnalysis>();
|
|
|
|
bool Changed = false;
|
|
// Specialize going bottom-up in the call graph.
|
|
for (auto *F : CGA->getCallGraph().getBottomUpFunctionOrder()) {
|
|
// If F is empty, attempt to link it. Skip it if we fail to do so.
|
|
if (F->empty() &&
|
|
!getModule()->linkFunction(F, SILModule::LinkingMode::LinkAll))
|
|
continue;
|
|
|
|
Changed |= ClosureSpecializer(LA).specialize(F);
|
|
}
|
|
|
|
// Invalidate the call graph.
|
|
if (Changed)
|
|
invalidateAnalysis(SILAnalysis::InvalidationKind::CallGraph);
|
|
}
|
|
|
|
StringRef getName() override { return "Closure Specialization"; }
|
|
};
|
|
} // end anonymous namespace
|
|
|
|
|
|
SILTransform *swift::createClosureSpecializer() {
|
|
return new SILClosureSpecializerTransform();
|
|
}
|