summaryrefslogtreecommitdiff
path: root/lib/Transforms
diff options
context:
space:
mode:
authorChris Lattner <sabre@nondot.org>2003-10-06 15:52:43 +0000
committerChris Lattner <sabre@nondot.org>2003-10-06 15:52:43 +0000
commit884d6c4e10501116a8ff45616231564a2738dadd (patch)
tree54bd9970078b53c3f11032527fd6ece56a377135 /lib/Transforms
parent2c9b913fc0fe0c6b2e41e84fc80f905a743ca054 (diff)
downloadllvm-884d6c4e10501116a8ff45616231564a2738dadd.tar.gz
llvm-884d6c4e10501116a8ff45616231564a2738dadd.tar.bz2
llvm-884d6c4e10501116a8ff45616231564a2738dadd.tar.xz
Speed up the predicate used to decide when to inline by caching the size
of callees between executions. On eon, in release mode, this changes the inliner from taking 11.5712s to taking 2.2066s. In debug mode, it went from taking 14.4148s to taking 7.0745s. In release mode, this is a 24.7% speedup of gccas, in debug mode, it's a total speedup of 11.7%. This also makes it slightly more aggressive. This could be because we are not judging the size of the functions quite as accurately as before. When we start looking at the performance of the generated code, this can be investigated further. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@8893 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'lib/Transforms')
-rw-r--r--lib/Transforms/IPO/InlineSimple.cpp41
1 files changed, 28 insertions, 13 deletions
diff --git a/lib/Transforms/IPO/InlineSimple.cpp b/lib/Transforms/IPO/InlineSimple.cpp
index e62a8b1344..966ac2eab5 100644
--- a/lib/Transforms/IPO/InlineSimple.cpp
+++ b/lib/Transforms/IPO/InlineSimple.cpp
@@ -11,7 +11,17 @@
#include "llvm/Transforms/IPO.h"
namespace {
- struct SimpleInliner : public Inliner {
+ // FunctionInfo - For each function, calculate the size of it in blocks and
+ // instructions.
+ struct FunctionInfo {
+ unsigned NumInsts, NumBlocks;
+
+ FunctionInfo() : NumInsts(0), NumBlocks(0) {}
+ };
+
+ class SimpleInliner : public Inliner {
+ std::map<const Function*, FunctionInfo> CachedFunctionInfo;
+ public:
int getInlineCost(CallSite CS);
};
RegisterOpt<SimpleInliner> X("inline", "Function Integration/Inlining");
@@ -19,7 +29,6 @@ namespace {
Pass *createFunctionInliningPass() { return new SimpleInliner(); }
-
// getInlineCost - The heuristic used to determine if we should inline the
// function call or not.
//
@@ -71,19 +80,25 @@ int SimpleInliner::getInlineCost(CallSite CS) {
// Now that we have considered all of the factors that make the call site more
// likely to be inlined, look at factors that make us not want to inline it.
- // As soon as the inline quality gets negative, bail out.
+ FunctionInfo &CalleeFI = CachedFunctionInfo[Callee];
- // Look at the size of the callee. Each basic block counts as 20 units, and
- // each instruction counts as 10.
- for (Function::const_iterator BB = Callee->begin(), E = Callee->end();
- BB != E; ++BB)
- InlineCost += BB->size()*10 + 20;
+ // If we haven't calculated this information yet...
+ if (CalleeFI.NumBlocks == 0) {
+ unsigned NumInsts = 0, NumBlocks = 0;
- // Don't inline into something too big, which would make it bigger. Here, we
- // count each basic block as a single unit.
- for (Function::const_iterator BB = Caller->begin(), E = Caller->end();
- BB != E; ++BB)
- InlineCost++;
+ // Look at the size of the callee. Each basic block counts as 20 units, and
+ // each instruction counts as 10.
+ for (Function::const_iterator BB = Callee->begin(), E = Callee->end();
+ BB != E; ++BB) {
+ NumInsts += BB->size();
+ NumBlocks++;
+ }
+ CalleeFI.NumBlocks = NumBlocks;
+ CalleeFI.NumInsts = NumInsts;
+ }
+ // Look at the size of the callee. Each basic block counts as 21 units, and
+ // each instruction counts as 10.
+ InlineCost += CalleeFI.NumInsts*10 + CalleeFI.NumBlocks*20;
return InlineCost;
}