Skip to content

Commit

Permalink
[MBP] Add flags to disable the BadCFGConflict check in MachineBlockPl…
Browse files Browse the repository at this point in the history
…acement.

Some benchmarks have shown that this could lead to a potential
performance benefit, and so adding some flags to try to help measure the
difference.

A possible explanation. In diamond-shaped CFGs (A followed by either
B or C both followed by D), putting B and C both in between A and
D leads to the code being less dense than it could be. Always either
B or C have to be skipped increasing the chance of cache misses etc.
Moving either B or C to after D might be beneficial on average.

In the long run, but we should probably do a better job of analyzing the
basic block and branch probabilities to move the correct one of B or
C to after D. But even if we don't use this in the long run, it is
a good baseline for benchmarking.

Original patch authored by Daniel Jasper with test tweaks and a second
flag added by me.

Differential Revision: http://reviews.llvm.org/D6969

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@226034 91177308-0d34-0410-b5e6-96231b3b80d8
  • Loading branch information
chandlerc committed Jan 14, 2015
1 parent 11abe69 commit 8af8091
Show file tree
Hide file tree
Showing 2 changed files with 147 additions and 20 deletions.
55 changes: 35 additions & 20 deletions lib/CodeGen/MachineBlockPlacement.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -60,6 +60,17 @@ static cl::opt<unsigned> AlignAllBlock("align-all-blocks",
"blocks in the function."),
cl::init(0), cl::Hidden);

static cl::opt<bool> OnlyHotBadCFGConflictCheck(
"only-hot-bad-cfg-conflict-check",
cl::desc("Only check that a hot successor doesn't have a hot predecessor."),
cl::init(false), cl::Hidden);

static cl::opt<bool> NoBadCFGConflictCheck(
"no-bad-cfg-conflict-check",
cl::desc("Don't check whether a hot successor has a more important "
"predecessor."),
cl::init(false), cl::Hidden);

// FIXME: Find a good default for this flag and remove the flag.
static cl::opt<unsigned>
ExitBlockBias("block-placement-exit-block-bias",
Expand Down Expand Up @@ -374,29 +385,33 @@ MachineBasicBlock *MachineBlockPlacement::selectBestSuccessor(
continue;
}

// Make sure that a hot successor doesn't have a globally more important
// predecessor.
BlockFrequency CandidateEdgeFreq
= MBFI->getBlockFreq(BB) * SuccProb * HotProb.getCompl();
bool BadCFGConflict = false;
for (MachineBasicBlock::pred_iterator PI = (*SI)->pred_begin(),
PE = (*SI)->pred_end();
PI != PE; ++PI) {
if (*PI == *SI || (BlockFilter && !BlockFilter->count(*PI)) ||
BlockToChain[*PI] == &Chain)
if (!NoBadCFGConflictCheck) {
// Make sure that a hot successor doesn't have a globally more
// important predecessor.
BlockFrequency CandidateEdgeFreq =
OnlyHotBadCFGConflictCheck
? MBFI->getBlockFreq(BB) * SuccProb
: MBFI->getBlockFreq(BB) * SuccProb * HotProb.getCompl();
bool BadCFGConflict = false;
for (MachineBasicBlock::pred_iterator PI = (*SI)->pred_begin(),
PE = (*SI)->pred_end();
PI != PE; ++PI) {
if (*PI == *SI || (BlockFilter && !BlockFilter->count(*PI)) ||
BlockToChain[*PI] == &Chain)
continue;
BlockFrequency PredEdgeFreq =
MBFI->getBlockFreq(*PI) * MBPI->getEdgeProbability(*PI, *SI);
if (PredEdgeFreq >= CandidateEdgeFreq) {
BadCFGConflict = true;
break;
}
}
if (BadCFGConflict) {
DEBUG(dbgs() << " " << getBlockName(*SI) << " -> " << SuccProb
<< " (prob) (non-cold CFG conflict)\n");
continue;
BlockFrequency PredEdgeFreq
= MBFI->getBlockFreq(*PI) * MBPI->getEdgeProbability(*PI, *SI);
if (PredEdgeFreq >= CandidateEdgeFreq) {
BadCFGConflict = true;
break;
}
}
if (BadCFGConflict) {
DEBUG(dbgs() << " " << getBlockName(*SI) << " -> " << SuccProb
<< " (prob) (non-cold CFG conflict)\n");
continue;
}
}

DEBUG(dbgs() << " " << getBlockName(*SI) << " -> " << SuccProb
Expand Down
112 changes: 112 additions & 0 deletions test/CodeGen/X86/code_placement_bad_cfg_check.ll
Original file line number Diff line number Diff line change
@@ -0,0 +1,112 @@
; RUN: llc -mcpu=corei7 -mtriple=x86_64-linux < %s | FileCheck %s -check-prefix=CHECK-BAD-CFG
; RUN: llc -mcpu=corei7 -mtriple=x86_64-linux -no-bad-cfg-conflict-check < %s | FileCheck %s -check-prefix=CHECK-NO-BAD-CFG
; RUN: llc -mcpu=corei7 -mtriple=x86_64-linux -only-hot-bad-cfg-conflict-check < %s | FileCheck %s -check-prefix=CHECK-HOT-BAD-CFG

define void @foo(i32 %t) {
; Test that we lift the call to 'c' up to immediately follow the call to 'b'
; when we disable the cfg conflict check.
;
; CHECK-BAD-CFG-LABEL: foo:
; CHECK-BAD-CFG: callq b
; CHECK-BAD-CFG: callq a
; CHECK-BAD-CFG: callq c
;
; CHECK-NO-BAD-CFG-LABEL: foo:
; CHECK-NO-BAD-CFG: callq b
; CHECK-NO-BAD-CFG: callq c
; CHECK-NO-BAD-CFG: callq a
;
; CHECK-HOT-BAD-CFG-LABEL: foo:
; CHECK-HOT-BAD-CFG: callq b
; CHECK-HOT-BAD-CFG: callq c
; CHECK-HOT-BAD-CFG: callq a

entry:
%cmp = icmp eq i32 %t, 0
br i1 %cmp, label %if.then, label %if.else

if.then:
call void @a()
br label %if.end

if.else:
call void @b()
br label %if.end

if.end:
call void @c()
ret void
}

define void @bar(i32 %t1, i32 %t2, i32 %t3) {
; Test that we lift the call to 'c' up to immediately follow the call to 'b'
; when we disable the cfg conflict check.
;
; CHECK-BAD-CFG-LABEL: bar:
; CHECK-BAD-CFG: callq a
; CHECK-BAD-CFG: callq c
; CHECK-BAD-CFG: callq d
; CHECK-BAD-CFG: callq f
; CHECK-BAD-CFG: callq b
; CHECK-BAD-CFG: callq e
; CHECK-BAD-CFG: callq g
;
; CHECK-NO-BAD-CFG-LABEL: bar:
; CHECK-NO-BAD-CFG: callq a
; CHECK-NO-BAD-CFG: callq c
; CHECK-NO-BAD-CFG: callq g
; CHECK-NO-BAD-CFG: callq d
; CHECK-NO-BAD-CFG: callq f
; CHECK-NO-BAD-CFG: callq b
; CHECK-NO-BAD-CFG: callq e
;
; CHECK-HOT-BAD-CFG-LABEL: bar:
; CHECK-HOT-BAD-CFG: callq a
; CHECK-HOT-BAD-CFG: callq c
; CHECK-HOT-BAD-CFG: callq d
; CHECK-HOT-BAD-CFG: callq f
; CHECK-HOT-BAD-CFG: callq g
; CHECK-HOT-BAD-CFG: callq b
; CHECK-HOT-BAD-CFG: callq e

entry:
br i1 undef, label %if1.then, label %if1.else

if1.then:
call void @a()
%cmp2 = icmp eq i32 %t2, 0
br i1 %cmp2, label %if2.then, label %if2.else

if2.then:
call void @b()
br label %if.end

if2.else:
call void @c()
br label %if.end

if1.else:
call void @d()
%cmp3 = icmp eq i32 %t3, 0
br i1 %cmp3, label %if3.then, label %if3.else

if3.then:
call void @e()
br label %if.end

if3.else:
call void @f()
br label %if.end

if.end:
call void @g()
ret void
}

declare void @a()
declare void @b()
declare void @c()
declare void @d()
declare void @e()
declare void @f()
declare void @g()

0 comments on commit 8af8091

Please sign in to comment.