diff options
author | Juergen Ributzka <juergen@apple.com> | 2014-06-25 20:06:12 +0000 |
---|---|---|
committer | Juergen Ributzka <juergen@apple.com> | 2014-06-25 20:06:12 +0000 |
commit | d01f1c4054c73a184d08ed6f5817ad8de4513f3c (patch) | |
tree | bca7556bf8e448d04b81d11acf64ca5f28b0e288 | |
parent | 91c39aa6285247aefbf627f4210f7931076bae49 (diff) | |
download | llvm-d01f1c4054c73a184d08ed6f5817ad8de4513f3c.tar.gz llvm-d01f1c4054c73a184d08ed6f5817ad8de4513f3c.tar.bz2 llvm-d01f1c4054c73a184d08ed6f5817ad8de4513f3c.tar.xz |
[FastISel][X86] Only fold the cmp into the select when both instructions are in the same basic block.
If the cmp is in a different basic block, then it is possible that not all
operands of that compare have defined registers. This can happen when one of
the operands to the cmp is a load and the load gets folded into the cmp. In
this case FastISel will skip the load instruction and the vreg is never
defined.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@211730 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r-- | lib/Target/X86/X86FastISel.cpp | 20 | ||||
-rw-r--r-- | test/CodeGen/X86/fast-isel-select-cmp.ll | 50 |
2 files changed, 65 insertions, 5 deletions
diff --git a/lib/Target/X86/X86FastISel.cpp b/lib/Target/X86/X86FastISel.cpp index 6ada3977f0..92b3d62f0c 100644 --- a/lib/Target/X86/X86FastISel.cpp +++ b/lib/Target/X86/X86FastISel.cpp @@ -1754,8 +1754,11 @@ bool X86FastISel::X86FastEmitCMoveSelect(const Instruction *I) { const TargetRegisterClass *RC = TLI.getRegClassFor(RetVT); bool NeedTest = true; - // Optimize conditons coming from a compare. - if (const auto *CI = dyn_cast<CmpInst>(Cond)) { + // Optimize conditons coming from a compare if both instructions are in the + // same basic block (values defined in other basic blocks may not have + // initialized registers). + const auto *CI = dyn_cast<CmpInst>(Cond); + if (CI && (CI->getParent() == I->getParent())) { CmpInst::Predicate Predicate = optimizeCmpPredicate(CI); // FCMP_OEQ and FCMP_UNE cannot be checked with a single instruction. @@ -1927,8 +1930,11 @@ bool X86FastISel::X86FastEmitSSESelect(const Instruction *I) { if (!isTypeLegal(I->getType(), RetVT)) return false; + // Optimize conditons coming from a compare if both instructions are in the + // same basic block (values defined in other basic blocks may not have + // initialized registers). const auto *CI = dyn_cast<FCmpInst>(I->getOperand(0)); - if (!CI) + if (!CI || (CI->getParent() != I->getParent())) return false; if (I->getType() != CI->getOperand(0)->getType() || @@ -2023,8 +2029,12 @@ bool X86FastISel::X86FastEmitPseudoSelect(const Instruction *I) { const Value *Cond = I->getOperand(0); X86::CondCode CC = X86::COND_NE; - // Don't emit a test if the condition comes from a compare. - if (const auto *CI = dyn_cast<CmpInst>(Cond)) { + + // Optimize conditons coming from a compare if both instructions are in the + // same basic block (values defined in other basic blocks may not have + // initialized registers). + const auto *CI = dyn_cast<CmpInst>(Cond); + if (CI && (CI->getParent() == I->getParent())) { bool NeedSwap; std::tie(CC, NeedSwap) = getX86ConditonCode(CI->getPredicate()); if (CC > X86::LAST_VALID_COND) diff --git a/test/CodeGen/X86/fast-isel-select-cmp.ll b/test/CodeGen/X86/fast-isel-select-cmp.ll new file mode 100644 index 0000000000..1af30e9f32 --- /dev/null +++ b/test/CodeGen/X86/fast-isel-select-cmp.ll @@ -0,0 +1,50 @@ +; RUN: llc < %s -O0 -mtriple=x86_64-apple-darwin10 | FileCheck %s + +; Test if we do not fold the cmp into select if the instructions are in +; different basic blocks. + +define i32 @select_cmp_cmov_i32(i32 %a, i32 %b) { +; CHECK-LABEL: select_cmp_cmov_i32 +; CHECK-LABEL: continue +; CHECK-NOT: cmp + %1 = icmp ult i32 %a, %b + br i1 %1, label %continue, label %exit + +continue: + %2 = select i1 %1, i32 %a, i32 %b + ret i32 %2 + +exit: + ret i32 -1 +} + +define float @select_fcmp_oeq_f32(float %a, float %b, float %c, float %d) { +; CHECK-LABEL: select_fcmp_oeq_f32 +; CHECK-LABEL: continue +; CHECK-NOT: cmp + %1 = fcmp oeq float %a, %b + br i1 %1, label %continue, label %exit + +continue: + %2 = select i1 %1, float %c, float %d + ret float %2 + +exit: + ret float -1.0 +} + +define float @select_fcmp_one_f32(float %a, float %b, float %c, float %d) { +; CHECK-LABEL: select_fcmp_one_f32 +; CHECK-LABEL: continue +; CHECK-NOT: ucomi + %1 = fcmp one float %a, %b + br i1 %1, label %continue, label %exit + +continue: + %2 = select i1 %1, float %c, float %d + ret float %2 + +exit: + ret float -1.0 +} + |