aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorEvan Cheng <evan.cheng@apple.com>2008-08-29 23:22:12 +0000
committerEvan Cheng <evan.cheng@apple.com>2008-08-29 23:22:12 +0000
commit456704476f953e4bee7ba4a95f9bf6dbb724e370 (patch)
tree522a441f7ad10bfb0b0fbce307cb726f87b70080
parent97af60b3ae4085d25ea4812c9e7219dba8293c9b (diff)
Swap fp comparison operands and change predicate to allow load folding (safely this time).
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@55553 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r--lib/Target/X86/X86ISelLowering.cpp66
-rw-r--r--test/CodeGen/X86/cmp2.ll2
2 files changed, 51 insertions, 17 deletions
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp
index 8f7b668ca0..791adb11d4 100644
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -1909,7 +1909,6 @@ SDValue X86TargetLowering::getReturnAddressFrameIndex(SelectionDAG &DAG) {
}
-
/// translateX86CC - do a one to one translation of a ISD::CondCode to the X86
/// specific condition code. It returns a false if it cannot do a direct
/// translation. X86CC is the translated CondCode. LHS/RHS are modified as
@@ -1951,36 +1950,71 @@ static bool translateX86CC(ISD::CondCode SetCCOpcode, bool isFP,
case ISD::SETUGE: X86CC = X86::COND_AE; break;
}
} else {
+ // First determine if it requires or is profitable to flip the operands.
+ bool Flip = false;
+ switch (SetCCOpcode) {
+ default: break;
+ case ISD::SETOLT:
+ case ISD::SETOLE:
+ case ISD::SETUGT:
+ case ISD::SETUGE:
+ Flip = true;
+ break;
+ }
+
+ // If LHS is a foldable load, but RHS is not, flip the condition.
+ if (!Flip &&
+ (ISD::isNON_EXTLoad(LHS.getNode()) && LHS.hasOneUse()) &&
+ !(ISD::isNON_EXTLoad(RHS.getNode()) && RHS.hasOneUse())) {
+ SetCCOpcode = getSetCCSwappedOperands(SetCCOpcode);
+ Flip = true;
+ }
+ if (Flip)
+ std::swap(LHS, RHS);
+
// On a floating point condition, the flags are set as follows:
// ZF PF CF op
// 0 | 0 | 0 | X > Y
// 0 | 0 | 1 | X < Y
// 1 | 0 | 0 | X == Y
// 1 | 1 | 1 | unordered
- bool Flip = false;
switch (SetCCOpcode) {
default: break;
case ISD::SETUEQ:
- case ISD::SETEQ: X86CC = X86::COND_E; break;
- case ISD::SETOLT: Flip = true; // Fallthrough
+ case ISD::SETEQ:
+ X86CC = X86::COND_E;
+ break;
+ case ISD::SETOLT: // flipped
case ISD::SETOGT:
- case ISD::SETGT: X86CC = X86::COND_A; break;
- case ISD::SETOLE: Flip = true; // Fallthrough
+ case ISD::SETGT:
+ X86CC = X86::COND_A;
+ break;
+ case ISD::SETOLE: // flipped
case ISD::SETOGE:
- case ISD::SETGE: X86CC = X86::COND_AE; break;
- case ISD::SETUGT: Flip = true; // Fallthrough
+ case ISD::SETGE:
+ X86CC = X86::COND_AE;
+ break;
+ case ISD::SETUGT: // flipped
case ISD::SETULT:
- case ISD::SETLT: X86CC = X86::COND_B; break;
- case ISD::SETUGE: Flip = true; // Fallthrough
+ case ISD::SETLT:
+ X86CC = X86::COND_B;
+ break;
+ case ISD::SETUGE: // flipped
case ISD::SETULE:
- case ISD::SETLE: X86CC = X86::COND_BE; break;
+ case ISD::SETLE:
+ X86CC = X86::COND_BE;
+ break;
case ISD::SETONE:
- case ISD::SETNE: X86CC = X86::COND_NE; break;
- case ISD::SETUO: X86CC = X86::COND_P; break;
- case ISD::SETO: X86CC = X86::COND_NP; break;
+ case ISD::SETNE:
+ X86CC = X86::COND_NE;
+ break;
+ case ISD::SETUO:
+ X86CC = X86::COND_P;
+ break;
+ case ISD::SETO:
+ X86CC = X86::COND_NP;
+ break;
}
- if (Flip)
- std::swap(LHS, RHS);
}
return X86CC != X86::COND_INVALID;
diff --git a/test/CodeGen/X86/cmp2.ll b/test/CodeGen/X86/cmp2.ll
index cc4027eb1b..2c046ffc08 100644
--- a/test/CodeGen/X86/cmp2.ll
+++ b/test/CodeGen/X86/cmp2.ll
@@ -3,7 +3,7 @@
define i32 @test(double %A) nounwind {
entry:
%tmp2 = fcmp ogt double %A, 1.500000e+02; <i1> [#uses=1]
- %tmp5 = fcmp olt double %A, 7.500000e+01; <i1> [#uses=1]
+ %tmp5 = fcmp ult double %A, 7.500000e+01; <i1> [#uses=1]
%bothcond = or i1 %tmp2, %tmp5; <i1> [#uses=1]
br i1 %bothcond, label %bb8, label %bb12