aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorElena Demikhovsky <elena.demikhovsky@intel.com>2013-01-03 08:48:33 +0000
committerElena Demikhovsky <elena.demikhovsky@intel.com>2013-01-03 08:48:33 +0000
commitab7032090871abf6aeed86b2c4b836e97771d234 (patch)
treed6012d82ead4b8e96e4d98d662a8857ba4e0fd2b
parente33a8b8c2f003b703b0af32effd8ef25477c2165 (diff)
Simplified TRUNCATE operation that comes after SETCC. It is possible since SETCC result is 0 or -1.
Added a test. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@171467 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r--lib/Target/X86/X86ISelLowering.cpp23
-rwxr-xr-xtest/CodeGen/X86/avx-trunc.ll15
2 files changed, 35 insertions, 3 deletions
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp
index eca63f80ae..9a553d61bf 100644
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -14661,12 +14661,29 @@ static SDValue PerformShuffleCombine(SDNode *N, SelectionDAG &DAG,
return EltsFromConsecutiveLoads(VT, Elts, dl, DAG);
}
-/// PerformTruncateCombine - Converts truncate operation to
-/// a sequence of vector shuffle operations.
-/// It is possible when we truncate 256-bit vector to 128-bit vector
+/// PerformTruncateCombine - In some cases a sequence with "truncate"
+/// operation may be simplified.
static SDValue PerformTruncateCombine(SDNode *N, SelectionDAG &DAG,
TargetLowering::DAGCombinerInfo &DCI,
const X86Subtarget *Subtarget) {
+ EVT VT = N->getValueType(0);
+ if (DCI.isBeforeLegalize() || !VT.isVector())
+ return SDValue();
+
+ SDValue In = N->getOperand(0);
+ // Optimize the sequence setcc -> truncate
+ if (In.getOpcode() == ISD::SETCC) {
+ DebugLoc DL = N->getDebugLoc();
+ EVT InVT = In.getValueType();
+
+ // The vector element is all ones or all zero. Just take a half of it.
+ EVT HalfVT = EVT::getVectorVT(*DAG.getContext(), InVT.getScalarType(),
+ InVT.getVectorNumElements()/2);
+ SDValue HalfVec = DAG.getNode(ISD::EXTRACT_SUBVECTOR, DL, HalfVT, In,
+ DAG.getIntPtrConstant(0));
+ assert(HalfVT.getSizeInBits() == VT.getSizeInBits());
+ return DAG.getNode(ISD::BITCAST, DL, VT, HalfVec);
+ }
return SDValue();
}
diff --git a/test/CodeGen/X86/avx-trunc.ll b/test/CodeGen/X86/avx-trunc.ll
index d007736644..aa186a05f2 100755
--- a/test/CodeGen/X86/avx-trunc.ll
+++ b/test/CodeGen/X86/avx-trunc.ll
@@ -13,3 +13,18 @@ define <8 x i16> @trunc_32_16(<8 x i32> %A) nounwind uwtable readnone ssp{
ret <8 x i16>%B
}
+define <8 x i16> @trunc_after_setcc(<8 x float> %a, <8 x float> %b, <8 x float> %c, <8 x float> %d) {
+; CHECK: trunc_after_setcc
+; CHECK: vcmpltps
+; CHECK-NOT: vextract
+; CHECK: vcmpltps
+; CHECK-NEXT: vandps
+; CHECK-NEXT: vandps
+; CHECK: ret
+ %res1 = fcmp olt <8 x float> %a, %b
+ %res2 = fcmp olt <8 x float> %c, %d
+ %andr = and <8 x i1>%res1, %res2
+ %ex = zext <8 x i1> %andr to <8 x i16>
+ ret <8 x i16>%ex
+}
+