Fix PR18014

- When simplifying the mask generation for BLEND, check whether that mask is
  also consumed by other non-BLEND insns. If true, skip that simplification.

llvm-svn: 195476
This commit is contained in:
Michael Liao 2013-11-22 17:56:57 +00:00
parent f03789ca3f
commit 02160d580b
2 changed files with 25 additions and 0 deletions

View File

@ -17024,6 +17024,15 @@ static SDValue PerformSELECTCombine(SDNode *N, SelectionDAG &DAG,
if (BitWidth == 1)
return SDValue();
// Check all uses of that condition operand to check whether it will be
// consumed by non-BLEND instructions, which may depend on all bits are set
// properly.
for (SDNode::use_iterator I = Cond->use_begin(),
E = Cond->use_end(); I != E; ++I)
if (I->getOpcode() != ISD::VSELECT)
// TODO: Add other opcodes eventually lowered into BLEND.
return SDValue();
assert(BitWidth >= 8 && BitWidth <= 64 && "Invalid mask size");
APInt DemandedMask = APInt::getHighBitsSet(BitWidth, 1);

View File

@ -0,0 +1,16 @@
; RUN: llc < %s -mtriple=x86_64-linux-pc -mcpu=penryn | FileCheck %s
; Ensure PSRAD is generated as the condition is consumed by both PADD and
; BLENDVPS. PAND requires all bits setting properly.
define <4 x i32> @foo(<4 x i32>* %p, <4 x i1> %cond, <4 x i32> %v1, <4 x i32> %v2, <4 x i32> %v3) {
%sext_cond = sext <4 x i1> %cond to <4 x i32>
%t1 = add <4 x i32> %v1, %sext_cond
%t2 = select <4 x i1> %cond, <4 x i32> %v1, <4 x i32> %v2
store <4 x i32> %t2, <4 x i32>* %p
ret <4 x i32> %t1
; CHECK: foo
; CHECK: pslld
; CHECK: psrad
; CHECK: ret
}