From 07e4b00a1a2d28985307c0e04e7508879b4ca270 Mon Sep 17 00:00:00 2001 From: Evan Cheng Date: Mon, 16 Oct 2006 06:34:55 +0000 Subject: [PATCH] SelectScalarSSELoad should call CanBeFoldedBy as well. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@30973 91177308-0d34-0410-b5e6-96231b3b80d8 --- lib/Target/X86/X86ISelDAGToDAG.cpp | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/lib/Target/X86/X86ISelDAGToDAG.cpp b/lib/Target/X86/X86ISelDAGToDAG.cpp index 3721fad5c3e..550e52c856f 100644 --- a/lib/Target/X86/X86ISelDAGToDAG.cpp +++ b/lib/Target/X86/X86ISelDAGToDAG.cpp @@ -147,7 +147,8 @@ namespace { SDOperand &Index, SDOperand &Disp); bool SelectLEAAddr(SDOperand N, SDOperand &Base, SDOperand &Scale, SDOperand &Index, SDOperand &Disp); - bool SelectScalarSSELoad(SDOperand N, SDOperand &Base, SDOperand &Scale, + bool SelectScalarSSELoad(SDOperand Root, SDOperand Pred, + SDOperand N, SDOperand &Base, SDOperand &Scale, SDOperand &Index, SDOperand &Disp, SDOperand &InChain, SDOperand &OutChain); bool TryFoldLoad(SDOperand P, SDOperand N, @@ -804,13 +805,16 @@ static inline bool isZeroNode(SDOperand Elt) { /// SelectScalarSSELoad - Match a scalar SSE load. In particular, we want to /// match a load whose top elements are either undef or zeros. The load flavor /// is derived from the type of N, which is either v4f32 or v2f64. -bool X86DAGToDAGISel::SelectScalarSSELoad(SDOperand N, SDOperand &Base, +bool X86DAGToDAGISel::SelectScalarSSELoad(SDOperand Root, SDOperand Pred, + SDOperand N, SDOperand &Base, SDOperand &Scale, SDOperand &Index, SDOperand &Disp, SDOperand &InChain, SDOperand &OutChain) { if (N.getOpcode() == ISD::SCALAR_TO_VECTOR) { InChain = N.getOperand(0).getValue(1); - if (ISD::isNON_EXTLoad(InChain.Val) && InChain.getValue(0).hasOneUse()) { + if (ISD::isNON_EXTLoad(InChain.Val) && + InChain.getValue(0).hasOneUse() && + CanBeFoldedBy(N.Val, Pred.Val, Root.Val)) { LoadSDNode *LD = cast(InChain); if (!SelectAddr(LD->getBasePtr(), Base, Scale, Index, Disp)) return false; -- 2.11.0