[IR] redefine 'UnsafeAlgebra' / 'reassoc' fast-math-flags and add 'trans' fast-math...

[android-x86/external-llvm.git] / lib / Transforms / Scalar / Reassociate.cpp
diff --git a/lib/Transforms/Scalar/Reassociate.cpp b/lib/Transforms/Scalar/Reassociate.cpp

index 75f646d..1f32f9f 100644 (file)
--- a/lib/Transforms/Scalar/Reassociate.cpp
+++ b/lib/Transforms/Scalar/Reassociate.cpp
@@ -21,27 +21,44 @@
  //===----------------------------------------------------------------------===//
  
  #include "llvm/Transforms/Scalar/Reassociate.h"
+#include "llvm/ADT/APFloat.h"
+#include "llvm/ADT/APInt.h"
  #include "llvm/ADT/DenseMap.h"
  #include "llvm/ADT/PostOrderIterator.h"
-#include "llvm/ADT/STLExtras.h"
  #include "llvm/ADT/SetVector.h"
+#include "llvm/ADT/SmallPtrSet.h"
+#include "llvm/ADT/SmallVector.h"
  #include "llvm/ADT/Statistic.h"
  #include "llvm/Analysis/GlobalsModRef.h"
  #include "llvm/Analysis/ValueTracking.h"
+#include "llvm/IR/Argument.h"
+#include "llvm/IR/BasicBlock.h"
  #include "llvm/IR/CFG.h"
+#include "llvm/IR/Constant.h"
  #include "llvm/IR/Constants.h"
-#include "llvm/IR/DerivedTypes.h"
  #include "llvm/IR/Function.h"
  #include "llvm/IR/IRBuilder.h"
+#include "llvm/IR/InstrTypes.h"
+#include "llvm/IR/Instruction.h"
  #include "llvm/IR/Instructions.h"
-#include "llvm/IR/IntrinsicInst.h"
+#include "llvm/IR/Operator.h"
+#include "llvm/IR/PassManager.h"
+#include "llvm/IR/PatternMatch.h"
+#include "llvm/IR/Type.h"
+#include "llvm/IR/User.h"
+#include "llvm/IR/Value.h"
  #include "llvm/IR/ValueHandle.h"
  #include "llvm/Pass.h"
+#include "llvm/Support/Casting.h"
  #include "llvm/Support/Debug.h"
+#include "llvm/Support/ErrorHandling.h"
  #include "llvm/Support/raw_ostream.h"
  #include "llvm/Transforms/Scalar.h"
  #include "llvm/Transforms/Utils/Local.h"
  #include <algorithm>
+#include <cassert>
+#include <utility>
+
  using namespace llvm;
  using namespace reassociate;
  
@@ -53,7 +70,6 @@ STATISTIC(NumFactor , "Number of multiplies factored");
  
  #ifndef NDEBUG
  /// Print out the expression identified in the Ops list.
-///
  static void PrintOps(Instruction *I, const SmallVectorImpl<ValueEntry> &Ops) {
    Module *M = I->getModule();
    dbgs() << Instruction::getOpcodeName(I->getOpcode()) << " "
@@ -106,11 +122,12 @@ XorOpnd::XorOpnd(Value *V) {
              I->getOpcode() == Instruction::And)) {
      Value *V0 = I->getOperand(0);
      Value *V1 = I->getOperand(1);
-    if (isa<ConstantInt>(V0))
+    const APInt *C;
+    if (match(V0, PatternMatch::m_APInt(C)))
        std::swap(V0, V1);
  
-    if (ConstantInt *C = dyn_cast<ConstantInt>(V1)) {
-      ConstPart = C->getValue();
+    if (match(V1, PatternMatch::m_APInt(C))) {
+      ConstPart = *C;
        SymbolicPart = V0;
        isOr = (I->getOpcode() == Instruction::Or);
        return;
@@ -119,7 +136,7 @@ XorOpnd::XorOpnd(Value *V) {
  
    // view the operand as "V | 0"
    SymbolicPart = V;
-  ConstPart = APInt::getNullValue(V->getType()->getIntegerBitWidth());
+  ConstPart = APInt::getNullValue(V->getType()->getScalarSizeInBits());
    isOr = true;
  }
  
@@ -128,8 +145,7 @@ XorOpnd::XorOpnd(Value *V) {
  static BinaryOperator *isReassociableOp(Value *V, unsigned Opcode) {
    if (V->hasOneUse() && isa<Instruction>(V) &&
        cast<Instruction>(V)->getOpcode() == Opcode &&
-      (!isa<FPMathOperator>(V) ||
-       cast<Instruction>(V)->hasUnsafeAlgebra()))
+      (!isa<FPMathOperator>(V) || cast<Instruction>(V)->isFast()))
      return cast<BinaryOperator>(V);
    return nullptr;
  }
@@ -139,33 +155,32 @@ static BinaryOperator *isReassociableOp(Value *V, unsigned Opcode1,
    if (V->hasOneUse() && isa<Instruction>(V) &&
        (cast<Instruction>(V)->getOpcode() == Opcode1 ||
         cast<Instruction>(V)->getOpcode() == Opcode2) &&
-      (!isa<FPMathOperator>(V) ||
-       cast<Instruction>(V)->hasUnsafeAlgebra()))
+      (!isa<FPMathOperator>(V) || cast<Instruction>(V)->isFast()))
      return cast<BinaryOperator>(V);
    return nullptr;
  }
  
-void ReassociatePass::BuildRankMap(
-    Function &F, ReversePostOrderTraversal<Function *> &RPOT) {
-  unsigned i = 2;
+void ReassociatePass::BuildRankMap(Function &F,
+                                   ReversePostOrderTraversal<Function*> &RPOT) {
+  unsigned Rank = 2;
  
    // Assign distinct ranks to function arguments.
-  for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E; ++I) {
-    ValueRankMap[&*I] = ++i;
-    DEBUG(dbgs() << "Calculated Rank[" << I->getName() << "] = " << i << "\n");
+  for (auto &Arg : F.args()) {
+    ValueRankMap[&Arg] = ++Rank;
+    DEBUG(dbgs() << "Calculated Rank[" << Arg.getName() << "] = " << Rank
+                 << "\n");
    }
  
-  for (ReversePostOrderTraversal<Function*>::rpo_iterator I = RPOT.begin(),
-         E = RPOT.end(); I != E; ++I) {
-    BasicBlock *BB = *I;
-    unsigned BBRank = RankMap[BB] = ++i << 16;
+  // Traverse basic blocks in ReversePostOrder
+  for (BasicBlock *BB : RPOT) {
+    unsigned BBRank = RankMap[BB] = ++Rank << 16;
  
      // Walk the basic block, adding precomputed ranks for any instructions that
      // we cannot move.  This ensures that the ranks for these instructions are
      // all different in the block.
-    for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I)
-      if (mayBeMemoryDependent(*I))
-        ValueRankMap[&*I] = ++BBRank;
+    for (Instruction &I : *BB)
+      if (mayBeMemoryDependent(I))
+        ValueRankMap[&I] = ++BBRank;
    }
  }
  
@@ -206,13 +221,9 @@ void ReassociatePass::canonicalizeOperands(Instruction *I) {
  
    Value *LHS = I->getOperand(0);
    Value *RHS = I->getOperand(1);
-  unsigned LHSRank = getRank(LHS);
-  unsigned RHSRank = getRank(RHS);
-
-  if (isa<Constant>(RHS))
+  if (LHS == RHS || isa<Constant>(RHS))
      return;
-
-  if (isa<Constant>(LHS) || RHSRank < LHSRank)
+  if (isa<Constant>(LHS) || getRank(RHS) < getRank(LHS))
      cast<BinaryOperator>(I)->swapOperands();
  }
  
@@ -356,7 +367,7 @@ static void IncorporateWeight(APInt &LHS, const APInt &RHS, unsigned Opcode) {
    }
  }
  
-typedef std::pair<Value*, APInt> RepeatedValue;
+using RepeatedValue = std::pair<Value*, APInt>;
  
  /// Given an associative binary expression, return the leaf
  /// nodes in Ops along with their weights (how many times the leaf occurs).  The
@@ -431,7 +442,6 @@ typedef std::pair<Value*, APInt> RepeatedValue;
  /// that have all uses inside the expression (i.e. only used by non-leaf nodes
  /// of the expression) if it can turn them into binary operators of the right
  /// type and thus make the expression bigger.
-
  static bool LinearizeExprTree(BinaryOperator *I,
                                SmallVectorImpl<RepeatedValue> &Ops) {
    DEBUG(dbgs() << "LINEARIZE: " << *I << '\n');
@@ -469,12 +479,12 @@ static bool LinearizeExprTree(BinaryOperator *I,
  
    // Leaves - Keeps track of the set of putative leaves as well as the number of
    // paths to each leaf seen so far.
-  typedef DenseMap<Value*, APInt> LeafMap;
+  using LeafMap = DenseMap<Value *, APInt>;
    LeafMap Leaves; // Leaf -> Total weight so far.
-  SmallVector<Value*, 8> LeafOrder; // Ensure deterministic leaf output order.
+  SmallVector<Value *, 8> LeafOrder; // Ensure deterministic leaf output order.
  
  #ifndef NDEBUG
-  SmallPtrSet<Value*, 8> Visited; // For sanity checking the iteration scheme.
+  SmallPtrSet<Value *, 8> Visited; // For sanity checking the iteration scheme.
  #endif
    while (!Worklist.empty()) {
      std::pair<BinaryOperator*, APInt> P = Worklist.pop_back_val();
@@ -509,9 +519,10 @@ static bool LinearizeExprTree(BinaryOperator *I,
            continue;
          }
          // No uses outside the expression, try morphing it.
-      } else if (It != Leaves.end()) {
+      } else {
          // Already in the leaf map.
-        assert(Visited.count(Op) && "In leaf map but not visited!");
+        assert(It != Leaves.end() && Visited.count(Op) &&
+               "In leaf map but not visited!");
  
          // Update the number of paths to the leaf.
          IncorporateWeight(It->second, Weight, Opcode);
@@ -552,7 +563,7 @@ static bool LinearizeExprTree(BinaryOperator *I,
        assert((!isa<Instruction>(Op) ||
                cast<Instruction>(Op)->getOpcode() != Opcode
                || (isa<FPMathOperator>(Op) &&
-                  !cast<Instruction>(Op)->hasUnsafeAlgebra())) &&
+                  !cast<Instruction>(Op)->isFast())) &&
               "Should have been handled above!");
        assert(Op->hasOneUse() && "Has uses outside the expression tree!");
  
@@ -771,7 +782,7 @@ void ReassociatePass::RewriteExprTree(BinaryOperator *I,
          break;
        ExpressionChanged->moveBefore(I);
        ExpressionChanged = cast<BinaryOperator>(*ExpressionChanged->user_begin());
-    } while (1);
+    } while (true);
  
    // Throw away any left over nodes from the original expression.
    for (unsigned i = 0, e = NodesToRewrite.size(); i != e; ++i)
@@ -794,7 +805,6 @@ static Value *NegateValue(Value *V, Instruction *BI,
      return ConstantExpr::getNeg(C);
    }
  
-
    // We are trying to expose opportunity for reassociation.  One of the things
    // that we want to do to achieve this is to push a negation as deep into an
    // expression chain as possible, to expose the add instructions.  In practice,
@@ -911,7 +921,6 @@ BreakUpSubtract(Instruction *Sub, SetVector<AssertingVH<Instruction>> &ToRedo) {
    //
    // Calculate the negative value of Operand 1 of the sub instruction,
    // and set it as the RHS of the add instruction we just made.
-  //
    Value *NegVal = NegateValue(Sub->getOperand(1), Sub, ToRedo);
    BinaryOperator *New = CreateAdd(Sub->getOperand(0), NegVal, "", Sub, Sub);
    Sub->setOperand(0, Constant::getNullValue(Sub->getType())); // Drop use of op.
@@ -955,8 +964,8 @@ static BinaryOperator *ConvertShiftToMul(Instruction *Shl) {
  /// Scan backwards and forwards among values with the same rank as element i
  /// to see if X exists.  If X does not exist, return i.  This is useful when
  /// scanning for 'x' when we see '-x' because they both get the same rank.
-static unsigned FindInOperandList(SmallVectorImpl<ValueEntry> &Ops, unsigned i,
-                                  Value *X) {
+static unsigned FindInOperandList(const SmallVectorImpl<ValueEntry> &Ops,
+                                  unsigned i, Value *X) {
    unsigned XRank = Ops[i].Rank;
    unsigned e = Ops.size();
    for (unsigned j = i+1; j != e && Ops[j].Rank == XRank; ++j) {
@@ -982,7 +991,7 @@ static unsigned FindInOperandList(SmallVectorImpl<ValueEntry> &Ops, unsigned i,
  /// Emit a tree of add instructions, summing Ops together
  /// and returning the result.  Insert the tree before I.
  static Value *EmitAddTreeOfValues(Instruction *I,
-                                  SmallVectorImpl<WeakVH> &Ops){
+                                  SmallVectorImpl<WeakTrackingVH> &Ops) {
    if (Ops.size() == 1) return Ops.back();
  
    Value *V1 = Ops.back();
@@ -1028,7 +1037,7 @@ Value *ReassociatePass::RemoveFactorFromExpression(Value *V, Value *Factor) {
          }
      } else if (ConstantFP *FC1 = dyn_cast<ConstantFP>(Factor)) {
        if (ConstantFP *FC2 = dyn_cast<ConstantFP>(Factors[i].Op)) {
-        APFloat F1(FC1->getValueAPF());
+        const APFloat &F1 = FC1->getValueAPF();
          APFloat F2(FC2->getValueAPF());
          F2.changeSign();
          if (F1.compare(F2) == APFloat::cmpEqual) {
@@ -1069,8 +1078,7 @@ Value *ReassociatePass::RemoveFactorFromExpression(Value *V, Value *Factor) {
  ///
  /// Ops is the top-level list of add operands we're trying to factor.
  static void FindSingleUseMultiplyFactors(Value *V,
-                                         SmallVectorImpl<Value*> &Factors,
-                                       const SmallVectorImpl<ValueEntry> &Ops) {
+                                         SmallVectorImpl<Value*> &Factors) {
    BinaryOperator *BO = isReassociableOp(V, Instruction::Mul, Instruction::FMul);
    if (!BO) {
      Factors.push_back(V);
@@ -1078,8 +1086,8 @@ static void FindSingleUseMultiplyFactors(Value *V,
    }
  
    // Otherwise, add the LHS and RHS to the list of factors.
-  FindSingleUseMultiplyFactors(BO->getOperand(1), Factors, Ops);
-  FindSingleUseMultiplyFactors(BO->getOperand(0), Factors, Ops);
+  FindSingleUseMultiplyFactors(BO->getOperand(1), Factors);
+  FindSingleUseMultiplyFactors(BO->getOperand(0), Factors);
  }
  
  /// Optimize a series of operands to an 'and', 'or', or 'xor' instruction.
@@ -1135,20 +1143,19 @@ static Value *OptimizeAndOrXor(unsigned Opcode,
  /// instruction. There are two special cases: 1) if the constant operand is 0,
  /// it will return NULL. 2) if the constant is ~0, the symbolic operand will
  /// be returned.
-static Value *createAndInstr(Instruction *InsertBefore, Value *Opnd, 
+static Value *createAndInstr(Instruction *InsertBefore, Value *Opnd,
                               const APInt &ConstOpnd) {
-  if (ConstOpnd != 0) {
-    if (!ConstOpnd.isAllOnesValue()) {
-      LLVMContext &Ctx = Opnd->getType()->getContext();
-      Instruction *I;
-      I = BinaryOperator::CreateAnd(Opnd, ConstantInt::get(Ctx, ConstOpnd),
-                                    "and.ra", InsertBefore);
-      I->setDebugLoc(InsertBefore->getDebugLoc());
-      return I;
-    }
+  if (ConstOpnd.isNullValue())
+    return nullptr;
+
+  if (ConstOpnd.isAllOnesValue())
      return Opnd;
-  }
-  return nullptr;
+
+  Instruction *I = BinaryOperator::CreateAnd(
+      Opnd, ConstantInt::get(Opnd->getType(), ConstOpnd), "and.ra",
+      InsertBefore);
+  I->setDebugLoc(InsertBefore->getDebugLoc());
+  return I;
  }
  
  // Helper function of OptimizeXor(). It tries to simplify "Opnd1 ^ ConstOpnd"
@@ -1157,33 +1164,31 @@ static Value *createAndInstr(Instruction *InsertBefore, Value *Opnd,
  // If it was successful, true is returned, and the "R" and "C" is returned
  // via "Res" and "ConstOpnd", respectively; otherwise, false is returned,
  // and both "Res" and "ConstOpnd" remain unchanged.
-//
  bool ReassociatePass::CombineXorOpnd(Instruction *I, XorOpnd *Opnd1,
                                       APInt &ConstOpnd, Value *&Res) {
    // Xor-Rule 1: (x | c1) ^ c2 = (x | c1) ^ (c1 ^ c1) ^ c2 
    //                       = ((x | c1) ^ c1) ^ (c1 ^ c2)
    //                       = (x & ~c1) ^ (c1 ^ c2)
    // It is useful only when c1 == c2.
-  if (Opnd1->isOrExpr() && Opnd1->getConstPart() != 0) {
-    if (!Opnd1->getValue()->hasOneUse())
-      return false;
+  if (!Opnd1->isOrExpr() || Opnd1->getConstPart().isNullValue())
+    return false;
  
-    const APInt &C1 = Opnd1->getConstPart();
-    if (C1 != ConstOpnd)
-      return false;
+  if (!Opnd1->getValue()->hasOneUse())
+    return false;
  
-    Value *X = Opnd1->getSymbolicPart();
-    Res = createAndInstr(I, X, ~C1);
-    // ConstOpnd was C2, now C1 ^ C2.
-    ConstOpnd ^= C1;
+  const APInt &C1 = Opnd1->getConstPart();
+  if (C1 != ConstOpnd)
+    return false;
  
-    if (Instruction *T = dyn_cast<Instruction>(Opnd1->getValue()))
-      RedoInsts.insert(T);
-    return true;
-  }
-  return false;
-}
+  Value *X = Opnd1->getSymbolicPart();
+  Res = createAndInstr(I, X, ~C1);
+  // ConstOpnd was C2, now C1 ^ C2.
+  ConstOpnd ^= C1;
  
+  if (Instruction *T = dyn_cast<Instruction>(Opnd1->getValue()))
+    RedoInsts.insert(T);
+  return true;
+}
                             
  // Helper function of OptimizeXor(). It tries to simplify
  // "Opnd1 ^ Opnd2 ^ ConstOpnd" into "R ^ C", where C would be 0, and R is a
@@ -1222,15 +1227,14 @@ bool ReassociatePass::CombineXorOpnd(Instruction *I, XorOpnd *Opnd1,
      APInt C3((~C1) ^ C2);
  
      // Do not increase code size!
-    if (C3 != 0 && !C3.isAllOnesValue()) {
-      int NewInstNum = ConstOpnd != 0 ? 1 : 2;
+    if (!C3.isNullValue() && !C3.isAllOnesValue()) {
+      int NewInstNum = ConstOpnd.getBoolValue() ? 1 : 2;
        if (NewInstNum > DeadInstNum)
          return false;
      }
  
      Res = createAndInstr(I, X, C3);
      ConstOpnd ^= C1;
-
    } else if (Opnd1->isOrExpr()) {
      // Xor-Rule 3: (x | c1) ^ (x | c2) = (x & c3) ^ c3 where c3 = c1 ^ c2
      //
@@ -1239,8 +1243,8 @@ bool ReassociatePass::CombineXorOpnd(Instruction *I, XorOpnd *Opnd1,
      APInt C3 = C1 ^ C2;
      
      // Do not increase code size
-    if (C3 != 0 && !C3.isAllOnesValue()) {
-      int NewInstNum = ConstOpnd != 0 ? 1 : 2;
+    if (!C3.isNullValue() && !C3.isAllOnesValue()) {
+      int NewInstNum = ConstOpnd.getBoolValue() ? 1 : 2;
        if (NewInstNum > DeadInstNum)
          return false;
      }
@@ -1280,17 +1284,20 @@ Value *ReassociatePass::OptimizeXor(Instruction *I,
    SmallVector<XorOpnd, 8> Opnds;
    SmallVector<XorOpnd*, 8> OpndPtrs;
    Type *Ty = Ops[0].Op->getType();
-  APInt ConstOpnd(Ty->getIntegerBitWidth(), 0);
+  APInt ConstOpnd(Ty->getScalarSizeInBits(), 0);
  
    // Step 1: Convert ValueEntry to XorOpnd
    for (unsigned i = 0, e = Ops.size(); i != e; ++i) {
      Value *V = Ops[i].Op;
-    if (!isa<ConstantInt>(V)) {
+    const APInt *C;
+    // TODO: Support non-splat vectors.
+    if (match(V, PatternMatch::m_APInt(C))) {
+      ConstOpnd ^= *C;
+    } else {
        XorOpnd O(V);
        O.setSymbolicRank(getRank(O.getSymbolicPart()));
        Opnds.push_back(O);
-    } else
-      ConstOpnd ^= cast<ConstantInt>(V)->getValue();
+    }
    }
  
    // NOTE: From this point on, do *NOT* add/delete element to/from "Opnds".
@@ -1328,7 +1335,8 @@ Value *ReassociatePass::OptimizeXor(Instruction *I,
      Value *CV;
  
      // Step 3.1: Try simplifying "CurrOpnd ^ ConstOpnd"
-    if (ConstOpnd != 0 && CombineXorOpnd(I, CurrOpnd, ConstOpnd, CV)) {
+    if (!ConstOpnd.isNullValue() &&
+        CombineXorOpnd(I, CurrOpnd, ConstOpnd, CV)) {
        Changed = true;
        if (CV)
          *CurrOpnd = XorOpnd(CV);
@@ -1345,7 +1353,6 @@ Value *ReassociatePass::OptimizeXor(Instruction *I,
  
      // step 3.2: When previous and current operands share the same symbolic
      //  value, try to simplify "PrevOpnd ^ CurrOpnd ^ ConstOpnd" 
-    //    
      if (CombineXorOpnd(I, CurrOpnd, PrevOpnd, ConstOpnd, CV)) {
        // Remove previous operand
        PrevOpnd->Invalidate();
@@ -1370,17 +1377,17 @@ Value *ReassociatePass::OptimizeXor(Instruction *I,
        ValueEntry VE(getRank(O.getValue()), O.getValue());
        Ops.push_back(VE);
      }
-    if (ConstOpnd != 0) {
-      Value *C = ConstantInt::get(Ty->getContext(), ConstOpnd);
+    if (!ConstOpnd.isNullValue()) {
+      Value *C = ConstantInt::get(Ty, ConstOpnd);
        ValueEntry VE(getRank(C), C);
        Ops.push_back(VE);
      }
-    int Sz = Ops.size();
+    unsigned Sz = Ops.size();
      if (Sz == 1)
        return Ops.back().Op;
-    else if (Sz == 0) {
-      assert(ConstOpnd == 0);
-      return ConstantInt::get(Ty->getContext(), ConstOpnd);
+    if (Sz == 0) {
+      assert(ConstOpnd.isNullValue());
+      return ConstantInt::get(Ty, ConstOpnd);
      }
    }
  
@@ -1499,7 +1506,7 @@ Value *ReassociatePass::OptimizeAdd(Instruction *I,
  
      // Compute all of the factors of this added value.
      SmallVector<Value*, 8> Factors;
-    FindSingleUseMultiplyFactors(BOp, Factors, Ops);
+    FindSingleUseMultiplyFactors(BOp, Factors);
      assert(Factors.size() > 1 && "Bad linearize!");
  
      // Add one to FactorOccurrences for each unique factor in this op.
@@ -1521,8 +1528,8 @@ Value *ReassociatePass::OptimizeAdd(Instruction *I,
        if (ConstantInt *CI = dyn_cast<ConstantInt>(Factor)) {
          if (CI->isNegative() && !CI->isMinValue(true)) {
            Factor = ConstantInt::get(CI->getContext(), -CI->getValue());
-          assert(!Duplicates.count(Factor) &&
-                 "Shouldn't have two constant factors, missed a canonicalize");
+          if (!Duplicates.insert(Factor).second)
+            continue;
            unsigned Occ = ++FactorOccurrences[Factor];
            if (Occ > MaxOcc) {
              MaxOcc = Occ;
@@ -1534,8 +1541,8 @@ Value *ReassociatePass::OptimizeAdd(Instruction *I,
            APFloat F(CF->getValueAPF());
            F.changeSign();
            Factor = ConstantFP::get(CF->getContext(), F);
-          assert(!Duplicates.count(Factor) &&
-                 "Shouldn't have two constant factors, missed a canonicalize");
+          if (!Duplicates.insert(Factor).second)
+            continue;
            unsigned Occ = ++FactorOccurrences[Factor];
            if (Occ > MaxOcc) {
              MaxOcc = Occ;
@@ -1560,7 +1567,7 @@ Value *ReassociatePass::OptimizeAdd(Instruction *I,
              ? BinaryOperator::CreateAdd(MaxOccVal, MaxOccVal)
              : BinaryOperator::CreateFAdd(MaxOccVal, MaxOccVal);
  
-    SmallVector<WeakVH, 4> NewMulOps;
+    SmallVector<WeakTrackingVH, 4> NewMulOps;
      for (unsigned i = 0; i != Ops.size(); ++i) {
        // Only try to remove factors from expressions we're allowed to.
        BinaryOperator *BOp =
@@ -1583,7 +1590,7 @@ Value *ReassociatePass::OptimizeAdd(Instruction *I,
      }
  
      // No need for extra uses anymore.
-    delete DummyInst;
+    DummyInst->deleteValue();
  
      unsigned NumAddedValues = NewMulOps.size();
      Value *V = EmitAddTreeOfValues(I, NewMulOps);
@@ -1628,8 +1635,8 @@ Value *ReassociatePass::OptimizeAdd(Instruction *I,
  ///   ((((x*y)*x)*y)*x) -> [(x, 3), (y, 2)]
  ///
  /// \returns Whether any factors have a power greater than one.
-bool ReassociatePass::collectMultiplyFactors(SmallVectorImpl<ValueEntry> &Ops,
-                                             SmallVectorImpl<Factor> &Factors) {
+static bool collectMultiplyFactors(SmallVectorImpl<ValueEntry> &Ops,
+                                   SmallVectorImpl<Factor> &Factors) {
    // FIXME: Have Ops be (ValueEntry, Multiplicity) pairs, simplifying this.
    // Compute the sum of powers of simplifiable factors.
    unsigned FactorPowerSum = 0;
@@ -1778,6 +1785,12 @@ Value *ReassociatePass::OptimizeMul(BinaryOperator *I,
      return nullptr; // All distinct factors, so nothing left for us to do.
  
    IRBuilder<> Builder(I);
+  // The reassociate transformation for FP operations is performed only
+  // if unsafe algebra is permitted by FastMathFlags. Propagate those flags
+  // to the newly generated operations.
+  if (auto FPI = dyn_cast<FPMathOperator>(I))
+    Builder.setFastMathFlags(FPI->getFastMathFlags());
+
    Value *V = buildMinimalMultiplyDAG(Builder, Factors);
    if (Ops.empty())
      return V;
@@ -1865,6 +1878,8 @@ void ReassociatePass::RecursivelyEraseDeadInsts(
  /// Zap the given instruction, adding interesting operands to the work list.
  void ReassociatePass::EraseInst(Instruction *I) {
    assert(isInstructionTriviallyDead(I) && "Trivially dead instructions only!");
+  DEBUG(dbgs() << "Erasing dead inst: "; I->dump());
+
    SmallVector<Value*, 8> Ops(I->op_begin(), I->op_end());
    // Erase the dead instruction.
    ValueRankMap.erase(I);
@@ -1882,6 +1897,8 @@ void ReassociatePass::EraseInst(Instruction *I) {
          Op = Op->user_back();
        RedoInsts.insert(Op);
      }
+
+  MadeChange = true;
  }
  
  // Canonicalize expressions of the following form:
@@ -1915,7 +1932,7 @@ Instruction *ReassociatePass::canonicalizeNegConstExpr(Instruction *I) {
  
    // User must be a binary operator with one or more uses.
    Instruction *User = I->user_back();
-  if (!isa<BinaryOperator>(User) || !User->hasNUsesOrMore(1))
+  if (!isa<BinaryOperator>(User) || User->use_empty())
      return nullptr;
  
    unsigned UserOpcode = User->getOpcode();
@@ -1927,6 +1944,12 @@ Instruction *ReassociatePass::canonicalizeNegConstExpr(Instruction *I) {
    if (!User->isCommutative() && User->getOperand(1) != I)
      return nullptr;
  
+  // Don't canonicalize x + (-Constant * y) -> x - (Constant * y), if the
+  // resulting subtract will be broken up later.  This can get us into an
+  // infinite loop during reassociation.
+  if (UserOpcode == Instruction::FAdd && ShouldBreakUpSubtract(User))
+    return nullptr;
+
    // Change the sign of the constant.
    APFloat Val = CF->getValueAPF();
    Val.changeSign();
@@ -1992,13 +2015,8 @@ void ReassociatePass::OptimizeInst(Instruction *I) {
    if (I->isCommutative())
      canonicalizeOperands(I);
  
-  // TODO: We should optimize vector Xor instructions, but they are
-  // currently unsupported.
-  if (I->getType()->isVectorTy() && I->getOpcode() == Instruction::Xor)
-    return;
-
-  // Don't optimize floating point instructions that don't have unsafe algebra.
-  if (I->getType()->isFPOrFPVectorTy() && !I->hasUnsafeAlgebra())
+  // Don't optimize floating-point instructions unless they are 'fast'.
+  if (I->getType()->isFPOrFPVectorTy() && !I->isFast())
      return;
  
    // Do not reassociate boolean (i1) expressions.  We want to preserve the
@@ -2125,7 +2143,8 @@ void ReassociatePass::ReassociateExpression(BinaryOperator *I) {
      DEBUG(dbgs() << "Reassoc to scalar: " << *V << '\n');
      I->replaceAllUsesWith(V);
      if (Instruction *VI = dyn_cast<Instruction>(V))
-      VI->setDebugLoc(I->getDebugLoc());
+      if (I->getDebugLoc())
+        VI->setDebugLoc(I->getDebugLoc());
      RedoInsts.insert(I);
      ++NumAnnihil;
      return;
@@ -2139,7 +2158,7 @@ void ReassociatePass::ReassociateExpression(BinaryOperator *I) {
      if (I->getOpcode() == Instruction::Mul &&
          cast<Instruction>(I->user_back())->getOpcode() == Instruction::Add &&
          isa<ConstantInt>(Ops.back().Op) &&
-        cast<ConstantInt>(Ops.back().Op)->isAllOnesValue()) {
+        cast<ConstantInt>(Ops.back().Op)->isMinusOne()) {
        ValueEntry Tmp = Ops.pop_back_val();
        Ops.insert(Ops.begin(), Tmp);
      } else if (I->getOpcode() == Instruction::FMul &&
@@ -2173,29 +2192,22 @@ void ReassociatePass::ReassociateExpression(BinaryOperator *I) {
    RewriteExprTree(I, Ops);
  }
  
-PreservedAnalyses ReassociatePass::run(Function &F) {
-  // Reassociate needs for each instruction to have its operands already
-  // processed, so we first perform a RPOT of the basic blocks so that
-  // when we process a basic block, all its dominators have been processed
-  // before.
+PreservedAnalyses ReassociatePass::run(Function &F, FunctionAnalysisManager &) {
+  // Get the functions basic blocks in Reverse Post Order. This order is used by
+  // BuildRankMap to pre calculate ranks correctly. It also excludes dead basic
+  // blocks (it has been seen that the analysis in this pass could hang when
+  // analysing dead basic blocks).
    ReversePostOrderTraversal<Function *> RPOT(&F);
+
+  // Calculate the rank map for F.
    BuildRankMap(F, RPOT);
  
    MadeChange = false;
+  // Traverse the same blocks that was analysed by BuildRankMap.
    for (BasicBlock *BI : RPOT) {
-    // Use a worklist to keep track of which instructions have been processed
-    // (and which insts won't be optimized again) so when redoing insts,
-    // optimize insts rightaway which won't be processed later.
-    SmallSet<Instruction *, 8> Worklist;
-
-    // Insert all instructions in the BB
-    for (Instruction &I : *BI)
-      Worklist.insert(&I);
-
+    assert(RankMap.count(&*BI) && "BB should be ranked.");
      // Optimize every instruction in the basic block.
-    for (BasicBlock::iterator II = BI->begin(), IE = BI->end(); II != IE;) {
-      // This instruction has been processed.
-      Worklist.erase(&*II);
+    for (BasicBlock::iterator II = BI->begin(), IE = BI->end(); II != IE;)
        if (isInstructionTriviallyDead(&*II)) {
          EraseInst(&*II++);
        } else {
@@ -2204,23 +2216,30 @@ PreservedAnalyses ReassociatePass::run(Function &F) {
          ++II;
        }
  
-      // If the above optimizations produced new instructions to optimize or
-      // made modifications which need to be redone, do them now if they won't
-      // be handled later.
-      while (!RedoInsts.empty()) {
-        Instruction *I = RedoInsts.pop_back_val();
-        // Process instructions that won't be processed later, either
-        // inside the block itself or in another basic block (based on rank),
-        // since these will be processed later.
-        if ((I->getParent() != BI || !Worklist.count(I)) &&
-            RankMap[I->getParent()] <= RankMap[BI]) {
-          if (isInstructionTriviallyDead(I))
-            EraseInst(I);
-          else
-            OptimizeInst(I);
-        }
+    // Make a copy of all the instructions to be redone so we can remove dead
+    // instructions.
+    SetVector<AssertingVH<Instruction>> ToRedo(RedoInsts);
+    // Iterate over all instructions to be reevaluated and remove trivially dead
+    // instructions. If any operand of the trivially dead instruction becomes
+    // dead mark it for deletion as well. Continue this process until all
+    // trivially dead instructions have been removed.
+    while (!ToRedo.empty()) {
+      Instruction *I = ToRedo.pop_back_val();
+      if (isInstructionTriviallyDead(I)) {
+        RecursivelyEraseDeadInsts(I, ToRedo);
+        MadeChange = true;
        }
      }
+
+    // Now that we have removed dead instructions, we can reoptimize the
+    // remaining instructions.
+    while (!RedoInsts.empty()) {
+      Instruction *I = RedoInsts.pop_back_val();
+      if (isInstructionTriviallyDead(I))
+        EraseInst(I);
+      else
+        OptimizeInst(I);
+    }
    }
  
    // We are done with the rank map.
@@ -2228,9 +2247,8 @@ PreservedAnalyses ReassociatePass::run(Function &F) {
    ValueRankMap.clear();
  
    if (MadeChange) {
-    // FIXME: Reassociate should also 'preserve the CFG'.
-    // The new pass manager has currently no way to do it.
-    auto PA = PreservedAnalyses();
+    PreservedAnalyses PA;
+    PA.preserveSet<CFGAnalyses>();
      PA.preserve<GlobalsAA>();
      return PA;
    }
@@ -2239,10 +2257,13 @@ PreservedAnalyses ReassociatePass::run(Function &F) {
  }
  
  namespace {
+
    class ReassociateLegacyPass : public FunctionPass {
      ReassociatePass Impl;
+
    public:
      static char ID; // Pass identification, replacement for typeid
+
      ReassociateLegacyPass() : FunctionPass(ID) {
        initializeReassociateLegacyPassPass(*PassRegistry::getPassRegistry());
      }
@@ -2251,7 +2272,8 @@ namespace {
        if (skipFunction(F))
          return false;
  
-      auto PA = Impl.run(F);
+      FunctionAnalysisManager DummyFAM;
+      auto PA = Impl.run(F, DummyFAM);
        return !PA.areAllPreserved();
      }
  
@@ -2260,9 +2282,11 @@ namespace {
        AU.addPreserved<GlobalsAAWrapperPass>();
      }
    };
-}
+
+} // end anonymous namespace
  
  char ReassociateLegacyPass::ID = 0;
+
  INITIALIZE_PASS(ReassociateLegacyPass, "reassociate",
                  "Reassociate expressions", false, false)