Update aosp/master LLVM for rebase to r239765

[android-x86/external-llvm.git] / lib / Target / SystemZ / SystemZInstrFP.td
diff --git a/lib/Target/SystemZ/SystemZInstrFP.td b/lib/Target/SystemZ/SystemZInstrFP.td

index e8841e1..27fbd7d 100644 (file)
--- a/lib/Target/SystemZ/SystemZInstrFP.td
+++ b/lib/Target/SystemZ/SystemZInstrFP.td
@@ -26,14 +26,14 @@ defm CondStoreF64 : CondStores<FP64, nonvolatile_store,
  //===----------------------------------------------------------------------===//
  
  // Load zero.
-let neverHasSideEffects = 1, isAsCheapAsAMove = 1, isMoveImm = 1 in {
+let hasSideEffects = 0, isAsCheapAsAMove = 1, isMoveImm = 1 in {
    def LZER : InherentRRE<"lzer", 0xB374, FP32,  (fpimm0)>;
    def LZDR : InherentRRE<"lzdr", 0xB375, FP64,  (fpimm0)>;
    def LZXR : InherentRRE<"lzxr", 0xB376, FP128, (fpimm0)>;
  }
  
  // Moves between two floating-point registers.
-let neverHasSideEffects = 1 in {
+let hasSideEffects = 0 in {
    def LER : UnaryRR <"le", 0x38,   null_frag, FP32,  FP32>;
    def LDR : UnaryRR <"ld", 0x28,   null_frag, FP64,  FP64>;
    def LXR : UnaryRRE<"lx", 0xB365, null_frag, FP128, FP128>;
@@ -46,9 +46,14 @@ let Defs = [CC], CCValues = 0xF, CompareZeroCCMask = 0xF in {
    defm LTDBR : LoadAndTestRRE<"ltdb", 0xB312, FP64>;
    defm LTXBR : LoadAndTestRRE<"ltxb", 0xB342, FP128>;
  }
-defm : CompareZeroFP<LTEBRCompare, FP32>;
-defm : CompareZeroFP<LTDBRCompare, FP64>;
-defm : CompareZeroFP<LTXBRCompare, FP128>;
+// Note that the comparison against zero operation is not available if we
+// have vector support, since load-and-test instructions will partially
+// clobber the target (vector) register.
+let Predicates = [FeatureNoVector] in {
+  defm : CompareZeroFP<LTEBRCompare, FP32>;
+  defm : CompareZeroFP<LTDBRCompare, FP64>;
+  defm : CompareZeroFP<LTXBRCompare, FP128>;
+}
  
  // Moves between 64-bit integer and floating-point registers.
  def LGDR : UnaryRRE<"lgd", 0xB3CD, bitconvert, GR64, FP64>;
@@ -98,6 +103,9 @@ let canFoldAsLoad = 1, SimpleBDXLoad = 1 in {
    defm LE : UnaryRXPair<"le", 0x78, 0xED64, load, FP32, 4>;
    defm LD : UnaryRXPair<"ld", 0x68, 0xED65, load, FP64, 8>;
  
+  // For z13 we prefer LDE over LE to avoid partial register dependencies.
+  def LDE32 : UnaryRXE<"lde", 0xED24, null_frag, FP32, 4>;
+
    // These instructions are split after register allocation, so we don't
    // want a custom inserter.
    let Has20BitOffset = 1, HasIndex = 1, Is128Bit = 1 in {
@@ -141,7 +149,7 @@ def LDXBRA : UnaryRRF4<"ldxbra", 0xB345, FP128, FP128>,
               Requires<[FeatureFPExtension]>;
  
  def : Pat<(f32 (fround FP128:$src)),
-          (EXTRACT_SUBREG (LEXBR FP128:$src), subreg_hh32)>;
+          (EXTRACT_SUBREG (LEXBR FP128:$src), subreg_hr32)>;
  def : Pat<(f64 (fround FP128:$src)),
            (EXTRACT_SUBREG (LDXBR FP128:$src), subreg_h64)>;
  
@@ -345,13 +353,13 @@ def MDB  : BinaryRXE<"mdb",  0xED1C, fmul, FP64, load, 8>;
  def MDEBR : BinaryRRE<"mdeb", 0xB30C, null_frag, FP64, FP32>;
  def : Pat<(fmul (f64 (fextend FP32:$src1)), (f64 (fextend FP32:$src2))),
            (MDEBR (INSERT_SUBREG (f64 (IMPLICIT_DEF)),
-                                FP32:$src1, subreg_h32), FP32:$src2)>;
+                                FP32:$src1, subreg_r32), FP32:$src2)>;
  
  // f64 multiplication of an FP32 register and an f32 memory.
  def MDEB : BinaryRXE<"mdeb", 0xED0C, null_frag, FP64, load, 4>;
  def : Pat<(fmul (f64 (fextend FP32:$src1)),
                  (f64 (extloadf32 bdxaddr12only:$addr))),
-          (MDEB (INSERT_SUBREG (f64 (IMPLICIT_DEF)), FP32:$src1, subreg_h32),
+          (MDEB (INSERT_SUBREG (f64 (IMPLICIT_DEF)), FP32:$src1, subreg_r32),
                  bdxaddr12only:$addr)>;
  
  // f128 multiplication of two FP64 registers.