// instructions per cycle.
let IssueWidth = 4;
let MicroOpBufferSize = 192; // Based on the reorder buffer.
- let LoadLatency = 4;
+ let LoadLatency = 5;
let MispredictPenalty = 16;
// Based on the LSD (loop-stream detector) queue size and benchmarking data.
// Integer division issued on port 0.
def HWDivider : ProcResource<1>;
-// Loads are 4 cycles, so ReadAfterLd registers needn't be available until 4
+// Loads are 5 cycles, so ReadAfterLd registers needn't be available until 5
// cycles after the memory operand.
-def : ReadAdvance<ReadAfterLd, 4>;
+def : ReadAdvance<ReadAfterLd, 5>;
// Many SchedWrites are defined in pairs with and without a folded load.
// Instructions with folded loads are usually micro-fused, so they only appear
// Register variant is using a single cycle on ExePort.
def : WriteRes<SchedRW, [ExePort]> { let Latency = Lat; }
- // Memory variant also uses a cycle on port 2/3 and adds 4 cycles to the
+ // Memory variant also uses a cycle on port 2/3 and adds 5 cycles to the
// latency.
def : WriteRes<SchedRW.Folded, [HWPort23, ExePort]> {
- let Latency = !add(Lat, 4);
+ let Latency = !add(Lat, 5);
}
}
// Store_addr on 237.
// Store_data on 4.
def : WriteRes<WriteStore, [HWPort237, HWPort4]>;
-def : WriteRes<WriteLoad, [HWPort23]> { let Latency = 4; }
+def : WriteRes<WriteLoad, [HWPort23]> { let Latency = 5; }
def : WriteRes<WriteMove, [HWPort0156]>;
def : WriteRes<WriteZero, []>;
// MOVSX, MOVZX.
// r,m.
-def : InstRW<[WriteLoad], (instregex "MOV(S|Z)X32rm(8|16)")>;
+def : InstRW<[WriteLoad], (instregex "MOV(S|Z)X32rm8")>;
// XLAT.
def WriteXLAT : SchedWriteRes<[]> {
}
def : InstRW<[WriteMOVS], (instregex "MOVS(B|L|Q|W)")>;
-// SCAS.
-def : InstRW<[Write2P0156_P23], (instregex "SCAS(B|W|L|Q)")>;
-
// CMPS.
def WriteCMPS : SchedWriteRes<[HWPort23, HWPort0156]> {
let Latency = 4;
}
def : InstRW<[WriteFNINIT], (instregex "FNINIT")>;
-//=== Integer MMX and XMM Instructions ===//
-
-// PBLENDW.
-// x,x,i / v,v,v,i
-def WritePBLENDWr : SchedWriteRes<[HWPort5]>;
-def : InstRW<[WritePBLENDWr], (instregex "(V?)PBLENDW(Y?)rri")>;
-
-// x,m,i / v,v,m,i
-def WritePBLENDWm : SchedWriteRes<[HWPort5, HWPort23]> {
- let NumMicroOps = 2;
- let Latency = 4;
- let ResourceCycles = [1, 1];
-}
-def : InstRW<[WritePBLENDWm, ReadAfterLd], (instregex "(V?)PBLENDW(Y?)rmi")>;
-
-// PMOVMSKB.
-def WritePMOVMSKB : SchedWriteRes<[HWPort0]> {
- let Latency = 3;
-}
-def : InstRW<[WritePMOVMSKB], (instregex "(V|MMX_)?PMOVMSKB(Y?)rr")>;
-
-// VPGATHERDD.
-// x.
-def WriteVPGATHERDD128 : SchedWriteRes<[]> {
- let NumMicroOps = 20;
-}
-def : InstRW<[WriteVPGATHERDD128, ReadAfterLd], (instregex "VPGATHERDDrm")>;
-
-// y.
-def WriteVPGATHERDD256 : SchedWriteRes<[]> {
- let NumMicroOps = 34;
-}
-def : InstRW<[WriteVPGATHERDD256, ReadAfterLd], (instregex "VPGATHERDDYrm")>;
-
-// VPGATHERQD.
-// x.
-def WriteVPGATHERQD128 : SchedWriteRes<[]> {
- let NumMicroOps = 15;
-}
-def : InstRW<[WriteVPGATHERQD128, ReadAfterLd], (instregex "VPGATHERQDrm")>;
-
-// y.
-def WriteVPGATHERQD256 : SchedWriteRes<[]> {
- let NumMicroOps = 22;
-}
-def : InstRW<[WriteVPGATHERQD256, ReadAfterLd], (instregex "VPGATHERQDYrm")>;
-
-// VPGATHERDQ.
-// x.
-def WriteVPGATHERDQ128 : SchedWriteRes<[]> {
- let NumMicroOps = 12;
-}
-def : InstRW<[WriteVPGATHERDQ128, ReadAfterLd], (instregex "VPGATHERDQrm")>;
-
-// y.
-def WriteVPGATHERDQ256 : SchedWriteRes<[]> {
- let NumMicroOps = 20;
-}
-def : InstRW<[WriteVPGATHERDQ256, ReadAfterLd], (instregex "VPGATHERDQYrm")>;
-
-// VPGATHERQQ.
-// x.
-def WriteVPGATHERQQ128 : SchedWriteRes<[]> {
- let NumMicroOps = 14;
-}
-def : InstRW<[WriteVPGATHERQQ128, ReadAfterLd], (instregex "VPGATHERQQrm")>;
-
-// y.
-def WriteVPGATHERQQ256 : SchedWriteRes<[]> {
- let NumMicroOps = 22;
-}
-def : InstRW<[WriteVPGATHERQQ256, ReadAfterLd], (instregex "VPGATHERQQYrm")>;
-
-//-- Arithmetic instructions --//
-
////////////////////////////////////////////////////////////////////////////////
// Horizontal add/sub instructions.
////////////////////////////////////////////////////////////////////////////////
//=== Floating Point XMM and YMM Instructions ===//
-// VGATHERDPS.
-// x.
-def WriteVGATHERDPS128 : SchedWriteRes<[]> {
- let NumMicroOps = 20;
-}
-def : InstRW<[WriteVGATHERDPS128, ReadAfterLd], (instregex "VGATHERDPSrm")>;
-
-// y.
-def WriteVGATHERDPS256 : SchedWriteRes<[]> {
- let NumMicroOps = 34;
-}
-def : InstRW<[WriteVGATHERDPS256, ReadAfterLd], (instregex "VGATHERDPSYrm")>;
-
-// VGATHERQPS.
-// x.
-def WriteVGATHERQPS128 : SchedWriteRes<[]> {
- let NumMicroOps = 15;
-}
-def : InstRW<[WriteVGATHERQPS128, ReadAfterLd], (instregex "VGATHERQPSrm")>;
-
-// y.
-def WriteVGATHERQPS256 : SchedWriteRes<[]> {
- let NumMicroOps = 22;
-}
-def : InstRW<[WriteVGATHERQPS256, ReadAfterLd], (instregex "VGATHERQPSYrm")>;
-
-// VGATHERDPD.
-// x.
-def WriteVGATHERDPD128 : SchedWriteRes<[]> {
- let NumMicroOps = 12;
-}
-def : InstRW<[WriteVGATHERDPD128, ReadAfterLd], (instregex "VGATHERDPDrm")>;
-
-// y.
-def WriteVGATHERDPD256 : SchedWriteRes<[]> {
- let NumMicroOps = 20;
-}
-def : InstRW<[WriteVGATHERDPD256, ReadAfterLd], (instregex "VGATHERDPDYrm")>;
-
-// VGATHERQPD.
-// x.
-def WriteVGATHERQPD128 : SchedWriteRes<[]> {
- let NumMicroOps = 14;
-}
-def : InstRW<[WriteVGATHERQPD128, ReadAfterLd], (instregex "VGATHERQPDrm")>;
-
-// y.
-def WriteVGATHERQPD256 : SchedWriteRes<[]> {
- let NumMicroOps = 22;
-}
-def : InstRW<[WriteVGATHERQPD256, ReadAfterLd], (instregex "VGATHERQPDYrm")>;
-
// Remaining instrs.
def HWWriteResGroup0 : SchedWriteRes<[HWPort23]> {
- let Latency = 1;
+ let Latency = 6;
let NumMicroOps = 1;
let ResourceCycles = [1];
}
def: InstRW<[HWWriteResGroup0], (instregex "LDDQUrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "LD_F32m")>;
-def: InstRW<[HWWriteResGroup0], (instregex "LD_F64m")>;
-def: InstRW<[HWWriteResGroup0], (instregex "LD_F80m")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVD64from64rm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVD64rm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVD64to64rm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVQ64rm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOV(16|32|64)rm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOV64toPQIrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOV8rm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVAPDrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVAPSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVDDUPrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVDI2PDIrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVDQArm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVDQUrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVNTDQArm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVSHDUPrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVSLDUPrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVSSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVSX(16|32|64)rm16")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVSX(16|32|64)rm32")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVSX(16|32|64)rm8")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVUPDrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "MOVUPSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVZX(16|32|64)rm16")>;
-def: InstRW<[HWWriteResGroup0], (instregex "MOVZX(16|32|64)rm8")>;
-def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHNTA")>;
-def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHT0")>;
-def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHT1")>;
-def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHT2")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTF128")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTI128")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTSDYrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTSSYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTSSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VLDDQUYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VLDDQUrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOV64toPQIrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPDYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPDrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPSYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVDDUPYrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVDDUPrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVDI2PDIrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQAYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQArm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQUYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQUrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVNTDQAYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVNTDQArm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVQI2PQIrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVSDrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVSHDUPYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVSHDUPrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVSLDUPYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVSLDUPrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVSSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPDYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPDrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPSYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPSrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTDYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTDrm")>;
-def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTQYrm")>;
def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTQrm")>;
+def: InstRW<[HWWriteResGroup0], (instregex "ROUNDPDr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "ROUNDPSr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "ROUNDSDr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "ROUNDSSr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "VROUNDPDr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "VROUNDPSr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "VROUNDSDr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "VROUNDSSr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "VROUNDYPDr")>;
+def: InstRW<[HWWriteResGroup0], (instregex "VROUNDYPSr")>;
+
+def HWWriteResGroup0_1 : SchedWriteRes<[HWPort23]> {
+ let Latency = 7;
+ let NumMicroOps = 1;
+ let ResourceCycles = [1];
+}
+def: InstRW<[HWWriteResGroup0_1], (instregex "LD_F32m")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "LD_F64m")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "LD_F80m")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTF128")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTI128")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTSDYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTSSYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VLDDQUYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVAPDYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVAPSYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVDDUPYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVDQAYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVDQUYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVNTDQAYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVSHDUPYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVSLDUPYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVUPDYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVUPSYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VPBROADCASTDYrm")>;
+def: InstRW<[HWWriteResGroup0_1], (instregex "VPBROADCASTQYrm")>;
+
+def HWWriteResGroup0_2 : SchedWriteRes<[HWPort23]> {
+ let Latency = 5;
+ let NumMicroOps = 1;
+ let ResourceCycles = [1];
+}
+def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVD64from64rm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVD64rm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVD64to64rm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVQ64rm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOV(16|32|64)rm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOV64toPQIrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOV8rm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVDDUPrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVDI2PDIrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSSrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSX(16|32|64)rm16")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSX(16|32|64)rm32")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSX(16|32|64)rm8")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVZX(16|32|64)rm16")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "MOVZX(16|32|64)rm8")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHNTA")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHT0")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHT1")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHT2")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "VMOV64toPQIrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVDDUPrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVDI2PDIrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVQI2PQIrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVSDrm")>;
+def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVSSrm")>;
def HWWriteResGroup1 : SchedWriteRes<[HWPort4,HWPort237]> {
let Latency = 1;
def: InstRW<[HWWriteResGroup10], (instregex "XOR8rr")>;
def HWWriteResGroup11 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 1;
+ let Latency = 6;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup11], (instregex "CVTPS2PDrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "CVTSS2SDrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSLLDrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSLLQrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSLLWrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSRLDrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSRLQrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSRLWrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VCVTPH2PSYrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "VCVTPH2PSrm")>;
def: InstRW<[HWWriteResGroup11], (instregex "VCVTPS2PDrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VCVTSS2SDrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSLLDYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSLLQYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSLLVQYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSLLVQrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSLLWYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRADYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRAWYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRLDYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRLQYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRLVQYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRLVQrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VPSRLWYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VTESTPDYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VTESTPDrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VTESTPSYrm")>;
-def: InstRW<[HWWriteResGroup11], (instregex "VTESTPSrm")>;
+
+def HWWriteResGroup11_1 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 7;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup11_1], (instregex "CVTSS2SDrm")>;
+def: InstRW<[HWWriteResGroup11_1], (instregex "VCVTPH2PSYrm")>;
+def: InstRW<[HWWriteResGroup11_1], (instregex "VCVTSS2SDrm")>;
+def: InstRW<[HWWriteResGroup11_1], (instregex "VPSLLVQrm")>;
+def: InstRW<[HWWriteResGroup11_1], (instregex "VPSRLVQrm")>;
+def: InstRW<[HWWriteResGroup11_1], (instregex "VTESTPDrm")>;
+def: InstRW<[HWWriteResGroup11_1], (instregex "VTESTPSrm")>;
+
+def HWWriteResGroup11_2 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 8;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLDYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLQYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLVQYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLWYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRADYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRAWYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLDYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLQYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLVQYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLWYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VTESTPDYrm")>;
+def: InstRW<[HWWriteResGroup11_2], (instregex "VTESTPSYrm")>;
def HWWriteResGroup12 : SchedWriteRes<[HWPort1,HWPort23]> {
- let Latency = 1;
+ let Latency = 8;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
+def: InstRW<[HWWriteResGroup12], (instregex "ADDSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "ADDSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "BSF(16|32|64)rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "BSR(16|32|64)rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "CMPSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "COMISDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "COMISSrm")>;
def: InstRW<[HWWriteResGroup12], (instregex "FCOM32m")>;
def: InstRW<[HWWriteResGroup12], (instregex "FCOM64m")>;
def: InstRW<[HWWriteResGroup12], (instregex "FCOMP32m")>;
def: InstRW<[HWWriteResGroup12], (instregex "FCOMP64m")>;
+def: InstRW<[HWWriteResGroup12], (instregex "IMUL(16|32|64)m")>;
+def: InstRW<[HWWriteResGroup12], (instregex "IMUL(16|32|64)rm(i8?)")>;
+def: InstRW<[HWWriteResGroup12], (instregex "IMUL8m")>;
+def: InstRW<[HWWriteResGroup12], (instregex "LZCNT(16|32|64)rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MAXSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MAXSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MINSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MINSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MMX_CVTPI2PSirm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MMX_CVTPS2PIirm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MMX_CVTTPS2PIirm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MUL(16|32|64)m")>;
+def: InstRW<[HWWriteResGroup12], (instregex "MUL8m")>;
+def: InstRW<[HWWriteResGroup12], (instregex "PDEP32rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "PDEP64rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "PEXT32rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "PEXT64rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "POPCNT(16|32|64)rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "SUBSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "SUBSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "TZCNT(16|32|64)rm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "UCOMISDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "UCOMISSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VADDSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VADDSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VCMPSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VCMPSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VCOMISDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VCOMISSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VMAXSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VMAXSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VMINSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VMINSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VSUBSDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VSUBSSrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VUCOMISDrm")>;
+def: InstRW<[HWWriteResGroup12], (instregex "VUCOMISSrm")>;
def HWWriteResGroup13 : SchedWriteRes<[HWPort5,HWPort23]> {
- let Latency = 1;
+ let Latency = 7;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup13], (instregex "ANDPDrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "ANDPSrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "INSERTPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PALIGNR64irm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PINSRWirmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PSHUFBrm64")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PSHUFWmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKHBWirm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKHDQirm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKHWDirm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKLBWirm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKLDQirm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKLWDirm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MOVHPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MOVHPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MOVLPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "MOVLPSrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "ORPDrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "ORPSrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "PACKSSDWrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "PACKUSWBrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "PALIGNRrmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "PBLENDWrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PINSRBrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PINSRDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PINSRQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PINSRWrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXBDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXBQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXBWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXWDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXWQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXBDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXBQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXBWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXWDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXWQrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "PSHUFBrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "PSHUFDmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "PSHUFHWmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "UNPCKHPSrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "UNPCKLPDrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "UNPCKLPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VANDNPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VANDNPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VANDNPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VANDNPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VANDPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VANDPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VANDPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VANDPSrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VINSERTPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VMOVHPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VMOVHPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VMOVLPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VMOVLPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VORPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VORPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VORPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VORPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSDWYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSDWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSWBYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSWBrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSDWYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSDWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSWBYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSWBrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPALIGNRYrmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPALIGNRrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPBLENDWYrmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPBLENDWrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDYmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSYmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPINSRBrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPINSRDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPINSRQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPINSRWrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXBDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXBQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXBWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXWDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXWQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXBDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXBQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXBWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXWDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXWQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFBYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFBrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFDYmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFDmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFHWYmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFHWmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFLWYmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFLWmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHBWYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHBWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHDQYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHQDQYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHQDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHWDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHWDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLBWYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLBWrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLDQYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLQDQYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLQDQrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLWDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLWDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPDYrmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPDrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPSYrmi")>;
def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPSrmi")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPSrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VXORPDYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VXORPDrm")>;
-def: InstRW<[HWWriteResGroup13], (instregex "VXORPSYrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "VXORPSrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "XORPDrm")>;
def: InstRW<[HWWriteResGroup13], (instregex "XORPSrm")>;
+def HWWriteResGroup13_1 : SchedWriteRes<[HWPort5,HWPort23]> {
+ let Latency = 8;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup13_1], (instregex "VANDNPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VANDNPSYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VANDPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VANDPSYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VORPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VORPSYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKSSDWYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKSSWBYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKUSDWYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKUSWBYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPALIGNRYrmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPBLENDWYrmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPDYmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPSYmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPSYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPMOVSXBDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPMOVSXBQYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPMOVSXWQYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFBYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFDYmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFHWYmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFLWYmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHBWYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHDQYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHQDQYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHWDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLBWYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLDQYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLQDQYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLWDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VSHUFPDYrmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VSHUFPSYrmi")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKHPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKHPSYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKLPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKLPSYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VXORPDYrm")>;
+def: InstRW<[HWWriteResGroup13_1], (instregex "VXORPSYrm")>;
+
+def HWWriteResGroup13_2 : SchedWriteRes<[HWPort5,HWPort23]> {
+ let Latency = 6;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PALIGNR64irm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PINSRWirmi")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PSHUFBrm64")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PSHUFWmi")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKHBWirm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKHDQirm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKHWDirm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKLBWirm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKLDQirm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKLWDirm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MOVHPDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MOVHPSrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MOVLPDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "MOVLPSrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRBrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRWrmi")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXBDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXBQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXBWrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXDQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXWDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXWQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXBDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXBQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXBWrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXDQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXWDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXWQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVHPDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVHPSrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVLPDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVLPSrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRBrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRWrmi")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXBDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXBQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXBWrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXDQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXWDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXWQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXBDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXBQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXBWrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXDQrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXWDrm")>;
+def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXWQrm")>;
+
def HWWriteResGroup14 : SchedWriteRes<[HWPort6,HWPort23]> {
- let Latency = 1;
+ let Latency = 6;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup14], (instregex "JMP(16|32|64)m")>;
def HWWriteResGroup15 : SchedWriteRes<[HWPort23,HWPort06]> {
- let Latency = 1;
+ let Latency = 6;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup15], (instregex "SHRX64rm")>;
def HWWriteResGroup16 : SchedWriteRes<[HWPort23,HWPort15]> {
- let Latency = 1;
+ let Latency = 6;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup16], (instregex "MMX_PSUBUSWirm")>;
def: InstRW<[HWWriteResGroup16], (instregex "MMX_PSUBWirm")>;
def: InstRW<[HWWriteResGroup16], (instregex "MOVBE(16|32|64)rm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PABSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PABSDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PABSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDQrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDUSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDUSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PADDWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PAVGBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PAVGWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQQrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPGTBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPGTDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PCMPGTWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMAXSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMAXSDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMAXSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMAXUBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMAXUDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMAXUWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMINSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMINSDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMINSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMINUBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMINUDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PMINUWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSIGNBrm128")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSIGNDrm128")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSIGNWrm128")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBQrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBUSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBUSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "PSUBWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPABSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPABSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPABSDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPABSDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPABSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPABSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDQYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDQrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPADDWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPAVGBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPAVGBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPAVGWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPAVGWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQQYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQQrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINSDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINSDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINUBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINUBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINUDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINUDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINUWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPMINUWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNBYrm256")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNBrm128")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNDYrm256")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNDrm128")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNWYrm256")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNWrm128")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBDYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBDrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBQYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBQrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSBYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSBrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSWrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBWYrm")>;
-def: InstRW<[HWWriteResGroup16], (instregex "VPSUBWrm")>;
+
+def HWWriteResGroup16_1 : SchedWriteRes<[HWPort23,HWPort15]> {
+ let Latency = 7;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup16_1], (instregex "PABSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PABSDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PABSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDQrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDUSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDUSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PADDWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PAVGBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PAVGWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQQrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPGTBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPGTDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPGTWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXSDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXUBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXUDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXUWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMINSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMINSDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMINSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMINUBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMINUDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PMINUWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSIGNBrm128")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSIGNDrm128")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSIGNWrm128")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBQrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBUSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBUSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPABSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPABSDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPABSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDQrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDUSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDUSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPAVGBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPAVGWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQQrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPGTBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPGTDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPGTWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXSDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXUBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXUDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXUWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINSDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINUBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINUDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINUWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSIGNBrm128")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSIGNDrm128")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSIGNWrm128")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBDrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBQrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBUSBrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBUSWrm")>;
+def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBWrm")>;
+
+def HWWriteResGroup16_2 : SchedWriteRes<[HWPort23,HWPort15]> {
+ let Latency = 8;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPABSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPABSDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPABSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDQYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDUSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDUSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPAVGBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPAVGWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQQYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPGTBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPGTDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPGTWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXSDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXUBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXUDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXUWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINSDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINUBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINUDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINUWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSIGNBYrm256")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSIGNDYrm256")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSIGNWYrm256")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBDYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBQYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBUSBYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBUSWYrm")>;
+def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBWYrm")>;
def HWWriteResGroup17 : SchedWriteRes<[HWPort23,HWPort015]> {
- let Latency = 1;
+ let Latency = 7;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup17], (instregex "BLENDPDrmi")>;
def: InstRW<[HWWriteResGroup17], (instregex "BLENDPSrmi")>;
-def: InstRW<[HWWriteResGroup17], (instregex "MMX_PANDNirm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "MMX_PANDirm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "MMX_PORirm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "MMX_PXORirm")>;
def: InstRW<[HWWriteResGroup17], (instregex "PANDNrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "PANDrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "PORrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "PXORrm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPDYrmi")>;
def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPDrmi")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPSYrmi")>;
def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPSrmi")>;
def: InstRW<[HWWriteResGroup17], (instregex "VINSERTF128rm")>;
def: InstRW<[HWWriteResGroup17], (instregex "VINSERTI128rm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VPANDNYrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "VPANDNrm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VPANDYrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "VPANDrm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VPBLENDDYrmi")>;
def: InstRW<[HWWriteResGroup17], (instregex "VPBLENDDrmi")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VPORYrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "VPORrm")>;
-def: InstRW<[HWWriteResGroup17], (instregex "VPXORYrm")>;
def: InstRW<[HWWriteResGroup17], (instregex "VPXORrm")>;
+def HWWriteResGroup17_1 : SchedWriteRes<[HWPort23,HWPort015]> {
+ let Latency = 6;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PANDNirm")>;
+def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PANDirm")>;
+def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PORirm")>;
+def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PXORirm")>;
+
+def HWWriteResGroup17_2 : SchedWriteRes<[HWPort23,HWPort015]> {
+ let Latency = 8;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup17_2], (instregex "VBLENDPDYrmi")>;
+def: InstRW<[HWWriteResGroup17_2], (instregex "VBLENDPSYrmi")>;
+def: InstRW<[HWWriteResGroup17_2], (instregex "VPANDNYrm")>;
+def: InstRW<[HWWriteResGroup17_2], (instregex "VPANDYrm")>;
+def: InstRW<[HWWriteResGroup17_2], (instregex "VPBLENDDYrmi")>;
+def: InstRW<[HWWriteResGroup17_2], (instregex "VPORYrm")>;
+def: InstRW<[HWWriteResGroup17_2], (instregex "VPXORYrm")>;
+
def HWWriteResGroup18 : SchedWriteRes<[HWPort23,HWPort0156]> {
- let Latency = 1;
+ let Latency = 6;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup18], (instregex "XOR8rm")>;
def HWWriteResGroup19 : SchedWriteRes<[HWPort237,HWPort0156]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup19], (instregex "SFENCE")>;
def HWWriteResGroup20 : SchedWriteRes<[HWPort4,HWPort5,HWPort237]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup20], (instregex "VSTMXCSR")>;
def HWWriteResGroup21 : SchedWriteRes<[HWPort4,HWPort6,HWPort237]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup21], (instregex "FNSTCW16m")>;
def HWWriteResGroup22 : SchedWriteRes<[HWPort4,HWPort237,HWPort06]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup22], (instregex "SETSm")>;
def HWWriteResGroup23 : SchedWriteRes<[HWPort4,HWPort237,HWPort15]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup23], (instregex "MOVBE(32|64)mr")>;
def HWWriteResGroup23_16 : SchedWriteRes<[HWPort06, HWPort237, HWPort4]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup23_16], (instregex "MOVBE16mr")>;
def HWWriteResGroup24 : SchedWriteRes<[HWPort4,HWPort237,HWPort0156]> {
- let Latency = 1;
+ let Latency = 2;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup24], (instregex "STOSW")>;
def HWWriteResGroup25 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06]> {
- let Latency = 1;
+ let Latency = 7;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup25], (instregex "SHR8mi")>;
def HWWriteResGroup26 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 1;
+ let Latency = 7;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup26], (instregex "OR(16|32|64)mr")>;
def: InstRW<[HWWriteResGroup26], (instregex "OR8mi")>;
def: InstRW<[HWWriteResGroup26], (instregex "OR8mr")>;
+def: InstRW<[HWWriteResGroup26], (instregex "POP(16|32|64)rmm")>;
+def: InstRW<[HWWriteResGroup26], (instregex "PUSH(16|32|64)rmm")>;
def: InstRW<[HWWriteResGroup26], (instregex "SUB(16|32|64)mi8")>;
def: InstRW<[HWWriteResGroup26], (instregex "SUB(16|32|64)mr")>;
def: InstRW<[HWWriteResGroup26], (instregex "SUB8mi")>;
def: InstRW<[HWWriteResGroup35], (instregex "SETBEr")>;
def HWWriteResGroup36 : SchedWriteRes<[HWPort5,HWPort23]> {
- let Latency = 2;
+ let Latency = 8;
let NumMicroOps = 3;
let ResourceCycles = [2,1];
}
def: InstRW<[HWWriteResGroup36], (instregex "BLENDVPDrm0")>;
def: InstRW<[HWWriteResGroup36], (instregex "BLENDVPSrm0")>;
-def: InstRW<[HWWriteResGroup36], (instregex "MMX_PACKSSDWirm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "MMX_PACKSSWBirm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "MMX_PACKUSWBirm")>;
def: InstRW<[HWWriteResGroup36], (instregex "PBLENDVBrm0")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPDYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPDrm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPSYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPSrm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPDYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPDrm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPSYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPSrm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VPBLENDVBYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VPBLENDVBrm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVDYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVDrm")>;
-def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVQYrm")>;
def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVQrm")>;
+def HWWriteResGroup36_1 : SchedWriteRes<[HWPort5,HWPort23]> {
+ let Latency = 9;
+ let NumMicroOps = 3;
+ let ResourceCycles = [2,1];
+}
+def: InstRW<[HWWriteResGroup36_1], (instregex "VBLENDVPDYrm")>;
+def: InstRW<[HWWriteResGroup36_1], (instregex "VBLENDVPSYrm")>;
+def: InstRW<[HWWriteResGroup36_1], (instregex "VMASKMOVPDYrm")>;
+def: InstRW<[HWWriteResGroup36_1], (instregex "VMASKMOVPSYrm")>;
+def: InstRW<[HWWriteResGroup36_1], (instregex "VPBLENDVBYrm")>;
+def: InstRW<[HWWriteResGroup36_1], (instregex "VPMASKMOVDYrm")>;
+def: InstRW<[HWWriteResGroup36_1], (instregex "VPMASKMOVQYrm")>;
+
+def HWWriteResGroup36_2 : SchedWriteRes<[HWPort5,HWPort23]> {
+ let Latency = 7;
+ let NumMicroOps = 3;
+ let ResourceCycles = [2,1];
+}
+def: InstRW<[HWWriteResGroup36_2], (instregex "MMX_PACKSSDWirm")>;
+def: InstRW<[HWWriteResGroup36_2], (instregex "MMX_PACKSSWBirm")>;
+def: InstRW<[HWWriteResGroup36_2], (instregex "MMX_PACKUSWBirm")>;
+
def HWWriteResGroup37 : SchedWriteRes<[HWPort23,HWPort0156]> {
- let Latency = 2;
+ let Latency = 7;
let NumMicroOps = 3;
let ResourceCycles = [1,2];
}
def: InstRW<[HWWriteResGroup37], (instregex "SCASW")>;
def HWWriteResGroup38 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
- let Latency = 2;
+ let Latency = 8;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup38], (instregex "VPTESTrm")>;
def HWWriteResGroup39 : SchedWriteRes<[HWPort0,HWPort01,HWPort23]> {
- let Latency = 2;
+ let Latency = 7;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup39], (instregex "FLDCW16m")>;
def HWWriteResGroup40 : SchedWriteRes<[HWPort0,HWPort23,HWPort0156]> {
- let Latency = 2;
+ let Latency = 7;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup40], (instregex "VLDMXCSR")>;
def HWWriteResGroup41 : SchedWriteRes<[HWPort6,HWPort23,HWPort0156]> {
- let Latency = 2;
+ let Latency = 7;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup41], (instregex "LRETQ")>;
+def: InstRW<[HWWriteResGroup41], (instregex "RETL")>;
def: InstRW<[HWWriteResGroup41], (instregex "RETQ")>;
def HWWriteResGroup42 : SchedWriteRes<[HWPort23,HWPort06,HWPort15]> {
- let Latency = 2;
+ let Latency = 7;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup42], (instregex "BEXTR64rm")>;
def HWWriteResGroup43 : SchedWriteRes<[HWPort23,HWPort06,HWPort0156]> {
- let Latency = 2;
+ let Latency = 7;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup43], (instregex "SBB8rm")>;
def HWWriteResGroup44 : SchedWriteRes<[HWPort4,HWPort6,HWPort237,HWPort0156]> {
- let Latency = 2;
+ let Latency = 3;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup44], (instregex "CALL(16|32|64)r")>;
def HWWriteResGroup45 : SchedWriteRes<[HWPort4,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 2;
+ let Latency = 3;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup45], (instregex "SETBEm")>;
def HWWriteResGroup46 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06]> {
- let Latency = 2;
+ let Latency = 8;
let NumMicroOps = 5;
let ResourceCycles = [1,1,1,2];
}
def: InstRW<[HWWriteResGroup46], (instregex "ROR8mi")>;
def HWWriteResGroup47 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 2;
+ let Latency = 8;
let NumMicroOps = 5;
let ResourceCycles = [1,1,1,2];
}
def: InstRW<[HWWriteResGroup47], (instregex "XADD8rm")>;
def HWWriteResGroup48 : SchedWriteRes<[HWPort4,HWPort6,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 2;
+ let Latency = 8;
let NumMicroOps = 5;
let ResourceCycles = [1,1,1,1,1];
}
def: InstRW<[HWWriteResGroup51], (instregex "VPMOVZXWQYrr")>;
def HWWriteResGroup52 : SchedWriteRes<[HWPort1,HWPort23]> {
- let Latency = 3;
+ let Latency = 9;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup52], (instregex "ADDPDrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "ADDPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ADDSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ADDSSrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "ADDSUBPDrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "ADDSUBPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ADD_F32m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ADD_F64m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "BSF(16|32|64)rm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "BSR(16|32|64)rm")>;
def: InstRW<[HWWriteResGroup52], (instregex "CMPPDrmi")>;
def: InstRW<[HWWriteResGroup52], (instregex "CMPPSrmi")>;
-def: InstRW<[HWWriteResGroup52], (instregex "CMPSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "COMISDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "COMISSrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "CVTDQ2PSrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "CVTPS2DQrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "CVTTPS2DQrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ILD_F16m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ILD_F32m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "ILD_F64m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "IMUL64m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "IMUL64rm(i8?)")>;
-def: InstRW<[HWWriteResGroup52], (instregex "IMUL8m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "LZCNT(16|32|64)rm")>;
def: InstRW<[HWWriteResGroup52], (instregex "MAXPDrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "MAXPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MAXSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MAXSSrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "MINPDrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "MINPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MINSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MINSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MMX_CVTPI2PSirm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MMX_CVTPS2PIirm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MMX_CVTTPS2PIirm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MUL64m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "MUL8m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "PDEP32rm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "PDEP64rm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "PEXT32rm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "PEXT64rm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "POPCNT(16|32|64)rm")>;
def: InstRW<[HWWriteResGroup52], (instregex "SUBPDrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "SUBPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "SUBR_F32m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "SUBR_F64m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "SUBSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "SUBSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "SUB_F32m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "SUB_F64m")>;
-def: InstRW<[HWWriteResGroup52], (instregex "TZCNT(16|32|64)rm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "UCOMISDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "UCOMISSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VADDPDYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VADDPDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VADDPSYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VADDPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VADDSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VADDSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPDYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPSYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCMPPDYrmi")>;
def: InstRW<[HWWriteResGroup52], (instregex "VCMPPDrmi")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCMPPSYrmi")>;
def: InstRW<[HWWriteResGroup52], (instregex "VCMPPSrmi")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCMPSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCMPSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCOMISDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCOMISSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCVTDQ2PSYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VCVTDQ2PSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCVTPS2DQYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VCVTPS2DQrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VCVTTPS2DQYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VCVTTPS2DQrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMAXPDYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VMAXPDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMAXPSYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VMAXPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMAXSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMAXSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMINPDYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VMINPDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMINPSYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VMINPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMINSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VMINSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VSUBPDYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VSUBPDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VSUBPSYrm")>;
def: InstRW<[HWWriteResGroup52], (instregex "VSUBPSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VSUBSDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VSUBSSrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VUCOMISDrm")>;
-def: InstRW<[HWWriteResGroup52], (instregex "VUCOMISSrm")>;
-def HWWriteResGroup52_16 : SchedWriteRes<[HWPort1, HWPort0156, HWPort23]> {
- let Latency = 3;
- let NumMicroOps = 4;
-}
-def: InstRW<[HWWriteResGroup52_16], (instregex "IMUL16m")>;
-def: InstRW<[HWWriteResGroup52_16], (instregex "IMUL16rm(i8?)")>;
-def: InstRW<[HWWriteResGroup52_16], (instregex "MUL16m")>;
-
-def HWWriteResGroup52_32 : SchedWriteRes<[HWPort1, HWPort0156, HWPort23]> {
- let Latency = 3;
- let NumMicroOps = 3;
+def HWWriteResGroup52_1 : SchedWriteRes<[HWPort1,HWPort23]> {
+ let Latency = 10;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
}
-def: InstRW<[HWWriteResGroup52_32], (instregex "IMUL32m")>;
-def: InstRW<[HWWriteResGroup52_32], (instregex "IMUL32rm(i8?)")>;
-def: InstRW<[HWWriteResGroup52_32], (instregex "MUL32m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "ADD_F32m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "ADD_F64m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "ILD_F16m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "ILD_F32m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "ILD_F64m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "SUBR_F32m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "SUBR_F64m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "SUB_F32m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "SUB_F64m")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VADDPDYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VADDPSYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VADDSUBPDYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VADDSUBPSYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VCMPPDYrmi")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VCMPPSYrmi")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VCVTDQ2PSYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VCVTPS2DQYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VCVTTPS2DQYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VMAXPDYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VMAXPSYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VMINPDYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VMINPSYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VSUBPDYrm")>;
+def: InstRW<[HWWriteResGroup52_1], (instregex "VSUBPSYrm")>;
def HWWriteResGroup53 : SchedWriteRes<[HWPort5,HWPort23]> {
- let Latency = 3;
+ let Latency = 10;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup53], (instregex "VPERMPDYmi")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPERMPSYrm")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPERMQYmi")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXBDYrm")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXBQYrm")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXBWYrm")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXDQYrm")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXWDYrm")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXWQYrm")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXBDYrm")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXBQYrm")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXBWYrm")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXDQYrm")>;
-def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXWDYrm")>;
def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXWQYrm")>;
+def HWWriteResGroup53_1 : SchedWriteRes<[HWPort5,HWPort23]> {
+ let Latency = 9;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVSXBWYrm")>;
+def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVSXDQYrm")>;
+def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVSXWDYrm")>;
+def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVZXWDYrm")>;
+
def HWWriteResGroup54 : SchedWriteRes<[HWPort0156]> {
let Latency = 3;
let NumMicroOps = 3;
def: InstRW<[HWWriteResGroup60], (instregex "SHR8rCL")>;
def HWWriteResGroup61 : SchedWriteRes<[HWPort0,HWPort4,HWPort237]> {
- let Latency = 3;
+ let Latency = 4;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup61], (instregex "FNSTSWm")>;
def HWWriteResGroup62 : SchedWriteRes<[HWPort1,HWPort4,HWPort237]> {
- let Latency = 3;
+ let Latency = 4;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup62], (instregex "IST_FP64m")>;
def HWWriteResGroup63 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
- let Latency = 3;
+ let Latency = 10;
let NumMicroOps = 4;
let ResourceCycles = [2,1,1];
}
def: InstRW<[HWWriteResGroup63], (instregex "VPSLLVDYrm")>;
-def: InstRW<[HWWriteResGroup63], (instregex "VPSLLVDrm")>;
def: InstRW<[HWWriteResGroup63], (instregex "VPSRAVDYrm")>;
-def: InstRW<[HWWriteResGroup63], (instregex "VPSRAVDrm")>;
def: InstRW<[HWWriteResGroup63], (instregex "VPSRLVDYrm")>;
-def: InstRW<[HWWriteResGroup63], (instregex "VPSRLVDrm")>;
+
+def HWWriteResGroup63_1 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
+ let Latency = 9;
+ let NumMicroOps = 4;
+ let ResourceCycles = [2,1,1];
+}
+def: InstRW<[HWWriteResGroup63_1], (instregex "VPSLLVDrm")>;
+def: InstRW<[HWWriteResGroup63_1], (instregex "VPSRAVDrm")>;
+def: InstRW<[HWWriteResGroup63_1], (instregex "VPSRLVDrm")>;
def HWWriteResGroup64 : SchedWriteRes<[HWPort5,HWPort23,HWPort15]> {
- let Latency = 3;
+ let Latency = 8;
let NumMicroOps = 4;
let ResourceCycles = [2,1,1];
}
def: InstRW<[HWWriteResGroup64], (instregex "MMX_PHSUBDrm64")>;
def: InstRW<[HWWriteResGroup64], (instregex "MMX_PHSUBSWrm64")>;
def: InstRW<[HWWriteResGroup64], (instregex "MMX_PHSUBWrm64")>;
-def: InstRW<[HWWriteResGroup64], (instregex "PHADDDrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "PHADDSWrm128")>;
-def: InstRW<[HWWriteResGroup64], (instregex "PHADDWrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "PHSUBDrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "PHSUBSWrm128")>;
-def: InstRW<[HWWriteResGroup64], (instregex "PHSUBWrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHADDDYrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHADDDrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHADDSWrm128")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHADDSWrm256")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHADDWYrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHADDWrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBDYrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBDrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBSWrm128")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBSWrm256")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBWYrm")>;
-def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBWrm")>;
+
+def HWWriteResGroup64_1 : SchedWriteRes<[HWPort5,HWPort23,HWPort15]> {
+ let Latency = 10;
+ let NumMicroOps = 4;
+ let ResourceCycles = [2,1,1];
+}
+def: InstRW<[HWWriteResGroup64_1], (instregex "VPHADDDYrm")>;
+def: InstRW<[HWWriteResGroup64_1], (instregex "VPHADDSWrm256")>;
+def: InstRW<[HWWriteResGroup64_1], (instregex "VPHADDWYrm")>;
+def: InstRW<[HWWriteResGroup64_1], (instregex "VPHSUBDYrm")>;
+def: InstRW<[HWWriteResGroup64_1], (instregex "VPHSUBSWrm256")>;
+def: InstRW<[HWWriteResGroup64_1], (instregex "VPHSUBWYrm")>;
+
+def HWWriteResGroup64_2 : SchedWriteRes<[HWPort5,HWPort23,HWPort15]> {
+ let Latency = 9;
+ let NumMicroOps = 4;
+ let ResourceCycles = [2,1,1];
+}
+def: InstRW<[HWWriteResGroup64_2], (instregex "PHADDDrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "PHADDSWrm128")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "PHADDWrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "PHSUBDrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "PHSUBSWrm128")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "PHSUBWrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "VPHADDDrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "VPHADDSWrm128")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "VPHADDWrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "VPHSUBDrm")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "VPHSUBSWrm128")>;
+def: InstRW<[HWWriteResGroup64_2], (instregex "VPHSUBWrm")>;
def HWWriteResGroup65 : SchedWriteRes<[HWPort23,HWPort06,HWPort0156]> {
- let Latency = 3;
+ let Latency = 8;
let NumMicroOps = 4;
let ResourceCycles = [1,1,2];
}
def: InstRW<[HWWriteResGroup65], (instregex "CMOVBE(16|32|64)rm")>;
def HWWriteResGroup66 : SchedWriteRes<[HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 3;
+ let Latency = 9;
let NumMicroOps = 5;
let ResourceCycles = [1,1,1,2];
}
def: InstRW<[HWWriteResGroup66], (instregex "RCR8mi")>;
def HWWriteResGroup67 : SchedWriteRes<[HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 3;
+ let Latency = 9;
let NumMicroOps = 5;
let ResourceCycles = [1,1,2,1];
}
def: InstRW<[HWWriteResGroup67], (instregex "ROR8mCL")>;
def HWWriteResGroup68 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 3;
+ let Latency = 9;
let NumMicroOps = 6;
let ResourceCycles = [1,1,1,3];
}
def: InstRW<[HWWriteResGroup68], (instregex "XOR8mi")>;
def HWWriteResGroup69 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 3;
+ let Latency = 9;
let NumMicroOps = 6;
let ResourceCycles = [1,1,1,2,1];
}
def: InstRW<[HWWriteResGroup74_32], (instregex "MUL32r")>;
def HWWriteResGroup75 : SchedWriteRes<[HWPort1,HWPort23]> {
- let Latency = 4;
+ let Latency = 11;
let NumMicroOps = 3;
let ResourceCycles = [2,1];
}
def: InstRW<[HWWriteResGroup75], (instregex "FICOMP32m")>;
def HWWriteResGroup76 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> {
- let Latency = 4;
+ let Latency = 9;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup76], (instregex "VCVTTSS2SIrm")>;
def HWWriteResGroup77 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
- let Latency = 4;
+ let Latency = 10;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup77], (instregex "VCVTPS2PDYrm")>;
-def: InstRW<[HWWriteResGroup77], (instregex "VPTESTYrm")>;
+
+def HWWriteResGroup77_1 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
+ let Latency = 11;
+ let NumMicroOps = 3;
+ let ResourceCycles = [1,1,1];
+}
+def: InstRW<[HWWriteResGroup77_1], (instregex "VPTESTYrm")>;
def HWWriteResGroup78 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> {
- let Latency = 4;
+ let Latency = 10;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup78], (instregex "CVTDQ2PDrm")>;
def: InstRW<[HWWriteResGroup78], (instregex "CVTPD2DQrm")>;
def: InstRW<[HWWriteResGroup78], (instregex "CVTPD2PSrm")>;
-def: InstRW<[HWWriteResGroup78], (instregex "CVTSD2SSrm")>;
def: InstRW<[HWWriteResGroup78], (instregex "CVTTPD2DQrm")>;
def: InstRW<[HWWriteResGroup78], (instregex "MMX_CVTPD2PIirm")>;
-def: InstRW<[HWWriteResGroup78], (instregex "MMX_CVTPI2PDirm")>;
def: InstRW<[HWWriteResGroup78], (instregex "MMX_CVTTPD2PIirm")>;
def: InstRW<[HWWriteResGroup78], (instregex "VCVTDQ2PDrm")>;
-def: InstRW<[HWWriteResGroup78], (instregex "VCVTSD2SSrm")>;
+
+def HWWriteResGroup78_1 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> {
+ let Latency = 9;
+ let NumMicroOps = 3;
+ let ResourceCycles = [1,1,1];
+}
+def: InstRW<[HWWriteResGroup78_1], (instregex "CVTSD2SSrm")>;
+def: InstRW<[HWWriteResGroup78_1], (instregex "MMX_CVTPI2PDirm")>;
+def: InstRW<[HWWriteResGroup78_1], (instregex "VCVTSD2SSrm")>;
def HWWriteResGroup79 : SchedWriteRes<[HWPort1,HWPort6,HWPort23]> {
- let Latency = 4;
+ let Latency = 9;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup79], (instregex "MULX64rm")>;
def HWWriteResGroup80 : SchedWriteRes<[HWPort5,HWPort23,HWPort015]> {
- let Latency = 4;
+ let Latency = 9;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup83], (instregex "LAR(16|32|64)rr")>;
def HWWriteResGroup84 : SchedWriteRes<[HWPort0,HWPort4,HWPort237,HWPort15]> {
- let Latency = 4;
+ let Latency = 5;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup84], (instregex "VPMASKMOVQmr")>;
def HWWriteResGroup85 : SchedWriteRes<[HWPort1,HWPort4,HWPort5,HWPort237]> {
- let Latency = 4;
+ let Latency = 5;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup85], (instregex "VCVTPS2PHmr")>;
def HWWriteResGroup86 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 4;
+ let Latency = 10;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup86], (instregex "SHRD(16|32|64)mri8")>;
def HWWriteResGroup87 : SchedWriteRes<[HWPort1,HWPort6,HWPort23,HWPort0156]> {
- let Latency = 4;
+ let Latency = 9;
let NumMicroOps = 5;
let ResourceCycles = [1,2,1,1];
}
def: InstRW<[HWWriteResGroup87], (instregex "LSL(16|32|64)rm")>;
def HWWriteResGroup88 : SchedWriteRes<[HWPort4,HWPort237,HWPort0156]> {
- let Latency = 4;
+ let Latency = 5;
let NumMicroOps = 6;
let ResourceCycles = [1,1,4];
}
def: InstRW<[HWWriteResGroup90], (instregex "VMULSSrr")>;
def HWWriteResGroup91 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 5;
+ let Latency = 10;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup91], (instregex "MMX_PMULLWirm")>;
def: InstRW<[HWWriteResGroup91], (instregex "MMX_PMULUDQirm")>;
def: InstRW<[HWWriteResGroup91], (instregex "MMX_PSADBWirm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "MUL_F32m")>;
-def: InstRW<[HWWriteResGroup91], (instregex "MUL_F64m")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PCMPGTQrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PHMINPOSUWrm128")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMADDUBSWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMADDWDrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMULDQrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMULHRSWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMULHUWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMULHWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMULLWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PMULUDQrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "PSADBWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "RCPPSm")>;
def: InstRW<[HWWriteResGroup91], (instregex "RCPSSm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "RSQRTPSm")>;
def: InstRW<[HWWriteResGroup91], (instregex "RSQRTSSm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPCMPGTQYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPCMPGTQrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPHMINPOSUWrm128")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMADDUBSWYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMADDUBSWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMADDWDYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMADDWDrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULDQYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULDQrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULHRSWYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULHRSWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULHUWYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULHUWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULHWYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULHWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULLWYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULLWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULUDQYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPMULUDQrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPSADBWYrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VPSADBWrm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VRCPPSm")>;
def: InstRW<[HWWriteResGroup91], (instregex "VRCPSSm")>;
-def: InstRW<[HWWriteResGroup91], (instregex "VRSQRTPSm")>;
def: InstRW<[HWWriteResGroup91], (instregex "VRSQRTSSm")>;
+def HWWriteResGroup91_1 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 18;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup91_1], (instregex "SQRTSSm")>;
+def: InstRW<[HWWriteResGroup91_1], (instregex "VDIVSSrm")>;
+
+def HWWriteResGroup91_2 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 11;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup91_2], (instregex "PCMPGTQrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PHMINPOSUWrm128")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMADDUBSWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMADDWDrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMULDQrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMULHRSWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMULHUWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMULHWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMULLWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PMULUDQrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "PSADBWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "RCPPSm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "RSQRTPSm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPCMPGTQrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPHMINPOSUWrm128")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMADDUBSWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMADDWDrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULDQrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULHRSWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULHUWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULHWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULLWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULUDQrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VPSADBWrm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VRCPPSm")>;
+def: InstRW<[HWWriteResGroup91_2], (instregex "VRSQRTPSm")>;
+
+def HWWriteResGroup91_3 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 12;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup91_3], (instregex "MUL_F32m")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "MUL_F64m")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPCMPGTQYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMADDUBSWYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMADDWDYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULDQYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULHRSWYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULHUWYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULHWYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULLWYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULUDQYrm")>;
+def: InstRW<[HWWriteResGroup91_3], (instregex "VPSADBWYrm")>;
+
def HWWriteResGroup92 : SchedWriteRes<[HWPort01,HWPort23]> {
- let Latency = 5;
+ let Latency = 11;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup92], (instregex "MULPDrm")>;
def: InstRW<[HWWriteResGroup92], (instregex "MULPSrm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "MULSDrm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "MULSSrm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PDYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PSYm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231SDm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231SSm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VMULPDYrm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VMULPDrm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VMULPSYrm")>;
def: InstRW<[HWWriteResGroup92], (instregex "VMULPSrm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VMULSDrm")>;
-def: InstRW<[HWWriteResGroup92], (instregex "VMULSSrm")>;
+
+def HWWriteResGroup92_1 : SchedWriteRes<[HWPort01,HWPort23]> {
+ let Latency = 12;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD132PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD132PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD213PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD213PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD231PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD231PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB132PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB132PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB213PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB213PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB231PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB231PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB132PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB132PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB213PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB213PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB231PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB231PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD132PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD132PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD213PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD213PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD231PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD231PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD132PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD132PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD213PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD213PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD231PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD231PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB132PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB132PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB213PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB213PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB231PDYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB231PSYm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VMULPDYrm")>;
+def: InstRW<[HWWriteResGroup92_1], (instregex "VMULPSYrm")>;
+
+def HWWriteResGroup92_2 : SchedWriteRes<[HWPort01,HWPort23]> {
+ let Latency = 10;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup92_2], (instregex "MULSDrm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "MULSSrm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD132SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD132SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD213SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD213SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD231SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD231SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB132SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB132SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB213SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB213SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB231SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB231SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD132SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD132SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD213SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD213SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD231SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD231SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB132SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB132SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB213SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB213SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB231SDm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB231SSm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VMULSDrm")>;
+def: InstRW<[HWWriteResGroup92_2], (instregex "VMULSSrm")>;
def HWWriteResGroup93 : SchedWriteRes<[HWPort1,HWPort5]> {
let Latency = 5;
def: InstRW<[HWWriteResGroup95], (instregex "MULX32rr")>;
def HWWriteResGroup96 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> {
- let Latency = 5;
+ let Latency = 11;
let NumMicroOps = 4;
let ResourceCycles = [1,2,1];
}
def: InstRW<[HWWriteResGroup96], (instregex "HADDPSrm")>;
def: InstRW<[HWWriteResGroup96], (instregex "HSUBPDrm")>;
def: InstRW<[HWWriteResGroup96], (instregex "HSUBPSrm")>;
-def: InstRW<[HWWriteResGroup96], (instregex "VHADDPDYrm")>;
def: InstRW<[HWWriteResGroup96], (instregex "VHADDPDrm")>;
-def: InstRW<[HWWriteResGroup96], (instregex "VHADDPSYrm")>;
def: InstRW<[HWWriteResGroup96], (instregex "VHADDPSrm")>;
-def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPDYrm")>;
def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPDrm")>;
-def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPSYrm")>;
def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPSrm")>;
+def HWWriteResGroup96_1 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> {
+ let Latency = 12;
+ let NumMicroOps = 4;
+ let ResourceCycles = [1,2,1];
+}
+def: InstRW<[HWWriteResGroup96_1], (instregex "VHADDPDYrm")>;
+def: InstRW<[HWWriteResGroup96_1], (instregex "VHADDPSYrm")>;
+def: InstRW<[HWWriteResGroup96_1], (instregex "VHSUBPDYrm")>;
+def: InstRW<[HWWriteResGroup96_1], (instregex "VHSUBPSYrm")>;
+
def HWWriteResGroup97 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> {
- let Latency = 5;
+ let Latency = 10;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup97], (instregex "CVTTSS2SI64rm")>;
def HWWriteResGroup98 : SchedWriteRes<[HWPort1,HWPort23,HWPort06,HWPort0156]> {
- let Latency = 5;
+ let Latency = 10;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
}
def: InstRW<[HWWriteResGroup101], (instregex "CMPXCHG(16|32|64)rr")>;
def: InstRW<[HWWriteResGroup101], (instregex "CMPXCHG8rr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "ROUNDPDr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "ROUNDPSr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "ROUNDSDr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "ROUNDSSr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "VROUNDPDr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "VROUNDPSr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "VROUNDSDr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "VROUNDSSr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "VROUNDYPDr")>;
-def: InstRW<[HWWriteResGroup101], (instregex "VROUNDYPSr")>;
def HWWriteResGroup102 : SchedWriteRes<[HWPort1,HWPort5]> {
let Latency = 6;
def: InstRW<[HWWriteResGroup102], (instregex "VCVTTPD2DQYrr")>;
def HWWriteResGroup103 : SchedWriteRes<[HWPort1,HWPort23]> {
- let Latency = 6;
+ let Latency = 13;
let NumMicroOps = 3;
let ResourceCycles = [2,1];
}
def: InstRW<[HWWriteResGroup103], (instregex "ADD_FI16m")>;
def: InstRW<[HWWriteResGroup103], (instregex "ADD_FI32m")>;
-def: InstRW<[HWWriteResGroup103], (instregex "ROUNDPDm")>;
-def: InstRW<[HWWriteResGroup103], (instregex "ROUNDPSm")>;
-def: InstRW<[HWWriteResGroup103], (instregex "ROUNDSDm")>;
-def: InstRW<[HWWriteResGroup103], (instregex "ROUNDSSm")>;
def: InstRW<[HWWriteResGroup103], (instregex "SUBR_FI16m")>;
def: InstRW<[HWWriteResGroup103], (instregex "SUBR_FI32m")>;
def: InstRW<[HWWriteResGroup103], (instregex "SUB_FI16m")>;
def: InstRW<[HWWriteResGroup103], (instregex "SUB_FI32m")>;
-def: InstRW<[HWWriteResGroup103], (instregex "VROUNDPDm")>;
-def: InstRW<[HWWriteResGroup103], (instregex "VROUNDPSm")>;
-def: InstRW<[HWWriteResGroup103], (instregex "VROUNDSDm")>;
-def: InstRW<[HWWriteResGroup103], (instregex "VROUNDSSm")>;
def: InstRW<[HWWriteResGroup103], (instregex "VROUNDYPDm")>;
def: InstRW<[HWWriteResGroup103], (instregex "VROUNDYPSm")>;
+def HWWriteResGroup103_1 : SchedWriteRes<[HWPort1,HWPort23]> {
+ let Latency = 12;
+ let NumMicroOps = 3;
+ let ResourceCycles = [2,1];
+}
+def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDPDm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDPSm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDSDm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDSSm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDPDm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDPSm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDSDm")>;
+def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDSSm")>;
+
def HWWriteResGroup104 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> {
- let Latency = 6;
+ let Latency = 12;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup105], (instregex "SHRD(16|32|64)rrCL")>;
def HWWriteResGroup106 : SchedWriteRes<[HWPort1,HWPort4,HWPort5,HWPort237]> {
- let Latency = 6;
+ let Latency = 7;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup108], (instregex "STD")>;
def HWWriteResGroup109 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 6;
+ let Latency = 12;
let NumMicroOps = 6;
let ResourceCycles = [1,1,1,1,2];
}
def: InstRW<[HWWriteResGroup110], (instregex "VAESENCrr")>;
def HWWriteResGroup111 : SchedWriteRes<[HWPort5,HWPort23]> {
- let Latency = 7;
+ let Latency = 13;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup112], (instregex "VMPSADBWrri")>;
def HWWriteResGroup113 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
- let Latency = 7;
+ let Latency = 13;
let NumMicroOps = 4;
let ResourceCycles = [1,2,1];
}
def: InstRW<[HWWriteResGroup113], (instregex "MPSADBWrmi")>;
-def: InstRW<[HWWriteResGroup113], (instregex "VMPSADBWYrmi")>;
def: InstRW<[HWWriteResGroup113], (instregex "VMPSADBWrmi")>;
+def HWWriteResGroup113_1 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
+ let Latency = 14;
+ let NumMicroOps = 4;
+ let ResourceCycles = [1,2,1];
+}
+def: InstRW<[HWWriteResGroup113_1], (instregex "VMPSADBWYrmi")>;
+
def HWWriteResGroup114 : SchedWriteRes<[HWPort6,HWPort06,HWPort15,HWPort0156]> {
let Latency = 7;
let NumMicroOps = 7;
def: InstRW<[HWWriteResGroup114], (instregex "LOOP")>;
def HWWriteResGroup115 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> {
- let Latency = 8;
+ let Latency = 15;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup116], (instregex "VDPPDrri")>;
def HWWriteResGroup117 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> {
- let Latency = 9;
+ let Latency = 15;
let NumMicroOps = 4;
let ResourceCycles = [1,1,1,1];
}
def: InstRW<[HWWriteResGroup118], (instregex "VPMULLDrr")>;
def HWWriteResGroup119 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 10;
+ let Latency = 16;
let NumMicroOps = 3;
let ResourceCycles = [2,1];
}
def: InstRW<[HWWriteResGroup119], (instregex "PMULLDrm")>;
-def: InstRW<[HWWriteResGroup119], (instregex "VPMULLDYrm")>;
def: InstRW<[HWWriteResGroup119], (instregex "VPMULLDrm")>;
+def HWWriteResGroup119_1 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 17;
+ let NumMicroOps = 3;
+ let ResourceCycles = [2,1];
+}
+def: InstRW<[HWWriteResGroup119_1], (instregex "VPMULLDYrm")>;
+
def HWWriteResGroup120 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort06,HWPort15,HWPort0156]> {
- let Latency = 10;
+ let Latency = 16;
let NumMicroOps = 10;
let ResourceCycles = [1,1,1,4,1,2];
}
def: InstRW<[HWWriteResGroup121], (instregex "DIVSSrr")>;
def HWWriteResGroup122 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 11;
+ let Latency = 17;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup122], (instregex "DIVPSrm")>;
-def: InstRW<[HWWriteResGroup122], (instregex "DIVSSrm")>;
+
+def HWWriteResGroup122_1 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 16;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup122_1], (instregex "DIVSSrm")>;
def HWWriteResGroup123 : SchedWriteRes<[HWPort0]> {
let Latency = 11;
def: InstRW<[HWWriteResGroup125], (instregex "VRSQRTPSYr")>;
def HWWriteResGroup126 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 11;
+ let Latency = 17;
let NumMicroOps = 4;
let ResourceCycles = [3,1];
}
def: InstRW<[HWWriteResGroup126], (instregex "VPCMPISTRM128rm")>;
def HWWriteResGroup127 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> {
- let Latency = 11;
+ let Latency = 17;
let NumMicroOps = 4;
let ResourceCycles = [2,1,1];
}
def: InstRW<[HWWriteResGroup127], (instregex "VPCLMULQDQrm")>;
def HWWriteResGroup128 : SchedWriteRes<[HWPort0,HWPort23,HWPort015]> {
- let Latency = 11;
+ let Latency = 18;
let NumMicroOps = 4;
let ResourceCycles = [2,1,1];
}
def: InstRW<[HWWriteResGroup131], (instregex "LOOPNE")>;
def HWWriteResGroup132 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06,HWPort15,HWPort0156]> {
- let Latency = 11;
+ let Latency = 17;
let NumMicroOps = 14;
let ResourceCycles = [1,1,1,4,2,5];
}
def: InstRW<[HWWriteResGroup133], (instregex "VDIVSSrr")>;
def HWWriteResGroup134 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 13;
+ let Latency = 19;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
+def: InstRW<[HWWriteResGroup134], (instregex "DIVSDrm")>;
def: InstRW<[HWWriteResGroup134], (instregex "SQRTPSm")>;
-def: InstRW<[HWWriteResGroup134], (instregex "SQRTSSm")>;
def: InstRW<[HWWriteResGroup134], (instregex "VDIVPSrm")>;
-def: InstRW<[HWWriteResGroup134], (instregex "VDIVSSrm")>;
+def: InstRW<[HWWriteResGroup134], (instregex "VSQRTSSm")>;
def HWWriteResGroup135 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort06,HWPort15,HWPort0156]> {
- let Latency = 13;
+ let Latency = 19;
let NumMicroOps = 11;
let ResourceCycles = [2,1,1,3,1,3];
}
def: InstRW<[HWWriteResGroup137], (instregex "VAESIMCrr")>;
def HWWriteResGroup138 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 14;
+ let Latency = 20;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup138], (instregex "DIVPDrm")>;
-def: InstRW<[HWWriteResGroup138], (instregex "DIVSDrm")>;
def: InstRW<[HWWriteResGroup138], (instregex "VSQRTPSm")>;
-def: InstRW<[HWWriteResGroup138], (instregex "VSQRTSSm")>;
def HWWriteResGroup139 : SchedWriteRes<[HWPort5,HWPort23]> {
- let Latency = 14;
+ let Latency = 20;
let NumMicroOps = 3;
let ResourceCycles = [2,1];
}
def: InstRW<[HWWriteResGroup140], (instregex "VDPPSrri")>;
def HWWriteResGroup141 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> {
- let Latency = 14;
+ let Latency = 20;
let NumMicroOps = 5;
let ResourceCycles = [2,1,1,1];
}
def: InstRW<[HWWriteResGroup141], (instregex "DPPSrmi")>;
-def: InstRW<[HWWriteResGroup141], (instregex "VDPPSYrmi")>;
def: InstRW<[HWWriteResGroup141], (instregex "VDPPSrmi")>;
+def HWWriteResGroup141_1 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> {
+ let Latency = 21;
+ let NumMicroOps = 5;
+ let ResourceCycles = [2,1,1,1];
+}
+def: InstRW<[HWWriteResGroup141_1], (instregex "VDPPSYrmi")>;
+
def HWWriteResGroup142 : SchedWriteRes<[HWPort1,HWPort06,HWPort15,HWPort0156]> {
let Latency = 14;
let NumMicroOps = 10;
def: InstRW<[HWWriteResGroup142], (instregex "RCR8rCL")>;
def HWWriteResGroup143 : SchedWriteRes<[HWPort23,HWPort0156]> {
- let Latency = 14;
+ let Latency = 19;
let NumMicroOps = 15;
let ResourceCycles = [1,14];
}
def: InstRW<[HWWriteResGroup143], (instregex "POPF16")>;
def HWWriteResGroup144 : SchedWriteRes<[HWPort4,HWPort5,HWPort6,HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 15;
+ let Latency = 21;
let NumMicroOps = 8;
let ResourceCycles = [1,1,1,1,1,1,2];
}
def: InstRW<[HWWriteResGroup145], (instregex "VZEROALL")>;
def HWWriteResGroup146 : SchedWriteRes<[HWPort0,HWPort4,HWPort5,HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 16;
+ let Latency = 22;
let NumMicroOps = 19;
let ResourceCycles = [2,1,4,1,1,4,6];
}
def: InstRW<[HWWriteResGroup149], (instregex "RDTSC")>;
def HWWriteResGroup150 : SchedWriteRes<[HWPort0,HWPort5,HWPort23,HWPort0156]> {
- let Latency = 18;
+ let Latency = 24;
let NumMicroOps = 9;
let ResourceCycles = [4,3,1,1];
}
def: InstRW<[HWWriteResGroup150], (instregex "VPCMPESTRIrm")>;
def HWWriteResGroup151 : SchedWriteRes<[HWPort6,HWPort23,HWPort0156]> {
- let Latency = 18;
+ let Latency = 23;
let NumMicroOps = 19;
let ResourceCycles = [3,1,15];
}
def: InstRW<[HWWriteResGroup152], (instregex "VPCMPESTRM128rr")>;
def HWWriteResGroup153 : SchedWriteRes<[HWPort0,HWPort5,HWPort23,HWPort015,HWPort0156]> {
- let Latency = 19;
+ let Latency = 25;
let NumMicroOps = 10;
let ResourceCycles = [4,3,1,1,1];
}
def: InstRW<[HWWriteResGroup154], (instregex "VDIVSDrr")>;
def HWWriteResGroup155 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 20;
+ let Latency = 27;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup155], (instregex "DIVR_F32m")>;
def: InstRW<[HWWriteResGroup155], (instregex "DIVR_F64m")>;
-def: InstRW<[HWWriteResGroup155], (instregex "SQRTPDm")>;
-def: InstRW<[HWWriteResGroup155], (instregex "SQRTSDm")>;
-def: InstRW<[HWWriteResGroup155], (instregex "VDIVPDrm")>;
-def: InstRW<[HWWriteResGroup155], (instregex "VDIVSDrm")>;
+def: InstRW<[HWWriteResGroup155], (instregex "VSQRTPDm")>;
+
+def HWWriteResGroup155_1 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 26;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup155_1], (instregex "SQRTPDm")>;
+def: InstRW<[HWWriteResGroup155_1], (instregex "VDIVPDrm")>;
+def: InstRW<[HWWriteResGroup155_1], (instregex "VSQRTSDm")>;
+
+def HWWriteResGroup155_2 : SchedWriteRes<[HWPort0,HWPort23]> {
+ let Latency = 25;
+ let NumMicroOps = 2;
+ let ResourceCycles = [1,1];
+}
+def: InstRW<[HWWriteResGroup155_2], (instregex "SQRTSDm")>;
+def: InstRW<[HWWriteResGroup155_2], (instregex "VDIVSDrm")>;
def HWWriteResGroup156 : SchedWriteRes<[HWPort5,HWPort6,HWPort0156]> {
let Latency = 20;
def: InstRW<[HWWriteResGroup157], (instregex "VSQRTPDr")>;
def: InstRW<[HWWriteResGroup157], (instregex "VSQRTSDr")>;
-def HWWriteResGroup158 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 21;
- let NumMicroOps = 2;
- let ResourceCycles = [1,1];
-}
-def: InstRW<[HWWriteResGroup158], (instregex "VSQRTPDm")>;
-def: InstRW<[HWWriteResGroup158], (instregex "VSQRTSDm")>;
-
def HWWriteResGroup159 : SchedWriteRes<[HWPort0,HWPort015]> {
let Latency = 21;
let NumMicroOps = 3;
def: InstRW<[HWWriteResGroup159], (instregex "VSQRTPSYr")>;
def HWWriteResGroup160 : SchedWriteRes<[HWPort0,HWPort23,HWPort015]> {
- let Latency = 21;
+ let Latency = 28;
let NumMicroOps = 4;
let ResourceCycles = [2,1,1];
}
def: InstRW<[HWWriteResGroup160], (instregex "VSQRTPSYm")>;
def HWWriteResGroup161 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> {
- let Latency = 23;
+ let Latency = 30;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup162], (instregex "DIVR_FrST0")>;
def HWWriteResGroup163 : SchedWriteRes<[HWPort0,HWPort23]> {
- let Latency = 24;
+ let Latency = 31;
let NumMicroOps = 2;
let ResourceCycles = [1,1];
}
def: InstRW<[HWWriteResGroup163], (instregex "DIV_F64m")>;
def HWWriteResGroup164 : SchedWriteRes<[HWPort4,HWPort6,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 24;
+ let Latency = 30;
let NumMicroOps = 27;
let ResourceCycles = [1,5,1,1,19];
}
def: InstRW<[HWWriteResGroup164], (instregex "XSAVE64")>;
def HWWriteResGroup165 : SchedWriteRes<[HWPort4,HWPort6,HWPort23,HWPort237,HWPort0156]> {
- let Latency = 25;
+ let Latency = 31;
let NumMicroOps = 28;
let ResourceCycles = [1,6,1,1,19];
}
def: InstRW<[HWWriteResGroup165], (instregex "XSAVE(OPT?)")>;
def HWWriteResGroup166 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> {
- let Latency = 27;
+ let Latency = 34;
let NumMicroOps = 3;
let ResourceCycles = [1,1,1];
}
def: InstRW<[HWWriteResGroup166], (instregex "DIV_FI32m")>;
def HWWriteResGroup167 : SchedWriteRes<[HWPort0,HWPort5,HWPort23,HWPort015]> {
- let Latency = 28;
+ let Latency = 34;
let NumMicroOps = 11;
let ResourceCycles = [2,7,1,1];
}
def: InstRW<[HWWriteResGroup168], (instregex "VAESKEYGENASSIST128rr")>;
def HWWriteResGroup170 : SchedWriteRes<[HWPort5,HWPort6,HWPort23,HWPort06,HWPort0156]> {
- let Latency = 30;
+ let Latency = 35;
let NumMicroOps = 23;
let ResourceCycles = [1,5,3,4,10];
}
def: InstRW<[HWWriteResGroup170], (instregex "IN8rr")>;
def HWWriteResGroup171 : SchedWriteRes<[HWPort5,HWPort6,HWPort23,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 30;
+ let Latency = 36;
let NumMicroOps = 23;
let ResourceCycles = [1,5,2,1,4,10];
}
def: InstRW<[HWWriteResGroup173], (instregex "VSQRTPDYr")>;
def HWWriteResGroup174 : SchedWriteRes<[HWPort0,HWPort23,HWPort015]> {
- let Latency = 35;
+ let Latency = 42;
let NumMicroOps = 4;
let ResourceCycles = [2,1,1];
}
def: InstRW<[HWWriteResGroup174], (instregex "VSQRTPDYm")>;
def HWWriteResGroup175 : SchedWriteRes<[HWPort1,HWPort4,HWPort5,HWPort6,HWPort23,HWPort237,HWPort15,HWPort0156]> {
- let Latency = 35;
+ let Latency = 41;
let NumMicroOps = 18;
let ResourceCycles = [1,1,2,3,1,1,1,8];
}
def: InstRW<[HWWriteResGroup176], (instregex "RDTSCP")>;
def HWWriteResGroup177 : SchedWriteRes<[HWPort0,HWPort01,HWPort23,HWPort05,HWPort06,HWPort015,HWPort0156]> {
- let Latency = 56;
+ let Latency = 61;
let NumMicroOps = 64;
let ResourceCycles = [2,2,8,1,10,2,39];
}
def: InstRW<[HWWriteResGroup177], (instregex "FLDENVm")>;
def HWWriteResGroup178 : SchedWriteRes<[HWPort0,HWPort6,HWPort23,HWPort05,HWPort06,HWPort15,HWPort0156]> {
- let Latency = 59;
+ let Latency = 64;
let NumMicroOps = 88;
let ResourceCycles = [4,4,31,1,2,1,45];
}
def: InstRW<[HWWriteResGroup178], (instregex "FXRSTOR64")>;
def HWWriteResGroup179 : SchedWriteRes<[HWPort0,HWPort6,HWPort23,HWPort05,HWPort06,HWPort15,HWPort0156]> {
- let Latency = 59;
+ let Latency = 64;
let NumMicroOps = 90;
let ResourceCycles = [4,2,33,1,2,1,47];
}
def: InstRW<[HWWriteResGroup182], (instregex "IDIV(16|32|64)r")>;
def HWWriteResGroup183 : SchedWriteRes<[HWPort0,HWPort1,HWPort4,HWPort5,HWPort6,HWPort237,HWPort06,HWPort0156]> {
- let Latency = 114;
+ let Latency = 115;
let NumMicroOps = 100;
let ResourceCycles = [9,9,11,8,1,11,21,30];
}
def: InstRW<[HWWriteResGroup183], (instregex "FSTENVm")>;
def: InstRW<[HWWriteResGroup183], (instregex "FSTENVm")>;
+def HWWriteResGroup184 : SchedWriteRes<[HWPort0, HWPort5, HWPort15, HWPort015, HWPort06, HWPort23]> {
+ let Latency = 26;
+ let NumMicroOps = 12;
+ let ResourceCycles = [2,2,1,3,2,2];
+}
+def: InstRW<[HWWriteResGroup184], (instregex "VGATHERDPDrm")>;
+def: InstRW<[HWWriteResGroup184], (instregex "VPGATHERDQrm")>;
+def: InstRW<[HWWriteResGroup184], (instregex "VPGATHERDDrm")>;
+
+def HWWriteResGroup185 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 24;
+ let NumMicroOps = 22;
+ let ResourceCycles = [5,3,4,1,5,4];
+}
+def: InstRW<[HWWriteResGroup185], (instregex "VGATHERQPDYrm")>;
+def: InstRW<[HWWriteResGroup185], (instregex "VPGATHERQQYrm")>;
+
+def HWWriteResGroup186 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 28;
+ let NumMicroOps = 22;
+ let ResourceCycles = [5,3,4,1,5,4];
+}
+def: InstRW<[HWWriteResGroup186], (instregex "VPGATHERQDYrm")>;
+
+def HWWriteResGroup187 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 25;
+ let NumMicroOps = 22;
+ let ResourceCycles = [5,3,4,1,5,4];
+}
+def: InstRW<[HWWriteResGroup187], (instregex "VPGATHERQDrm")>;
+
+def HWWriteResGroup188 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 27;
+ let NumMicroOps = 20;
+ let ResourceCycles = [3,3,4,1,5,4];
+}
+def: InstRW<[HWWriteResGroup188], (instregex "VGATHERDPDYrm")>;
+def: InstRW<[HWWriteResGroup188], (instregex "VPGATHERDQYrm")>;
+
+def HWWriteResGroup189 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 27;
+ let NumMicroOps = 34;
+ let ResourceCycles = [5,3,8,1,9,8];
+}
+def: InstRW<[HWWriteResGroup189], (instregex "VGATHERDPSYrm")>;
+def: InstRW<[HWWriteResGroup189], (instregex "VPGATHERDDYrm")>;
+
+def HWWriteResGroup190 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 23;
+ let NumMicroOps = 14;
+ let ResourceCycles = [3,3,2,1,3,2];
+}
+def: InstRW<[HWWriteResGroup190], (instregex "VGATHERQPDrm")>;
+def: InstRW<[HWWriteResGroup190], (instregex "VPGATHERQQrm")>;
+
+def HWWriteResGroup191 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 28;
+ let NumMicroOps = 15;
+ let ResourceCycles = [3,3,2,1,4,2];
+}
+def: InstRW<[HWWriteResGroup191], (instregex "VGATHERQPSYrm")>;
+
+def HWWriteResGroup192 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> {
+ let Latency = 25;
+ let NumMicroOps = 15;
+ let ResourceCycles = [3,3,2,1,4,2];
+}
+def: InstRW<[HWWriteResGroup192], (instregex "VGATHERQPSrm")>;
+def: InstRW<[HWWriteResGroup192], (instregex "VGATHERDPSrm")>;
+
} // SchedModel
; HASWELL-LABEL: test_aesdec:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaesdec %xmm1, %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: vaesdec (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaesdec (%rdi), %xmm0, %xmm0 # sched: [13:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aesdec:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_aesdeclast:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaesdeclast %xmm1, %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: vaesdeclast (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaesdeclast (%rdi), %xmm0, %xmm0 # sched: [13:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aesdeclast:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_aesenc:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaesenc %xmm1, %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: vaesenc (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaesenc (%rdi), %xmm0, %xmm0 # sched: [13:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aesenc:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_aesenclast:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaesenclast %xmm1, %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: vaesenclast (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaesenclast (%rdi), %xmm0, %xmm0 # sched: [13:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aesenclast:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_aesimc:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaesimc %xmm0, %xmm0 # sched: [14:2.00]
-; HASWELL-NEXT: vaesimc (%rdi), %xmm1 # sched: [14:2.00]
+; HASWELL-NEXT: vaesimc (%rdi), %xmm1 # sched: [20:2.00]
; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aesimc:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_aeskeygenassist:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaeskeygenassist $7, %xmm0, %xmm0 # sched: [29:7.00]
-; HASWELL-NEXT: vaeskeygenassist $7, (%rdi), %xmm1 # sched: [28:7.00]
+; HASWELL-NEXT: vaeskeygenassist $7, (%rdi), %xmm1 # sched: [34:7.00]
; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aeskeygenassist:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addsubpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddsubpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddsubpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddsubpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addsubpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addsubps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddsubps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddsubps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddsubps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addsubps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andnotpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandnpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandnpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vandnpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andnotpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andnotps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandnps %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandnps (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vandnps (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andnotps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vandpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandps %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandps (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vandps (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andps:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendpd {{.*#+}} ymm0 = ymm0[0],ymm1[1,2],ymm0[3] sched: [1:0.33]
; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vblendpd {{.*#+}} ymm0 = ymm0[0],mem[1,2],ymm0[3] sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendpd {{.*#+}} ymm0 = ymm0[0],mem[1,2],ymm0[3] sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_blendps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendps {{.*#+}} ymm0 = ymm0[0],ymm1[1,2],ymm0[3,4,5,6,7] sched: [1:0.33]
-; HASWELL-NEXT: vblendps {{.*#+}} ymm0 = ymm0[0,1],mem[2],ymm0[3],mem[4,5,6],ymm0[7] sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendps {{.*#+}} ymm0 = ymm0[0,1],mem[2],ymm0[3],mem[4,5,6],ymm0[7] sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_blendvpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendvpd %ymm2, %ymm1, %ymm0, %ymm0 # sched: [2:2.00]
-; HASWELL-NEXT: vblendvpd %ymm2, (%rdi), %ymm0, %ymm0 # sched: [2:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendvpd %ymm2, (%rdi), %ymm0, %ymm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendvpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_blendvps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendvps %ymm2, %ymm1, %ymm0, %ymm0 # sched: [2:2.00]
-; HASWELL-NEXT: vblendvps %ymm2, (%rdi), %ymm0, %ymm0 # sched: [2:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendvps %ymm2, (%rdi), %ymm0, %ymm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendvps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_broadcastf128:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcastf128 {{.*#+}} ymm0 = mem[0,1,0,1] sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vbroadcastf128 {{.*#+}} ymm0 = mem[0,1,0,1] sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastf128:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_broadcastsd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcastsd (%rdi), %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vbroadcastsd (%rdi), %ymm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastsd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_broadcastss:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcastss (%rdi), %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vbroadcastss (%rdi), %xmm0 # sched: [6:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastss:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_broadcastss_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcastss (%rdi), %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vbroadcastss (%rdi), %ymm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastss_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cmppd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcmpeqpd %ymm1, %ymm0, %ymm1 # sched: [3:1.00]
-; HASWELL-NEXT: vcmpeqpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
+; HASWELL-NEXT: vcmpeqpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
; HASWELL-NEXT: vorpd %ymm0, %ymm1, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cmppd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cmpps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcmpeqps %ymm1, %ymm0, %ymm1 # sched: [3:1.00]
-; HASWELL-NEXT: vcmpeqps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
+; HASWELL-NEXT: vcmpeqps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
; HASWELL-NEXT: vorps %ymm0, %ymm1, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cmpps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtdq2pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtdq2pd %xmm0, %ymm0 # sched: [6:1.00]
-; HASWELL-NEXT: vcvtdq2pd (%rdi), %ymm1 # sched: [6:1.00]
+; HASWELL-NEXT: vcvtdq2pd (%rdi), %ymm1 # sched: [12:1.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtdq2pd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtdq2ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtdq2ps %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcvtdq2ps (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vcvtdq2ps (%rdi), %ymm1 # sched: [10:1.00]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtdq2ps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtpd2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtpd2dq %ymm0, %xmm0 # sched: [6:1.00]
-; HASWELL-NEXT: vcvtpd2dqy (%rdi), %xmm1 # sched: [7:1.00]
+; HASWELL-NEXT: vcvtpd2dqy (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpd2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttpd2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttpd2dq %ymm0, %xmm0 # sched: [6:1.00]
-; HASWELL-NEXT: vcvttpd2dqy (%rdi), %xmm1 # sched: [7:1.00]
+; HASWELL-NEXT: vcvttpd2dqy (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttpd2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtpd2ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtpd2ps %ymm0, %xmm0 # sched: [6:1.00]
-; HASWELL-NEXT: vcvtpd2psy (%rdi), %xmm1 # sched: [7:1.00]
+; HASWELL-NEXT: vcvtpd2psy (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpd2ps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtps2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtps2dq %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcvtps2dq (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vcvtps2dq (%rdi), %ymm1 # sched: [10:1.00]
; HASWELL-NEXT: vorpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtps2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttps2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttps2dq %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcvttps2dq (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vcvttps2dq (%rdi), %ymm1 # sched: [10:1.00]
; HASWELL-NEXT: vorps %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttps2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_divpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdivpd %ymm1, %ymm0, %ymm0 # sched: [35:2.00]
-; HASWELL-NEXT: vdivpd (%rdi), %ymm0, %ymm0 # sched: [35:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdivpd (%rdi), %ymm0, %ymm0 # sched: [42:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_divpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_divps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdivps %ymm1, %ymm0, %ymm0 # sched: [21:2.00]
-; HASWELL-NEXT: vdivps (%rdi), %ymm0, %ymm0 # sched: [21:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdivps (%rdi), %ymm0, %ymm0 # sched: [28:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_divps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_dpps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdpps $7, %ymm1, %ymm0, %ymm0 # sched: [14:2.00]
-; HASWELL-NEXT: vdpps $7, (%rdi), %ymm0, %ymm0 # sched: [14:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdpps $7, (%rdi), %ymm0, %ymm0 # sched: [21:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_dpps:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: vextractf128 $1, %ymm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vextractf128 $1, %ymm1, (%rdi) # sched: [1:1.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_extractf128:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_haddpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhaddpd %ymm1, %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhaddpd (%rdi), %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhaddpd (%rdi), %ymm0, %ymm0 # sched: [12:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_haddpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_haddps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhaddps %ymm1, %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhaddps (%rdi), %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhaddps (%rdi), %ymm0, %ymm0 # sched: [12:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_haddps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_hsubpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhsubpd %ymm1, %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhsubpd (%rdi), %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhsubpd (%rdi), %ymm0, %ymm0 # sched: [12:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_hsubpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_hsubps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhsubps %ymm1, %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhsubps (%rdi), %ymm0, %ymm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhsubps (%rdi), %ymm0, %ymm0 # sched: [12:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_hsubps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_insertf128:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm1 # sched: [3:1.00]
-; HASWELL-NEXT: vinsertf128 $1, (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vinsertf128 $1, (%rdi), %ymm0, %ymm0 # sched: [7:0.50]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_insertf128:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_lddqu:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vlddqu (%rdi), %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vlddqu (%rdi), %ymm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lddqu:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_maskmovpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmaskmovpd (%rdi), %xmm0, %xmm2 # sched: [2:2.00]
-; HASWELL-NEXT: vmaskmovpd %xmm1, %xmm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vmaskmovpd (%rdi), %xmm0, %xmm2 # sched: [8:2.00]
+; HASWELL-NEXT: vmaskmovpd %xmm1, %xmm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovapd %xmm2, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maskmovpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_maskmovpd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmaskmovpd (%rdi), %ymm0, %ymm2 # sched: [2:2.00]
-; HASWELL-NEXT: vmaskmovpd %ymm1, %ymm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vmaskmovpd (%rdi), %ymm0, %ymm2 # sched: [9:2.00]
+; HASWELL-NEXT: vmaskmovpd %ymm1, %ymm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovapd %ymm2, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maskmovpd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_maskmovps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmaskmovps (%rdi), %xmm0, %xmm2 # sched: [2:2.00]
-; HASWELL-NEXT: vmaskmovps %xmm1, %xmm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vmaskmovps (%rdi), %xmm0, %xmm2 # sched: [8:2.00]
+; HASWELL-NEXT: vmaskmovps %xmm1, %xmm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovaps %xmm2, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maskmovps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_maskmovps_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmaskmovps (%rdi), %ymm0, %ymm2 # sched: [2:2.00]
-; HASWELL-NEXT: vmaskmovps %ymm1, %ymm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vmaskmovps (%rdi), %ymm0, %ymm2 # sched: [9:2.00]
+; HASWELL-NEXT: vmaskmovps %ymm1, %ymm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovaps %ymm2, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maskmovps_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maxpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaxpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vmaxpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmaxpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maxpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maxps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaxps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vmaxps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmaxps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maxps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_minpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vminpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vminpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vminpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_minpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_minps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vminps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vminps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vminps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_minps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movapd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovapd (%rdi), %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovapd (%rdi), %ymm0 # sched: [7:0.50]
; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovapd %ymm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movapd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movaps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovaps (%rdi), %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovaps (%rdi), %ymm0 # sched: [7:0.50]
; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovaps %ymm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movaps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movddup:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovddup {{.*#+}} ymm0 = ymm0[0,0,2,2] sched: [1:1.00]
-; HASWELL-NEXT: vmovddup {{.*#+}} ymm1 = mem[0,0,2,2] sched: [1:0.50]
+; HASWELL-NEXT: vmovddup {{.*#+}} ymm1 = mem[0,0,2,2] sched: [7:0.50]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movddup:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovmskpd %ymm0, %eax # sched: [3:1.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movmskpd:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovmskps %ymm0, %eax # sched: [3:1.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movmskps:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntdq:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovntpd %ymm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntpd:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovntps %ymm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movshdup:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovshdup {{.*#+}} ymm0 = ymm0[1,1,3,3,5,5,7,7] sched: [1:1.00]
-; HASWELL-NEXT: vmovshdup {{.*#+}} ymm1 = mem[1,1,3,3,5,5,7,7] sched: [1:0.50]
+; HASWELL-NEXT: vmovshdup {{.*#+}} ymm1 = mem[1,1,3,3,5,5,7,7] sched: [7:0.50]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movshdup:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movsldup:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovsldup {{.*#+}} ymm0 = ymm0[0,0,2,2,4,4,6,6] sched: [1:1.00]
-; HASWELL-NEXT: vmovsldup {{.*#+}} ymm1 = mem[0,0,2,2,4,4,6,6] sched: [1:0.50]
+; HASWELL-NEXT: vmovsldup {{.*#+}} ymm1 = mem[0,0,2,2,4,4,6,6] sched: [7:0.50]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movsldup:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movupd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovupd (%rdi), %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovupd (%rdi), %ymm0 # sched: [7:0.50]
; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovupd %ymm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movupd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movups:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovups (%rdi), %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovups (%rdi), %ymm0 # sched: [7:0.50]
; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovups %ymm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movups:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mulpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmulpd %ymm1, %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulpd (%rdi), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulpd (%rdi), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mulps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmulps %ymm1, %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps (%rdi), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps (%rdi), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: orpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vorpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vorpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vorpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: orpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_orps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vorps %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vorps (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vorps (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_orps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_perm2f128:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vperm2f128 {{.*#+}} ymm1 = ymm0[2,3],ymm1[0,1] sched: [3:1.00]
-; HASWELL-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [3:1.00]
+; HASWELL-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [10:1.00]
; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_perm2f128:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilpd {{.*#+}} xmm0 = xmm0[1,0] sched: [1:1.00]
-; HASWELL-NEXT: vpermilpd {{.*#+}} xmm1 = mem[1,0] sched: [1:1.00]
+; HASWELL-NEXT: vpermilpd {{.*#+}} xmm1 = mem[1,0] sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilpd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilpd {{.*#+}} ymm0 = ymm0[1,0,2,3] sched: [1:1.00]
-; HASWELL-NEXT: vpermilpd {{.*#+}} ymm1 = mem[1,0,2,3] sched: [1:1.00]
+; HASWELL-NEXT: vpermilpd {{.*#+}} ymm1 = mem[1,0,2,3] sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilpd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[3,2,1,0] sched: [1:1.00]
-; HASWELL-NEXT: vpermilps {{.*#+}} xmm1 = mem[3,2,1,0] sched: [1:1.00]
+; HASWELL-NEXT: vpermilps {{.*#+}} xmm1 = mem[3,2,1,0] sched: [7:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilps {{.*#+}} ymm0 = ymm0[3,2,1,0,7,6,5,4] sched: [1:1.00]
-; HASWELL-NEXT: vpermilps {{.*#+}} ymm1 = mem[3,2,1,0,7,6,5,4] sched: [1:1.00]
+; HASWELL-NEXT: vpermilps {{.*#+}} ymm1 = mem[3,2,1,0,7,6,5,4] sched: [8:1.00]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilps_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilvarpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpermilpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpermilpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilvarpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilvarpd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpermilpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpermilpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilvarpd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilvarps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilps %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpermilps (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpermilps (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilvarps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permilvarps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermilps %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpermilps (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpermilps (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permilvarps_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_rcpps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vrcpps (%rdi), %ymm1 # sched: [11:2.00]
+; HASWELL-NEXT: vrcpps (%rdi), %ymm1 # sched: [18:2.00]
; HASWELL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rcpps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_roundpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vroundpd $7, %ymm0, %ymm0 # sched: [5:1.25]
-; HASWELL-NEXT: vroundpd $7, (%rdi), %ymm1 # sched: [6:2.00]
+; HASWELL-NEXT: vroundpd $7, %ymm0, %ymm0 # sched: [6:0.50]
+; HASWELL-NEXT: vroundpd $7, (%rdi), %ymm1 # sched: [13:2.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_roundpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_roundps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vroundps $7, %ymm0, %ymm0 # sched: [5:1.25]
-; HASWELL-NEXT: vroundps $7, (%rdi), %ymm1 # sched: [6:2.00]
+; HASWELL-NEXT: vroundps $7, %ymm0, %ymm0 # sched: [6:0.50]
+; HASWELL-NEXT: vroundps $7, (%rdi), %ymm1 # sched: [13:2.00]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_roundps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_rsqrtps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vrsqrtps (%rdi), %ymm1 # sched: [11:2.00]
+; HASWELL-NEXT: vrsqrtps (%rdi), %ymm1 # sched: [18:2.00]
; HASWELL-NEXT: vrsqrtps %ymm0, %ymm0 # sched: [11:2.00]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rsqrtps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_shufpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vshufpd {{.*#+}} ymm0 = ymm0[1],ymm1[0],ymm0[2],ymm1[3] sched: [1:1.00]
-; HASWELL-NEXT: vshufpd {{.*#+}} ymm1 = ymm1[1],mem[0],ymm1[2],mem[3] sched: [1:1.00]
+; HASWELL-NEXT: vshufpd {{.*#+}} ymm1 = ymm1[1],mem[0],ymm1[2],mem[3] sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shufpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_shufps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vshufps {{.*#+}} ymm0 = ymm0[0,0],ymm1[0,0],ymm0[4,4],ymm1[4,4] sched: [1:1.00]
-; HASWELL-NEXT: vshufps {{.*#+}} ymm0 = ymm0[0,3],mem[0,0],ymm0[4,7],mem[4,4] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vshufps {{.*#+}} ymm0 = ymm0[0,3],mem[0,0],ymm0[4,7],mem[4,4] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shufps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_sqrtpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vsqrtpd (%rdi), %ymm1 # sched: [35:2.00]
+; HASWELL-NEXT: vsqrtpd (%rdi), %ymm1 # sched: [42:2.00]
; HASWELL-NEXT: vsqrtpd %ymm0, %ymm0 # sched: [35:2.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sqrtpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_sqrtps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vsqrtps (%rdi), %ymm1 # sched: [21:2.00]
+; HASWELL-NEXT: vsqrtps (%rdi), %ymm1 # sched: [28:2.00]
; HASWELL-NEXT: vsqrtps %ymm0, %ymm0 # sched: [21:2.00]
; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sqrtps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_subpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsubpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vsubpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vsubpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_subpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_subps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsubps %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vsubps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vsubps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_subps:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25]
; HASWELL-NEXT: vtestpd %xmm1, %xmm0 # sched: [1:1.00]
; HASWELL-NEXT: setb %al # sched: [1:0.50]
-; HASWELL-NEXT: vtestpd (%rdi), %xmm0 # sched: [1:1.00]
+; HASWELL-NEXT: vtestpd (%rdi), %xmm0 # sched: [7:1.00]
; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_testpd:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25]
; HASWELL-NEXT: vtestpd %ymm1, %ymm0 # sched: [1:1.00]
; HASWELL-NEXT: setb %al # sched: [1:0.50]
-; HASWELL-NEXT: vtestpd (%rdi), %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vtestpd (%rdi), %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_testpd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25]
; HASWELL-NEXT: vtestps %xmm1, %xmm0 # sched: [1:1.00]
; HASWELL-NEXT: setb %al # sched: [1:0.50]
-; HASWELL-NEXT: vtestps (%rdi), %xmm0 # sched: [1:1.00]
+; HASWELL-NEXT: vtestps (%rdi), %xmm0 # sched: [7:1.00]
; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_testps:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25]
; HASWELL-NEXT: vtestps %ymm1, %ymm0 # sched: [1:1.00]
; HASWELL-NEXT: setb %al # sched: [1:0.50]
-; HASWELL-NEXT: vtestps (%rdi), %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vtestps (%rdi), %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_testps_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpckhpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpckhpd {{.*#+}} ymm0 = ymm0[1],ymm1[1],ymm0[3],ymm1[3] sched: [1:1.00]
-; HASWELL-NEXT: vunpckhpd {{.*#+}} ymm1 = ymm1[1],mem[1],ymm1[3],mem[3] sched: [1:1.00]
+; HASWELL-NEXT: vunpckhpd {{.*#+}} ymm1 = ymm1[1],mem[1],ymm1[3],mem[3] sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpckhpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpckhps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpckhps {{.*#+}} ymm0 = ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[6],ymm1[6],ymm0[7],ymm1[7] sched: [1:1.00]
-; HASWELL-NEXT: vunpckhps {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vunpckhps {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpckhps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpcklpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpcklpd {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[2],ymm1[2] sched: [1:1.00]
-; HASWELL-NEXT: vunpcklpd {{.*#+}} ymm1 = ymm1[0],mem[0],ymm1[2],mem[2] sched: [1:1.00]
+; HASWELL-NEXT: vunpcklpd {{.*#+}} ymm1 = ymm1[0],mem[0],ymm1[2],mem[2] sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpcklpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpcklps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpcklps {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[4],ymm1[4],ymm0[5],ymm1[5] sched: [1:1.00]
-; HASWELL-NEXT: vunpcklps {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vunpcklps {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpcklps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_xorpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vxorpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vxorpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vxorpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_xorpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_xorps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vxorps %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vxorps (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vxorps (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_xorps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_zeroall:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vzeroall # sched: [16:16.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_zeroall:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_zeroupper:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_zeroupper:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_broadcasti128:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcasti128 {{.*#+}} ymm1 = mem[0,1,0,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcasti128 {{.*#+}} ymm1 = mem[0,1,0,1] sched: [7:0.50]
; HASWELL-NEXT: vpaddd %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcasti128:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vbroadcastsd %xmm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastsd_ymm:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vbroadcastss %xmm0, %xmm0 # sched: [1:1.00]
; HASWELL-NEXT: vaddps %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastss:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vbroadcastss %xmm0, %ymm0 # sched: [3:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_broadcastss_ymm:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: vextracti128 $1, %ymm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vextracti128 $1, %ymm2, (%rdi) # sched: [1:1.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_extracti128:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherdpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherdpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherdpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [26:2.67]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherdpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherdpd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherdpd %ymm2, (%rdi,%xmm1,8), %ymm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherdpd %ymm2, (%rdi,%xmm1,8), %ymm0 # sched: [27:4.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherdpd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherdps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherdps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherdps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [25:3.67]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherdps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherdps_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherdps %ymm2, (%rdi,%ymm1,4), %ymm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherdps %ymm2, (%rdi,%ymm1,4), %ymm0 # sched: [27:6.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherdps_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherqpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherqpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherqpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [23:3.33]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherqpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherqpd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherqpd %ymm2, (%rdi,%ymm1,8), %ymm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherqpd %ymm2, (%rdi,%ymm1,8), %ymm0 # sched: [24:5.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherqpd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherqps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [25:3.67]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherqps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_gatherqps_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%ymm1,4), %xmm0 # sched: [1:?]
+; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%ymm1,4), %xmm0 # sched: [28:3.67]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_gatherqps_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_inserti128:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm1 # sched: [3:1.00]
-; HASWELL-NEXT: vinserti128 $1, (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vinserti128 $1, (%rdi), %ymm0, %ymm0 # sched: [7:0.50]
; HASWELL-NEXT: vpaddd %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_inserti128:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movntdqa:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovntdqa (%rdi), %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmovntdqa (%rdi), %ymm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntdqa:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mpsadbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmpsadbw $7, %ymm1, %ymm0, %ymm0 # sched: [7:2.00]
-; HASWELL-NEXT: vmpsadbw $7, (%rdi), %ymm0, %ymm0 # sched: [7:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmpsadbw $7, (%rdi), %ymm0, %ymm0 # sched: [14:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mpsadbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pabsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpabsb %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpabsb (%rdi), %ymm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpabsb (%rdi), %ymm1 # sched: [8:0.50]
; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pabsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpabsd %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpabsd (%rdi), %ymm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpabsd (%rdi), %ymm1 # sched: [8:0.50]
; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pabsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpabsw %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpabsw (%rdi), %ymm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpabsw (%rdi), %ymm1 # sched: [8:0.50]
; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packssdw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpackssdw %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpackssdw (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpackssdw (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packssdw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packsswb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpacksswb %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpacksswb (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpacksswb (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packsswb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packusdw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpackusdw %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpackusdw (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpackusdw (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packusdw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packuswb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpackuswb %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpackuswb (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpackuswb (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packuswb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddq (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddq (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddusb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddusb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddusb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddusb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddusb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddusw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddusw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddusw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddusw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddusw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_palignr:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpalignr {{.*#+}} ymm0 = ymm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],ymm0[0],ymm1[17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],ymm0[16] sched: [1:1.00]
-; HASWELL-NEXT: vpalignr {{.*#+}} ymm0 = mem[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],ymm0[0],mem[17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],ymm0[16] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpalignr {{.*#+}} ymm0 = mem[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],ymm0[0],mem[17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],ymm0[16] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_palignr:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pand:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpand %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpand (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpand (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pand:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pandn:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpandn %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpandn (%rdi), %ymm0, %ymm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpandn (%rdi), %ymm0, %ymm1 # sched: [8:0.50]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pandn:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pavgb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpavgb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpavgb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpavgb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pavgb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pavgw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpavgw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpavgw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpavgw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pavgw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pblendd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpblendd {{.*#+}} xmm1 = xmm1[0,1,2],xmm0[3] sched: [1:0.33]
-; HASWELL-NEXT: vpblendd {{.*#+}} xmm1 = mem[0],xmm1[1],mem[2],xmm1[3] sched: [1:0.50]
+; HASWELL-NEXT: vpblendd {{.*#+}} xmm1 = mem[0],xmm1[1],mem[2],xmm1[3] sched: [7:0.50]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pblendd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pblendd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2],ymm0[3,4,5,6],ymm1[7] sched: [1:0.33]
-; HASWELL-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0],mem[1,2],ymm1[3,4,5,6,7] sched: [1:0.50]
+; HASWELL-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0],mem[1,2],ymm1[3,4,5,6,7] sched: [8:0.50]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pblendd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pblendvb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpblendvb %ymm2, %ymm1, %ymm0, %ymm0 # sched: [2:2.00]
-; HASWELL-NEXT: vpblendvb %ymm3, (%rdi), %ymm0, %ymm0 # sched: [2:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpblendvb %ymm3, (%rdi), %ymm0, %ymm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pblendvb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pblendw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpblendw {{.*#+}} ymm0 = ymm0[0,1],ymm1[2,3,4],ymm0[5,6,7,8,9],ymm1[10,11,12],ymm0[13,14,15] sched: [1:1.00]
-; HASWELL-NEXT: vpblendw {{.*#+}} ymm0 = mem[0],ymm0[1],mem[2],ymm0[3],mem[4],ymm0[5],mem[6],ymm0[7],mem[8],ymm0[9],mem[10],ymm0[11],mem[12],ymm0[13],mem[14],ymm0[15] sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpblendw {{.*#+}} ymm0 = mem[0],ymm0[1],mem[2],ymm0[3],mem[4],ymm0[5],mem[6],ymm0[7],mem[8],ymm0[9],mem[10],ymm0[11],mem[12],ymm0[13],mem[14],ymm0[15] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pblendw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastb %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpbroadcastb (%rdi), %xmm1 # sched: [4:1.00]
+; HASWELL-NEXT: vpbroadcastb (%rdi), %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastb_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastb %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpbroadcastb (%rdi), %ymm1 # sched: [4:1.00]
+; HASWELL-NEXT: vpbroadcastb (%rdi), %ymm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastb_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastd %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpbroadcastd (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpbroadcastd (%rdi), %xmm1 # sched: [6:0.50]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastd %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpbroadcastd (%rdi), %ymm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpbroadcastd (%rdi), %ymm1 # sched: [7:0.50]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastq %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpbroadcastq (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpbroadcastq (%rdi), %xmm1 # sched: [6:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastq_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastq %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpbroadcastq (%rdi), %ymm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpbroadcastq (%rdi), %ymm1 # sched: [7:0.50]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastq_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastw %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpbroadcastw (%rdi), %xmm1 # sched: [4:1.00]
+; HASWELL-NEXT: vpbroadcastw (%rdi), %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pbroadcastw_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpbroadcastw %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpbroadcastw (%rdi), %ymm1 # sched: [4:1.00]
+; HASWELL-NEXT: vpbroadcastw (%rdi), %ymm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pbroadcastw_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpeqb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpeqd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqq (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpeqq (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpeqw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpgtb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpgtb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpgtd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpgtd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtq %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpcmpgtq (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpgtq (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpgtw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpgtw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_perm2i128:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vperm2i128 {{.*#+}} ymm1 = ymm0[2,3],ymm1[0,1] sched: [3:1.00]
-; HASWELL-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [3:1.00]
+; HASWELL-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [10:1.00]
; HASWELL-NEXT: vpaddq %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_perm2i128:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermd %ymm1, %ymm0, %ymm1 # sched: [3:1.00]
-; HASWELL-NEXT: vpermd (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
+; HASWELL-NEXT: vpermd (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
; HASWELL-NEXT: vpaddd %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermpd {{.*#+}} ymm0 = ymm0[3,2,2,3] sched: [3:1.00]
-; HASWELL-NEXT: vpermpd {{.*#+}} ymm1 = mem[0,2,2,3] sched: [3:1.00]
+; HASWELL-NEXT: vpermpd {{.*#+}} ymm1 = mem[0,2,2,3] sched: [10:1.00]
; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermps %ymm1, %ymm0, %ymm1 # sched: [3:1.00]
-; HASWELL-NEXT: vpermps (%rdi), %ymm0, %ymm0 # sched: [3:1.00]
+; HASWELL-NEXT: vpermps (%rdi), %ymm0, %ymm0 # sched: [10:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_permq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpermq {{.*#+}} ymm0 = ymm0[3,2,2,3] sched: [3:1.00]
-; HASWELL-NEXT: vpermq {{.*#+}} ymm1 = mem[0,2,2,3] sched: [3:1.00]
+; HASWELL-NEXT: vpermq {{.*#+}} ymm1 = mem[0,2,2,3] sched: [10:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_permq:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherdd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherdd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherdd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [26:2.67]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherdd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherdd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherdd %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherdd %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [27:6.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherdd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherdq:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherdq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherdq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [26:2.67]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherdq:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherdq_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherdq %ymm2, (%rdi,%xmm1,2), %ymm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherdq %ymm2, (%rdi,%xmm1,2), %ymm0 # sched: [27:4.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherdq_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherqd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [25:5.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherqd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherqd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%ymm1,2), %xmm0 # sched: [1:?]
+; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%ymm1,2), %xmm0 # sched: [28:5.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherqd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherqq:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherqq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherqq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [23:3.33]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherqq:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pgatherqq_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpgatherqq %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [1:?]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpgatherqq %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [24:5.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pgatherqq_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphaddd %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphaddd (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphaddd (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphaddsw %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphaddsw (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphaddsw (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphaddw %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphaddw (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphaddw (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphsubd %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphsubd (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphsubd (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphsubsw %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphsubsw (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphsubsw (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphsubw %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphsubw (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphsubw (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaddubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaddubsw %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmaddubsw (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaddubsw (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaddubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaddwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaddwd %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmaddwd (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaddwd (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaddwd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pmaskmovd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpmaskmovd (%rdi), %xmm0, %xmm2 # sched: [2:2.00]
-; HASWELL-NEXT: vpmaskmovd %xmm1, %xmm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vpmaskmovd (%rdi), %xmm0, %xmm2 # sched: [8:2.00]
+; HASWELL-NEXT: vpmaskmovd %xmm1, %xmm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovdqa %xmm2, %xmm0 # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaskmovd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pmaskmovd_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpmaskmovd (%rdi), %ymm0, %ymm2 # sched: [2:2.00]
-; HASWELL-NEXT: vpmaskmovd %ymm1, %ymm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vpmaskmovd (%rdi), %ymm0, %ymm2 # sched: [9:2.00]
+; HASWELL-NEXT: vpmaskmovd %ymm1, %ymm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovdqa %ymm2, %ymm0 # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaskmovd_ymm:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pmaskmovq:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpmaskmovq (%rdi), %xmm0, %xmm2 # sched: [2:2.00]
-; HASWELL-NEXT: vpmaskmovq %xmm1, %xmm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vpmaskmovq (%rdi), %xmm0, %xmm2 # sched: [8:2.00]
+; HASWELL-NEXT: vpmaskmovq %xmm1, %xmm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovdqa %xmm2, %xmm0 # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaskmovq:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pmaskmovq_ymm:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vpmaskmovq (%rdi), %ymm0, %ymm2 # sched: [2:2.00]
-; HASWELL-NEXT: vpmaskmovq %ymm1, %ymm0, (%rdi) # sched: [4:1.00]
+; HASWELL-NEXT: vpmaskmovq (%rdi), %ymm0, %ymm2 # sched: [9:2.00]
+; HASWELL-NEXT: vpmaskmovq %ymm1, %ymm0, (%rdi) # sched: [5:1.00]
; HASWELL-NEXT: vmovdqa %ymm2, %ymm0 # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaskmovq_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxsd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxsd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxsd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxub:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxub %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxub (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxub (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxub:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxud:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxud %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxud (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxud (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxud:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxuw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxuw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxuw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminsd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminsd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminsd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminub:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminub %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminub (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminub (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminub:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminud:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminud %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminud (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminud (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminud:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminuw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminuw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminuw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminuw:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovmskb %ymm0, %eax # sched: [3:1.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovmskb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxbd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxbd %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpmovsxbd (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vpmovsxbd (%rdi), %ymm1 # sched: [8:1.00]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxbd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxbq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxbq %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpmovsxbq (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vpmovsxbq (%rdi), %ymm1 # sched: [8:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxbq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxbw %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpmovsxbw (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vpmovsxbw (%rdi), %ymm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxdq %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpmovsxdq (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vpmovsxdq (%rdi), %ymm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxwd %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpmovsxwd (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vpmovsxwd (%rdi), %ymm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxwq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxwq %xmm0, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpmovsxwq (%rdi), %ymm1 # sched: [3:1.00]
+; HASWELL-NEXT: vpmovsxwq (%rdi), %ymm1 # sched: [8:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxwq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxbd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxbd {{.*#+}} ymm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero,xmm0[4],zero,zero,zero,xmm0[5],zero,zero,zero,xmm0[6],zero,zero,zero,xmm0[7],zero,zero,zero sched: [3:1.00]
-; HASWELL-NEXT: vpmovzxbd {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero,mem[4],zero,zero,zero,mem[5],zero,zero,zero,mem[6],zero,zero,zero,mem[7],zero,zero,zero sched: [3:1.00]
+; HASWELL-NEXT: vpmovzxbd {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero,mem[4],zero,zero,zero,mem[5],zero,zero,zero,mem[6],zero,zero,zero,mem[7],zero,zero,zero sched: [10:1.00]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxbd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxbq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxbq {{.*#+}} ymm0 = xmm0[0],zero,zero,zero,zero,zero,zero,zero,xmm0[1],zero,zero,zero,zero,zero,zero,zero,xmm0[2],zero,zero,zero,zero,zero,zero,zero,xmm0[3],zero,zero,zero,zero,zero,zero,zero sched: [3:1.00]
-; HASWELL-NEXT: vpmovzxbq {{.*#+}} ymm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero,mem[2],zero,zero,zero,zero,zero,zero,zero,mem[3],zero,zero,zero,zero,zero,zero,zero sched: [3:1.00]
+; HASWELL-NEXT: vpmovzxbq {{.*#+}} ymm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero,mem[2],zero,zero,zero,zero,zero,zero,zero,mem[3],zero,zero,zero,zero,zero,zero,zero sched: [10:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxbq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxbw {{.*#+}} ymm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero,xmm0[8],zero,xmm0[9],zero,xmm0[10],zero,xmm0[11],zero,xmm0[12],zero,xmm0[13],zero,xmm0[14],zero,xmm0[15],zero sched: [3:1.00]
-; HASWELL-NEXT: vpmovzxbw {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero,mem[8],zero,mem[9],zero,mem[10],zero,mem[11],zero,mem[12],zero,mem[13],zero,mem[14],zero,mem[15],zero sched: [3:1.00]
+; HASWELL-NEXT: vpmovzxbw {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero,mem[8],zero,mem[9],zero,mem[10],zero,mem[11],zero,mem[12],zero,mem[13],zero,mem[14],zero,mem[15],zero sched: [10:1.00]
; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxdq {{.*#+}} ymm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero sched: [3:1.00]
-; HASWELL-NEXT: vpmovzxdq {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [3:1.00]
+; HASWELL-NEXT: vpmovzxdq {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [10:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxwd {{.*#+}} ymm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero sched: [3:1.00]
-; HASWELL-NEXT: vpmovzxwd {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [3:1.00]
+; HASWELL-NEXT: vpmovzxwd {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [9:1.00]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxwq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxwq {{.*#+}} ymm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero sched: [3:1.00]
-; HASWELL-NEXT: vpmovzxwq {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [3:1.00]
+; HASWELL-NEXT: vpmovzxwq {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [10:1.00]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxwq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmuldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmuldq %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmuldq (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmuldq (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmuldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhrsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulhrsw %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmulhrsw (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulhrsw (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhrsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulhuw %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmulhuw (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulhuw (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulhw %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmulhw (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulhw (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulld %ymm1, %ymm0, %ymm0 # sched: [10:2.00]
-; HASWELL-NEXT: vpmulld (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulld (%rdi), %ymm0, %ymm0 # sched: [17:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmullw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmullw %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmullw (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmullw (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmullw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmuludq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmuludq %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmuludq (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmuludq (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmuludq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_por:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpor (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpor (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_por:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psadbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsadbw %ymm1, %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpsadbw (%rdi), %ymm0, %ymm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsadbw (%rdi), %ymm0, %ymm0 # sched: [12:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psadbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshufb %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpshufb (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpshufb (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshufd {{.*#+}} ymm0 = ymm0[3,2,1,0,7,6,5,4] sched: [1:1.00]
-; HASWELL-NEXT: vpshufd {{.*#+}} ymm1 = mem[1,0,3,2,5,4,7,6] sched: [1:1.00]
+; HASWELL-NEXT: vpshufd {{.*#+}} ymm1 = mem[1,0,3,2,5,4,7,6] sched: [8:1.00]
; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufhw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshufhw {{.*#+}} ymm0 = ymm0[0,1,2,3,7,6,5,4,8,9,10,11,15,14,13,12] sched: [1:1.00]
-; HASWELL-NEXT: vpshufhw {{.*#+}} ymm1 = mem[0,1,2,3,5,4,7,6,8,9,10,11,13,12,15,14] sched: [1:1.00]
+; HASWELL-NEXT: vpshufhw {{.*#+}} ymm1 = mem[0,1,2,3,5,4,7,6,8,9,10,11,13,12,15,14] sched: [8:1.00]
; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufhw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshuflw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshuflw {{.*#+}} ymm0 = ymm0[3,2,1,0,4,5,6,7,11,10,9,8,12,13,14,15] sched: [1:1.00]
-; HASWELL-NEXT: vpshuflw {{.*#+}} ymm1 = mem[1,0,3,2,4,5,6,7,9,8,11,10,12,13,14,15] sched: [1:1.00]
+; HASWELL-NEXT: vpshuflw {{.*#+}} ymm1 = mem[1,0,3,2,4,5,6,7,9,8,11,10,12,13,14,15] sched: [8:1.00]
; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshuflw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsignb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsignb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsignb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsignd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsignd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsignd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsignw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsignw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsignw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pslld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpslld %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpslld (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpslld (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpslld $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pslld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pslldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpslldq {{.*#+}} ymm0 = zero,zero,zero,ymm0[0,1,2,3,4,5,6,7,8,9,10,11,12],zero,zero,zero,ymm0[16,17,18,19,20,21,22,23,24,25,26,27,28] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pslldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllq %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsllq (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsllq (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsllq $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllvd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllvd %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vpsllvd (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsllvd (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllvd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllvd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllvd %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vpsllvd (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsllvd (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllvd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllvq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllvq %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpsllvq (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsllvq (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllvq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllvq_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllvq %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpsllvq (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsllvq (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllvq_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllw %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsllw (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsllw (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsllw $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrad:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrad %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsrad (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsrad (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrad $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrad:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psravd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsravd %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vpsravd (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsravd (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psravd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psravd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsravd %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vpsravd (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsravd (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psravd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psraw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsraw %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsraw (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsraw (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsraw $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psraw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrld %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsrld (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsrld (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrld $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrldq {{.*#+}} ymm0 = ymm0[3,4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,ymm0[19,20,21,22,23,24,25,26,27,28,29,30,31],zero,zero,zero sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlq %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsrlq (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsrlq (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrlq $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlvd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlvd %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vpsrlvd (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsrlvd (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlvd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlvd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlvd %ymm1, %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: vpsrlvd (%rdi), %ymm0, %ymm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsrlvd (%rdi), %ymm0, %ymm0 # sched: [10:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlvd_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlvq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlvq %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpsrlvq (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsrlvq (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlvq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlvq_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlvq %ymm1, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpsrlvq (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsrlvq (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlvq_ymm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlw %xmm1, %ymm0, %ymm0 # sched: [4:1.00]
-; HASWELL-NEXT: vpsrlw (%rdi), %ymm0, %ymm0 # sched: [1:1.00]
+; HASWELL-NEXT: vpsrlw (%rdi), %ymm0, %ymm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrlw $2, %ymm0, %ymm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubd (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubd (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubq (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubq (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubusb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubusb %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubusb (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubusb (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubusb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubusw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubusw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubusw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubusw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubusw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubw %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubw (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubw (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhbw {{.*#+}} ymm0 = ymm0[8],ymm1[8],ymm0[9],ymm1[9],ymm0[10],ymm1[10],ymm0[11],ymm1[11],ymm0[12],ymm1[12],ymm0[13],ymm1[13],ymm0[14],ymm1[14],ymm0[15],ymm1[15],ymm0[24],ymm1[24],ymm0[25],ymm1[25],ymm0[26],ymm1[26],ymm0[27],ymm1[27],ymm0[28],ymm1[28],ymm0[29],ymm1[29],ymm0[30],ymm1[30],ymm0[31],ymm1[31] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhbw {{.*#+}} ymm0 = ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15],ymm0[24],mem[24],ymm0[25],mem[25],ymm0[26],mem[26],ymm0[27],mem[27],ymm0[28],mem[28],ymm0[29],mem[29],ymm0[30],mem[30],ymm0[31],mem[31] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpckhbw {{.*#+}} ymm0 = ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15],ymm0[24],mem[24],ymm0[25],mem[25],ymm0[26],mem[26],ymm0[27],mem[27],ymm0[28],mem[28],ymm0[29],mem[29],ymm0[30],mem[30],ymm0[31],mem[31] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhdq {{.*#+}} ymm0 = ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[6],ymm1[6],ymm0[7],ymm1[7] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhdq {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [1:1.00]
+; HASWELL-NEXT: vpunpckhdq {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [8:1.00]
; HASWELL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 # sched: [1:0.50]
; HASWELL-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhqdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhqdq {{.*#+}} ymm1 = ymm0[1],ymm1[1],ymm0[3],ymm1[3] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhqdq {{.*#+}} ymm0 = ymm0[1],mem[1],ymm0[3],mem[3] sched: [1:1.00]
+; HASWELL-NEXT: vpunpckhqdq {{.*#+}} ymm0 = ymm0[1],mem[1],ymm0[3],mem[3] sched: [8:1.00]
; HASWELL-NEXT: vpaddq %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhqdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhwd {{.*#+}} ymm0 = ymm0[4],ymm1[4],ymm0[5],ymm1[5],ymm0[6],ymm1[6],ymm0[7],ymm1[7],ymm0[12],ymm1[12],ymm0[13],ymm1[13],ymm0[14],ymm1[14],ymm0[15],ymm1[15] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhwd {{.*#+}} ymm0 = ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpckhwd {{.*#+}} ymm0 = ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpcklbw {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[4],ymm1[4],ymm0[5],ymm1[5],ymm0[6],ymm1[6],ymm0[7],ymm1[7],ymm0[16],ymm1[16],ymm0[17],ymm1[17],ymm0[18],ymm1[18],ymm0[19],ymm1[19],ymm0[20],ymm1[20],ymm0[21],ymm1[21],ymm0[22],ymm1[22],ymm0[23],ymm1[23] sched: [1:1.00]
-; HASWELL-NEXT: vpunpcklbw {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[16],mem[16],ymm0[17],mem[17],ymm0[18],mem[18],ymm0[19],mem[19],ymm0[20],mem[20],ymm0[21],mem[21],ymm0[22],mem[22],ymm0[23],mem[23] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpcklbw {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[16],mem[16],ymm0[17],mem[17],ymm0[18],mem[18],ymm0[19],mem[19],ymm0[20],mem[20],ymm0[21],mem[21],ymm0[22],mem[22],ymm0[23],mem[23] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckldq {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[4],ymm1[4],ymm0[5],ymm1[5] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckldq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [1:1.00]
+; HASWELL-NEXT: vpunpckldq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [8:1.00]
; HASWELL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 # sched: [1:0.50]
; HASWELL-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklqdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpcklqdq {{.*#+}} ymm1 = ymm0[0],ymm1[0],ymm0[2],ymm1[2] sched: [1:1.00]
-; HASWELL-NEXT: vpunpcklqdq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[2],mem[2] sched: [1:1.00]
+; HASWELL-NEXT: vpunpcklqdq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[2],mem[2] sched: [8:1.00]
; HASWELL-NEXT: vpaddq %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklqdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpcklwd {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[8],ymm1[8],ymm0[9],ymm1[9],ymm0[10],ymm1[10],ymm0[11],ymm1[11] sched: [1:1.00]
-; HASWELL-NEXT: vpunpcklwd {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpcklwd {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11] sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pxor:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpxor %ymm1, %ymm0, %ymm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpxor (%rdi), %ymm0, %ymm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpxor (%rdi), %ymm0, %ymm0 # sched: [8:0.50]
; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pxor:
; BROADWELL: # %bb.0:
; CHECK-NEXT: movw $-21846, %ax ## imm = 0xAAAA
; CHECK-NEXT: kmovw %eax, %k1
; CHECK-NEXT: vmovdqa32 {{.*}}(%rip), %zmm1 {%k1}
-; CHECK-NEXT: vpaddd %zmm1, %zmm0, %zmm0
; CHECK-NEXT: vpaddd %zmm0, %zmm2, %zmm0
+; CHECK-NEXT: vpaddd %zmm1, %zmm0, %zmm0
; CHECK-NEXT: vcvtdq2ps %zmm0, %zmm0
; CHECK-NEXT: vmovups %zmm0, (%rdi)
; CHECK-NEXT: retq
; HASWELL: # %bb.0:
; HASWELL-NEXT: andnl %esi, %edi, %eax # sched: [1:0.50]
; HASWELL-NEXT: notl %edi # sched: [1:0.25]
-; HASWELL-NEXT: andw (%rdx), %di # sched: [1:0.50]
+; HASWELL-NEXT: andw (%rdx), %di # sched: [6:0.50]
; HASWELL-NEXT: addl %edi, %eax # sched: [1:0.25]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andn_i16:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andn_i32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.50]
-; HASWELL-NEXT: andnl (%rdx), %edi, %eax # sched: [1:0.50]
+; HASWELL-NEXT: andnl (%rdx), %edi, %eax # sched: [6:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andn_i32:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andn_i64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.50]
-; HASWELL-NEXT: andnq (%rdx), %rdi, %rax # sched: [1:0.50]
+; HASWELL-NEXT: andnq (%rdx), %rdi, %rax # sched: [6:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andn_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_bextr_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: bextrl %edi, (%rdx), %ecx # sched: [2:0.50]
+; HASWELL-NEXT: bextrl %edi, (%rdx), %ecx # sched: [7:0.50]
; HASWELL-NEXT: bextrl %edi, %esi, %eax # sched: [2:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bextr_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_bextr_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [2:0.50]
+; HASWELL-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [7:0.50]
; HASWELL-NEXT: bextrq %rdi, %rsi, %rax # sched: [2:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bextr_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_blsi_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: blsil (%rsi), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: blsil (%rsi), %ecx # sched: [6:0.50]
; HASWELL-NEXT: blsil %edi, %eax # sched: [1:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blsi_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_blsi_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: blsiq (%rsi), %rcx # sched: [1:0.50]
+; HASWELL-NEXT: blsiq (%rsi), %rcx # sched: [6:0.50]
; HASWELL-NEXT: blsiq %rdi, %rax # sched: [1:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blsi_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_blsmsk_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: blsmskl (%rsi), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: blsmskl (%rsi), %ecx # sched: [6:0.50]
; HASWELL-NEXT: blsmskl %edi, %eax # sched: [1:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blsmsk_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_blsmsk_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: blsmskq (%rsi), %rcx # sched: [1:0.50]
+; HASWELL-NEXT: blsmskq (%rsi), %rcx # sched: [6:0.50]
; HASWELL-NEXT: blsmskq %rdi, %rax # sched: [1:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blsmsk_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_blsr_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: blsrl (%rsi), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: blsrl (%rsi), %ecx # sched: [6:0.50]
; HASWELL-NEXT: blsrl %edi, %eax # sched: [1:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blsr_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_blsr_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: blsrq (%rsi), %rcx # sched: [1:0.50]
+; HASWELL-NEXT: blsrq (%rsi), %rcx # sched: [6:0.50]
; HASWELL-NEXT: blsrq %rdi, %rax # sched: [1:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blsr_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_cttz_i16:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: tzcntw (%rsi), %cx # sched: [3:1.00]
+; HASWELL-NEXT: tzcntw (%rsi), %cx # sched: [8:1.00]
; HASWELL-NEXT: tzcntw %di, %ax # sched: [3:1.00]
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cttz_i16:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_cttz_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: tzcntl (%rsi), %ecx # sched: [3:1.00]
+; HASWELL-NEXT: tzcntl (%rsi), %ecx # sched: [8:1.00]
; HASWELL-NEXT: tzcntl %edi, %eax # sched: [3:1.00]
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cttz_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_cttz_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: tzcntq (%rsi), %rcx # sched: [3:1.00]
+; HASWELL-NEXT: tzcntq (%rsi), %rcx # sched: [8:1.00]
; HASWELL-NEXT: tzcntq %rdi, %rax # sched: [3:1.00]
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cttz_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_bzhi_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [6:0.50]
; HASWELL-NEXT: bzhil %edi, %esi, %eax # sched: [1:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bzhi_i32:
; BROADWELL: # %bb.0:
;
; KNL-LABEL: test_bzhi_i32:
; KNL: # %bb.0:
-; KNL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [1:0.50]
+; KNL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [6:0.50]
; KNL-NEXT: bzhil %edi, %esi, %eax # sched: [1:0.50]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_bzhi_i32:
; ZNVER1: # %bb.0:
;
; HASWELL-LABEL: test_bzhi_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [1:0.50]
+; HASWELL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [6:0.50]
; HASWELL-NEXT: bzhiq %rdi, %rsi, %rax # sched: [1:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bzhi_i64:
; BROADWELL: # %bb.0:
;
; KNL-LABEL: test_bzhi_i64:
; KNL: # %bb.0:
-; KNL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [1:0.50]
+; KNL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [6:0.50]
; KNL-NEXT: bzhiq %rdi, %rsi, %rax # sched: [1:0.50]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_bzhi_i64:
; ZNVER1: # %bb.0:
; HASWELL-NEXT: movq %rdx, %rax # sched: [1:0.25]
; HASWELL-NEXT: movq %rdi, %rdx # sched: [1:0.25]
; HASWELL-NEXT: mulxq %rsi, %rsi, %rcx # sched: [4:1.00]
-; HASWELL-NEXT: mulxq (%rax), %rdx, %rax # sched: [4:1.00]
+; HASWELL-NEXT: mulxq (%rax), %rdx, %rax # sched: [9:1.00]
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulx_i64:
; BROADWELL: # %bb.0:
; KNL-NEXT: movq %rdx, %rax # sched: [1:0.25]
; KNL-NEXT: movq %rdi, %rdx # sched: [1:0.25]
; KNL-NEXT: mulxq %rsi, %rsi, %rcx # sched: [4:1.00]
-; KNL-NEXT: mulxq (%rax), %rdx, %rax # sched: [4:1.00]
+; KNL-NEXT: mulxq (%rax), %rdx, %rax # sched: [9:1.00]
; KNL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_mulx_i64:
; ZNVER1: # %bb.0:
;
; HASWELL-LABEL: test_pdep_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [3:1.00]
+; HASWELL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [8:1.00]
; HASWELL-NEXT: pdepl %esi, %edi, %eax # sched: [3:1.00]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pdep_i32:
; BROADWELL: # %bb.0:
;
; KNL-LABEL: test_pdep_i32:
; KNL: # %bb.0:
-; KNL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [3:1.00]
+; KNL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [8:1.00]
; KNL-NEXT: pdepl %esi, %edi, %eax # sched: [3:1.00]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_pdep_i32:
; ZNVER1: # %bb.0:
;
; HASWELL-LABEL: test_pdep_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [3:1.00]
+; HASWELL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [8:1.00]
; HASWELL-NEXT: pdepq %rsi, %rdi, %rax # sched: [3:1.00]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pdep_i64:
; BROADWELL: # %bb.0:
;
; KNL-LABEL: test_pdep_i64:
; KNL: # %bb.0:
-; KNL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [3:1.00]
+; KNL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [8:1.00]
; KNL-NEXT: pdepq %rsi, %rdi, %rax # sched: [3:1.00]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_pdep_i64:
; ZNVER1: # %bb.0:
;
; HASWELL-LABEL: test_pext_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pextl (%rdx), %edi, %ecx # sched: [3:1.00]
+; HASWELL-NEXT: pextl (%rdx), %edi, %ecx # sched: [8:1.00]
; HASWELL-NEXT: pextl %esi, %edi, %eax # sched: [3:1.00]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pext_i32:
; BROADWELL: # %bb.0:
;
; KNL-LABEL: test_pext_i32:
; KNL: # %bb.0:
-; KNL-NEXT: pextl (%rdx), %edi, %ecx # sched: [3:1.00]
+; KNL-NEXT: pextl (%rdx), %edi, %ecx # sched: [8:1.00]
; KNL-NEXT: pextl %esi, %edi, %eax # sched: [3:1.00]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_pext_i32:
; ZNVER1: # %bb.0:
;
; HASWELL-LABEL: test_pext_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [3:1.00]
+; HASWELL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [8:1.00]
; HASWELL-NEXT: pextq %rsi, %rdi, %rax # sched: [3:1.00]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pext_i64:
; BROADWELL: # %bb.0:
;
; KNL-LABEL: test_pext_i64:
; KNL: # %bb.0:
-; KNL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [3:1.00]
+; KNL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [8:1.00]
; KNL-NEXT: pextq %rsi, %rdi, %rax # sched: [3:1.00]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_pext_i64:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_rorx_i32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: rorxl $5, %edi, %ecx # sched: [1:0.50]
-; HASWELL-NEXT: rorxl $5, (%rdx), %eax # sched: [1:0.50]
+; HASWELL-NEXT: rorxl $5, (%rdx), %eax # sched: [6:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rorx_i32:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_rorx_i32:
; KNL: # %bb.0:
; KNL-NEXT: rorxl $5, %edi, %ecx # sched: [1:0.50]
-; KNL-NEXT: rorxl $5, (%rdx), %eax # sched: [1:0.50]
+; KNL-NEXT: rorxl $5, (%rdx), %eax # sched: [6:0.50]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_rorx_i32:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_rorx_i64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: rorxq $5, %rdi, %rcx # sched: [1:0.50]
-; HASWELL-NEXT: rorxq $5, (%rdx), %rax # sched: [1:0.50]
+; HASWELL-NEXT: rorxq $5, (%rdx), %rax # sched: [6:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rorx_i64:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_rorx_i64:
; KNL: # %bb.0:
; KNL-NEXT: rorxq $5, %rdi, %rcx # sched: [1:0.50]
-; KNL-NEXT: rorxq $5, (%rdx), %rax # sched: [1:0.50]
+; KNL-NEXT: rorxq $5, (%rdx), %rax # sched: [6:0.50]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_rorx_i64:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_sarx_i32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: sarxl %esi, %edi, %ecx # sched: [1:0.50]
-; HASWELL-NEXT: sarxl %esi, (%rdx), %eax # sched: [1:0.50]
+; HASWELL-NEXT: sarxl %esi, (%rdx), %eax # sched: [6:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sarx_i32:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_sarx_i32:
; KNL: # %bb.0:
; KNL-NEXT: sarxl %esi, %edi, %ecx # sched: [1:0.50]
-; KNL-NEXT: sarxl %esi, (%rdx), %eax # sched: [1:0.50]
+; KNL-NEXT: sarxl %esi, (%rdx), %eax # sched: [6:0.50]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_sarx_i32:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_sarx_i64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: sarxq %rsi, %rdi, %rcx # sched: [1:0.50]
-; HASWELL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [1:0.50]
+; HASWELL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [6:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sarx_i64:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_sarx_i64:
; KNL: # %bb.0:
; KNL-NEXT: sarxq %rsi, %rdi, %rcx # sched: [1:0.50]
-; KNL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [1:0.50]
+; KNL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [6:0.50]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_sarx_i64:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_shlx_i32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: shlxl %esi, %edi, %ecx # sched: [1:0.50]
-; HASWELL-NEXT: shlxl %esi, (%rdx), %eax # sched: [1:0.50]
+; HASWELL-NEXT: shlxl %esi, (%rdx), %eax # sched: [6:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shlx_i32:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_shlx_i32:
; KNL: # %bb.0:
; KNL-NEXT: shlxl %esi, %edi, %ecx # sched: [1:0.50]
-; KNL-NEXT: shlxl %esi, (%rdx), %eax # sched: [1:0.50]
+; KNL-NEXT: shlxl %esi, (%rdx), %eax # sched: [6:0.50]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_shlx_i32:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_shlx_i64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: shlxq %rsi, %rdi, %rcx # sched: [1:0.50]
-; HASWELL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [1:0.50]
+; HASWELL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [6:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shlx_i64:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_shlx_i64:
; KNL: # %bb.0:
; KNL-NEXT: shlxq %rsi, %rdi, %rcx # sched: [1:0.50]
-; KNL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [1:0.50]
+; KNL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [6:0.50]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_shlx_i64:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_shrx_i32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: shrxl %esi, %edi, %ecx # sched: [1:0.50]
-; HASWELL-NEXT: shrxl %esi, (%rdx), %eax # sched: [1:0.50]
+; HASWELL-NEXT: shrxl %esi, (%rdx), %eax # sched: [6:0.50]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shrx_i32:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_shrx_i32:
; KNL: # %bb.0:
; KNL-NEXT: shrxl %esi, %edi, %ecx # sched: [1:0.50]
-; KNL-NEXT: shrxl %esi, (%rdx), %eax # sched: [1:0.50]
+; KNL-NEXT: shrxl %esi, (%rdx), %eax # sched: [6:0.50]
; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_shrx_i32:
; ZNVER1: # %bb.0:
; HASWELL-LABEL: test_shrx_i64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: shrxq %rsi, %rdi, %rcx # sched: [1:0.50]
-; HASWELL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [1:0.50]
+; HASWELL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [6:0.50]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shrx_i64:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_shrx_i64:
; KNL: # %bb.0:
; KNL-NEXT: shrxq %rsi, %rdi, %rcx # sched: [1:0.50]
-; KNL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [1:0.50]
+; KNL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [6:0.50]
; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; ZNVER1-LABEL: test_shrx_i64:
; ZNVER1: # %bb.0:
;
; HASWELL-LABEL: test_vcvtph2ps_128:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vcvtph2ps (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vcvtph2ps (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vcvtph2ps %xmm0, %xmm0 # sched: [2:1.00]
; HASWELL-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vcvtph2ps_128:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_vcvtph2ps_256:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vcvtph2ps (%rdi), %ymm1 # sched: [1:1.00]
+; HASWELL-NEXT: vcvtph2ps (%rdi), %ymm1 # sched: [7:1.00]
; HASWELL-NEXT: vcvtph2ps %xmm0, %ymm0 # sched: [2:1.00]
; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vcvtph2ps_256:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_vcvtps2ph_128:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtps2ph $0, %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtps2ph $0, %xmm1, (%rdi) # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vcvtps2ph $0, %xmm1, (%rdi) # sched: [5:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vcvtps2ph_128:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_vcvtps2ph_256:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtps2ph $0, %ymm0, %xmm0 # sched: [6:1.00]
-; HASWELL-NEXT: vcvtps2ph $0, %ymm1, (%rdi) # sched: [6:1.00]
+; HASWELL-NEXT: vcvtps2ph $0, %ymm1, (%rdi) # sched: [7:1.00]
; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vcvtps2ph_256:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_vfmadd213pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmadd213pd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmadd213pd:
; KNL: # %bb.0:
; KNL-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmadd213pd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmadd213pd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmadd213pd_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmadd213pd_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmadd213pd_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmadd213ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmadd213ps:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmadd213ps:
; KNL: # %bb.0:
; KNL-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmadd213ps:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmadd213ps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmadd213ps_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmadd213ps_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmadd213ps_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmadd213sd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmadd213sd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmadd213sd:
; KNL: # %bb.0:
; KNL-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmadd213sd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmadd213ss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmadd213ss:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmadd213ss:
; KNL: # %bb.0:
; KNL-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmadd213ss:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmaddsubpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmaddsubpd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmaddsubpd:
; KNL: # %bb.0:
; KNL-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmaddsubpd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmaddsubpd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmaddsubpd_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmaddsubpd_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmaddsubpd_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmaddsubps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmaddsubps:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmaddsubps:
; KNL: # %bb.0:
; KNL-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmaddsubps:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmaddsubps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmaddsubps_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmaddsubps_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmaddsubps_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsubaddpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsubaddpd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsubaddpd:
; KNL: # %bb.0:
; KNL-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsubaddpd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsubaddpd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsubaddpd_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsubaddpd_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsubaddpd_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsubaddps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsubaddps:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsubaddps:
; KNL: # %bb.0:
; KNL-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsubaddps:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsubaddps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsubaddps_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsubaddps_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsubaddps_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsub213pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsub213pd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsub213pd:
; KNL: # %bb.0:
; KNL-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsub213pd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsub213pd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsub213pd_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsub213pd_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsub213pd_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsub213ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsub213ps:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsub213ps:
; KNL: # %bb.0:
; KNL-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsub213ps:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsub213ps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsub213ps_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsub213ps_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsub213ps_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsub213sd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsub213sd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsub213sd:
; KNL: # %bb.0:
; KNL-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsub213sd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfmsub213ss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfmsub213ss:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfmsub213ss:
; KNL: # %bb.0:
; KNL-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfmsub213ss:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmadd213pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmadd213pd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmadd213pd:
; KNL: # %bb.0:
; KNL-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmadd213pd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmadd213pd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmadd213pd_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmadd213pd_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmadd213pd_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmadd213ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmadd213ps:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmadd213ps:
; KNL: # %bb.0:
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmadd213ps:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmadd213ps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmadd213ps_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmadd213ps_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmadd213ps_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmadd213sd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmadd213sd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmadd213sd:
; KNL: # %bb.0:
; KNL-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmadd213sd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmadd213ss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmadd213ss:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmadd213ss:
; KNL: # %bb.0:
; KNL-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmadd213ss:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmsub213pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmsub213pd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmsub213pd:
; KNL: # %bb.0:
; KNL-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmsub213pd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmsub213pd_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmsub213pd_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmsub213pd_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmsub213pd_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmsub213ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmsub213ps:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmsub213ps:
; KNL: # %bb.0:
; KNL-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmsub213ps:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmsub213ps_ymm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmsub213ps_ymm:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmsub213ps_ymm:
; KNL: # %bb.0:
; KNL-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmsub213ps_ymm:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmsub213sd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmsub213sd:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmsub213sd:
; KNL: # %bb.0:
; KNL-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmsub213sd:
; SKX: # %bb.0:
; HASWELL-LABEL: test_vfnmsub213ss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_vfnmsub213ss:
; BROADWELL: # %bb.0:
; KNL-LABEL: test_vfnmsub213ss:
; KNL: # %bb.0:
; KNL-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: test_vfnmsub213ss:
; SKX: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal -24(%rdi), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_offset:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal 1024(%rdi), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_offset_big:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %esi killed %esi def %rsi
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal (%rdi,%rsi), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal (%rdi,%rsi), %eax # sched: [1:0.50]
; HASWELL-NEXT: addl $16, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_offset:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leal (%rdi,%rsi), %eax # sched: [1:0.50]
; HASWELL-NEXT: addl $-4096, %eax # imm = 0xF000
; HASWELL-NEXT: # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_offset_big:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_mul:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
; HASWELL-NEXT: addl $-32, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_mul_offset:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
; HASWELL-NEXT: addl $10000, %eax # imm = 0x2710
; HASWELL-NEXT: # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_mul_offset_big:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %esi killed %esi def %rsi
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal (%rdi,%rsi,2), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_scale:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: # kill: def %edi killed %edi def %rdi
; HASWELL-NEXT: leal (%rdi,%rsi,4), %eax # sched: [1:0.50]
; HASWELL-NEXT: addl $96, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_scale_offset:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leal (%rdi,%rsi,8), %eax # sched: [1:0.50]
; HASWELL-NEXT: addl $-1200, %eax # imm = 0xFB50
; HASWELL-NEXT: # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_scale_offset_big:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_lea_offset:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq -24(%rdi), %rax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_offset:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_lea_offset_big:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq 1024(%rdi), %rax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_offset_big:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_lea_add:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rsi), %rax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rsi), %rax # sched: [1:0.50]
; HASWELL-NEXT: addq $16, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_offset:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rsi), %rax # sched: [1:0.50]
; HASWELL-NEXT: addq $-4096, %rax # imm = 0xF000
; HASWELL-NEXT: # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_offset_big:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_lea_mul:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_mul:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
; HASWELL-NEXT: addq $-32, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_mul_offset:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
; HASWELL-NEXT: addq $10000, %rax # imm = 0x2710
; HASWELL-NEXT: # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_mul_offset_big:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_lea_add_scale:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rsi,2), %rax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_scale:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rsi,4), %rax # sched: [1:0.50]
; HASWELL-NEXT: addq $96, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_scale_offset:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi,%rsi,8), %rax # sched: [1:0.50]
; HASWELL-NEXT: addq $-1200, %rax # imm = 0xFB50
; HASWELL-NEXT: # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lea_add_scale_offset_big:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_ctlz_i16:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: lzcntw (%rsi), %cx # sched: [3:1.00]
+; HASWELL-NEXT: lzcntw (%rsi), %cx # sched: [8:1.00]
; HASWELL-NEXT: lzcntw %di, %ax # sched: [3:1.00]
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ctlz_i16:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_ctlz_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: lzcntl (%rsi), %ecx # sched: [3:1.00]
+; HASWELL-NEXT: lzcntl (%rsi), %ecx # sched: [8:1.00]
; HASWELL-NEXT: lzcntl %edi, %eax # sched: [3:1.00]
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ctlz_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_ctlz_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: lzcntq (%rsi), %rcx # sched: [3:1.00]
+; HASWELL-NEXT: lzcntq (%rsi), %rcx # sched: [8:1.00]
; HASWELL-NEXT: lzcntq %rdi, %rax # sched: [3:1.00]
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ctlz_i64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_cvtpd2pi:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: cvtpd2pi (%rdi), %mm0 # sched: [4:1.00]
+; HASWELL-NEXT: cvtpd2pi (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: cvtpd2pi %xmm0, %mm1 # sched: [4:1.00]
; HASWELL-NEXT: por %mm1, %mm0 # sched: [1:0.33]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpd2pi:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtpi2pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: cvtpi2pd %mm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: cvtpi2pd (%rdi), %xmm1 # sched: [4:1.00]
+; HASWELL-NEXT: cvtpi2pd (%rdi), %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpi2pd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtpi2ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: cvtpi2ps %mm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: cvtpi2ps (%rdi), %xmm1 # sched: [3:1.00]
+; HASWELL-NEXT: cvtpi2ps (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpi2ps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtps2pi:
; HASWELL: # %bb.0:
; HASWELL-NEXT: cvtps2pi %xmm0, %mm0 # sched: [4:1.00]
-; HASWELL-NEXT: cvtps2pi (%rdi), %mm1 # sched: [3:1.00]
+; HASWELL-NEXT: cvtps2pi (%rdi), %mm1 # sched: [8:1.00]
; HASWELL-NEXT: por %mm0, %mm1 # sched: [1:0.33]
; HASWELL-NEXT: movd %mm1, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtps2pi:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_cvttpd2pi:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: cvttpd2pi (%rdi), %mm0 # sched: [4:1.00]
+; HASWELL-NEXT: cvttpd2pi (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: cvttpd2pi %xmm0, %mm1 # sched: [4:1.00]
; HASWELL-NEXT: por %mm1, %mm0 # sched: [1:0.33]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttpd2pi:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttps2pi:
; HASWELL: # %bb.0:
; HASWELL-NEXT: cvttps2pi %xmm0, %mm0 # sched: [4:1.00]
-; HASWELL-NEXT: cvttps2pi (%rdi), %mm1 # sched: [3:1.00]
+; HASWELL-NEXT: cvttps2pi (%rdi), %mm1 # sched: [8:1.00]
; HASWELL-NEXT: por %mm0, %mm1 # sched: [1:0.33]
; HASWELL-NEXT: movd %mm1, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttps2pi:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_emms:
; HASWELL: # %bb.0:
; HASWELL-NEXT: emms # sched: [31:10.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_emms:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maskmovq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: maskmovq %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maskmovq:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovd %edi, %xmm0 # sched: [1:1.00]
; HASWELL-NEXT: vmovq %xmm0, -{{[0-9]+}}(%rsp) # sched: [1:1.00]
-; HASWELL-NEXT: movq -{{[0-9]+}}(%rsp), %mm1 # sched: [1:0.50]
-; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: movq -{{[0-9]+}}(%rsp), %mm1 # sched: [5:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vmovlps %xmm0, -{{[0-9]+}}(%rsp) # sched: [1:1.00]
-; HASWELL-NEXT: paddd -{{[0-9]+}}(%rsp), %mm1 # sched: [1:0.50]
+; HASWELL-NEXT: paddd -{{[0-9]+}}(%rsp), %mm1 # sched: [6:0.50]
; HASWELL-NEXT: paddd %mm1, %mm0 # sched: [1:0.50]
; HASWELL-NEXT: movd %mm1, %ecx # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %eax # sched: [1:1.00]
; HASWELL-NEXT: movl %ecx, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movd:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: movdq2q %xmm0, %mm0 # sched: [2:0.67]
; HASWELL-NEXT: paddd %mm0, %mm0 # sched: [1:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movdq2q:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movntq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: movntq %mm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntq:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movq:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movq (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: movq (%rdi), %mm0 # sched: [5:0.50]
; HASWELL-NEXT: paddd %mm0, %mm0 # sched: [1:0.50]
; HASWELL-NEXT: movq %mm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movq2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: movq2dq %mm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movq2dq:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pabsb:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pabsb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pabsb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: pabsb %mm0, %mm0 # sched: [1:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsb:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pabsd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pabsd (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pabsd (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: pabsd %mm0, %mm0 # sched: [1:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pabsw:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pabsw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pabsw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: pabsw %mm0, %mm0 # sched: [1:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packssdw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: packssdw %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: packssdw (%rdi), %mm0 # sched: [2:2.00]
+; HASWELL-NEXT: packssdw (%rdi), %mm0 # sched: [7:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packssdw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packsswb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: packsswb %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: packsswb (%rdi), %mm0 # sched: [2:2.00]
+; HASWELL-NEXT: packsswb (%rdi), %mm0 # sched: [7:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packsswb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packuswb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: packuswb %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: packuswb (%rdi), %mm0 # sched: [2:2.00]
+; HASWELL-NEXT: packuswb (%rdi), %mm0 # sched: [7:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packuswb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddd %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddd (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddd (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddq %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddq (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddq (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddsb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddsb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddsb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddsw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddsw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddsw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddusb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddusb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddusb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddusb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddusb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddusw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddusw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddusw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddusw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddusw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: paddw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: paddw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: paddw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_palignr:
; HASWELL: # %bb.0:
; HASWELL-NEXT: palignr $1, %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: palignr $1, (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: palignr $1, (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_palignr:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pand:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pand %mm1, %mm0 # sched: [1:0.33]
-; HASWELL-NEXT: pand (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pand (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pand:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pandn:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pandn %mm1, %mm0 # sched: [1:0.33]
-; HASWELL-NEXT: pandn (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pandn (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pandn:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pavgb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pavgb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pavgb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pavgb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pavgb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pavgw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pavgw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pavgw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pavgw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pavgw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pcmpeqb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pcmpeqb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pcmpeqb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pcmpeqd %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pcmpeqd (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pcmpeqd (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pcmpeqw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pcmpeqw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pcmpeqw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pcmpgtb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pcmpgtb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pcmpgtb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pcmpgtd %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pcmpgtd (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pcmpgtd (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pcmpgtw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pcmpgtw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pcmpgtw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pextrw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pextrw $0, %mm0, %eax # sched: [2:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pextrw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: phaddd %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: phaddd (%rdi), %mm0 # sched: [3:2.00]
+; HASWELL-NEXT: phaddd (%rdi), %mm0 # sched: [8:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: phaddsw %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: phaddsw (%rdi), %mm0 # sched: [3:2.00]
+; HASWELL-NEXT: phaddsw (%rdi), %mm0 # sched: [8:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: phaddw %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: phaddw (%rdi), %mm0 # sched: [3:2.00]
+; HASWELL-NEXT: phaddw (%rdi), %mm0 # sched: [8:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: phsubd %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: phsubd (%rdi), %mm0 # sched: [3:2.00]
+; HASWELL-NEXT: phsubd (%rdi), %mm0 # sched: [8:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: phsubsw %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: phsubsw (%rdi), %mm0 # sched: [3:2.00]
+; HASWELL-NEXT: phsubsw (%rdi), %mm0 # sched: [8:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: phsubw %mm1, %mm0 # sched: [3:2.00]
-; HASWELL-NEXT: phsubw (%rdi), %mm0 # sched: [3:2.00]
+; HASWELL-NEXT: phsubw (%rdi), %mm0 # sched: [8:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pinsrw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pinsrw $0, %edi, %mm0 # sched: [2:2.00]
-; HASWELL-NEXT: movswl (%rsi), %eax # sched: [4:0.50]
+; HASWELL-NEXT: movswl (%rsi), %eax # sched: [5:0.50]
; HASWELL-NEXT: pinsrw $1, %eax, %mm0 # sched: [2:2.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pinsrw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaddwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmaddwd %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmaddwd (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmaddwd (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaddwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaddubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmaddubsw %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmaddubsw (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmaddubsw (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaddubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmaxsw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pmaxsw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pmaxsw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxub:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmaxub %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pmaxub (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pmaxub (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxub:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pminsw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pminsw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pminsw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminub:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pminub %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: pminub (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pminub (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminub:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pmovmskb:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pmovmskb %mm0, %eax # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: pmovmskb %mm0, %eax # sched: [1:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovmskb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhrsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmulhrsw %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmulhrsw (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmulhrsw (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhrsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmulhw %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmulhw (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmulhw (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmulhuw %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmulhuw (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmulhuw (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmullw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmullw %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmullw (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmullw (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmullw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmuludq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pmuludq %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: pmuludq (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: pmuludq (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmuludq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_por:
; HASWELL: # %bb.0:
; HASWELL-NEXT: por %mm1, %mm0 # sched: [1:0.33]
-; HASWELL-NEXT: por (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: por (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_por:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psadbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psadbw %mm1, %mm0 # sched: [5:1.00]
-; HASWELL-NEXT: psadbw (%rdi), %mm0 # sched: [5:1.00]
+; HASWELL-NEXT: psadbw (%rdi), %mm0 # sched: [10:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psadbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pshufb %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: pshufb (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: pshufb (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufb:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_pshufw:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: pshufw $0, (%rdi), %mm0 # mm0 = mem[0,0,0,0] sched: [1:1.00]
+; HASWELL-NEXT: pshufw $0, (%rdi), %mm0 # mm0 = mem[0,0,0,0] sched: [6:1.00]
; HASWELL-NEXT: pshufw $0, %mm0, %mm0 # mm0 = mm0[0,0,0,0] sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psignb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psignb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psignb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psignd %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psignd (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psignd (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psignw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psignw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psignw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pslld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pslld %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: pslld (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: pslld (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: pslld $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pslld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psllq %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psllq (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psllq (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psllq $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psllw %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psllw (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psllw (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psllw $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrad:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psrad %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psrad (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psrad (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psrad $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrad:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psraw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psraw %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psraw (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psraw (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psraw $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psraw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psrld %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psrld (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psrld (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psrld $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psrlq %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psrlq (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psrlq (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psrlq $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psrlw %mm1, %mm0 # sched: [1:1.00]
-; HASWELL-NEXT: psrlw (%rdi), %mm0 # sched: [1:1.00]
+; HASWELL-NEXT: psrlw (%rdi), %mm0 # sched: [6:1.00]
; HASWELL-NEXT: psrlw $7, %mm0 # sched: [1:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubd %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubd (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubd (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubq %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubq (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubq (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubsb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubsb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubsb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubsw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubsw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubsw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubusb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubusb %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubusb (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubusb (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubusb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubusw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubusw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubusw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubusw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubusw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: psubw %mm1, %mm0 # sched: [1:0.50]
-; HASWELL-NEXT: psubw (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: psubw (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: punpckhbw %mm1, %mm0 # mm0 = mm0[4],mm1[4],mm0[5],mm1[5],mm0[6],mm1[6],mm0[7],mm1[7] sched: [1:1.00]
-; HASWELL-NEXT: punpckhbw (%rdi), %mm0 # mm0 = mm0[4],mem[4],mm0[5],mem[5],mm0[6],mem[6],mm0[7],mem[7] sched: [1:1.00]
+; HASWELL-NEXT: punpckhbw (%rdi), %mm0 # mm0 = mm0[4],mem[4],mm0[5],mem[5],mm0[6],mem[6],mm0[7],mem[7] sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: punpckhdq %mm1, %mm0 # mm0 = mm0[1],mm1[1] sched: [1:1.00]
-; HASWELL-NEXT: punpckhdq (%rdi), %mm0 # mm0 = mm0[1],mem[1] sched: [1:1.00]
+; HASWELL-NEXT: punpckhdq (%rdi), %mm0 # mm0 = mm0[1],mem[1] sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: punpckhwd %mm1, %mm0 # mm0 = mm0[2],mm1[2],mm0[3],mm1[3] sched: [1:1.00]
-; HASWELL-NEXT: punpckhwd (%rdi), %mm0 # mm0 = mm0[2],mem[2],mm0[3],mem[3] sched: [1:1.00]
+; HASWELL-NEXT: punpckhwd (%rdi), %mm0 # mm0 = mm0[2],mem[2],mm0[3],mem[3] sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: punpcklbw %mm1, %mm0 # mm0 = mm0[0],mm1[0],mm0[1],mm1[1],mm0[2],mm1[2],mm0[3],mm1[3] sched: [1:1.00]
-; HASWELL-NEXT: punpcklbw (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1],mm0[2],mem[2],mm0[3],mem[3] sched: [1:1.00]
+; HASWELL-NEXT: punpcklbw (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1],mm0[2],mem[2],mm0[3],mem[3] sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: punpckldq %mm1, %mm0 # mm0 = mm0[0],mm1[0] sched: [1:1.00]
-; HASWELL-NEXT: punpckldq (%rdi), %mm0 # mm0 = mm0[0],mem[0] sched: [1:1.00]
+; HASWELL-NEXT: punpckldq (%rdi), %mm0 # mm0 = mm0[0],mem[0] sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: punpcklwd %mm1, %mm0 # mm0 = mm0[0],mm1[0],mm0[1],mm1[1] sched: [1:1.00]
-; HASWELL-NEXT: punpcklwd (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1] sched: [1:1.00]
+; HASWELL-NEXT: punpcklwd (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1] sched: [6:1.00]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pxor:
; HASWELL: # %bb.0:
; HASWELL-NEXT: pxor %mm1, %mm0 # sched: [1:0.33]
-; HASWELL-NEXT: pxor (%rdi), %mm0 # sched: [1:0.50]
+; HASWELL-NEXT: pxor (%rdi), %mm0 # sched: [6:0.50]
; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pxor:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movbe_i16:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movbew (%rdi), %ax # sched: [1:0.50]
-; HASWELL-NEXT: movbew %si, (%rdx) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: movbew (%rdi), %ax # sched: [6:0.50]
+; HASWELL-NEXT: movbew %si, (%rdx) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movbe_i16:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movbe_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movbel (%rdi), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movbel %esi, (%rdx) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: movbel (%rdi), %eax # sched: [6:0.50]
+; HASWELL-NEXT: movbel %esi, (%rdx) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movbe_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movbe_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movbeq (%rdi), %rax # sched: [1:0.50]
-; HASWELL-NEXT: movbeq %rsi, (%rdx) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: movbeq (%rdi), %rax # sched: [6:0.50]
+; HASWELL-NEXT: movbeq %rsi, (%rdx) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movbe_i64:
; BROADWELL: # %bb.0:
; X64-HSW-LABEL: test_mul_by_1:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_1:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_1:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_1:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_2:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: # kill: def %edi killed %edi def %rdi
; HSW-NOOPT-NEXT: leal (%rdi,%rdi), %eax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_2:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_3:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: # kill: def %edi killed %edi def %rdi
; HSW-NOOPT-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_3:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (,%rdi,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_4:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: # kill: def %edi killed %edi def %rdi
; HSW-NOOPT-NEXT: leal (,%rdi,4), %eax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_4:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_5:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: # kill: def %edi killed %edi def %rdi
; HSW-NOOPT-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_5:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: addl %edi, %edi # sched: [1:0.25]
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_6:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_6:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $6, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_6:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (,%rdi,8), %eax # sched: [1:0.50]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_7:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_7:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $7, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_7:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (,%rdi,8), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_8:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: # kill: def %edi killed %edi def %rdi
; HSW-NOOPT-NEXT: leal (,%rdi,8), %eax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_8:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_9:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: # kill: def %edi killed %edi def %rdi
; HSW-NOOPT-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_9:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: addl %edi, %edi # sched: [1:0.25]
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_10:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_10:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $10, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_10:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rax,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_11:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_11:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $11, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_11:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: shll $2, %edi # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_12:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_12:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $12, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_12:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_13:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_13:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $13, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_13:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_14:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_14:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $14, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_14:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_15:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_15:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $15, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_15:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shll $4, %edi # sched: [1:0.50]
; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_16:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: shll $4, %edi # sched: [1:0.50]
; HSW-NOOPT-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_16:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25]
; X64-HSW-NEXT: shll $4, %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rax,%rdi), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_17:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_17:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $17, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_17:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: addl %edi, %edi # sched: [1:0.25]
; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_18:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_18:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $18, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_18:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: shll $2, %eax # sched: [1:0.50]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_19:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_19:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $19, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_19:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: shll $2, %edi # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_20:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_20:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $20, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_20:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_21:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_21:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $21, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_21:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_22:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_22:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $22, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_22:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
; X64-HSW-NEXT: shll $3, %eax # sched: [1:0.50]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_23:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_23:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $23, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_23:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: shll $3, %edi # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_24:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_24:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $24, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_24:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rax,%rax,4), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_25:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_25:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $25, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_25:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_26:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_26:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $26, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_26:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: # kill: def %edi killed %edi def %rdi
; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_27:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_27:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $27, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_27:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50]
; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50]
; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_28:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_28:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $28, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_28:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50]
; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25]
; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_29:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_29:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $29, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_29:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: shll $5, %eax # sched: [1:0.50]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_30:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_30:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $30, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_30:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25]
; X64-HSW-NEXT: shll $5, %eax # sched: [1:0.50]
; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_31:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_31:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imull $31, %edi, %eax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_31:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shll $5, %edi # sched: [1:0.50]
; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_32:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: shll $5, %edi # sched: [1:0.50]
; HSW-NOOPT-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_32:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; X64-HSW-NEXT: addl $2, %eax # sched: [1:0.25]
; X64-HSW-NEXT: imull %ecx, %eax # sched: [4:1.00]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_spec:
; X64-JAG: # %bb.0:
; HSW-NOOPT-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50]
; HSW-NOOPT-NEXT: addl $2, %eax # sched: [1:0.25]
; HSW-NOOPT-NEXT: imull %ecx, %eax # sched: [4:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_spec:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_1:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_1:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_1:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_1:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_2:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_2:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_2:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: leaq (%rdi,%rdi), %rax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_2:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_3:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_3:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_3:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_3:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_4:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (,%rdi,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_4:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_4:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: leaq (,%rdi,4), %rax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_4:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_5:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_5:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_5:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_5:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: addq %rdi, %rdi # sched: [1:0.25]
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_6:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_6:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $6, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_6:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (,%rdi,8), %rax # sched: [1:0.50]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_7:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_7:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $7, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_7:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_8:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (,%rdi,8), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_8:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_8:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: leaq (,%rdi,8), %rax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_8:
; JAG-NOOPT: # %bb.0:
; X64-HSW-LABEL: test_mul_by_9:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_9:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_9:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_9:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: addq %rdi, %rdi # sched: [1:0.25]
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_10:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_10:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $10, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_10:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rax,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_11:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_11:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $11, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_11:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shlq $2, %rdi # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_12:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_12:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $12, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_12:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_13:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_13:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $13, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_13:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_14:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_14:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $14, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_14:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_15:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_15:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $15, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_15:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shlq $4, %rdi # sched: [1:0.50]
; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_16:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: shlq $4, %rdi # sched: [1:0.50]
; HSW-NOOPT-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_16:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25]
; X64-HSW-NEXT: shlq $4, %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rax,%rdi), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_17:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_17:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $17, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_17:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: addq %rdi, %rdi # sched: [1:0.25]
; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_18:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_18:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $18, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_18:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: shlq $2, %rax # sched: [1:0.50]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_19:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_19:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $19, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_19:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shlq $2, %rdi # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_20:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_20:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $20, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_20:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_21:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_21:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $21, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_21:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_22:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_22:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $22, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_22:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
; X64-HSW-NEXT: shlq $3, %rax # sched: [1:0.50]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_23:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_23:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $23, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_23:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shlq $3, %rdi # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_24:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_24:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $24, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_24:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rax,%rax,4), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_25:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_25:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $25, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_25:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_26:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_26:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $26, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_26:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_27:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_27:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $27, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_27:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50]
; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50]
; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_28:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_28:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $28, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_28:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50]
; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25]
; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_29:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_29:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $29, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_29:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: shlq $5, %rax # sched: [1:0.50]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_30:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_30:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $30, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_30:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25]
; X64-HSW-NEXT: shlq $5, %rax # sched: [1:0.50]
; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_31:
; X64-JAG: # %bb.0:
; HSW-NOOPT-LABEL: test_mul_by_31:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: imulq $31, %rdi, %rax # sched: [3:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_31:
; JAG-NOOPT: # %bb.0:
; X64-HSW: # %bb.0:
; X64-HSW-NEXT: shlq $5, %rdi # sched: [1:0.50]
; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_by_32:
; X64-JAG: # %bb.0:
; HSW-NOOPT: # %bb.0:
; HSW-NOOPT-NEXT: shlq $5, %rdi # sched: [1:0.50]
; HSW-NOOPT-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_by_32:
; JAG-NOOPT: # %bb.0:
; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; X64-HSW-NEXT: addq $2, %rax # sched: [1:0.25]
; X64-HSW-NEXT: imulq %rcx, %rax # sched: [4:1.00]
-; X64-HSW-NEXT: retq # sched: [2:1.00]
+; X64-HSW-NEXT: retq # sched: [7:1.00]
;
; X64-JAG-LABEL: test_mul_spec:
; X64-JAG: # %bb.0:
; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50]
; HSW-NOOPT-NEXT: addq $2, %rax # sched: [1:0.25]
; HSW-NOOPT-NEXT: imulq %rcx, %rax # sched: [4:1.00]
-; HSW-NOOPT-NEXT: retq # sched: [2:1.00]
+; HSW-NOOPT-NEXT: retq # sched: [7:1.00]
;
; JAG-NOOPT-LABEL: test_mul_spec:
; JAG-NOOPT: # %bb.0:
;
; HASWELL-LABEL: test_ctpop_i16:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: popcntw (%rsi), %cx # sched: [3:1.00]
+; HASWELL-NEXT: popcntw (%rsi), %cx # sched: [8:1.00]
; HASWELL-NEXT: popcntw %di, %ax # sched: [3:1.00]
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ctpop_i16:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_ctpop_i32:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: popcntl (%rsi), %ecx # sched: [3:1.00]
+; HASWELL-NEXT: popcntl (%rsi), %ecx # sched: [8:1.00]
; HASWELL-NEXT: popcntl %edi, %eax # sched: [3:1.00]
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ctpop_i32:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_ctpop_i64:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: popcntq (%rsi), %rcx # sched: [3:1.00]
+; HASWELL-NEXT: popcntq (%rsi), %rcx # sched: [8:1.00]
; HASWELL-NEXT: popcntq %rdi, %rax # sched: [3:1.00]
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ctpop_i64:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rdrand_16:
; HASWELL: # %bb.0:
; HASWELL-NEXT: rdrandw %ax # sched: [1:5.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rdrand_16:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rdrand_32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: rdrandl %eax # sched: [1:5.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rdrand_32:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rdrand_64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: rdrandq %rax # sched: [1:5.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rdrand_64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: f32_no_estimate:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vdivss %xmm0, %xmm1, %xmm0 # sched: [13:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_no_estimate:
; HASWELL-NO-FMA: # %bb.0:
;
; KNL-LABEL: f32_no_estimate:
; KNL: # %bb.0:
-; KNL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50]
+; KNL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50]
; KNL-NEXT: vdivss %xmm0, %xmm1, %xmm0 # sched: [13:1.00]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_no_estimate:
; SKX: # %bb.0:
; HASWELL-LABEL: f32_one_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50]
+; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_one_step:
; HASWELL-NO-FMA: # %bb.0:
; KNL-LABEL: f32_one_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50]
+; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50]
; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_one_step:
; SKX: # %bb.0:
; HASWELL-LABEL: f32_two_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_two_step:
; HASWELL-NO-FMA: # %bb.0:
; KNL-LABEL: f32_two_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; KNL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_two_step:
; SKX: # %bb.0:
;
; HASWELL-LABEL: v4f32_no_estimate:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NEXT: vdivps %xmm0, %xmm1, %xmm0 # sched: [13:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v4f32_no_estimate:
; HASWELL-NO-FMA: # %bb.0:
;
; KNL-LABEL: v4f32_no_estimate:
; KNL: # %bb.0:
-; KNL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [6:0.50]
; KNL-NEXT: vdivps %xmm0, %xmm1, %xmm0 # sched: [13:1.00]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v4f32_no_estimate:
; SKX: # %bb.0:
; HASWELL-LABEL: v4f32_one_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v4f32_one_step:
; HASWELL-NO-FMA: # %bb.0:
; KNL-LABEL: v4f32_one_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v4f32_one_step:
; SKX: # %bb.0:
; HASWELL-LABEL: v4f32_two_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v4f32_two_step:
; HASWELL-NO-FMA: # %bb.0:
; KNL-LABEL: v4f32_two_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v4f32_two_step:
; SKX: # %bb.0:
;
; HASWELL-LABEL: v8f32_no_estimate:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NEXT: vdivps %ymm0, %ymm1, %ymm0 # sched: [21:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_no_estimate:
; HASWELL-NO-FMA: # %bb.0:
;
; KNL-LABEL: v8f32_no_estimate:
; KNL: # %bb.0:
-; KNL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; KNL-NEXT: vdivps %ymm0, %ymm1, %ymm0 # sched: [21:2.00]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_no_estimate:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_one_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_one_step:
; HASWELL-NO-FMA: # %bb.0:
; KNL-LABEL: v8f32_one_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_one_step:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_two_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_two_step:
; HASWELL-NO-FMA: # %bb.0:
; KNL-LABEL: v8f32_two_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; KNL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_two_step:
; SKX: # %bb.0:
; HASWELL-LABEL: f32_no_step_2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_no_step_2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: f32_no_step_2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00]
-; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_no_step_2:
; SKX: # %bb.0:
; HASWELL-LABEL: f32_one_step_2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50]
+; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_one_step_2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vsubss %xmm0, %xmm2, %xmm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddss %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: f32_one_step_2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50]
+; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50]
; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_one_step_2:
; SKX: # %bb.0:
; HASWELL-LABEL: f32_one_step_2_divs:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50]
+; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50]
+; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [10:0.50]
; HASWELL-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_one_step_2_divs:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vsubss %xmm0, %xmm2, %xmm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddss %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50]
+; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [10:0.50]
; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: f32_one_step_2_divs:
; KNL: # %bb.0:
; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50]
+; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50]
; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50]
+; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [10:0.50]
; KNL-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_one_step_2_divs:
; SKX: # %bb.0:
; HASWELL-LABEL: f32_two_step_2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: f32_two_step_2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm1, %xmm0, %xmm2 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm3 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm3 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vsubss %xmm2, %xmm3, %xmm2 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm2, %xmm1, %xmm2 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddss %xmm2, %xmm1, %xmm1 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vsubss %xmm0, %xmm3, %xmm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddss %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: f32_two_step_2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; KNL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: f32_two_step_2:
; SKX: # %bb.0:
; HASWELL-LABEL: v4f32_one_step2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v4f32_one_step2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NO-FMA-NEXT: vsubps %xmm0, %xmm2, %xmm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v4f32_one_step2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v4f32_one_step2:
; SKX: # %bb.0:
; HASWELL-LABEL: v4f32_one_step_2_divs:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [11:0.50]
; HASWELL-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v4f32_one_step_2_divs:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NO-FMA-NEXT: vsubps %xmm0, %xmm2, %xmm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [11:0.50]
; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v4f32_one_step_2_divs:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50]
+; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [11:0.50]
; KNL-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v4f32_one_step_2_divs:
; SKX: # %bb.0:
; HASWELL-LABEL: v4f32_two_step2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v4f32_two_step2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm1, %xmm0, %xmm2 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm3 = [1,1,1,1] sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm3 = [1,1,1,1] sched: [6:0.50]
; HASWELL-NO-FMA-NEXT: vsubps %xmm2, %xmm3, %xmm2 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm2, %xmm1, %xmm2 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %xmm2, %xmm1, %xmm1 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vsubps %xmm0, %xmm3, %xmm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v4f32_two_step2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50]
; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50]
; KNL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v4f32_two_step2:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_one_step2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_one_step2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm1, %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NO-FMA-NEXT: vsubps %ymm0, %ymm2, %ymm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v8f32_one_step2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_one_step2:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_one_step_2_divs:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [5:0.50]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [12:0.50]
; HASWELL-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_one_step_2_divs:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm1, %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NO-FMA-NEXT: vsubps %ymm0, %ymm2, %ymm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [5:0.50]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [12:0.50]
; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v8f32_one_step_2_divs:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [5:0.50]
+; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [12:0.50]
; KNL-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_one_step_2_divs:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_two_step2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50]
; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50]
; HASWELL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_two_step2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm1, %ymm0, %ymm2 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm3 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm3 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; HASWELL-NO-FMA-NEXT: vsubps %ymm2, %ymm3, %ymm2 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm2, %ymm1, %ymm2 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %ymm2, %ymm1, %ymm1 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vsubps %ymm0, %ymm3, %ymm0 # sched: [3:1.00]
; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50]
; HASWELL-NO-FMA-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v8f32_two_step2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00]
-; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50]
+; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50]
; KNL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50]
; KNL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50]
; KNL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_two_step2:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_no_step:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_no_step:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v8f32_no_step:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_no_step:
; SKX: # %bb.0:
; HASWELL-LABEL: v8f32_no_step2:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
-; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; HASWELL-NO-FMA-LABEL: v8f32_no_step2:
; HASWELL-NO-FMA: # %bb.0:
; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
-; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00]
+; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00]
;
; KNL-LABEL: v8f32_no_step2:
; KNL: # %bb.0:
; KNL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00]
-; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50]
-; KNL-NEXT: retq # sched: [2:1.00]
+; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50]
+; KNL-NEXT: retq # sched: [7:1.00]
;
; SKX-LABEL: v8f32_no_step2:
; SKX: # %bb.0:
;
; HASWELL-LABEL: test_aaa:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50]
+; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: aaa # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aaa:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_aad:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movzwl {{[0-9]+}}(%esp), %eax # sched: [4:0.50]
+; HASWELL-NEXT: movzwl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: aad # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aad:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_aam:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50]
+; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: aam # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aam:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_aas:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50]
+; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: aas # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_aas:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_daa:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50]
+; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: daa # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_daa:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_das:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50]
+; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: das # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_das:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: salc # sched: [1:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_salc:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: bsfw %di, %ax # sched: [3:1.00]
-; HASWELL-NEXT: bsfw (%rsi), %cx # sched: [3:1.00]
+; HASWELL-NEXT: bsfw (%rsi), %cx # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bsf16:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: bsfl %edi, %eax # sched: [3:1.00]
-; HASWELL-NEXT: bsfl (%rsi), %ecx # sched: [3:1.00]
+; HASWELL-NEXT: bsfl (%rsi), %ecx # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bsf32:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: bsfq %rdi, %rax # sched: [3:1.00]
-; HASWELL-NEXT: bsfq (%rsi), %rcx # sched: [3:1.00]
+; HASWELL-NEXT: bsfq (%rsi), %rcx # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bsf64:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: bsrw %di, %ax # sched: [3:1.00]
-; HASWELL-NEXT: bsrw (%rsi), %cx # sched: [3:1.00]
+; HASWELL-NEXT: bsrw (%rsi), %cx # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bsr16:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: bsrl %edi, %eax # sched: [3:1.00]
-; HASWELL-NEXT: bsrl (%rsi), %ecx # sched: [3:1.00]
+; HASWELL-NEXT: bsrl (%rsi), %ecx # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bsr32:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: bsrq %rdi, %rax # sched: [3:1.00]
-; HASWELL-NEXT: bsrq (%rsi), %rcx # sched: [3:1.00]
+; HASWELL-NEXT: bsrq (%rsi), %rcx # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bsr64:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: bswapl %edi # sched: [2:0.50]
; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bswap32:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: bswapq %rdi # sched: [2:0.50]
; HASWELL-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_bswap64:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: cwtd # sched: [2:0.50]
; HASWELL-NEXT: cwtl # sched: [1:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cbw_cdq_cdqe_cqo_cwd_cwde:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: cld # sched: [3:1.00]
; HASWELL-NEXT: cmc # sched: [1:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_clc_cld_cmc:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: cpuid # sched: [18:2.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cpuid:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: invlpg (%rdi) # sched: [100:0.25]
; HASWELL-NEXT: invlpga %ecx, %rax # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_invlpg_invlpga:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: lahf # sched: [1:0.25]
; HASWELL-NEXT: sahf # sched: [1:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lahf_sahf:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: shldw %cl, %si, %di # sched: [6:1.00]
; HASWELL-NEXT: shrdw %cl, %si, %di # sched: [6:1.00]
-; HASWELL-NEXT: shldw %cl, %si, (%rdx) # sched: [6:1.00]
-; HASWELL-NEXT: shrdw %cl, %si, (%rdx) # sched: [6:1.00]
+; HASWELL-NEXT: shldw %cl, %si, (%rdx) # sched: [12:1.00]
+; HASWELL-NEXT: shrdw %cl, %si, (%rdx) # sched: [12:1.00]
; HASWELL-NEXT: shldw $7, %si, %di # sched: [3:1.00]
; HASWELL-NEXT: shrdw $7, %si, %di # sched: [3:1.00]
-; HASWELL-NEXT: shldw $7, %si, (%rdx) # sched: [4:1.00]
-; HASWELL-NEXT: shrdw $7, %si, (%rdx) # sched: [4:1.00]
+; HASWELL-NEXT: shldw $7, %si, (%rdx) # sched: [10:1.00]
+; HASWELL-NEXT: shrdw $7, %si, (%rdx) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shld_shrd_16:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: shldl %cl, %esi, %edi # sched: [6:1.00]
; HASWELL-NEXT: shrdl %cl, %esi, %edi # sched: [6:1.00]
-; HASWELL-NEXT: shldl %cl, %esi, (%rdx) # sched: [6:1.00]
-; HASWELL-NEXT: shrdl %cl, %esi, (%rdx) # sched: [6:1.00]
+; HASWELL-NEXT: shldl %cl, %esi, (%rdx) # sched: [12:1.00]
+; HASWELL-NEXT: shrdl %cl, %esi, (%rdx) # sched: [12:1.00]
; HASWELL-NEXT: shldl $7, %esi, %edi # sched: [3:1.00]
; HASWELL-NEXT: shrdl $7, %esi, %edi # sched: [3:1.00]
-; HASWELL-NEXT: shldl $7, %esi, (%rdx) # sched: [4:1.00]
-; HASWELL-NEXT: shrdl $7, %esi, (%rdx) # sched: [4:1.00]
+; HASWELL-NEXT: shldl $7, %esi, (%rdx) # sched: [10:1.00]
+; HASWELL-NEXT: shrdl $7, %esi, (%rdx) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shld_shrd_32:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: shldq %cl, %rsi, %rdi # sched: [6:1.00]
; HASWELL-NEXT: shrdq %cl, %rsi, %rdi # sched: [6:1.00]
-; HASWELL-NEXT: shldq %cl, %rsi, (%rdx) # sched: [6:1.00]
-; HASWELL-NEXT: shrdq %cl, %rsi, (%rdx) # sched: [6:1.00]
+; HASWELL-NEXT: shldq %cl, %rsi, (%rdx) # sched: [12:1.00]
+; HASWELL-NEXT: shrdq %cl, %rsi, (%rdx) # sched: [12:1.00]
; HASWELL-NEXT: shldq $7, %rsi, %rdi # sched: [3:1.00]
; HASWELL-NEXT: shrdq $7, %rsi, %rdi # sched: [3:1.00]
-; HASWELL-NEXT: shldq $7, %rsi, (%rdx) # sched: [4:1.00]
-; HASWELL-NEXT: shrdq $7, %rsi, (%rdx) # sched: [4:1.00]
+; HASWELL-NEXT: shldq $7, %rsi, (%rdx) # sched: [10:1.00]
+; HASWELL-NEXT: shrdq $7, %rsi, (%rdx) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shld_shrd_64:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddps (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddps (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddss (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddss (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandps %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandps (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vandps (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andnotps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandnps %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandnps (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vandnps (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andnotps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cmpps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcmpeqps %xmm1, %xmm0, %xmm1 # sched: [3:1.00]
-; HASWELL-NEXT: vcmpeqps (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
+; HASWELL-NEXT: vcmpeqps (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
; HASWELL-NEXT: vorps %xmm0, %xmm1, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cmpps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cmpss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcmpeqss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcmpeqss (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vcmpeqss (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cmpss:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %cl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25]
-; HASWELL-NEXT: vcomiss (%rdi), %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: vcomiss (%rdi), %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %dl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25]
; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25]
; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_comiss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsi2ss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsi2ssl %edi, %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtsi2ssl (%rsi), %xmm1, %xmm1 # sched: [8:1.00]
+; HASWELL-NEXT: vcvtsi2ssl (%rsi), %xmm1, %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsi2ss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsi2ssq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsi2ssq %rdi, %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: vcvtsi2ssq (%rsi), %xmm1, %xmm1 # sched: [8:1.00]
+; HASWELL-NEXT: vcvtsi2ssq (%rsi), %xmm1, %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsi2ssq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtss2si:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtss2si %xmm0, %ecx # sched: [4:1.00]
-; HASWELL-NEXT: vcvtss2si (%rdi), %eax # sched: [4:1.00]
+; HASWELL-NEXT: vcvtss2si (%rdi), %eax # sched: [9:1.00]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtss2si:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtss2siq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtss2si %xmm0, %rcx # sched: [4:1.00]
-; HASWELL-NEXT: vcvtss2si (%rdi), %rax # sched: [4:1.00]
+; HASWELL-NEXT: vcvtss2si (%rdi), %rax # sched: [9:1.00]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtss2siq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttss2si:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttss2si %xmm0, %ecx # sched: [4:1.00]
-; HASWELL-NEXT: vcvttss2si (%rdi), %eax # sched: [4:1.00]
+; HASWELL-NEXT: vcvttss2si (%rdi), %eax # sched: [9:1.00]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttss2si:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttss2siq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttss2si %xmm0, %rcx # sched: [4:1.00]
-; HASWELL-NEXT: vcvttss2si (%rdi), %rax # sched: [4:1.00]
+; HASWELL-NEXT: vcvttss2si (%rdi), %rax # sched: [9:1.00]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttss2siq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_divps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdivps %xmm1, %xmm0, %xmm0 # sched: [13:1.00]
-; HASWELL-NEXT: vdivps (%rdi), %xmm0, %xmm0 # sched: [13:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdivps (%rdi), %xmm0, %xmm0 # sched: [19:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_divps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_divss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdivss %xmm1, %xmm0, %xmm0 # sched: [13:1.00]
-; HASWELL-NEXT: vdivss (%rdi), %xmm0, %xmm0 # sched: [13:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdivss (%rdi), %xmm0, %xmm0 # sched: [18:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_divss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_ldmxcsr:
; HASWELL: # %bb.0:
; HASWELL-NEXT: movl %edi, -{{[0-9]+}}(%rsp) # sched: [1:1.00]
-; HASWELL-NEXT: vldmxcsr -{{[0-9]+}}(%rsp) # sched: [2:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vldmxcsr -{{[0-9]+}}(%rsp) # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ldmxcsr:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maxps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaxps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vmaxps (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmaxps (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maxps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maxss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaxss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vmaxss (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmaxss (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maxss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_minps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vminps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vminps (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vminps (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_minps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_minss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vminss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vminss (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vminss (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_minss:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movaps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovaps (%rdi), %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovaps (%rdi), %xmm0 # sched: [6:0.50]
; HASWELL-NEXT: vaddps %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovaps %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movaps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movhlps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm1[1],xmm0[1] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movhlps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movhps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [1:1.00]
+; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movhps:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0] sched: [1:1.00]
; HASWELL-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movlhps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movlps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [1:1.00]
+; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovlps %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movlps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movmskps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovmskps %xmm0, %eax # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movmskps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movntps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovntps %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movss_mem:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vaddss %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovss %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movss_mem:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movss_reg:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0],xmm0[1,2,3] sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movss_reg:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movups:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovups (%rdi), %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovups (%rdi), %xmm0 # sched: [6:0.50]
; HASWELL-NEXT: vaddps %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovups %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movups:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mulps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmulps %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulps (%rdi), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulps (%rdi), %xmm0, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mulss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmulss %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulss (%rdi), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulss (%rdi), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_orps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vorps %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vorps (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vorps (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_orps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_prefetchnta:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: prefetchnta (%rdi) # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: prefetchnta (%rdi) # sched: [5:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_prefetchnta:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rcpps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpps %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vrcpps (%rdi), %xmm1 # sched: [5:1.00]
+; HASWELL-NEXT: vrcpps (%rdi), %xmm1 # sched: [11:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rcpps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rcpss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vrcpss %xmm1, %xmm1, %xmm1 # sched: [5:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rcpss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rsqrtps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrsqrtps %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vrsqrtps (%rdi), %xmm1 # sched: [5:1.00]
+; HASWELL-NEXT: vrsqrtps (%rdi), %xmm1 # sched: [11:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rsqrtps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_rsqrtss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vrsqrtss %xmm0, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vrsqrtss %xmm1, %xmm1, %xmm1 # sched: [5:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_rsqrtss:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_sfence:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: sfence # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: sfence # sched: [2:0.33]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sfence:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_shufps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vshufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[0,0] sched: [1:1.00]
-; HASWELL-NEXT: vshufps {{.*#+}} xmm0 = xmm0[0,3],mem[0,0] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vshufps {{.*#+}} xmm0 = xmm0[0,3],mem[0,0] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shufps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_sqrtps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsqrtps %xmm0, %xmm0 # sched: [14:1.00]
-; HASWELL-NEXT: vsqrtps (%rdi), %xmm1 # sched: [14:1.00]
+; HASWELL-NEXT: vsqrtps (%rdi), %xmm1 # sched: [20:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sqrtps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_sqrtss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsqrtss %xmm0, %xmm0, %xmm0 # sched: [14:1.00]
-; HASWELL-NEXT: vmovaps (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vmovaps (%rdi), %xmm1 # sched: [6:0.50]
; HASWELL-NEXT: vsqrtss %xmm1, %xmm1, %xmm1 # sched: [14:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sqrtss:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_stmxcsr:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vstmxcsr -{{[0-9]+}}(%rsp) # sched: [1:1.00]
-; HASWELL-NEXT: movl -{{[0-9]+}}(%rsp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vstmxcsr -{{[0-9]+}}(%rsp) # sched: [2:1.00]
+; HASWELL-NEXT: movl -{{[0-9]+}}(%rsp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_stmxcsr:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_subps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsubps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vsubps (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vsubps (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_subps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_subss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsubss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vsubss (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vsubss (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_subss:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %cl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25]
-; HASWELL-NEXT: vucomiss (%rdi), %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: vucomiss (%rdi), %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %dl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25]
; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25]
; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ucomiss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpckhps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpckhps {{.*#+}} xmm0 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] sched: [1:1.00]
-; HASWELL-NEXT: vunpckhps {{.*#+}} xmm0 = xmm0[2],mem[2],xmm0[3],mem[3] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vunpckhps {{.*#+}} xmm0 = xmm0[2],mem[2],xmm0[3],mem[3] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpckhps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpcklps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpcklps {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] sched: [1:1.00]
-; HASWELL-NEXT: vunpcklps {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vunpcklps {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpcklps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_xorps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vxorps %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vxorps (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vxorps (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_xorps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
+; HASWELL-NEXT: vandpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_andnotpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vandnpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vandnpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
+; HASWELL-NEXT: vandnpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_andnotpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_clflush:
; HASWELL: # %bb.0:
; HASWELL-NEXT: clflush (%rdi) # sched: [2:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_clflush:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cmppd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcmpeqpd %xmm1, %xmm0, %xmm1 # sched: [3:1.00]
-; HASWELL-NEXT: vcmpeqpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
+; HASWELL-NEXT: vcmpeqpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
; HASWELL-NEXT: vorpd %xmm0, %xmm1, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cmppd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cmpsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcmpeqsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcmpeqsd (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vcmpeqsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cmpsd:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %cl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25]
-; HASWELL-NEXT: vcomisd (%rdi), %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: vcomisd (%rdi), %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %dl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25]
; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25]
; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_comisd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtdq2pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtdq2pd %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtdq2pd (%rdi), %xmm1 # sched: [4:1.00]
+; HASWELL-NEXT: vcvtdq2pd (%rdi), %xmm1 # sched: [10:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtdq2pd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtdq2ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtdq2ps %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcvtdq2ps (%rdi), %xmm1 # sched: [3:1.00]
+; HASWELL-NEXT: vcvtdq2ps (%rdi), %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtdq2ps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtpd2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtpd2dq %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtpd2dqx (%rdi), %xmm1 # sched: [7:1.00]
+; HASWELL-NEXT: vcvtpd2dqx (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpd2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtpd2ps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtpd2ps %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtpd2psx (%rdi), %xmm1 # sched: [7:1.00]
+; HASWELL-NEXT: vcvtpd2psx (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtpd2ps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtps2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtps2dq %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcvtps2dq (%rdi), %xmm1 # sched: [3:1.00]
+; HASWELL-NEXT: vcvtps2dq (%rdi), %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtps2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtps2pd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtps2pd %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vcvtps2pd (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vcvtps2pd (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtps2pd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsd2si:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsd2si %xmm0, %ecx # sched: [4:1.00]
-; HASWELL-NEXT: vcvtsd2si (%rdi), %eax # sched: [4:1.00]
+; HASWELL-NEXT: vcvtsd2si (%rdi), %eax # sched: [9:1.00]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsd2si:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsd2siq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsd2si %xmm0, %rcx # sched: [4:1.00]
-; HASWELL-NEXT: vcvtsd2si (%rdi), %rax # sched: [4:1.00]
+; HASWELL-NEXT: vcvtsd2si (%rdi), %rax # sched: [9:1.00]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsd2siq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsd2ss:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsd2ss %xmm0, %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vmovsd {{.*#+}} xmm1 = mem[0],zero sched: [1:0.50]
+; HASWELL-NEXT: vmovsd {{.*#+}} xmm1 = mem[0],zero sched: [5:0.50]
; HASWELL-NEXT: vcvtsd2ss %xmm1, %xmm1, %xmm1 # sched: [4:1.00]
; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsd2ss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsi2sd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsi2sdl %edi, %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtsi2sdl (%rsi), %xmm1, %xmm1 # sched: [8:1.00]
+; HASWELL-NEXT: vcvtsi2sdl (%rsi), %xmm1, %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsi2sd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtsi2sdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtsi2sdq %rdi, %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvtsi2sdq (%rsi), %xmm1, %xmm1 # sched: [8:1.00]
+; HASWELL-NEXT: vcvtsi2sdq (%rsi), %xmm1, %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtsi2sdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvtss2sd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvtss2sd %xmm0, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vcvtss2sd %xmm1, %xmm1, %xmm1 # sched: [2:1.00]
; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvtss2sd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttpd2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttpd2dq %xmm0, %xmm0 # sched: [4:1.00]
-; HASWELL-NEXT: vcvttpd2dqx (%rdi), %xmm1 # sched: [7:1.00]
+; HASWELL-NEXT: vcvttpd2dqx (%rdi), %xmm1 # sched: [8:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttpd2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttps2dq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttps2dq %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vcvttps2dq (%rdi), %xmm1 # sched: [3:1.00]
+; HASWELL-NEXT: vcvttps2dq (%rdi), %xmm1 # sched: [9:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttps2dq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttsd2si:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttsd2si %xmm0, %ecx # sched: [4:1.00]
-; HASWELL-NEXT: vcvttsd2si (%rdi), %eax # sched: [4:1.00]
+; HASWELL-NEXT: vcvttsd2si (%rdi), %eax # sched: [9:1.00]
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttsd2si:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_cvttsd2siq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vcvttsd2si %xmm0, %rcx # sched: [4:1.00]
-; HASWELL-NEXT: vcvttsd2si (%rdi), %rax # sched: [4:1.00]
+; HASWELL-NEXT: vcvttsd2si (%rdi), %rax # sched: [9:1.00]
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_cvttsd2siq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_divpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdivpd %xmm1, %xmm0, %xmm0 # sched: [20:1.00]
-; HASWELL-NEXT: vdivpd (%rdi), %xmm0, %xmm0 # sched: [20:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdivpd (%rdi), %xmm0, %xmm0 # sched: [26:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_divpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_divsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdivsd %xmm1, %xmm0, %xmm0 # sched: [20:1.00]
-; HASWELL-NEXT: vdivsd (%rdi), %xmm0, %xmm0 # sched: [20:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdivsd (%rdi), %xmm0, %xmm0 # sched: [25:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_divsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_lfence:
; HASWELL: # %bb.0:
; HASWELL-NEXT: lfence # sched: [2:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lfence:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mfence:
; HASWELL: # %bb.0:
; HASWELL-NEXT: mfence # sched: [2:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mfence:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maskmovdqu:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaskmovdqu %xmm1, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maskmovdqu:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maxpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaxpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vmaxpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmaxpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maxpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_maxsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmaxsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vmaxsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmaxsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_maxsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_minpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vminpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vminpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vminpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_minpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_minsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vminsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vminsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vminsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_minsd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movapd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovapd (%rdi), %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovapd (%rdi), %xmm0 # sched: [6:0.50]
; HASWELL-NEXT: vaddpd %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovapd %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movapd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movdqa:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovdqa (%rdi), %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovdqa (%rdi), %xmm0 # sched: [6:0.50]
; HASWELL-NEXT: vpaddq %xmm0, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vmovdqa %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movdqa:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movdqu:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovdqu (%rdi), %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovdqu (%rdi), %xmm0 # sched: [6:0.50]
; HASWELL-NEXT: vpaddq %xmm0, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vmovdqu %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movdqu:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovd %edi, %xmm1 # sched: [1:1.00]
-; HASWELL-NEXT: vmovd {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50]
+; HASWELL-NEXT: vmovd {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
; HASWELL-NEXT: vpaddd %xmm2, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vmovd %xmm0, %eax # sched: [1:1.00]
; HASWELL-NEXT: vmovd %xmm1, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movd_64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovq %rdi, %xmm1 # sched: [1:1.00]
-; HASWELL-NEXT: vmovq {{.*#+}} xmm2 = mem[0],zero sched: [1:0.50]
+; HASWELL-NEXT: vmovq {{.*#+}} xmm2 = mem[0],zero sched: [5:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
; HASWELL-NEXT: vpaddq %xmm2, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vmovq %xmm0, %rax # sched: [1:1.00]
; HASWELL-NEXT: vmovq %xmm1, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movd_64:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movhpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [1:1.00]
+; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovhpd %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movhpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movlpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [1:1.00]
+; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovlpd %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movlpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movmskpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovmskpd %xmm0, %eax # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movmskpd:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddq %xmm0, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vmovntdq %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntdqa:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddpd %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovntpd %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movq_mem:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovq {{.*#+}} xmm1 = mem[0],zero sched: [1:0.50]
+; HASWELL-NEXT: vmovq {{.*#+}} xmm1 = mem[0],zero sched: [5:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vmovq %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movq_mem:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero sched: [1:0.33]
; HASWELL-NEXT: vpaddq %xmm0, %xmm1, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movq_reg:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movsd_mem:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero sched: [1:0.50]
+; HASWELL-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero sched: [5:0.50]
; HASWELL-NEXT: vaddsd %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovsd %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movsd_mem:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movsd_reg:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovlhps {{.*#+}} xmm0 = xmm1[0],xmm0[0] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movsd_reg:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movupd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovupd (%rdi), %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vmovupd (%rdi), %xmm0 # sched: [6:0.50]
; HASWELL-NEXT: vaddpd %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
; HASWELL-NEXT: vmovupd %xmm0, (%rsi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movupd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mulpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmulpd %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulpd (%rdi), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulpd (%rdi), %xmm0, %xmm0 # sched: [11:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mulsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmulsd %xmm1, %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: vmulsd (%rdi), %xmm0, %xmm0 # sched: [5:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmulsd (%rdi), %xmm0, %xmm0 # sched: [10:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mulsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_orpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vorpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vorpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
+; HASWELL-NEXT: vorpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_orpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packssdw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpackssdw %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpackssdw (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpackssdw (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packssdw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packsswb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpacksswb %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpacksswb (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpacksswb (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packsswb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packuswb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpackuswb %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpackuswb (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpackuswb (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packuswb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddq (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddq (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddusb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddusb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddusb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddusb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddusb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddusw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddusw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddusw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddusw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddusw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_paddw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpaddw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpaddw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_paddw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pand:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpand %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpand (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpand (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pand:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pandn:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpandn %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpandn (%rdi), %xmm0, %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpandn (%rdi), %xmm0, %xmm1 # sched: [7:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pandn:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pavgb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpavgb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpavgb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpavgb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pavgb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pavgw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpavgw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpavgw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpavgw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pavgw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqb %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpcmpeqb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqd %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqw %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpcmpeqw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtb %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpgtb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpcmpgtb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtd %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtw %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpgtw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpcmpgtw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtw:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpextrw $6, %xmm0, %eax # sched: [2:1.00]
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pextrw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pinsrw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpinsrw $1, %edi, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vpinsrw $3, (%rsi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpinsrw $3, (%rsi), %xmm0, %xmm0 # sched: [6:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pinsrw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaddwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaddwd %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmaddwd (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaddwd (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaddwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxub:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxub %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxub (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxub (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxub:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminub:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminub %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminub (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminub (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminub:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovmskb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovmskb %xmm0, %eax # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovmskb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulhuw %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmulhuw (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulhuw (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulhw %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmulhw (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulhw (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmullw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmullw %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmullw (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmullw (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmullw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmuludq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmuludq %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmuludq (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmuludq (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmuludq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_por:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpor (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpor (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_por:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psadbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpsadbw (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsadbw (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psadbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[1,0,3,2] sched: [1:1.00]
-; HASWELL-NEXT: vpshufd {{.*#+}} xmm1 = mem[3,2,1,0] sched: [1:1.00]
+; HASWELL-NEXT: vpshufd {{.*#+}} xmm1 = mem[3,2,1,0] sched: [7:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufhw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,5,4,7,6] sched: [1:1.00]
-; HASWELL-NEXT: vpshufhw {{.*#+}} xmm1 = mem[0,1,2,3,7,6,5,4] sched: [1:1.00]
+; HASWELL-NEXT: vpshufhw {{.*#+}} xmm1 = mem[0,1,2,3,7,6,5,4] sched: [7:1.00]
; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufhw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshuflw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshuflw {{.*#+}} xmm0 = xmm0[1,0,3,2,4,5,6,7] sched: [1:1.00]
-; HASWELL-NEXT: vpshuflw {{.*#+}} xmm1 = mem[3,2,1,0,4,5,6,7] sched: [1:1.00]
+; HASWELL-NEXT: vpshuflw {{.*#+}} xmm1 = mem[3,2,1,0,4,5,6,7] sched: [7:1.00]
; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshuflw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pslld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpslld %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpslld (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpslld (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpslld $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pslld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pslldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pslldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllq %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsllq (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsllq (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsllq $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psllw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsllw %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsllw (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsllw (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsllw $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psllw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrad:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrad %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsrad (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsrad (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrad $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrad:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psraw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsraw %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsraw (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsraw (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsraw $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psraw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrld %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsrld (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsrld (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrld $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrld:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrldq {{.*#+}} xmm0 = xmm0[4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,zero sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlq %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsrlq (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsrlq (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrlq $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psrlw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsrlw %xmm1, %xmm0, %xmm0 # sched: [2:1.00]
-; HASWELL-NEXT: vpsrlw (%rdi), %xmm0, %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vpsrlw (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: vpsrlw $2, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psrlw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubq (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubq (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubusb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubusb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubusb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubusb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubusb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubusw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubusw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubusw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubusw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubusw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psubw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsubw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsubw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsubw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psubw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhbw {{.*#+}} xmm0 = xmm0[8],xmm1[8],xmm0[9],xmm1[9],xmm0[10],xmm1[10],xmm0[11],xmm1[11],xmm0[12],xmm1[12],xmm0[13],xmm1[13],xmm0[14],xmm1[14],xmm0[15],xmm1[15] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhbw {{.*#+}} xmm0 = xmm0[8],mem[8],xmm0[9],mem[9],xmm0[10],mem[10],xmm0[11],mem[11],xmm0[12],mem[12],xmm0[13],mem[13],xmm0[14],mem[14],xmm0[15],mem[15] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpckhbw {{.*#+}} xmm0 = xmm0[8],mem[8],xmm0[9],mem[9],xmm0[10],mem[10],xmm0[11],mem[11],xmm0[12],mem[12],xmm0[13],mem[13],xmm0[14],mem[14],xmm0[15],mem[15] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhdq {{.*#+}} xmm0 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhdq {{.*#+}} xmm1 = xmm1[2],mem[2],xmm1[3],mem[3] sched: [1:1.00]
+; HASWELL-NEXT: vpunpckhdq {{.*#+}} xmm1 = xmm1[2],mem[2],xmm1[3],mem[3] sched: [7:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhqdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhqdq {{.*#+}} xmm0 = xmm0[1],xmm1[1] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhqdq {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [1:1.00]
+; HASWELL-NEXT: vpunpckhqdq {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [7:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhqdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckhwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckhwd {{.*#+}} xmm0 = xmm0[4],xmm1[4],xmm0[5],xmm1[5],xmm0[6],xmm1[6],xmm0[7],xmm1[7] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckhwd {{.*#+}} xmm0 = xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpckhwd {{.*#+}} xmm0 = xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckhwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpcklbw {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[3],xmm1[3],xmm0[4],xmm1[4],xmm0[5],xmm1[5],xmm0[6],xmm1[6],xmm0[7],xmm1[7] sched: [1:1.00]
-; HASWELL-NEXT: vpunpcklbw {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3],xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpcklbw {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3],xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpckldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] sched: [1:1.00]
-; HASWELL-NEXT: vpunpckldq {{.*#+}} xmm1 = xmm1[0],mem[0],xmm1[1],mem[1] sched: [1:1.00]
+; HASWELL-NEXT: vpunpckldq {{.*#+}} xmm1 = xmm1[0],mem[0],xmm1[1],mem[1] sched: [7:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpckldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklqdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] sched: [1:1.00]
-; HASWELL-NEXT: vpunpcklqdq {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [1:1.00]
+; HASWELL-NEXT: vpunpcklqdq {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [7:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklqdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_punpcklwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpunpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[3],xmm1[3] sched: [1:1.00]
-; HASWELL-NEXT: vpunpcklwd {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpunpcklwd {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_punpcklwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pxor:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpxor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: vpxor (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
+; HASWELL-NEXT: vpxor (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pxor:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_shufpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vshufpd {{.*#+}} xmm0 = xmm0[1],xmm1[0] sched: [1:1.00]
-; HASWELL-NEXT: vshufpd {{.*#+}} xmm1 = xmm1[1],mem[0] sched: [1:1.00]
+; HASWELL-NEXT: vshufpd {{.*#+}} xmm1 = xmm1[1],mem[0] sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_shufpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_sqrtpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsqrtpd %xmm0, %xmm0 # sched: [21:1.00]
-; HASWELL-NEXT: vsqrtpd (%rdi), %xmm1 # sched: [21:1.00]
+; HASWELL-NEXT: vsqrtpd (%rdi), %xmm1 # sched: [27:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sqrtpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_sqrtsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsqrtsd %xmm0, %xmm0, %xmm0 # sched: [21:1.00]
-; HASWELL-NEXT: vmovapd (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vmovapd (%rdi), %xmm1 # sched: [6:0.50]
; HASWELL-NEXT: vsqrtsd %xmm1, %xmm1, %xmm1 # sched: [21:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_sqrtsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_subpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsubpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vsubpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vsubpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_subpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_subsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vsubsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vsubsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vsubsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_subsd:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %cl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25]
-; HASWELL-NEXT: vucomisd (%rdi), %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: vucomisd (%rdi), %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: setnp %al # sched: [1:0.50]
; HASWELL-NEXT: sete %dl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25]
; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25]
; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ucomisd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpckhpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1] sched: [1:1.00]
-; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [1:1.00]
+; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpckhpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_unpcklpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vunpcklpd {{.*#+}} xmm0 = xmm0[0],xmm1[0] sched: [1:1.00]
-; HASWELL-NEXT: vunpcklpd {{.*#+}} xmm1 = xmm0[0],mem[0] sched: [1:1.00]
+; HASWELL-NEXT: vunpcklpd {{.*#+}} xmm1 = xmm0[0],mem[0] sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_unpcklpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_xorpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vxorpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vxorpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
+; HASWELL-NEXT: vxorpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_xorpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addsubpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddsubpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddsubpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddsubpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addsubpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_addsubps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vaddsubps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vaddsubps (%rdi), %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vaddsubps (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_addsubps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_haddpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhaddpd %xmm1, %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhaddpd (%rdi), %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhaddpd (%rdi), %xmm0, %xmm0 # sched: [11:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_haddpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_haddps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhaddps %xmm1, %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhaddps (%rdi), %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhaddps (%rdi), %xmm0, %xmm0 # sched: [11:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_haddps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_hsubpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhsubpd %xmm1, %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhsubpd (%rdi), %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhsubpd (%rdi), %xmm0, %xmm0 # sched: [11:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_hsubpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_hsubps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vhsubps %xmm1, %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: vhsubps (%rdi), %xmm0, %xmm0 # sched: [5:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vhsubps (%rdi), %xmm0, %xmm0 # sched: [11:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_hsubps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_lddqu:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vlddqu (%rdi), %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vlddqu (%rdi), %xmm0 # sched: [6:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_lddqu:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: leaq (%rdi), %rax # sched: [1:0.50]
; HASWELL-NEXT: movl %esi, %ecx # sched: [1:0.25]
; HASWELL-NEXT: monitor # sched: [100:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_monitor:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movddup:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovddup {{.*#+}} xmm0 = xmm0[0,0] sched: [1:1.00]
-; HASWELL-NEXT: vmovddup {{.*#+}} xmm1 = mem[0,0] sched: [1:0.50]
+; HASWELL-NEXT: vmovddup {{.*#+}} xmm1 = mem[0,0] sched: [5:0.50]
; HASWELL-NEXT: vsubpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movddup:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movshdup:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovshdup {{.*#+}} xmm0 = xmm0[1,1,3,3] sched: [1:1.00]
-; HASWELL-NEXT: vmovshdup {{.*#+}} xmm1 = mem[1,1,3,3] sched: [1:0.50]
+; HASWELL-NEXT: vmovshdup {{.*#+}} xmm1 = mem[1,1,3,3] sched: [6:0.50]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movshdup:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_movsldup:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmovsldup {{.*#+}} xmm0 = xmm0[0,0,2,2] sched: [1:1.00]
-; HASWELL-NEXT: vmovsldup {{.*#+}} xmm1 = mem[0,0,2,2] sched: [1:0.50]
+; HASWELL-NEXT: vmovsldup {{.*#+}} xmm1 = mem[0,0,2,2] sched: [6:0.50]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movsldup:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: movl %edi, %ecx # sched: [1:0.25]
; HASWELL-NEXT: movl %esi, %eax # sched: [1:0.25]
; HASWELL-NEXT: mwait # sched: [20:2.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mwait:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendpd {{.*#+}} xmm0 = xmm0[0],xmm1[1] sched: [1:0.33]
; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: vblendpd {{.*#+}} xmm0 = xmm0[0],mem[1] sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendpd {{.*#+}} xmm0 = xmm0[0],mem[1] sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_blendps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0],xmm1[1,2],xmm0[3] sched: [1:0.33]
-; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0],mem[1],xmm0[2,3] sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0],mem[1],xmm0[2,3] sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_blendvpd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vblendvpd %xmm2, (%rdi), %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendvpd %xmm2, (%rdi), %xmm0, %xmm0 # sched: [8:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendvpd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_blendvps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vblendvps %xmm2, %xmm1, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vblendvps %xmm2, (%rdi), %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vblendvps %xmm2, (%rdi), %xmm0, %xmm0 # sched: [8:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_blendvps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_dppd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdppd $7, %xmm1, %xmm0, %xmm0 # sched: [9:1.00]
-; HASWELL-NEXT: vdppd $7, (%rdi), %xmm0, %xmm0 # sched: [9:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdppd $7, (%rdi), %xmm0, %xmm0 # sched: [15:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_dppd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_dpps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vdpps $7, %xmm1, %xmm0, %xmm0 # sched: [14:2.00]
-; HASWELL-NEXT: vdpps $7, (%rdi), %xmm0, %xmm0 # sched: [14:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vdpps $7, (%rdi), %xmm0, %xmm0 # sched: [20:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_dpps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_extractps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vextractps $3, %xmm0, %eax # sched: [2:1.00]
-; HASWELL-NEXT: vextractps $1, %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vextractps $1, %xmm0, (%rdi) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_extractps:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_insertps:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vinsertps {{.*#+}} xmm0 = zero,xmm1[0],xmm0[2,3] sched: [1:1.00]
-; HASWELL-NEXT: vinsertps {{.*#+}} xmm0 = xmm0[0,1,2],mem[0] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vinsertps {{.*#+}} xmm0 = xmm0[0,1,2],mem[0] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_insertps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_movntdqa:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vmovntdqa (%rdi), %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmovntdqa (%rdi), %xmm0 # sched: [6:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_movntdqa:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_mpsadbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vmpsadbw $7, %xmm1, %xmm0, %xmm0 # sched: [7:2.00]
-; HASWELL-NEXT: vmpsadbw $7, (%rdi), %xmm0, %xmm0 # sched: [7:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vmpsadbw $7, (%rdi), %xmm0, %xmm0 # sched: [13:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_mpsadbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_packusdw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpackusdw %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpackusdw (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpackusdw (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_packusdw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pblendvb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpblendvb %xmm2, %xmm1, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vpblendvb %xmm2, (%rdi), %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpblendvb %xmm2, (%rdi), %xmm0, %xmm0 # sched: [8:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pblendvb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pblendw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0],xmm1[1],xmm0[2],xmm1[3],xmm0[4],xmm1[5],xmm0[6],xmm1[7] sched: [1:1.00]
-; HASWELL-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0,1],mem[2,3],xmm0[4,5,6],mem[7] sched: [4:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0,1],mem[2,3],xmm0[4,5,6],mem[7] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pblendw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpeqq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpeqq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpcmpeqq (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpeqq (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpeqq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pextrb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpextrb $3, %xmm0, %eax # sched: [2:1.00]
-; HASWELL-NEXT: vpextrb $1, %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpextrb $1, %xmm0, (%rdi) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pextrb:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpaddd %xmm0, %xmm0, %xmm0 # sched: [1:0.50]
; HASWELL-NEXT: vpextrd $3, %xmm0, %eax # sched: [2:1.00]
-; HASWELL-NEXT: vpextrd $1, %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpextrd $1, %xmm0, (%rdi) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pextrd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pextrq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpextrq $1, %xmm0, %rax # sched: [2:1.00]
-; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pextrq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pextrw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpextrw $3, %xmm0, %eax # sched: [2:1.00]
-; HASWELL-NEXT: vpextrw $1, %xmm0, (%rdi) # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpextrw $1, %xmm0, (%rdi) # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pextrw:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_phminposuw:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vphminposuw (%rdi), %xmm0 # sched: [5:1.00]
+; HASWELL-NEXT: vphminposuw (%rdi), %xmm0 # sched: [11:1.00]
; HASWELL-NEXT: vphminposuw %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phminposuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pinsrb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpinsrb $1, %edi, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vpinsrb $3, (%rsi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpinsrb $3, (%rsi), %xmm0, %xmm0 # sched: [6:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pinsrb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pinsrd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpinsrd $1, %edi, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vpinsrd $3, (%rsi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpinsrd $3, (%rsi), %xmm0, %xmm0 # sched: [6:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pinsrd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pinsrq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpinsrq $1, %rdi, %xmm0, %xmm0 # sched: [2:2.00]
-; HASWELL-NEXT: vpinsrq $1, (%rsi), %xmm1, %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpinsrq $1, (%rsi), %xmm1, %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pinsrq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxsd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxsd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxsd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxud:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxud %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxud (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxud (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxud:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaxuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaxuw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpmaxuw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaxuw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaxuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminsd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminsd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminsd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminud:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminud %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminud (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminud (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminud:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pminuw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpminuw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpminuw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpminuw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pminuw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxbw %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpmovsxbw (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpmovsxbw (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxbd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxbd %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpmovsxbd (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpmovsxbd (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxbd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxbq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxbq %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpmovsxbq (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpmovsxbq (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxbq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxdq %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpmovsxdq (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpmovsxdq (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxwd %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpmovsxwd (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpmovsxwd (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovsxwq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovsxwq %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpmovsxwq (%rdi), %xmm1 # sched: [1:1.00]
+; HASWELL-NEXT: vpmovsxwq (%rdi), %xmm1 # sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovsxwq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxbw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxbw {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero sched: [1:1.00]
-; HASWELL-NEXT: vpmovzxbw {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [1:1.00]
+; HASWELL-NEXT: vpmovzxbw {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [6:1.00]
; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxbw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxbd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxbd {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero sched: [1:1.00]
-; HASWELL-NEXT: vpmovzxbd {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [1:1.00]
+; HASWELL-NEXT: vpmovzxbd {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [6:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxbd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxbq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxbq {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,zero,zero,zero,zero,xmm0[1],zero,zero,zero,zero,zero,zero,zero sched: [1:1.00]
-; HASWELL-NEXT: vpmovzxbq {{.*#+}} xmm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero sched: [1:1.00]
+; HASWELL-NEXT: vpmovzxbq {{.*#+}} xmm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxbq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxdq {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero sched: [1:1.00]
-; HASWELL-NEXT: vpmovzxdq {{.*#+}} xmm1 = mem[0],zero,mem[1],zero sched: [1:1.00]
+; HASWELL-NEXT: vpmovzxdq {{.*#+}} xmm1 = mem[0],zero,mem[1],zero sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxwd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxwd {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero sched: [1:1.00]
-; HASWELL-NEXT: vpmovzxwd {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [1:1.00]
+; HASWELL-NEXT: vpmovzxwd {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [6:1.00]
; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxwd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmovzxwq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmovzxwq {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero sched: [1:1.00]
-; HASWELL-NEXT: vpmovzxwq {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero sched: [1:1.00]
+; HASWELL-NEXT: vpmovzxwq {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero sched: [6:1.00]
; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmovzxwq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmuldq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmuldq %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmuldq (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmuldq (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmuldq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulld:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulld %xmm1, %xmm0, %xmm0 # sched: [10:2.00]
-; HASWELL-NEXT: vpmulld (%rdi), %xmm0, %xmm0 # sched: [10:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulld (%rdi), %xmm0, %xmm0 # sched: [16:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulld:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vptest %xmm1, %xmm0 # sched: [2:1.00]
; HASWELL-NEXT: setb %al # sched: [1:0.50]
-; HASWELL-NEXT: vptest (%rdi), %xmm0 # sched: [2:1.00]
+; HASWELL-NEXT: vptest (%rdi), %xmm0 # sched: [8:1.00]
; HASWELL-NEXT: setb %cl # sched: [1:0.50]
; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25]
; HASWELL-NEXT: movzbl %cl, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ptest:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_roundpd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vroundpd $7, %xmm0, %xmm0 # sched: [5:1.25]
-; HASWELL-NEXT: vroundpd $7, (%rdi), %xmm1 # sched: [6:2.00]
+; HASWELL-NEXT: vroundpd $7, %xmm0, %xmm0 # sched: [6:0.50]
+; HASWELL-NEXT: vroundpd $7, (%rdi), %xmm1 # sched: [12:2.00]
; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_roundpd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_roundps:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vroundps $7, %xmm0, %xmm0 # sched: [5:1.25]
-; HASWELL-NEXT: vroundps $7, (%rdi), %xmm1 # sched: [6:2.00]
+; HASWELL-NEXT: vroundps $7, %xmm0, %xmm0 # sched: [6:0.50]
+; HASWELL-NEXT: vroundps $7, (%rdi), %xmm1 # sched: [12:2.00]
; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_roundps:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_roundsd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vroundsd $7, %xmm1, %xmm0, %xmm1 # sched: [5:1.25]
-; HASWELL-NEXT: vroundsd $7, (%rdi), %xmm0, %xmm0 # sched: [6:2.00]
+; HASWELL-NEXT: vroundsd $7, %xmm1, %xmm0, %xmm1 # sched: [6:0.50]
+; HASWELL-NEXT: vroundsd $7, (%rdi), %xmm0, %xmm0 # sched: [12:2.00]
; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_roundsd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_roundss:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: vroundss $7, %xmm1, %xmm0, %xmm1 # sched: [5:1.25]
-; HASWELL-NEXT: vroundss $7, (%rdi), %xmm0, %xmm0 # sched: [6:2.00]
+; HASWELL-NEXT: vroundss $7, %xmm1, %xmm0, %xmm1 # sched: [6:0.50]
+; HASWELL-NEXT: vroundss $7, (%rdi), %xmm0, %xmm0 # sched: [12:2.00]
; HASWELL-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_roundss:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: crc32_32_8:
; HASWELL: # %bb.0:
; HASWELL-NEXT: crc32b %sil, %edi # sched: [3:1.00]
-; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [7:1.00]
+; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [8:1.00]
; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: crc32_32_8:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: crc32_32_16:
; HASWELL: # %bb.0:
; HASWELL-NEXT: crc32w %si, %edi # sched: [3:1.00]
-; HASWELL-NEXT: crc32w (%rdx), %edi # sched: [7:1.00]
+; HASWELL-NEXT: crc32w (%rdx), %edi # sched: [8:1.00]
; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: crc32_32_16:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: crc32_32_32:
; HASWELL: # %bb.0:
; HASWELL-NEXT: crc32l %esi, %edi # sched: [3:1.00]
-; HASWELL-NEXT: crc32l (%rdx), %edi # sched: [7:1.00]
+; HASWELL-NEXT: crc32l (%rdx), %edi # sched: [8:1.00]
; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: crc32_32_32:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: crc32_64_8:
; HASWELL: # %bb.0:
; HASWELL-NEXT: crc32b %sil, %edi # sched: [3:1.00]
-; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [7:1.00]
+; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [8:1.00]
; HASWELL-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: crc32_64_8:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: crc32_64_64:
; HASWELL: # %bb.0:
; HASWELL-NEXT: crc32q %rsi, %rdi # sched: [3:1.00]
-; HASWELL-NEXT: crc32q (%rdx), %rdi # sched: [7:1.00]
+; HASWELL-NEXT: crc32q (%rdx), %rdi # sched: [8:1.00]
; HASWELL-NEXT: movq %rdi, %rax # sched: [1:0.25]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: crc32_64_64:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: movl %ecx, %esi # sched: [1:0.25]
; HASWELL-NEXT: movl $7, %eax # sched: [1:0.25]
; HASWELL-NEXT: movl $7, %edx # sched: [1:0.25]
-; HASWELL-NEXT: vpcmpestri $7, (%rdi), %xmm0 # sched: [18:4.00]
+; HASWELL-NEXT: vpcmpestri $7, (%rdi), %xmm0 # sched: [24:4.00]
; HASWELL-NEXT: # kill: def %ecx killed %ecx def %rcx
; HASWELL-NEXT: leal (%rcx,%rsi), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpestri:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: vpcmpestrm $7, %xmm1, %xmm0 # sched: [19:4.00]
; HASWELL-NEXT: movl $7, %eax # sched: [1:0.25]
; HASWELL-NEXT: movl $7, %edx # sched: [1:0.25]
-; HASWELL-NEXT: vpcmpestrm $7, (%rdi), %xmm0 # sched: [19:4.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpestrm $7, (%rdi), %xmm0 # sched: [25:4.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpestrm:
; BROADWELL: # %bb.0:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpistri $7, %xmm1, %xmm0 # sched: [11:3.00]
; HASWELL-NEXT: movl %ecx, %eax # sched: [1:0.25]
-; HASWELL-NEXT: vpcmpistri $7, (%rdi), %xmm0 # sched: [11:3.00]
+; HASWELL-NEXT: vpcmpistri $7, (%rdi), %xmm0 # sched: [17:3.00]
; HASWELL-NEXT: # kill: def %ecx killed %ecx def %rcx
; HASWELL-NEXT: leal (%rcx,%rax), %eax # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpistri:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpistrm:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpistrm $7, %xmm1, %xmm0 # sched: [11:3.00]
-; HASWELL-NEXT: vpcmpistrm $7, (%rdi), %xmm0 # sched: [11:3.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpistrm $7, (%rdi), %xmm0 # sched: [17:3.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpistrm:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pcmpgtq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpcmpgtq (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpcmpgtq (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pcmpgtq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pclmulqdq:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpclmulqdq $0, %xmm1, %xmm0, %xmm0 # sched: [11:2.00]
-; HASWELL-NEXT: vpclmulqdq $0, (%rdi), %xmm0, %xmm0 # sched: [11:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpclmulqdq $0, (%rdi), %xmm0, %xmm0 # sched: [17:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pclmulqdq:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pabsb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpabsb %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpabsb (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpabsb (%rdi), %xmm1 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pabsd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpabsd %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpabsd (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpabsd (%rdi), %xmm1 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pabsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpabsw %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpabsw (%rdi), %xmm1 # sched: [1:0.50]
+; HASWELL-NEXT: vpabsw (%rdi), %xmm1 # sched: [7:0.50]
; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pabsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_palignr:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpalignr {{.*#+}} xmm0 = xmm0[6,7,8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5] sched: [1:1.00]
-; HASWELL-NEXT: vpalignr {{.*#+}} xmm0 = mem[14,15],xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13] sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpalignr {{.*#+}} xmm0 = mem[14,15],xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13] sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_palignr:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphaddd %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphaddd (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphaddd (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphaddsw %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphaddsw (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphaddsw (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phaddw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphaddw %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphaddw (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphaddw (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phaddw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphsubd %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphsubd (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphsubd (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphsubsw %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphsubsw (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphsubsw (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_phsubw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vphsubw %xmm1, %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: vphsubw (%rdi), %xmm0, %xmm0 # sched: [3:2.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vphsubw (%rdi), %xmm0, %xmm0 # sched: [9:2.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_phsubw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmaddubsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmaddubsw %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmaddubsw (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmaddubsw (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmaddubsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pmulhrsw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpmulhrsw %xmm1, %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: vpmulhrsw (%rdi), %xmm0, %xmm0 # sched: [5:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpmulhrsw (%rdi), %xmm0, %xmm0 # sched: [11:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pmulhrsw:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_pshufb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpshufb %xmm1, %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: vpshufb (%rdi), %xmm0, %xmm0 # sched: [1:1.00]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpshufb (%rdi), %xmm0, %xmm0 # sched: [7:1.00]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_pshufb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignb:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsignb %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsignb (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsignb (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignb:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignd:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsignd %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsignd (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsignd (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignd:
; BROADWELL: # %bb.0:
; HASWELL-LABEL: test_psignw:
; HASWELL: # %bb.0:
; HASWELL-NEXT: vpsignw %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: vpsignw (%rdi), %xmm0, %xmm0 # sched: [1:0.50]
-; HASWELL-NEXT: retq # sched: [2:1.00]
+; HASWELL-NEXT: vpsignw (%rdi), %xmm0, %xmm0 # sched: [7:0.50]
+; HASWELL-NEXT: retq # sched: [7:1.00]
;
; BROADWELL-LABEL: test_psignw:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: f2xm1 # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_f2xm1:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fabs # sched: [1:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fabs:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fadd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fadd %st(0), %st(1) # sched: [3:1.00]
; HASWELL-NEXT: fadd %st(2) # sched: [3:1.00]
-; HASWELL-NEXT: fadds (%ecx) # sched: [3:1.00]
-; HASWELL-NEXT: faddl (%eax) # sched: [3:1.00]
+; HASWELL-NEXT: fadds (%ecx) # sched: [10:1.00]
+; HASWELL-NEXT: faddl (%eax) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fadd:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_faddp_fiadd:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: faddp %st(1) # sched: [3:1.00]
; HASWELL-NEXT: faddp %st(2) # sched: [3:1.00]
-; HASWELL-NEXT: fiadds (%ecx) # sched: [6:2.00]
-; HASWELL-NEXT: fiaddl (%eax) # sched: [6:2.00]
+; HASWELL-NEXT: fiadds (%ecx) # sched: [13:2.00]
+; HASWELL-NEXT: fiaddl (%eax) # sched: [13:2.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_faddp_fiadd:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fchs # sched: [1:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fchs:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fnclex # sched: [1:1.25]
; HASWELL-NEXT: fnclex # sched: [1:1.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fclex_fnclex:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fcmovnu %st(1), %st(0) # sched: [3:1.00]
; HASWELL-NEXT: fcmovu %st(1), %st(0) # sched: [3:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fcmov:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fcom:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fcom %st(1) # sched: [1:1.00]
; HASWELL-NEXT: fcom %st(3) # sched: [1:1.00]
-; HASWELL-NEXT: fcoms (%ecx) # sched: [1:1.00]
-; HASWELL-NEXT: fcoml (%eax) # sched: [1:1.00]
+; HASWELL-NEXT: fcoms (%ecx) # sched: [8:1.00]
+; HASWELL-NEXT: fcoml (%eax) # sched: [8:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fcom:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fcomp_fcompp:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fcomp %st(1) # sched: [1:1.00]
; HASWELL-NEXT: fcomp %st(3) # sched: [1:1.00]
-; HASWELL-NEXT: fcomps (%ecx) # sched: [1:1.00]
-; HASWELL-NEXT: fcompl (%eax) # sched: [1:1.00]
+; HASWELL-NEXT: fcomps (%ecx) # sched: [8:1.00]
+; HASWELL-NEXT: fcompl (%eax) # sched: [8:1.00]
; HASWELL-NEXT: fcompp # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fcomp_fcompp:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fcomi %st(3) # sched: [1:0.50]
; HASWELL-NEXT: fcompi %st(3) # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fcomi_fcomip:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fcos # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fcos:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fdecstp # sched: [2:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fdecstp:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fdiv:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fdiv %st(0), %st(1) # sched: [24:1.00]
; HASWELL-NEXT: fdiv %st(2) # sched: [20:1.00]
-; HASWELL-NEXT: fdivs (%ecx) # sched: [24:1.00]
-; HASWELL-NEXT: fdivl (%eax) # sched: [24:1.00]
+; HASWELL-NEXT: fdivs (%ecx) # sched: [31:1.00]
+; HASWELL-NEXT: fdivl (%eax) # sched: [31:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fdiv:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fdivp_fidiv:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fdivp %st(1) # sched: [24:1.00]
; HASWELL-NEXT: fdivp %st(2) # sched: [24:1.00]
-; HASWELL-NEXT: fidivs (%ecx) # sched: [27:1.00]
-; HASWELL-NEXT: fidivl (%eax) # sched: [27:1.00]
+; HASWELL-NEXT: fidivs (%ecx) # sched: [34:1.00]
+; HASWELL-NEXT: fidivl (%eax) # sched: [34:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fdivp_fidiv:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fdivr:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fdivr %st(0), %st(1) # sched: [20:1.00]
; HASWELL-NEXT: fdivr %st(2) # sched: [24:1.00]
-; HASWELL-NEXT: fdivrs (%ecx) # sched: [20:1.00]
-; HASWELL-NEXT: fdivrl (%eax) # sched: [20:1.00]
+; HASWELL-NEXT: fdivrs (%ecx) # sched: [27:1.00]
+; HASWELL-NEXT: fdivrl (%eax) # sched: [27:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fdivr:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fdivrp_fidivr:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fdivrp %st(1) # sched: [20:1.00]
; HASWELL-NEXT: fdivrp %st(2) # sched: [20:1.00]
-; HASWELL-NEXT: fidivrs (%ecx) # sched: [23:1.00]
-; HASWELL-NEXT: fidivrl (%eax) # sched: [23:1.00]
+; HASWELL-NEXT: fidivrs (%ecx) # sched: [30:1.00]
+; HASWELL-NEXT: fidivrl (%eax) # sched: [30:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fdivrp_fidivr:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: ffree %st(0) # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ffree:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_ficom:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
-; HASWELL-NEXT: ficoms (%ecx) # sched: [4:2.00]
-; HASWELL-NEXT: ficoml (%eax) # sched: [4:2.00]
-; HASWELL-NEXT: ficomps (%ecx) # sched: [4:2.00]
-; HASWELL-NEXT: ficompl (%eax) # sched: [4:2.00]
+; HASWELL-NEXT: ficoms (%ecx) # sched: [11:2.00]
+; HASWELL-NEXT: ficoml (%eax) # sched: [11:2.00]
+; HASWELL-NEXT: ficomps (%ecx) # sched: [11:2.00]
+; HASWELL-NEXT: ficompl (%eax) # sched: [11:2.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ficom:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fild:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %edx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %edx # sched: [5:0.50]
; HASWELL-NEXT: #APP
-; HASWELL-NEXT: filds (%edx) # sched: [3:1.00]
-; HASWELL-NEXT: fildl (%ecx) # sched: [3:1.00]
-; HASWELL-NEXT: fildll (%eax) # sched: [3:1.00]
+; HASWELL-NEXT: filds (%edx) # sched: [10:1.00]
+; HASWELL-NEXT: fildl (%ecx) # sched: [10:1.00]
+; HASWELL-NEXT: fildll (%eax) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fild:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fincstp # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fincstp:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fninit # sched: [1:?]
; HASWELL-NEXT: fninit # sched: [1:?]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_finit_fninit:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fldpi # sched: [1:0.50]
; HASWELL-NEXT: fldz # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fld1_fldl2e_fldl2t_fldlg2_fldln2_fldpi_fldz:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fmul:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fmul %st(0), %st(1) # sched: [5:1.00]
; HASWELL-NEXT: fmul %st(2) # sched: [5:1.00]
-; HASWELL-NEXT: fmuls (%ecx) # sched: [5:1.00]
-; HASWELL-NEXT: fmull (%eax) # sched: [5:1.00]
+; HASWELL-NEXT: fmuls (%ecx) # sched: [12:1.00]
+; HASWELL-NEXT: fmull (%eax) # sched: [12:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fmul:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fmulp_fimul:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fmulp %st(1) # sched: [5:1.00]
; HASWELL-NEXT: fmulp %st(2) # sched: [5:1.00]
-; HASWELL-NEXT: fimuls (%ecx) # sched: [8:1.00]
-; HASWELL-NEXT: fimull (%eax) # sched: [8:1.00]
+; HASWELL-NEXT: fimuls (%ecx) # sched: [15:1.00]
+; HASWELL-NEXT: fimull (%eax) # sched: [15:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fmulp_fimul:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fnop # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fnop:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fpatan # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fpatan:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fprem # sched: [19:?]
; HASWELL-NEXT: fprem1 # sched: [19:?]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fprem_fprem1:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fptan # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fptan:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: frndint # sched: [11:?]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_frndint:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fscale # sched: [75:?]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fscale:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsin # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsin:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsincos # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsincos:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsqrt # sched: [15:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsqrt:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fsub:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsub %st(0), %st(1) # sched: [3:1.00]
; HASWELL-NEXT: fsub %st(2) # sched: [3:1.00]
-; HASWELL-NEXT: fsubs (%ecx) # sched: [3:1.00]
-; HASWELL-NEXT: fsubl (%eax) # sched: [3:1.00]
+; HASWELL-NEXT: fsubs (%ecx) # sched: [10:1.00]
+; HASWELL-NEXT: fsubl (%eax) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsub:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fsubp_fisub:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsubp %st(1) # sched: [3:1.00]
; HASWELL-NEXT: fsubp %st(2) # sched: [3:1.00]
-; HASWELL-NEXT: fisubs (%ecx) # sched: [6:2.00]
-; HASWELL-NEXT: fisubl (%eax) # sched: [6:2.00]
+; HASWELL-NEXT: fisubs (%ecx) # sched: [13:2.00]
+; HASWELL-NEXT: fisubl (%eax) # sched: [13:2.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsubp_fisub:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fsubr:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsubr %st(0), %st(1) # sched: [3:1.00]
; HASWELL-NEXT: fsubr %st(2) # sched: [3:1.00]
-; HASWELL-NEXT: fsubrs (%ecx) # sched: [3:1.00]
-; HASWELL-NEXT: fsubrl (%eax) # sched: [3:1.00]
+; HASWELL-NEXT: fsubrs (%ecx) # sched: [10:1.00]
+; HASWELL-NEXT: fsubrl (%eax) # sched: [10:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsubr:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fsubrp_fisubr:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50]
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fsubrp %st(1) # sched: [3:1.00]
; HASWELL-NEXT: fsubrp %st(2) # sched: [3:1.00]
-; HASWELL-NEXT: fisubrs (%ecx) # sched: [6:2.00]
-; HASWELL-NEXT: fisubrl (%eax) # sched: [6:2.00]
+; HASWELL-NEXT: fisubrs (%ecx) # sched: [13:2.00]
+; HASWELL-NEXT: fisubrl (%eax) # sched: [13:2.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fsubrp_fisubr:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: ftst # sched: [1:1.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_ftst:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fucomp %st(3) # sched: [1:1.00]
; HASWELL-NEXT: fucompp # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fucom_fucomp_fucompp:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fucomi %st(3) # sched: [1:0.50]
; HASWELL-NEXT: fucompi %st(3) # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fucomi_fucomip:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: wait # sched: [1:0.50]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fwait:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fxam # sched: [1:2.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fxam:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: fxch %st(1) # sched: [17:4.00]
; HASWELL-NEXT: fxch %st(3) # sched: [17:4.00]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fxch:
; BROADWELL: # %bb.0:
;
; HASWELL-LABEL: test_fxrstor_fxsave:
; HASWELL: # %bb.0:
-; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50]
+; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50]
; HASWELL-NEXT: #APP
-; HASWELL-NEXT: fxrstor (%eax) # sched: [59:16.50]
+; HASWELL-NEXT: fxrstor (%eax) # sched: [64:16.50]
; HASWELL-NEXT: fxsave (%eax) # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fxrstor_fxsave:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fxtract # sched: [15:?]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fxtract:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fyl2x # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fyl2x:
; BROADWELL: # %bb.0:
; HASWELL-NEXT: #APP
; HASWELL-NEXT: fyl2xp1 # sched: [100:0.25]
; HASWELL-NEXT: #NO_APP
-; HASWELL-NEXT: retl # sched: [5:0.50]
+; HASWELL-NEXT: retl # sched: [7:1.00]
;
; BROADWELL-LABEL: test_fyl2xp1:
; BROADWELL: # %bb.0: