Index: lib/Target/X86/X86SchedHaswell.td =================================================================== --- lib/Target/X86/X86SchedHaswell.td +++ lib/Target/X86/X86SchedHaswell.td @@ -17,7 +17,7 @@ // instructions per cycle. let IssueWidth = 4; let MicroOpBufferSize = 192; // Based on the reorder buffer. - let LoadLatency = 4; + let LoadLatency = 5; let MispredictPenalty = 16; // Based on the LSD (loop-stream detector) queue size and benchmarking data. @@ -70,9 +70,9 @@ // Integer division issued on port 0. def HWDivider : ProcResource<1>; -// Loads are 4 cycles, so ReadAfterLd registers needn't be available until 4 +// Loads are 5 cycles, so ReadAfterLd registers needn't be available until 5 // cycles after the memory operand. -def : ReadAdvance; +def : ReadAdvance; // Many SchedWrites are defined in pairs with and without a folded load. // Instructions with folded loads are usually micro-fused, so they only appear @@ -85,10 +85,10 @@ // Register variant is using a single cycle on ExePort. def : WriteRes { let Latency = Lat; } - // Memory variant also uses a cycle on port 2/3 and adds 4 cycles to the + // Memory variant also uses a cycle on port 2/3 and adds 5 cycles to the // latency. def : WriteRes { - let Latency = !add(Lat, 4); + let Latency = !add(Lat, 5); } } @@ -99,7 +99,7 @@ // Store_addr on 237. // Store_data on 4. def : WriteRes; -def : WriteRes { let Latency = 4; } +def : WriteRes { let Latency = 5; } def : WriteRes; def : WriteRes; @@ -435,7 +435,7 @@ // MOVSX, MOVZX. // r,m. -def : InstRW<[WriteLoad], (instregex "MOV(S|Z)X32rm(8|16)")>; +def : InstRW<[WriteLoad], (instregex "MOV(S|Z)X32rm8")>; // XLAT. def WriteXLAT : SchedWriteRes<[]> { @@ -535,9 +535,6 @@ } def : InstRW<[WriteMOVS], (instregex "MOVS(B|L|Q|W)")>; -// SCAS. -def : InstRW<[Write2P0156_P23], (instregex "SCAS(B|W|L|Q)")>; - // CMPS. def WriteCMPS : SchedWriteRes<[HWPort23, HWPort0156]> { let Latency = 4; @@ -678,81 +675,6 @@ } def : InstRW<[WriteFNINIT], (instregex "FNINIT")>; -//=== Integer MMX and XMM Instructions ===// - -// PBLENDW. -// x,x,i / v,v,v,i -def WritePBLENDWr : SchedWriteRes<[HWPort5]>; -def : InstRW<[WritePBLENDWr], (instregex "(V?)PBLENDW(Y?)rri")>; - -// x,m,i / v,v,m,i -def WritePBLENDWm : SchedWriteRes<[HWPort5, HWPort23]> { - let NumMicroOps = 2; - let Latency = 4; - let ResourceCycles = [1, 1]; -} -def : InstRW<[WritePBLENDWm, ReadAfterLd], (instregex "(V?)PBLENDW(Y?)rmi")>; - -// PMOVMSKB. -def WritePMOVMSKB : SchedWriteRes<[HWPort0]> { - let Latency = 3; -} -def : InstRW<[WritePMOVMSKB], (instregex "(V|MMX_)?PMOVMSKB(Y?)rr")>; - -// VPGATHERDD. -// x. -def WriteVPGATHERDD128 : SchedWriteRes<[]> { - let NumMicroOps = 20; -} -def : InstRW<[WriteVPGATHERDD128, ReadAfterLd], (instregex "VPGATHERDDrm")>; - -// y. -def WriteVPGATHERDD256 : SchedWriteRes<[]> { - let NumMicroOps = 34; -} -def : InstRW<[WriteVPGATHERDD256, ReadAfterLd], (instregex "VPGATHERDDYrm")>; - -// VPGATHERQD. -// x. -def WriteVPGATHERQD128 : SchedWriteRes<[]> { - let NumMicroOps = 15; -} -def : InstRW<[WriteVPGATHERQD128, ReadAfterLd], (instregex "VPGATHERQDrm")>; - -// y. -def WriteVPGATHERQD256 : SchedWriteRes<[]> { - let NumMicroOps = 22; -} -def : InstRW<[WriteVPGATHERQD256, ReadAfterLd], (instregex "VPGATHERQDYrm")>; - -// VPGATHERDQ. -// x. -def WriteVPGATHERDQ128 : SchedWriteRes<[]> { - let NumMicroOps = 12; -} -def : InstRW<[WriteVPGATHERDQ128, ReadAfterLd], (instregex "VPGATHERDQrm")>; - -// y. -def WriteVPGATHERDQ256 : SchedWriteRes<[]> { - let NumMicroOps = 20; -} -def : InstRW<[WriteVPGATHERDQ256, ReadAfterLd], (instregex "VPGATHERDQYrm")>; - -// VPGATHERQQ. -// x. -def WriteVPGATHERQQ128 : SchedWriteRes<[]> { - let NumMicroOps = 14; -} -def : InstRW<[WriteVPGATHERQQ128, ReadAfterLd], (instregex "VPGATHERQQrm")>; - -// y. -def WriteVPGATHERQQ256 : SchedWriteRes<[]> { - let NumMicroOps = 22; -} -def : InstRW<[WriteVPGATHERQQ256, ReadAfterLd], (instregex "VPGATHERQQYrm")>; - -//-- Arithmetic instructions --// - //////////////////////////////////////////////////////////////////////////////// // Horizontal add/sub instructions. //////////////////////////////////////////////////////////////////////////////// @@ -788,133 +710,103 @@ //=== Floating Point XMM and YMM Instructions ===// -// VGATHERDPS. -// x. -def WriteVGATHERDPS128 : SchedWriteRes<[]> { - let NumMicroOps = 20; -} -def : InstRW<[WriteVGATHERDPS128, ReadAfterLd], (instregex "VGATHERDPSrm")>; - -// y. -def WriteVGATHERDPS256 : SchedWriteRes<[]> { - let NumMicroOps = 34; -} -def : InstRW<[WriteVGATHERDPS256, ReadAfterLd], (instregex "VGATHERDPSYrm")>; - -// VGATHERQPS. -// x. -def WriteVGATHERQPS128 : SchedWriteRes<[]> { - let NumMicroOps = 15; -} -def : InstRW<[WriteVGATHERQPS128, ReadAfterLd], (instregex "VGATHERQPSrm")>; - -// y. -def WriteVGATHERQPS256 : SchedWriteRes<[]> { - let NumMicroOps = 22; -} -def : InstRW<[WriteVGATHERQPS256, ReadAfterLd], (instregex "VGATHERQPSYrm")>; - -// VGATHERDPD. -// x. -def WriteVGATHERDPD128 : SchedWriteRes<[]> { - let NumMicroOps = 12; -} -def : InstRW<[WriteVGATHERDPD128, ReadAfterLd], (instregex "VGATHERDPDrm")>; - -// y. -def WriteVGATHERDPD256 : SchedWriteRes<[]> { - let NumMicroOps = 20; -} -def : InstRW<[WriteVGATHERDPD256, ReadAfterLd], (instregex "VGATHERDPDYrm")>; - -// VGATHERQPD. -// x. -def WriteVGATHERQPD128 : SchedWriteRes<[]> { - let NumMicroOps = 14; -} -def : InstRW<[WriteVGATHERQPD128, ReadAfterLd], (instregex "VGATHERQPDrm")>; - -// y. -def WriteVGATHERQPD256 : SchedWriteRes<[]> { - let NumMicroOps = 22; -} -def : InstRW<[WriteVGATHERQPD256, ReadAfterLd], (instregex "VGATHERQPDYrm")>; - // Remaining instrs. def HWWriteResGroup0 : SchedWriteRes<[HWPort23]> { - let Latency = 1; + let Latency = 6; let NumMicroOps = 1; let ResourceCycles = [1]; } def: InstRW<[HWWriteResGroup0], (instregex "LDDQUrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "LD_F32m")>; -def: InstRW<[HWWriteResGroup0], (instregex "LD_F64m")>; -def: InstRW<[HWWriteResGroup0], (instregex "LD_F80m")>; -def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVD64from64rm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVD64rm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVD64to64rm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MMX_MOVQ64rm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOV(16|32|64)rm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOV64toPQIrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOV8rm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVAPDrm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVAPSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVDDUPrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVDI2PDIrm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVDQArm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVDQUrm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVNTDQArm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVSHDUPrm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVSLDUPrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVSSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVSX(16|32|64)rm16")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVSX(16|32|64)rm32")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVSX(16|32|64)rm8")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVUPDrm")>; def: InstRW<[HWWriteResGroup0], (instregex "MOVUPSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVZX(16|32|64)rm16")>; -def: InstRW<[HWWriteResGroup0], (instregex "MOVZX(16|32|64)rm8")>; -def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHNTA")>; -def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHT0")>; -def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHT1")>; -def: InstRW<[HWWriteResGroup0], (instregex "PREFETCHT2")>; -def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTF128")>; -def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTI128")>; -def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTSDYrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTSSYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VBROADCASTSSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VLDDQUYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VLDDQUrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOV64toPQIrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPDYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPDrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPSYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVAPSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVDDUPYrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVDDUPrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVDI2PDIrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQAYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQArm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQUYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVDQUrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVNTDQAYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVNTDQArm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVQI2PQIrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVSDrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVSHDUPYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVSHDUPrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVSLDUPYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVSLDUPrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVSSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPDYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPDrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPSYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VMOVUPSrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTDYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTDrm")>; -def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTQYrm")>; def: InstRW<[HWWriteResGroup0], (instregex "VPBROADCASTQrm")>; +def: InstRW<[HWWriteResGroup0], (instregex "ROUNDPDr")>; +def: InstRW<[HWWriteResGroup0], (instregex "ROUNDPSr")>; +def: InstRW<[HWWriteResGroup0], (instregex "ROUNDSDr")>; +def: InstRW<[HWWriteResGroup0], (instregex "ROUNDSSr")>; +def: InstRW<[HWWriteResGroup0], (instregex "VROUNDPDr")>; +def: InstRW<[HWWriteResGroup0], (instregex "VROUNDPSr")>; +def: InstRW<[HWWriteResGroup0], (instregex "VROUNDSDr")>; +def: InstRW<[HWWriteResGroup0], (instregex "VROUNDSSr")>; +def: InstRW<[HWWriteResGroup0], (instregex "VROUNDYPDr")>; +def: InstRW<[HWWriteResGroup0], (instregex "VROUNDYPSr")>; + +def HWWriteResGroup0_1 : SchedWriteRes<[HWPort23]> { + let Latency = 7; + let NumMicroOps = 1; + let ResourceCycles = [1]; +} +def: InstRW<[HWWriteResGroup0_1], (instregex "LD_F32m")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "LD_F64m")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "LD_F80m")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTF128")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTI128")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTSDYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VBROADCASTSSYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VLDDQUYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVAPDYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVAPSYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVDDUPYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVDQAYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVDQUYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVNTDQAYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVSHDUPYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVSLDUPYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVUPDYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VMOVUPSYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VPBROADCASTDYrm")>; +def: InstRW<[HWWriteResGroup0_1], (instregex "VPBROADCASTQYrm")>; + +def HWWriteResGroup0_2 : SchedWriteRes<[HWPort23]> { + let Latency = 5; + let NumMicroOps = 1; + let ResourceCycles = [1]; +} +def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVD64from64rm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVD64rm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVD64to64rm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MMX_MOVQ64rm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOV(16|32|64)rm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOV64toPQIrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOV8rm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVDDUPrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVDI2PDIrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSSrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSX(16|32|64)rm16")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSX(16|32|64)rm32")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVSX(16|32|64)rm8")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVZX(16|32|64)rm16")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "MOVZX(16|32|64)rm8")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHNTA")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHT0")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHT1")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "PREFETCHT2")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "VMOV64toPQIrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVDDUPrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVDI2PDIrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVQI2PQIrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVSDrm")>; +def: InstRW<[HWWriteResGroup0_2], (instregex "VMOVSSrm")>; def HWWriteResGroup1 : SchedWriteRes<[HWPort4,HWPort237]> { let Latency = 1; @@ -1638,12 +1530,11 @@ def: InstRW<[HWWriteResGroup10], (instregex "XOR8rr")>; def HWWriteResGroup11 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 1; + let Latency = 6; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup11], (instregex "CVTPS2PDrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "CVTSS2SDrm")>; def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSLLDrm")>; def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSLLQrm")>; def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSLLWrm")>; @@ -1652,39 +1543,96 @@ def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSRLDrm")>; def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSRLQrm")>; def: InstRW<[HWWriteResGroup11], (instregex "MMX_PSRLWrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VCVTPH2PSYrm")>; def: InstRW<[HWWriteResGroup11], (instregex "VCVTPH2PSrm")>; def: InstRW<[HWWriteResGroup11], (instregex "VCVTPS2PDrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VCVTSS2SDrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSLLDYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSLLQYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSLLVQYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSLLVQrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSLLWYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRADYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRAWYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRLDYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRLQYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRLVQYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRLVQrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VPSRLWYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VTESTPDYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VTESTPDrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VTESTPSYrm")>; -def: InstRW<[HWWriteResGroup11], (instregex "VTESTPSrm")>; + +def HWWriteResGroup11_1 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 7; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup11_1], (instregex "CVTSS2SDrm")>; +def: InstRW<[HWWriteResGroup11_1], (instregex "VCVTPH2PSYrm")>; +def: InstRW<[HWWriteResGroup11_1], (instregex "VCVTSS2SDrm")>; +def: InstRW<[HWWriteResGroup11_1], (instregex "VPSLLVQrm")>; +def: InstRW<[HWWriteResGroup11_1], (instregex "VPSRLVQrm")>; +def: InstRW<[HWWriteResGroup11_1], (instregex "VTESTPDrm")>; +def: InstRW<[HWWriteResGroup11_1], (instregex "VTESTPSrm")>; + +def HWWriteResGroup11_2 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 8; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLDYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLQYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLVQYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSLLWYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRADYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRAWYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLDYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLQYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLVQYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VPSRLWYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VTESTPDYrm")>; +def: InstRW<[HWWriteResGroup11_2], (instregex "VTESTPSYrm")>; def HWWriteResGroup12 : SchedWriteRes<[HWPort1,HWPort23]> { - let Latency = 1; + let Latency = 8; let NumMicroOps = 2; let ResourceCycles = [1,1]; } +def: InstRW<[HWWriteResGroup12], (instregex "ADDSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "ADDSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "BSF(16|32|64)rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "BSR(16|32|64)rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "CMPSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "COMISDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "COMISSrm")>; def: InstRW<[HWWriteResGroup12], (instregex "FCOM32m")>; def: InstRW<[HWWriteResGroup12], (instregex "FCOM64m")>; def: InstRW<[HWWriteResGroup12], (instregex "FCOMP32m")>; def: InstRW<[HWWriteResGroup12], (instregex "FCOMP64m")>; +def: InstRW<[HWWriteResGroup12], (instregex "IMUL(16|32|64)m")>; +def: InstRW<[HWWriteResGroup12], (instregex "IMUL(16|32|64)rm(i8?)")>; +def: InstRW<[HWWriteResGroup12], (instregex "IMUL8m")>; +def: InstRW<[HWWriteResGroup12], (instregex "LZCNT(16|32|64)rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MAXSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MAXSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MINSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MINSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MMX_CVTPI2PSirm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MMX_CVTPS2PIirm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MMX_CVTTPS2PIirm")>; +def: InstRW<[HWWriteResGroup12], (instregex "MUL(16|32|64)m")>; +def: InstRW<[HWWriteResGroup12], (instregex "MUL8m")>; +def: InstRW<[HWWriteResGroup12], (instregex "PDEP32rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "PDEP64rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "PEXT32rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "PEXT64rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "POPCNT(16|32|64)rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "SUBSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "SUBSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "TZCNT(16|32|64)rm")>; +def: InstRW<[HWWriteResGroup12], (instregex "UCOMISDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "UCOMISSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VADDSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VADDSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VCMPSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VCMPSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VCOMISDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VCOMISSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VMAXSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VMAXSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VMINSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VMINSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VSUBSDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VSUBSSrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VUCOMISDrm")>; +def: InstRW<[HWWriteResGroup12], (instregex "VUCOMISSrm")>; def HWWriteResGroup13 : SchedWriteRes<[HWPort5,HWPort23]> { - let Latency = 1; + let Latency = 7; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -1693,20 +1641,6 @@ def: InstRW<[HWWriteResGroup13], (instregex "ANDPDrm")>; def: InstRW<[HWWriteResGroup13], (instregex "ANDPSrm")>; def: InstRW<[HWWriteResGroup13], (instregex "INSERTPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PALIGNR64irm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PINSRWirmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PSHUFBrm64")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PSHUFWmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKHBWirm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKHDQirm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKHWDirm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKLBWirm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKLDQirm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MMX_PUNPCKLWDirm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MOVHPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MOVHPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MOVLPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "MOVLPSrm")>; def: InstRW<[HWWriteResGroup13], (instregex "ORPDrm")>; def: InstRW<[HWWriteResGroup13], (instregex "ORPSrm")>; def: InstRW<[HWWriteResGroup13], (instregex "PACKSSDWrm")>; @@ -1715,22 +1649,6 @@ def: InstRW<[HWWriteResGroup13], (instregex "PACKUSWBrm")>; def: InstRW<[HWWriteResGroup13], (instregex "PALIGNRrmi")>; def: InstRW<[HWWriteResGroup13], (instregex "PBLENDWrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "PINSRBrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PINSRDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PINSRQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PINSRWrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXBDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXBQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXBWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXWDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVSXWQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXBDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXBQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXBWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXWDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "PMOVZXWQrm")>; def: InstRW<[HWWriteResGroup13], (instregex "PSHUFBrm")>; def: InstRW<[HWWriteResGroup13], (instregex "PSHUFDmi")>; def: InstRW<[HWWriteResGroup13], (instregex "PSHUFHWmi")>; @@ -1749,104 +1667,149 @@ def: InstRW<[HWWriteResGroup13], (instregex "UNPCKHPSrm")>; def: InstRW<[HWWriteResGroup13], (instregex "UNPCKLPDrm")>; def: InstRW<[HWWriteResGroup13], (instregex "UNPCKLPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VANDNPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VANDNPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VANDNPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VANDNPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VANDPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VANDPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VANDPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VANDPSrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VINSERTPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VMOVHPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VMOVHPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VMOVLPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VMOVLPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VORPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VORPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VORPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VORPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSDWYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSDWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSWBYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPACKSSWBrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSDWYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSDWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSWBYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPACKUSWBrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPALIGNRYrmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPALIGNRrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPBLENDWYrmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPBLENDWrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDYmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSYmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPERMILPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPINSRBrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPINSRDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPINSRQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPINSRWrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXBDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXBQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXBWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXWDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVSXWQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXBDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXBQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXBWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXWDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPMOVZXWQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFBYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFBrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFDYmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFDmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFHWYmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFHWmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFLWYmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VPSHUFLWmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHBWYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHBWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHDQYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHQDQYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHQDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHWDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKHWDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLBWYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLBWrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLDQYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLQDQYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLQDQrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLWDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VPUNPCKLWDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPDYrmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPDrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPSYrmi")>; def: InstRW<[HWWriteResGroup13], (instregex "VSHUFPSrmi")>; -def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKHPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VUNPCKLPSrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VXORPDYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VXORPDrm")>; -def: InstRW<[HWWriteResGroup13], (instregex "VXORPSYrm")>; def: InstRW<[HWWriteResGroup13], (instregex "VXORPSrm")>; def: InstRW<[HWWriteResGroup13], (instregex "XORPDrm")>; def: InstRW<[HWWriteResGroup13], (instregex "XORPSrm")>; +def HWWriteResGroup13_1 : SchedWriteRes<[HWPort5,HWPort23]> { + let Latency = 8; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup13_1], (instregex "VANDNPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VANDNPSYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VANDPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VANDPSYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VORPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VORPSYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKSSDWYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKSSWBYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKUSDWYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKUSWBYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPALIGNRYrmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPBLENDWYrmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPDYmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPSYmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPERMILPSYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPMOVSXBDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPMOVSXBQYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPMOVSXWQYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFBYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFDYmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFHWYmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPSHUFLWYmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHBWYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHDQYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHQDQYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKHWDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLBWYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLDQYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLQDQYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VPUNPCKLWDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VSHUFPDYrmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VSHUFPSYrmi")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKHPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKHPSYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKLPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VUNPCKLPSYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VXORPDYrm")>; +def: InstRW<[HWWriteResGroup13_1], (instregex "VXORPSYrm")>; + +def HWWriteResGroup13_2 : SchedWriteRes<[HWPort5,HWPort23]> { + let Latency = 6; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PALIGNR64irm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PINSRWirmi")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PSHUFBrm64")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PSHUFWmi")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKHBWirm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKHDQirm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKHWDirm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKLBWirm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKLDQirm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MMX_PUNPCKLWDirm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MOVHPDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MOVHPSrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MOVLPDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "MOVLPSrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRBrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PINSRWrmi")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXBDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXBQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXBWrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXDQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXWDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVSXWQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXBDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXBQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXBWrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXDQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXWDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "PMOVZXWQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVHPDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVHPSrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVLPDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VMOVLPSrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRBrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPINSRWrmi")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXBDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXBQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXBWrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXDQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXWDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVSXWQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXBDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXBQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXBWrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXDQrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXWDrm")>; +def: InstRW<[HWWriteResGroup13_2], (instregex "VPMOVZXWQrm")>; + def HWWriteResGroup14 : SchedWriteRes<[HWPort6,HWPort23]> { - let Latency = 1; + let Latency = 6; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -1854,7 +1817,7 @@ def: InstRW<[HWWriteResGroup14], (instregex "JMP(16|32|64)m")>; def HWWriteResGroup15 : SchedWriteRes<[HWPort23,HWPort06]> { - let Latency = 1; + let Latency = 6; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -1869,7 +1832,7 @@ def: InstRW<[HWWriteResGroup15], (instregex "SHRX64rm")>; def HWWriteResGroup16 : SchedWriteRes<[HWPort23,HWPort15]> { - let Latency = 1; + let Latency = 6; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -1918,170 +1881,194 @@ def: InstRW<[HWWriteResGroup16], (instregex "MMX_PSUBUSWirm")>; def: InstRW<[HWWriteResGroup16], (instregex "MMX_PSUBWirm")>; def: InstRW<[HWWriteResGroup16], (instregex "MOVBE(16|32|64)rm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PABSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PABSDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PABSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDQrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDUSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDUSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PADDWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PAVGBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PAVGWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQQrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPEQWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPGTBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPGTDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PCMPGTWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMAXSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMAXSDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMAXSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMAXUBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMAXUDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMAXUWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMINSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMINSDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMINSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMINUBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMINUDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PMINUWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSIGNBrm128")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSIGNDrm128")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSIGNWrm128")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBQrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBUSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBUSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "PSUBWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPABSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPABSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPABSDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPABSDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPABSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPABSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDQYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDQrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDUSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPADDWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPAVGBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPAVGBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPAVGWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPAVGWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQQYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQQrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPEQWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPCMPGTWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMAXUWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINSDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINSDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINUBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINUBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINUDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINUDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINUWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPMINUWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNBYrm256")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNBrm128")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNDYrm256")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNDrm128")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNWYrm256")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSIGNWrm128")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBDYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBDrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBQYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBQrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSBYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSBrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBUSWrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBWYrm")>; -def: InstRW<[HWWriteResGroup16], (instregex "VPSUBWrm")>; + +def HWWriteResGroup16_1 : SchedWriteRes<[HWPort23,HWPort15]> { + let Latency = 7; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup16_1], (instregex "PABSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PABSDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PABSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDQrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDUSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDUSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PADDWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PAVGBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PAVGWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQQrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPEQWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPGTBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPGTDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PCMPGTWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXSDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXUBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXUDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMAXUWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMINSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMINSDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMINSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMINUBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMINUDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PMINUWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSIGNBrm128")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSIGNDrm128")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSIGNWrm128")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBQrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBUSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBUSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "PSUBWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPABSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPABSDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPABSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDQrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDUSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDUSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPADDWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPAVGBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPAVGWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQQrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPEQWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPGTBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPGTDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPCMPGTWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXSDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXUBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXUDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMAXUWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINSDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINUBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINUDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPMINUWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSIGNBrm128")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSIGNDrm128")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSIGNWrm128")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBDrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBQrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBUSBrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBUSWrm")>; +def: InstRW<[HWWriteResGroup16_1], (instregex "VPSUBWrm")>; + +def HWWriteResGroup16_2 : SchedWriteRes<[HWPort23,HWPort15]> { + let Latency = 8; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup16_2], (instregex "VPABSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPABSDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPABSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDQYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDUSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDUSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPADDWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPAVGBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPAVGWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQQYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPEQWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPGTBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPGTDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPCMPGTWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXSDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXUBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXUDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMAXUWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINSDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINUBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINUDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPMINUWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSIGNBYrm256")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSIGNDYrm256")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSIGNWYrm256")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBDYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBQYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBUSBYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBUSWYrm")>; +def: InstRW<[HWWriteResGroup16_2], (instregex "VPSUBWYrm")>; def HWWriteResGroup17 : SchedWriteRes<[HWPort23,HWPort015]> { - let Latency = 1; + let Latency = 7; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup17], (instregex "BLENDPDrmi")>; def: InstRW<[HWWriteResGroup17], (instregex "BLENDPSrmi")>; -def: InstRW<[HWWriteResGroup17], (instregex "MMX_PANDNirm")>; -def: InstRW<[HWWriteResGroup17], (instregex "MMX_PANDirm")>; -def: InstRW<[HWWriteResGroup17], (instregex "MMX_PORirm")>; -def: InstRW<[HWWriteResGroup17], (instregex "MMX_PXORirm")>; def: InstRW<[HWWriteResGroup17], (instregex "PANDNrm")>; def: InstRW<[HWWriteResGroup17], (instregex "PANDrm")>; def: InstRW<[HWWriteResGroup17], (instregex "PORrm")>; def: InstRW<[HWWriteResGroup17], (instregex "PXORrm")>; -def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPDYrmi")>; def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPDrmi")>; -def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPSYrmi")>; def: InstRW<[HWWriteResGroup17], (instregex "VBLENDPSrmi")>; def: InstRW<[HWWriteResGroup17], (instregex "VINSERTF128rm")>; def: InstRW<[HWWriteResGroup17], (instregex "VINSERTI128rm")>; -def: InstRW<[HWWriteResGroup17], (instregex "VPANDNYrm")>; def: InstRW<[HWWriteResGroup17], (instregex "VPANDNrm")>; -def: InstRW<[HWWriteResGroup17], (instregex "VPANDYrm")>; def: InstRW<[HWWriteResGroup17], (instregex "VPANDrm")>; -def: InstRW<[HWWriteResGroup17], (instregex "VPBLENDDYrmi")>; def: InstRW<[HWWriteResGroup17], (instregex "VPBLENDDrmi")>; -def: InstRW<[HWWriteResGroup17], (instregex "VPORYrm")>; def: InstRW<[HWWriteResGroup17], (instregex "VPORrm")>; -def: InstRW<[HWWriteResGroup17], (instregex "VPXORYrm")>; def: InstRW<[HWWriteResGroup17], (instregex "VPXORrm")>; +def HWWriteResGroup17_1 : SchedWriteRes<[HWPort23,HWPort015]> { + let Latency = 6; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PANDNirm")>; +def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PANDirm")>; +def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PORirm")>; +def: InstRW<[HWWriteResGroup17_1], (instregex "MMX_PXORirm")>; + +def HWWriteResGroup17_2 : SchedWriteRes<[HWPort23,HWPort015]> { + let Latency = 8; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup17_2], (instregex "VBLENDPDYrmi")>; +def: InstRW<[HWWriteResGroup17_2], (instregex "VBLENDPSYrmi")>; +def: InstRW<[HWWriteResGroup17_2], (instregex "VPANDNYrm")>; +def: InstRW<[HWWriteResGroup17_2], (instregex "VPANDYrm")>; +def: InstRW<[HWWriteResGroup17_2], (instregex "VPBLENDDYrmi")>; +def: InstRW<[HWWriteResGroup17_2], (instregex "VPORYrm")>; +def: InstRW<[HWWriteResGroup17_2], (instregex "VPXORYrm")>; + def HWWriteResGroup18 : SchedWriteRes<[HWPort23,HWPort0156]> { - let Latency = 1; + let Latency = 6; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -2107,14 +2094,14 @@ def: InstRW<[HWWriteResGroup18], (instregex "XOR8rm")>; def HWWriteResGroup19 : SchedWriteRes<[HWPort237,HWPort0156]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup19], (instregex "SFENCE")>; def HWWriteResGroup20 : SchedWriteRes<[HWPort4,HWPort5,HWPort237]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2132,14 +2119,14 @@ def: InstRW<[HWWriteResGroup20], (instregex "VSTMXCSR")>; def HWWriteResGroup21 : SchedWriteRes<[HWPort4,HWPort6,HWPort237]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup21], (instregex "FNSTCW16m")>; def HWWriteResGroup22 : SchedWriteRes<[HWPort4,HWPort237,HWPort06]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2159,21 +2146,21 @@ def: InstRW<[HWWriteResGroup22], (instregex "SETSm")>; def HWWriteResGroup23 : SchedWriteRes<[HWPort4,HWPort237,HWPort15]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup23], (instregex "MOVBE(32|64)mr")>; def HWWriteResGroup23_16 : SchedWriteRes<[HWPort06, HWPort237, HWPort4]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup23_16], (instregex "MOVBE16mr")>; def HWWriteResGroup24 : SchedWriteRes<[HWPort4,HWPort237,HWPort0156]> { - let Latency = 1; + let Latency = 2; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2185,7 +2172,7 @@ def: InstRW<[HWWriteResGroup24], (instregex "STOSW")>; def HWWriteResGroup25 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06]> { - let Latency = 1; + let Latency = 7; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -2206,7 +2193,7 @@ def: InstRW<[HWWriteResGroup25], (instregex "SHR8mi")>; def HWWriteResGroup26 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort0156]> { - let Latency = 1; + let Latency = 7; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -2230,6 +2217,8 @@ def: InstRW<[HWWriteResGroup26], (instregex "OR(16|32|64)mr")>; def: InstRW<[HWWriteResGroup26], (instregex "OR8mi")>; def: InstRW<[HWWriteResGroup26], (instregex "OR8mr")>; +def: InstRW<[HWWriteResGroup26], (instregex "POP(16|32|64)rmm")>; +def: InstRW<[HWWriteResGroup26], (instregex "PUSH(16|32|64)rmm")>; def: InstRW<[HWWriteResGroup26], (instregex "SUB(16|32|64)mi8")>; def: InstRW<[HWWriteResGroup26], (instregex "SUB(16|32|64)mr")>; def: InstRW<[HWWriteResGroup26], (instregex "SUB8mi")>; @@ -2395,33 +2384,45 @@ def: InstRW<[HWWriteResGroup35], (instregex "SETBEr")>; def HWWriteResGroup36 : SchedWriteRes<[HWPort5,HWPort23]> { - let Latency = 2; + let Latency = 8; let NumMicroOps = 3; let ResourceCycles = [2,1]; } def: InstRW<[HWWriteResGroup36], (instregex "BLENDVPDrm0")>; def: InstRW<[HWWriteResGroup36], (instregex "BLENDVPSrm0")>; -def: InstRW<[HWWriteResGroup36], (instregex "MMX_PACKSSDWirm")>; -def: InstRW<[HWWriteResGroup36], (instregex "MMX_PACKSSWBirm")>; -def: InstRW<[HWWriteResGroup36], (instregex "MMX_PACKUSWBirm")>; def: InstRW<[HWWriteResGroup36], (instregex "PBLENDVBrm0")>; -def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPDYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPDrm")>; -def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPSYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VBLENDVPSrm")>; -def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPDYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPDrm")>; -def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPSYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VMASKMOVPSrm")>; -def: InstRW<[HWWriteResGroup36], (instregex "VPBLENDVBYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VPBLENDVBrm")>; -def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVDYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVDrm")>; -def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVQYrm")>; def: InstRW<[HWWriteResGroup36], (instregex "VPMASKMOVQrm")>; +def HWWriteResGroup36_1 : SchedWriteRes<[HWPort5,HWPort23]> { + let Latency = 9; + let NumMicroOps = 3; + let ResourceCycles = [2,1]; +} +def: InstRW<[HWWriteResGroup36_1], (instregex "VBLENDVPDYrm")>; +def: InstRW<[HWWriteResGroup36_1], (instregex "VBLENDVPSYrm")>; +def: InstRW<[HWWriteResGroup36_1], (instregex "VMASKMOVPDYrm")>; +def: InstRW<[HWWriteResGroup36_1], (instregex "VMASKMOVPSYrm")>; +def: InstRW<[HWWriteResGroup36_1], (instregex "VPBLENDVBYrm")>; +def: InstRW<[HWWriteResGroup36_1], (instregex "VPMASKMOVDYrm")>; +def: InstRW<[HWWriteResGroup36_1], (instregex "VPMASKMOVQYrm")>; + +def HWWriteResGroup36_2 : SchedWriteRes<[HWPort5,HWPort23]> { + let Latency = 7; + let NumMicroOps = 3; + let ResourceCycles = [2,1]; +} +def: InstRW<[HWWriteResGroup36_2], (instregex "MMX_PACKSSDWirm")>; +def: InstRW<[HWWriteResGroup36_2], (instregex "MMX_PACKSSWBirm")>; +def: InstRW<[HWWriteResGroup36_2], (instregex "MMX_PACKUSWBirm")>; + def HWWriteResGroup37 : SchedWriteRes<[HWPort23,HWPort0156]> { - let Latency = 2; + let Latency = 7; let NumMicroOps = 3; let ResourceCycles = [1,2]; } @@ -2432,7 +2433,7 @@ def: InstRW<[HWWriteResGroup37], (instregex "SCASW")>; def HWWriteResGroup38 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { - let Latency = 2; + let Latency = 8; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2456,14 +2457,14 @@ def: InstRW<[HWWriteResGroup38], (instregex "VPTESTrm")>; def HWWriteResGroup39 : SchedWriteRes<[HWPort0,HWPort01,HWPort23]> { - let Latency = 2; + let Latency = 7; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup39], (instregex "FLDCW16m")>; def HWWriteResGroup40 : SchedWriteRes<[HWPort0,HWPort23,HWPort0156]> { - let Latency = 2; + let Latency = 7; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2471,15 +2472,16 @@ def: InstRW<[HWWriteResGroup40], (instregex "VLDMXCSR")>; def HWWriteResGroup41 : SchedWriteRes<[HWPort6,HWPort23,HWPort0156]> { - let Latency = 2; + let Latency = 7; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup41], (instregex "LRETQ")>; +def: InstRW<[HWWriteResGroup41], (instregex "RETL")>; def: InstRW<[HWWriteResGroup41], (instregex "RETQ")>; def HWWriteResGroup42 : SchedWriteRes<[HWPort23,HWPort06,HWPort15]> { - let Latency = 2; + let Latency = 7; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2487,7 +2489,7 @@ def: InstRW<[HWWriteResGroup42], (instregex "BEXTR64rm")>; def HWWriteResGroup43 : SchedWriteRes<[HWPort23,HWPort06,HWPort0156]> { - let Latency = 2; + let Latency = 7; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2511,14 +2513,14 @@ def: InstRW<[HWWriteResGroup43], (instregex "SBB8rm")>; def HWWriteResGroup44 : SchedWriteRes<[HWPort4,HWPort6,HWPort237,HWPort0156]> { - let Latency = 2; + let Latency = 3; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } def: InstRW<[HWWriteResGroup44], (instregex "CALL(16|32|64)r")>; def HWWriteResGroup45 : SchedWriteRes<[HWPort4,HWPort237,HWPort06,HWPort0156]> { - let Latency = 2; + let Latency = 3; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -2527,7 +2529,7 @@ def: InstRW<[HWWriteResGroup45], (instregex "SETBEm")>; def HWWriteResGroup46 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06]> { - let Latency = 2; + let Latency = 8; let NumMicroOps = 5; let ResourceCycles = [1,1,1,2]; } @@ -2541,7 +2543,7 @@ def: InstRW<[HWWriteResGroup46], (instregex "ROR8mi")>; def HWWriteResGroup47 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort0156]> { - let Latency = 2; + let Latency = 8; let NumMicroOps = 5; let ResourceCycles = [1,1,1,2]; } @@ -2549,7 +2551,7 @@ def: InstRW<[HWWriteResGroup47], (instregex "XADD8rm")>; def HWWriteResGroup48 : SchedWriteRes<[HWPort4,HWPort6,HWPort23,HWPort237,HWPort0156]> { - let Latency = 2; + let Latency = 8; let NumMicroOps = 5; let ResourceCycles = [1,1,1,1,1]; } @@ -2722,127 +2724,73 @@ def: InstRW<[HWWriteResGroup51], (instregex "VPMOVZXWQYrr")>; def HWWriteResGroup52 : SchedWriteRes<[HWPort1,HWPort23]> { - let Latency = 3; + let Latency = 9; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup52], (instregex "ADDPDrm")>; def: InstRW<[HWWriteResGroup52], (instregex "ADDPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "ADDSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "ADDSSrm")>; def: InstRW<[HWWriteResGroup52], (instregex "ADDSUBPDrm")>; def: InstRW<[HWWriteResGroup52], (instregex "ADDSUBPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "ADD_F32m")>; -def: InstRW<[HWWriteResGroup52], (instregex "ADD_F64m")>; -def: InstRW<[HWWriteResGroup52], (instregex "BSF(16|32|64)rm")>; -def: InstRW<[HWWriteResGroup52], (instregex "BSR(16|32|64)rm")>; def: InstRW<[HWWriteResGroup52], (instregex "CMPPDrmi")>; def: InstRW<[HWWriteResGroup52], (instregex "CMPPSrmi")>; -def: InstRW<[HWWriteResGroup52], (instregex "CMPSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "COMISDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "COMISSrm")>; def: InstRW<[HWWriteResGroup52], (instregex "CVTDQ2PSrm")>; def: InstRW<[HWWriteResGroup52], (instregex "CVTPS2DQrm")>; def: InstRW<[HWWriteResGroup52], (instregex "CVTTPS2DQrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "ILD_F16m")>; -def: InstRW<[HWWriteResGroup52], (instregex "ILD_F32m")>; -def: InstRW<[HWWriteResGroup52], (instregex "ILD_F64m")>; -def: InstRW<[HWWriteResGroup52], (instregex "IMUL64m")>; -def: InstRW<[HWWriteResGroup52], (instregex "IMUL64rm(i8?)")>; -def: InstRW<[HWWriteResGroup52], (instregex "IMUL8m")>; -def: InstRW<[HWWriteResGroup52], (instregex "LZCNT(16|32|64)rm")>; def: InstRW<[HWWriteResGroup52], (instregex "MAXPDrm")>; def: InstRW<[HWWriteResGroup52], (instregex "MAXPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MAXSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MAXSSrm")>; def: InstRW<[HWWriteResGroup52], (instregex "MINPDrm")>; def: InstRW<[HWWriteResGroup52], (instregex "MINPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MINSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MINSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MMX_CVTPI2PSirm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MMX_CVTPS2PIirm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MMX_CVTTPS2PIirm")>; -def: InstRW<[HWWriteResGroup52], (instregex "MUL64m")>; -def: InstRW<[HWWriteResGroup52], (instregex "MUL8m")>; -def: InstRW<[HWWriteResGroup52], (instregex "PDEP32rm")>; -def: InstRW<[HWWriteResGroup52], (instregex "PDEP64rm")>; -def: InstRW<[HWWriteResGroup52], (instregex "PEXT32rm")>; -def: InstRW<[HWWriteResGroup52], (instregex "PEXT64rm")>; -def: InstRW<[HWWriteResGroup52], (instregex "POPCNT(16|32|64)rm")>; def: InstRW<[HWWriteResGroup52], (instregex "SUBPDrm")>; def: InstRW<[HWWriteResGroup52], (instregex "SUBPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "SUBR_F32m")>; -def: InstRW<[HWWriteResGroup52], (instregex "SUBR_F64m")>; -def: InstRW<[HWWriteResGroup52], (instregex "SUBSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "SUBSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "SUB_F32m")>; -def: InstRW<[HWWriteResGroup52], (instregex "SUB_F64m")>; -def: InstRW<[HWWriteResGroup52], (instregex "TZCNT(16|32|64)rm")>; -def: InstRW<[HWWriteResGroup52], (instregex "UCOMISDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "UCOMISSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VADDPDYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VADDPDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VADDPSYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VADDPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VADDSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VADDSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPDYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPSYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VADDSUBPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCMPPDYrmi")>; def: InstRW<[HWWriteResGroup52], (instregex "VCMPPDrmi")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCMPPSYrmi")>; def: InstRW<[HWWriteResGroup52], (instregex "VCMPPSrmi")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCMPSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCMPSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCOMISDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCOMISSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCVTDQ2PSYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VCVTDQ2PSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCVTPS2DQYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VCVTPS2DQrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VCVTTPS2DQYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VCVTTPS2DQrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMAXPDYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VMAXPDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMAXPSYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VMAXPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMAXSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMAXSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMINPDYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VMINPDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMINPSYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VMINPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMINSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VMINSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VSUBPDYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VSUBPDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VSUBPSYrm")>; def: InstRW<[HWWriteResGroup52], (instregex "VSUBPSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VSUBSDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VSUBSSrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VUCOMISDrm")>; -def: InstRW<[HWWriteResGroup52], (instregex "VUCOMISSrm")>; -def HWWriteResGroup52_16 : SchedWriteRes<[HWPort1, HWPort0156, HWPort23]> { - let Latency = 3; - let NumMicroOps = 4; -} -def: InstRW<[HWWriteResGroup52_16], (instregex "IMUL16m")>; -def: InstRW<[HWWriteResGroup52_16], (instregex "IMUL16rm(i8?)")>; -def: InstRW<[HWWriteResGroup52_16], (instregex "MUL16m")>; - -def HWWriteResGroup52_32 : SchedWriteRes<[HWPort1, HWPort0156, HWPort23]> { - let Latency = 3; - let NumMicroOps = 3; +def HWWriteResGroup52_1 : SchedWriteRes<[HWPort1,HWPort23]> { + let Latency = 10; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; } -def: InstRW<[HWWriteResGroup52_32], (instregex "IMUL32m")>; -def: InstRW<[HWWriteResGroup52_32], (instregex "IMUL32rm(i8?)")>; -def: InstRW<[HWWriteResGroup52_32], (instregex "MUL32m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "ADD_F32m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "ADD_F64m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "ILD_F16m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "ILD_F32m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "ILD_F64m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "SUBR_F32m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "SUBR_F64m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "SUB_F32m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "SUB_F64m")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VADDPDYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VADDPSYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VADDSUBPDYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VADDSUBPSYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VCMPPDYrmi")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VCMPPSYrmi")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VCVTDQ2PSYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VCVTPS2DQYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VCVTTPS2DQYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VMAXPDYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VMAXPSYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VMINPDYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VMINPSYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VSUBPDYrm")>; +def: InstRW<[HWWriteResGroup52_1], (instregex "VSUBPSYrm")>; def HWWriteResGroup53 : SchedWriteRes<[HWPort5,HWPort23]> { - let Latency = 3; + let Latency = 10; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -2852,19 +2800,22 @@ def: InstRW<[HWWriteResGroup53], (instregex "VPERMPDYmi")>; def: InstRW<[HWWriteResGroup53], (instregex "VPERMPSYrm")>; def: InstRW<[HWWriteResGroup53], (instregex "VPERMQYmi")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXBDYrm")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXBQYrm")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXBWYrm")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXDQYrm")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXWDYrm")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVSXWQYrm")>; def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXBDYrm")>; def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXBQYrm")>; def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXBWYrm")>; def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXDQYrm")>; -def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXWDYrm")>; def: InstRW<[HWWriteResGroup53], (instregex "VPMOVZXWQYrm")>; +def HWWriteResGroup53_1 : SchedWriteRes<[HWPort5,HWPort23]> { + let Latency = 9; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVSXBWYrm")>; +def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVSXDQYrm")>; +def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVSXWDYrm")>; +def: InstRW<[HWWriteResGroup53_1], (instregex "VPMOVZXWDYrm")>; + def HWWriteResGroup54 : SchedWriteRes<[HWPort0156]> { let Latency = 3; let NumMicroOps = 3; @@ -2965,14 +2916,14 @@ def: InstRW<[HWWriteResGroup60], (instregex "SHR8rCL")>; def HWWriteResGroup61 : SchedWriteRes<[HWPort0,HWPort4,HWPort237]> { - let Latency = 3; + let Latency = 4; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup61], (instregex "FNSTSWm")>; def HWWriteResGroup62 : SchedWriteRes<[HWPort1,HWPort4,HWPort237]> { - let Latency = 3; + let Latency = 4; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -2986,19 +2937,25 @@ def: InstRW<[HWWriteResGroup62], (instregex "IST_FP64m")>; def HWWriteResGroup63 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { - let Latency = 3; + let Latency = 10; let NumMicroOps = 4; let ResourceCycles = [2,1,1]; } def: InstRW<[HWWriteResGroup63], (instregex "VPSLLVDYrm")>; -def: InstRW<[HWWriteResGroup63], (instregex "VPSLLVDrm")>; def: InstRW<[HWWriteResGroup63], (instregex "VPSRAVDYrm")>; -def: InstRW<[HWWriteResGroup63], (instregex "VPSRAVDrm")>; def: InstRW<[HWWriteResGroup63], (instregex "VPSRLVDYrm")>; -def: InstRW<[HWWriteResGroup63], (instregex "VPSRLVDrm")>; + +def HWWriteResGroup63_1 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { + let Latency = 9; + let NumMicroOps = 4; + let ResourceCycles = [2,1,1]; +} +def: InstRW<[HWWriteResGroup63_1], (instregex "VPSLLVDrm")>; +def: InstRW<[HWWriteResGroup63_1], (instregex "VPSRAVDrm")>; +def: InstRW<[HWWriteResGroup63_1], (instregex "VPSRLVDrm")>; def HWWriteResGroup64 : SchedWriteRes<[HWPort5,HWPort23,HWPort15]> { - let Latency = 3; + let Latency = 8; let NumMicroOps = 4; let ResourceCycles = [2,1,1]; } @@ -3008,27 +2965,39 @@ def: InstRW<[HWWriteResGroup64], (instregex "MMX_PHSUBDrm64")>; def: InstRW<[HWWriteResGroup64], (instregex "MMX_PHSUBSWrm64")>; def: InstRW<[HWWriteResGroup64], (instregex "MMX_PHSUBWrm64")>; -def: InstRW<[HWWriteResGroup64], (instregex "PHADDDrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "PHADDSWrm128")>; -def: InstRW<[HWWriteResGroup64], (instregex "PHADDWrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "PHSUBDrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "PHSUBSWrm128")>; -def: InstRW<[HWWriteResGroup64], (instregex "PHSUBWrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHADDDYrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHADDDrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHADDSWrm128")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHADDSWrm256")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHADDWYrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHADDWrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBDYrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBDrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBSWrm128")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBSWrm256")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBWYrm")>; -def: InstRW<[HWWriteResGroup64], (instregex "VPHSUBWrm")>; + +def HWWriteResGroup64_1 : SchedWriteRes<[HWPort5,HWPort23,HWPort15]> { + let Latency = 10; + let NumMicroOps = 4; + let ResourceCycles = [2,1,1]; +} +def: InstRW<[HWWriteResGroup64_1], (instregex "VPHADDDYrm")>; +def: InstRW<[HWWriteResGroup64_1], (instregex "VPHADDSWrm256")>; +def: InstRW<[HWWriteResGroup64_1], (instregex "VPHADDWYrm")>; +def: InstRW<[HWWriteResGroup64_1], (instregex "VPHSUBDYrm")>; +def: InstRW<[HWWriteResGroup64_1], (instregex "VPHSUBSWrm256")>; +def: InstRW<[HWWriteResGroup64_1], (instregex "VPHSUBWYrm")>; + +def HWWriteResGroup64_2 : SchedWriteRes<[HWPort5,HWPort23,HWPort15]> { + let Latency = 9; + let NumMicroOps = 4; + let ResourceCycles = [2,1,1]; +} +def: InstRW<[HWWriteResGroup64_2], (instregex "PHADDDrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "PHADDSWrm128")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "PHADDWrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "PHSUBDrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "PHSUBSWrm128")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "PHSUBWrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "VPHADDDrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "VPHADDSWrm128")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "VPHADDWrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "VPHSUBDrm")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "VPHSUBSWrm128")>; +def: InstRW<[HWWriteResGroup64_2], (instregex "VPHSUBWrm")>; def HWWriteResGroup65 : SchedWriteRes<[HWPort23,HWPort06,HWPort0156]> { - let Latency = 3; + let Latency = 8; let NumMicroOps = 4; let ResourceCycles = [1,1,2]; } @@ -3036,7 +3005,7 @@ def: InstRW<[HWWriteResGroup65], (instregex "CMOVBE(16|32|64)rm")>; def HWWriteResGroup66 : SchedWriteRes<[HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 3; + let Latency = 9; let NumMicroOps = 5; let ResourceCycles = [1,1,1,2]; } @@ -3050,7 +3019,7 @@ def: InstRW<[HWWriteResGroup66], (instregex "RCR8mi")>; def HWWriteResGroup67 : SchedWriteRes<[HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 3; + let Latency = 9; let NumMicroOps = 5; let ResourceCycles = [1,1,2,1]; } @@ -3058,7 +3027,7 @@ def: InstRW<[HWWriteResGroup67], (instregex "ROR8mCL")>; def HWWriteResGroup68 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort0156]> { - let Latency = 3; + let Latency = 9; let NumMicroOps = 6; let ResourceCycles = [1,1,1,3]; } @@ -3073,7 +3042,7 @@ def: InstRW<[HWWriteResGroup68], (instregex "XOR8mi")>; def HWWriteResGroup69 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 3; + let Latency = 9; let NumMicroOps = 6; let ResourceCycles = [1,1,1,2,1]; } @@ -3191,7 +3160,7 @@ def: InstRW<[HWWriteResGroup74_32], (instregex "MUL32r")>; def HWWriteResGroup75 : SchedWriteRes<[HWPort1,HWPort23]> { - let Latency = 4; + let Latency = 11; let NumMicroOps = 3; let ResourceCycles = [2,1]; } @@ -3201,7 +3170,7 @@ def: InstRW<[HWWriteResGroup75], (instregex "FICOMP32m")>; def HWWriteResGroup76 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> { - let Latency = 4; + let Latency = 9; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -3222,38 +3191,50 @@ def: InstRW<[HWWriteResGroup76], (instregex "VCVTTSS2SIrm")>; def HWWriteResGroup77 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { - let Latency = 4; + let Latency = 10; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup77], (instregex "VCVTPS2PDYrm")>; -def: InstRW<[HWWriteResGroup77], (instregex "VPTESTYrm")>; + +def HWWriteResGroup77_1 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { + let Latency = 11; + let NumMicroOps = 3; + let ResourceCycles = [1,1,1]; +} +def: InstRW<[HWWriteResGroup77_1], (instregex "VPTESTYrm")>; def HWWriteResGroup78 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> { - let Latency = 4; + let Latency = 10; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup78], (instregex "CVTDQ2PDrm")>; def: InstRW<[HWWriteResGroup78], (instregex "CVTPD2DQrm")>; def: InstRW<[HWWriteResGroup78], (instregex "CVTPD2PSrm")>; -def: InstRW<[HWWriteResGroup78], (instregex "CVTSD2SSrm")>; def: InstRW<[HWWriteResGroup78], (instregex "CVTTPD2DQrm")>; def: InstRW<[HWWriteResGroup78], (instregex "MMX_CVTPD2PIirm")>; -def: InstRW<[HWWriteResGroup78], (instregex "MMX_CVTPI2PDirm")>; def: InstRW<[HWWriteResGroup78], (instregex "MMX_CVTTPD2PIirm")>; def: InstRW<[HWWriteResGroup78], (instregex "VCVTDQ2PDrm")>; -def: InstRW<[HWWriteResGroup78], (instregex "VCVTSD2SSrm")>; + +def HWWriteResGroup78_1 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> { + let Latency = 9; + let NumMicroOps = 3; + let ResourceCycles = [1,1,1]; +} +def: InstRW<[HWWriteResGroup78_1], (instregex "CVTSD2SSrm")>; +def: InstRW<[HWWriteResGroup78_1], (instregex "MMX_CVTPI2PDirm")>; +def: InstRW<[HWWriteResGroup78_1], (instregex "VCVTSD2SSrm")>; def HWWriteResGroup79 : SchedWriteRes<[HWPort1,HWPort6,HWPort23]> { - let Latency = 4; + let Latency = 9; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } def: InstRW<[HWWriteResGroup79], (instregex "MULX64rm")>; def HWWriteResGroup80 : SchedWriteRes<[HWPort5,HWPort23,HWPort015]> { - let Latency = 4; + let Latency = 9; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -3284,7 +3265,7 @@ def: InstRW<[HWWriteResGroup83], (instregex "LAR(16|32|64)rr")>; def HWWriteResGroup84 : SchedWriteRes<[HWPort0,HWPort4,HWPort237,HWPort15]> { - let Latency = 4; + let Latency = 5; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -3298,14 +3279,14 @@ def: InstRW<[HWWriteResGroup84], (instregex "VPMASKMOVQmr")>; def HWWriteResGroup85 : SchedWriteRes<[HWPort1,HWPort4,HWPort5,HWPort237]> { - let Latency = 4; + let Latency = 5; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } def: InstRW<[HWWriteResGroup85], (instregex "VCVTPS2PHmr")>; def HWWriteResGroup86 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort0156]> { - let Latency = 4; + let Latency = 10; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -3313,7 +3294,7 @@ def: InstRW<[HWWriteResGroup86], (instregex "SHRD(16|32|64)mri8")>; def HWWriteResGroup87 : SchedWriteRes<[HWPort1,HWPort6,HWPort23,HWPort0156]> { - let Latency = 4; + let Latency = 9; let NumMicroOps = 5; let ResourceCycles = [1,2,1,1]; } @@ -3321,7 +3302,7 @@ def: InstRW<[HWWriteResGroup87], (instregex "LSL(16|32|64)rm")>; def HWWriteResGroup88 : SchedWriteRes<[HWPort4,HWPort237,HWPort0156]> { - let Latency = 4; + let Latency = 5; let NumMicroOps = 6; let ResourceCycles = [1,1,4]; } @@ -3498,7 +3479,7 @@ def: InstRW<[HWWriteResGroup90], (instregex "VMULSSrr")>; def HWWriteResGroup91 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 5; + let Latency = 10; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -3510,160 +3491,192 @@ def: InstRW<[HWWriteResGroup91], (instregex "MMX_PMULLWirm")>; def: InstRW<[HWWriteResGroup91], (instregex "MMX_PMULUDQirm")>; def: InstRW<[HWWriteResGroup91], (instregex "MMX_PSADBWirm")>; -def: InstRW<[HWWriteResGroup91], (instregex "MUL_F32m")>; -def: InstRW<[HWWriteResGroup91], (instregex "MUL_F64m")>; -def: InstRW<[HWWriteResGroup91], (instregex "PCMPGTQrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PHMINPOSUWrm128")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMADDUBSWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMADDWDrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMULDQrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMULHRSWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMULHUWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMULHWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMULLWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PMULUDQrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "PSADBWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "RCPPSm")>; def: InstRW<[HWWriteResGroup91], (instregex "RCPSSm")>; -def: InstRW<[HWWriteResGroup91], (instregex "RSQRTPSm")>; def: InstRW<[HWWriteResGroup91], (instregex "RSQRTSSm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPCMPGTQYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPCMPGTQrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPHMINPOSUWrm128")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMADDUBSWYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMADDUBSWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMADDWDYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMADDWDrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULDQYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULDQrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULHRSWYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULHRSWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULHUWYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULHUWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULHWYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULHWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULLWYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULLWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULUDQYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPMULUDQrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPSADBWYrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VPSADBWrm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VRCPPSm")>; def: InstRW<[HWWriteResGroup91], (instregex "VRCPSSm")>; -def: InstRW<[HWWriteResGroup91], (instregex "VRSQRTPSm")>; def: InstRW<[HWWriteResGroup91], (instregex "VRSQRTSSm")>; +def HWWriteResGroup91_1 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 18; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup91_1], (instregex "SQRTSSm")>; +def: InstRW<[HWWriteResGroup91_1], (instregex "VDIVSSrm")>; + +def HWWriteResGroup91_2 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 11; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup91_2], (instregex "PCMPGTQrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PHMINPOSUWrm128")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMADDUBSWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMADDWDrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMULDQrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMULHRSWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMULHUWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMULHWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMULLWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PMULUDQrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "PSADBWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "RCPPSm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "RSQRTPSm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPCMPGTQrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPHMINPOSUWrm128")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMADDUBSWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMADDWDrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULDQrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULHRSWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULHUWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULHWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULLWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPMULUDQrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VPSADBWrm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VRCPPSm")>; +def: InstRW<[HWWriteResGroup91_2], (instregex "VRSQRTPSm")>; + +def HWWriteResGroup91_3 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 12; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup91_3], (instregex "MUL_F32m")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "MUL_F64m")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPCMPGTQYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMADDUBSWYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMADDWDYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULDQYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULHRSWYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULHUWYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULHWYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULLWYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPMULUDQYrm")>; +def: InstRW<[HWWriteResGroup91_3], (instregex "VPSADBWYrm")>; + def HWWriteResGroup92 : SchedWriteRes<[HWPort01,HWPort23]> { - let Latency = 5; + let Latency = 11; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup92], (instregex "MULPDrm")>; def: InstRW<[HWWriteResGroup92], (instregex "MULPSrm")>; -def: InstRW<[HWWriteResGroup92], (instregex "MULSDrm")>; -def: InstRW<[HWWriteResGroup92], (instregex "MULSSrm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD132SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD213SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADD231SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB132PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB213PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMADDSUB231PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB132SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB213SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUB231SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD132PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD213PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFMSUBADD231PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD132SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD213SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMADD231SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB132SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB213SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PDYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PSYm")>; def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231PSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231SDm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VFNMSUB231SSm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VMULPDYrm")>; def: InstRW<[HWWriteResGroup92], (instregex "VMULPDrm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VMULPSYrm")>; def: InstRW<[HWWriteResGroup92], (instregex "VMULPSrm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VMULSDrm")>; -def: InstRW<[HWWriteResGroup92], (instregex "VMULSSrm")>; + +def HWWriteResGroup92_1 : SchedWriteRes<[HWPort01,HWPort23]> { + let Latency = 12; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD132PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD132PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD213PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD213PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD231PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADD231PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB132PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB132PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB213PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB213PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB231PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMADDSUB231PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB132PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB132PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB213PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB213PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB231PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUB231PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD132PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD132PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD213PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD213PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD231PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFMSUBADD231PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD132PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD132PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD213PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD213PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD231PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMADD231PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB132PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB132PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB213PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB213PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB231PDYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VFNMSUB231PSYm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VMULPDYrm")>; +def: InstRW<[HWWriteResGroup92_1], (instregex "VMULPSYrm")>; + +def HWWriteResGroup92_2 : SchedWriteRes<[HWPort01,HWPort23]> { + let Latency = 10; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup92_2], (instregex "MULSDrm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "MULSSrm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD132SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD132SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD213SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD213SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD231SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMADD231SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB132SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB132SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB213SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB213SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB231SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFMSUB231SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD132SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD132SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD213SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD213SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD231SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMADD231SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB132SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB132SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB213SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB213SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB231SDm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VFNMSUB231SSm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VMULSDrm")>; +def: InstRW<[HWWriteResGroup92_2], (instregex "VMULSSrm")>; def HWWriteResGroup93 : SchedWriteRes<[HWPort1,HWPort5]> { let Latency = 5; @@ -3700,7 +3713,7 @@ def: InstRW<[HWWriteResGroup95], (instregex "MULX32rr")>; def HWWriteResGroup96 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> { - let Latency = 5; + let Latency = 11; let NumMicroOps = 4; let ResourceCycles = [1,2,1]; } @@ -3708,24 +3721,30 @@ def: InstRW<[HWWriteResGroup96], (instregex "HADDPSrm")>; def: InstRW<[HWWriteResGroup96], (instregex "HSUBPDrm")>; def: InstRW<[HWWriteResGroup96], (instregex "HSUBPSrm")>; -def: InstRW<[HWWriteResGroup96], (instregex "VHADDPDYrm")>; def: InstRW<[HWWriteResGroup96], (instregex "VHADDPDrm")>; -def: InstRW<[HWWriteResGroup96], (instregex "VHADDPSYrm")>; def: InstRW<[HWWriteResGroup96], (instregex "VHADDPSrm")>; -def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPDYrm")>; def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPDrm")>; -def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPSYrm")>; def: InstRW<[HWWriteResGroup96], (instregex "VHSUBPSrm")>; +def HWWriteResGroup96_1 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> { + let Latency = 12; + let NumMicroOps = 4; + let ResourceCycles = [1,2,1]; +} +def: InstRW<[HWWriteResGroup96_1], (instregex "VHADDPDYrm")>; +def: InstRW<[HWWriteResGroup96_1], (instregex "VHADDPSYrm")>; +def: InstRW<[HWWriteResGroup96_1], (instregex "VHSUBPDYrm")>; +def: InstRW<[HWWriteResGroup96_1], (instregex "VHSUBPSYrm")>; + def HWWriteResGroup97 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> { - let Latency = 5; + let Latency = 10; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } def: InstRW<[HWWriteResGroup97], (instregex "CVTTSS2SI64rm")>; def HWWriteResGroup98 : SchedWriteRes<[HWPort1,HWPort23,HWPort06,HWPort0156]> { - let Latency = 5; + let Latency = 10; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -3752,16 +3771,6 @@ } def: InstRW<[HWWriteResGroup101], (instregex "CMPXCHG(16|32|64)rr")>; def: InstRW<[HWWriteResGroup101], (instregex "CMPXCHG8rr")>; -def: InstRW<[HWWriteResGroup101], (instregex "ROUNDPDr")>; -def: InstRW<[HWWriteResGroup101], (instregex "ROUNDPSr")>; -def: InstRW<[HWWriteResGroup101], (instregex "ROUNDSDr")>; -def: InstRW<[HWWriteResGroup101], (instregex "ROUNDSSr")>; -def: InstRW<[HWWriteResGroup101], (instregex "VROUNDPDr")>; -def: InstRW<[HWWriteResGroup101], (instregex "VROUNDPSr")>; -def: InstRW<[HWWriteResGroup101], (instregex "VROUNDSDr")>; -def: InstRW<[HWWriteResGroup101], (instregex "VROUNDSSr")>; -def: InstRW<[HWWriteResGroup101], (instregex "VROUNDYPDr")>; -def: InstRW<[HWWriteResGroup101], (instregex "VROUNDYPSr")>; def HWWriteResGroup102 : SchedWriteRes<[HWPort1,HWPort5]> { let Latency = 6; @@ -3775,29 +3784,35 @@ def: InstRW<[HWWriteResGroup102], (instregex "VCVTTPD2DQYrr")>; def HWWriteResGroup103 : SchedWriteRes<[HWPort1,HWPort23]> { - let Latency = 6; + let Latency = 13; let NumMicroOps = 3; let ResourceCycles = [2,1]; } def: InstRW<[HWWriteResGroup103], (instregex "ADD_FI16m")>; def: InstRW<[HWWriteResGroup103], (instregex "ADD_FI32m")>; -def: InstRW<[HWWriteResGroup103], (instregex "ROUNDPDm")>; -def: InstRW<[HWWriteResGroup103], (instregex "ROUNDPSm")>; -def: InstRW<[HWWriteResGroup103], (instregex "ROUNDSDm")>; -def: InstRW<[HWWriteResGroup103], (instregex "ROUNDSSm")>; def: InstRW<[HWWriteResGroup103], (instregex "SUBR_FI16m")>; def: InstRW<[HWWriteResGroup103], (instregex "SUBR_FI32m")>; def: InstRW<[HWWriteResGroup103], (instregex "SUB_FI16m")>; def: InstRW<[HWWriteResGroup103], (instregex "SUB_FI32m")>; -def: InstRW<[HWWriteResGroup103], (instregex "VROUNDPDm")>; -def: InstRW<[HWWriteResGroup103], (instregex "VROUNDPSm")>; -def: InstRW<[HWWriteResGroup103], (instregex "VROUNDSDm")>; -def: InstRW<[HWWriteResGroup103], (instregex "VROUNDSSm")>; def: InstRW<[HWWriteResGroup103], (instregex "VROUNDYPDm")>; def: InstRW<[HWWriteResGroup103], (instregex "VROUNDYPSm")>; +def HWWriteResGroup103_1 : SchedWriteRes<[HWPort1,HWPort23]> { + let Latency = 12; + let NumMicroOps = 3; + let ResourceCycles = [2,1]; +} +def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDPDm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDPSm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDSDm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "ROUNDSSm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDPDm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDPSm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDSDm")>; +def: InstRW<[HWWriteResGroup103_1], (instregex "VROUNDSSm")>; + def HWWriteResGroup104 : SchedWriteRes<[HWPort1,HWPort5,HWPort23]> { - let Latency = 6; + let Latency = 12; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -3812,7 +3827,7 @@ def: InstRW<[HWWriteResGroup105], (instregex "SHRD(16|32|64)rrCL")>; def HWWriteResGroup106 : SchedWriteRes<[HWPort1,HWPort4,HWPort5,HWPort237]> { - let Latency = 6; + let Latency = 7; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -3833,7 +3848,7 @@ def: InstRW<[HWWriteResGroup108], (instregex "STD")>; def HWWriteResGroup109 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 6; + let Latency = 12; let NumMicroOps = 6; let ResourceCycles = [1,1,1,1,2]; } @@ -3855,7 +3870,7 @@ def: InstRW<[HWWriteResGroup110], (instregex "VAESENCrr")>; def HWWriteResGroup111 : SchedWriteRes<[HWPort5,HWPort23]> { - let Latency = 7; + let Latency = 13; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -3878,14 +3893,20 @@ def: InstRW<[HWWriteResGroup112], (instregex "VMPSADBWrri")>; def HWWriteResGroup113 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { - let Latency = 7; + let Latency = 13; let NumMicroOps = 4; let ResourceCycles = [1,2,1]; } def: InstRW<[HWWriteResGroup113], (instregex "MPSADBWrmi")>; -def: InstRW<[HWWriteResGroup113], (instregex "VMPSADBWYrmi")>; def: InstRW<[HWWriteResGroup113], (instregex "VMPSADBWrmi")>; +def HWWriteResGroup113_1 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { + let Latency = 14; + let NumMicroOps = 4; + let ResourceCycles = [1,2,1]; +} +def: InstRW<[HWWriteResGroup113_1], (instregex "VMPSADBWYrmi")>; + def HWWriteResGroup114 : SchedWriteRes<[HWPort6,HWPort06,HWPort15,HWPort0156]> { let Latency = 7; let NumMicroOps = 7; @@ -3894,7 +3915,7 @@ def: InstRW<[HWWriteResGroup114], (instregex "LOOP")>; def HWWriteResGroup115 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> { - let Latency = 8; + let Latency = 15; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -3910,7 +3931,7 @@ def: InstRW<[HWWriteResGroup116], (instregex "VDPPDrri")>; def HWWriteResGroup117 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> { - let Latency = 9; + let Latency = 15; let NumMicroOps = 4; let ResourceCycles = [1,1,1,1]; } @@ -3927,16 +3948,22 @@ def: InstRW<[HWWriteResGroup118], (instregex "VPMULLDrr")>; def HWWriteResGroup119 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 10; + let Latency = 16; let NumMicroOps = 3; let ResourceCycles = [2,1]; } def: InstRW<[HWWriteResGroup119], (instregex "PMULLDrm")>; -def: InstRW<[HWWriteResGroup119], (instregex "VPMULLDYrm")>; def: InstRW<[HWWriteResGroup119], (instregex "VPMULLDrm")>; +def HWWriteResGroup119_1 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 17; + let NumMicroOps = 3; + let ResourceCycles = [2,1]; +} +def: InstRW<[HWWriteResGroup119_1], (instregex "VPMULLDYrm")>; + def HWWriteResGroup120 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort06,HWPort15,HWPort0156]> { - let Latency = 10; + let Latency = 16; let NumMicroOps = 10; let ResourceCycles = [1,1,1,4,1,2]; } @@ -3952,12 +3979,18 @@ def: InstRW<[HWWriteResGroup121], (instregex "DIVSSrr")>; def HWWriteResGroup122 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 11; + let Latency = 17; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup122], (instregex "DIVPSrm")>; -def: InstRW<[HWWriteResGroup122], (instregex "DIVSSrm")>; + +def HWWriteResGroup122_1 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 16; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup122_1], (instregex "DIVSSrm")>; def HWWriteResGroup123 : SchedWriteRes<[HWPort0]> { let Latency = 11; @@ -3986,7 +4019,7 @@ def: InstRW<[HWWriteResGroup125], (instregex "VRSQRTPSYr")>; def HWWriteResGroup126 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 11; + let Latency = 17; let NumMicroOps = 4; let ResourceCycles = [3,1]; } @@ -3996,7 +4029,7 @@ def: InstRW<[HWWriteResGroup126], (instregex "VPCMPISTRM128rm")>; def HWWriteResGroup127 : SchedWriteRes<[HWPort0,HWPort5,HWPort23]> { - let Latency = 11; + let Latency = 17; let NumMicroOps = 4; let ResourceCycles = [2,1,1]; } @@ -4004,7 +4037,7 @@ def: InstRW<[HWWriteResGroup127], (instregex "VPCLMULQDQrm")>; def HWWriteResGroup128 : SchedWriteRes<[HWPort0,HWPort23,HWPort015]> { - let Latency = 11; + let Latency = 18; let NumMicroOps = 4; let ResourceCycles = [2,1,1]; } @@ -4035,7 +4068,7 @@ def: InstRW<[HWWriteResGroup131], (instregex "LOOPNE")>; def HWWriteResGroup132 : SchedWriteRes<[HWPort4,HWPort23,HWPort237,HWPort06,HWPort15,HWPort0156]> { - let Latency = 11; + let Latency = 17; let NumMicroOps = 14; let ResourceCycles = [1,1,1,4,2,5]; } @@ -4052,17 +4085,17 @@ def: InstRW<[HWWriteResGroup133], (instregex "VDIVSSrr")>; def HWWriteResGroup134 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 13; + let Latency = 19; let NumMicroOps = 2; let ResourceCycles = [1,1]; } +def: InstRW<[HWWriteResGroup134], (instregex "DIVSDrm")>; def: InstRW<[HWWriteResGroup134], (instregex "SQRTPSm")>; -def: InstRW<[HWWriteResGroup134], (instregex "SQRTSSm")>; def: InstRW<[HWWriteResGroup134], (instregex "VDIVPSrm")>; -def: InstRW<[HWWriteResGroup134], (instregex "VDIVSSrm")>; +def: InstRW<[HWWriteResGroup134], (instregex "VSQRTSSm")>; def HWWriteResGroup135 : SchedWriteRes<[HWPort1,HWPort23,HWPort237,HWPort06,HWPort15,HWPort0156]> { - let Latency = 13; + let Latency = 19; let NumMicroOps = 11; let ResourceCycles = [2,1,1,3,1,3]; } @@ -4088,17 +4121,15 @@ def: InstRW<[HWWriteResGroup137], (instregex "VAESIMCrr")>; def HWWriteResGroup138 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 14; + let Latency = 20; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup138], (instregex "DIVPDrm")>; -def: InstRW<[HWWriteResGroup138], (instregex "DIVSDrm")>; def: InstRW<[HWWriteResGroup138], (instregex "VSQRTPSm")>; -def: InstRW<[HWWriteResGroup138], (instregex "VSQRTSSm")>; def HWWriteResGroup139 : SchedWriteRes<[HWPort5,HWPort23]> { - let Latency = 14; + let Latency = 20; let NumMicroOps = 3; let ResourceCycles = [2,1]; } @@ -4115,14 +4146,20 @@ def: InstRW<[HWWriteResGroup140], (instregex "VDPPSrri")>; def HWWriteResGroup141 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> { - let Latency = 14; + let Latency = 20; let NumMicroOps = 5; let ResourceCycles = [2,1,1,1]; } def: InstRW<[HWWriteResGroup141], (instregex "DPPSrmi")>; -def: InstRW<[HWWriteResGroup141], (instregex "VDPPSYrmi")>; def: InstRW<[HWWriteResGroup141], (instregex "VDPPSrmi")>; +def HWWriteResGroup141_1 : SchedWriteRes<[HWPort0,HWPort1,HWPort5,HWPort23]> { + let Latency = 21; + let NumMicroOps = 5; + let ResourceCycles = [2,1,1,1]; +} +def: InstRW<[HWWriteResGroup141_1], (instregex "VDPPSYrmi")>; + def HWWriteResGroup142 : SchedWriteRes<[HWPort1,HWPort06,HWPort15,HWPort0156]> { let Latency = 14; let NumMicroOps = 10; @@ -4131,14 +4168,14 @@ def: InstRW<[HWWriteResGroup142], (instregex "RCR8rCL")>; def HWWriteResGroup143 : SchedWriteRes<[HWPort23,HWPort0156]> { - let Latency = 14; + let Latency = 19; let NumMicroOps = 15; let ResourceCycles = [1,14]; } def: InstRW<[HWWriteResGroup143], (instregex "POPF16")>; def HWWriteResGroup144 : SchedWriteRes<[HWPort4,HWPort5,HWPort6,HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 15; + let Latency = 21; let NumMicroOps = 8; let ResourceCycles = [1,1,1,1,1,1,2]; } @@ -4154,7 +4191,7 @@ def: InstRW<[HWWriteResGroup145], (instregex "VZEROALL")>; def HWWriteResGroup146 : SchedWriteRes<[HWPort0,HWPort4,HWPort5,HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 16; + let Latency = 22; let NumMicroOps = 19; let ResourceCycles = [2,1,4,1,1,4,6]; } @@ -4184,7 +4221,7 @@ def: InstRW<[HWWriteResGroup149], (instregex "RDTSC")>; def HWWriteResGroup150 : SchedWriteRes<[HWPort0,HWPort5,HWPort23,HWPort0156]> { - let Latency = 18; + let Latency = 24; let NumMicroOps = 9; let ResourceCycles = [4,3,1,1]; } @@ -4192,7 +4229,7 @@ def: InstRW<[HWWriteResGroup150], (instregex "VPCMPESTRIrm")>; def HWWriteResGroup151 : SchedWriteRes<[HWPort6,HWPort23,HWPort0156]> { - let Latency = 18; + let Latency = 23; let NumMicroOps = 19; let ResourceCycles = [3,1,15]; } @@ -4207,7 +4244,7 @@ def: InstRW<[HWWriteResGroup152], (instregex "VPCMPESTRM128rr")>; def HWWriteResGroup153 : SchedWriteRes<[HWPort0,HWPort5,HWPort23,HWPort015,HWPort0156]> { - let Latency = 19; + let Latency = 25; let NumMicroOps = 10; let ResourceCycles = [4,3,1,1,1]; } @@ -4228,16 +4265,30 @@ def: InstRW<[HWWriteResGroup154], (instregex "VDIVSDrr")>; def HWWriteResGroup155 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 20; + let Latency = 27; let NumMicroOps = 2; let ResourceCycles = [1,1]; } def: InstRW<[HWWriteResGroup155], (instregex "DIVR_F32m")>; def: InstRW<[HWWriteResGroup155], (instregex "DIVR_F64m")>; -def: InstRW<[HWWriteResGroup155], (instregex "SQRTPDm")>; -def: InstRW<[HWWriteResGroup155], (instregex "SQRTSDm")>; -def: InstRW<[HWWriteResGroup155], (instregex "VDIVPDrm")>; -def: InstRW<[HWWriteResGroup155], (instregex "VDIVSDrm")>; +def: InstRW<[HWWriteResGroup155], (instregex "VSQRTPDm")>; + +def HWWriteResGroup155_1 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 26; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup155_1], (instregex "SQRTPDm")>; +def: InstRW<[HWWriteResGroup155_1], (instregex "VDIVPDrm")>; +def: InstRW<[HWWriteResGroup155_1], (instregex "VSQRTSDm")>; + +def HWWriteResGroup155_2 : SchedWriteRes<[HWPort0,HWPort23]> { + let Latency = 25; + let NumMicroOps = 2; + let ResourceCycles = [1,1]; +} +def: InstRW<[HWWriteResGroup155_2], (instregex "SQRTSDm")>; +def: InstRW<[HWWriteResGroup155_2], (instregex "VDIVSDrm")>; def HWWriteResGroup156 : SchedWriteRes<[HWPort5,HWPort6,HWPort0156]> { let Latency = 20; @@ -4254,14 +4305,6 @@ def: InstRW<[HWWriteResGroup157], (instregex "VSQRTPDr")>; def: InstRW<[HWWriteResGroup157], (instregex "VSQRTSDr")>; -def HWWriteResGroup158 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 21; - let NumMicroOps = 2; - let ResourceCycles = [1,1]; -} -def: InstRW<[HWWriteResGroup158], (instregex "VSQRTPDm")>; -def: InstRW<[HWWriteResGroup158], (instregex "VSQRTSDm")>; - def HWWriteResGroup159 : SchedWriteRes<[HWPort0,HWPort015]> { let Latency = 21; let NumMicroOps = 3; @@ -4271,7 +4314,7 @@ def: InstRW<[HWWriteResGroup159], (instregex "VSQRTPSYr")>; def HWWriteResGroup160 : SchedWriteRes<[HWPort0,HWPort23,HWPort015]> { - let Latency = 21; + let Latency = 28; let NumMicroOps = 4; let ResourceCycles = [2,1,1]; } @@ -4279,7 +4322,7 @@ def: InstRW<[HWWriteResGroup160], (instregex "VSQRTPSYm")>; def HWWriteResGroup161 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> { - let Latency = 23; + let Latency = 30; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -4296,7 +4339,7 @@ def: InstRW<[HWWriteResGroup162], (instregex "DIVR_FrST0")>; def HWWriteResGroup163 : SchedWriteRes<[HWPort0,HWPort23]> { - let Latency = 24; + let Latency = 31; let NumMicroOps = 2; let ResourceCycles = [1,1]; } @@ -4304,21 +4347,21 @@ def: InstRW<[HWWriteResGroup163], (instregex "DIV_F64m")>; def HWWriteResGroup164 : SchedWriteRes<[HWPort4,HWPort6,HWPort23,HWPort237,HWPort0156]> { - let Latency = 24; + let Latency = 30; let NumMicroOps = 27; let ResourceCycles = [1,5,1,1,19]; } def: InstRW<[HWWriteResGroup164], (instregex "XSAVE64")>; def HWWriteResGroup165 : SchedWriteRes<[HWPort4,HWPort6,HWPort23,HWPort237,HWPort0156]> { - let Latency = 25; + let Latency = 31; let NumMicroOps = 28; let ResourceCycles = [1,6,1,1,19]; } def: InstRW<[HWWriteResGroup165], (instregex "XSAVE(OPT?)")>; def HWWriteResGroup166 : SchedWriteRes<[HWPort0,HWPort1,HWPort23]> { - let Latency = 27; + let Latency = 34; let NumMicroOps = 3; let ResourceCycles = [1,1,1]; } @@ -4326,7 +4369,7 @@ def: InstRW<[HWWriteResGroup166], (instregex "DIV_FI32m")>; def HWWriteResGroup167 : SchedWriteRes<[HWPort0,HWPort5,HWPort23,HWPort015]> { - let Latency = 28; + let Latency = 34; let NumMicroOps = 11; let ResourceCycles = [2,7,1,1]; } @@ -4342,7 +4385,7 @@ def: InstRW<[HWWriteResGroup168], (instregex "VAESKEYGENASSIST128rr")>; def HWWriteResGroup170 : SchedWriteRes<[HWPort5,HWPort6,HWPort23,HWPort06,HWPort0156]> { - let Latency = 30; + let Latency = 35; let NumMicroOps = 23; let ResourceCycles = [1,5,3,4,10]; } @@ -4352,7 +4395,7 @@ def: InstRW<[HWWriteResGroup170], (instregex "IN8rr")>; def HWWriteResGroup171 : SchedWriteRes<[HWPort5,HWPort6,HWPort23,HWPort237,HWPort06,HWPort0156]> { - let Latency = 30; + let Latency = 36; let NumMicroOps = 23; let ResourceCycles = [1,5,2,1,4,10]; } @@ -4377,7 +4420,7 @@ def: InstRW<[HWWriteResGroup173], (instregex "VSQRTPDYr")>; def HWWriteResGroup174 : SchedWriteRes<[HWPort0,HWPort23,HWPort015]> { - let Latency = 35; + let Latency = 42; let NumMicroOps = 4; let ResourceCycles = [2,1,1]; } @@ -4385,7 +4428,7 @@ def: InstRW<[HWWriteResGroup174], (instregex "VSQRTPDYm")>; def HWWriteResGroup175 : SchedWriteRes<[HWPort1,HWPort4,HWPort5,HWPort6,HWPort23,HWPort237,HWPort15,HWPort0156]> { - let Latency = 35; + let Latency = 41; let NumMicroOps = 18; let ResourceCycles = [1,1,2,3,1,1,1,8]; } @@ -4399,7 +4442,7 @@ def: InstRW<[HWWriteResGroup176], (instregex "RDTSCP")>; def HWWriteResGroup177 : SchedWriteRes<[HWPort0,HWPort01,HWPort23,HWPort05,HWPort06,HWPort015,HWPort0156]> { - let Latency = 56; + let Latency = 61; let NumMicroOps = 64; let ResourceCycles = [2,2,8,1,10,2,39]; } @@ -4407,14 +4450,14 @@ def: InstRW<[HWWriteResGroup177], (instregex "FLDENVm")>; def HWWriteResGroup178 : SchedWriteRes<[HWPort0,HWPort6,HWPort23,HWPort05,HWPort06,HWPort15,HWPort0156]> { - let Latency = 59; + let Latency = 64; let NumMicroOps = 88; let ResourceCycles = [4,4,31,1,2,1,45]; } def: InstRW<[HWWriteResGroup178], (instregex "FXRSTOR64")>; def HWWriteResGroup179 : SchedWriteRes<[HWPort0,HWPort6,HWPort23,HWPort05,HWPort06,HWPort15,HWPort0156]> { - let Latency = 59; + let Latency = 64; let NumMicroOps = 90; let ResourceCycles = [4,2,33,1,2,1,47]; } @@ -4442,11 +4485,81 @@ def: InstRW<[HWWriteResGroup182], (instregex "IDIV(16|32|64)r")>; def HWWriteResGroup183 : SchedWriteRes<[HWPort0,HWPort1,HWPort4,HWPort5,HWPort6,HWPort237,HWPort06,HWPort0156]> { - let Latency = 114; + let Latency = 115; let NumMicroOps = 100; let ResourceCycles = [9,9,11,8,1,11,21,30]; } def: InstRW<[HWWriteResGroup183], (instregex "FSTENVm")>; def: InstRW<[HWWriteResGroup183], (instregex "FSTENVm")>; +def HWWriteResGroup184 : SchedWriteRes<[HWPort0, HWPort5, HWPort15, HWPort015, HWPort06, HWPort23]> { + let Latency = 26; + let NumMicroOps = 12; + let ResourceCycles = [2,2,1,3,2,2]; +} +def: InstRW<[HWWriteResGroup184], (instregex "VGATHERDPDrm")>; +def: InstRW<[HWWriteResGroup184], (instregex "VPGATHERDQrm")>; +def: InstRW<[HWWriteResGroup184], (instregex "VPGATHERDDrm")>; + +def HWWriteResGroup185 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 24; + let NumMicroOps = 22; + let ResourceCycles = [5,3,4,1,5,4]; +} +def: InstRW<[HWWriteResGroup185], (instregex "VGATHERQPDYrm")>; +def: InstRW<[HWWriteResGroup185], (instregex "VPGATHERQQYrm")>; + +def HWWriteResGroup186 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 28; + let NumMicroOps = 22; + let ResourceCycles = [5,3,4,1,5,4]; +} +def: InstRW<[HWWriteResGroup186], (instregex "VPGATHERQDYrm")>; + +def HWWriteResGroup187 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 25; + let NumMicroOps = 22; + let ResourceCycles = [5,3,4,1,5,4]; +} +def: InstRW<[HWWriteResGroup187], (instregex "VPGATHERQDrm")>; + +def HWWriteResGroup188 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 27; + let NumMicroOps = 20; + let ResourceCycles = [3,3,4,1,5,4]; +} +def: InstRW<[HWWriteResGroup188], (instregex "VGATHERDPDYrm")>; +def: InstRW<[HWWriteResGroup188], (instregex "VPGATHERDQYrm")>; + +def HWWriteResGroup189 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 27; + let NumMicroOps = 34; + let ResourceCycles = [5,3,8,1,9,8]; +} +def: InstRW<[HWWriteResGroup189], (instregex "VGATHERDPSYrm")>; +def: InstRW<[HWWriteResGroup189], (instregex "VPGATHERDDYrm")>; + +def HWWriteResGroup190 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 23; + let NumMicroOps = 14; + let ResourceCycles = [3,3,2,1,3,2]; +} +def: InstRW<[HWWriteResGroup190], (instregex "VGATHERQPDrm")>; +def: InstRW<[HWWriteResGroup190], (instregex "VPGATHERQQrm")>; + +def HWWriteResGroup191 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 28; + let NumMicroOps = 15; + let ResourceCycles = [3,3,2,1,4,2]; +} +def: InstRW<[HWWriteResGroup191], (instregex "VGATHERQPSYrm")>; + +def HWWriteResGroup192 : SchedWriteRes<[HWPort0, HWPort5, HWPort06, HWPort15, HWPort015, HWPort23]> { + let Latency = 25; + let NumMicroOps = 15; + let ResourceCycles = [3,3,2,1,4,2]; +} +def: InstRW<[HWWriteResGroup192], (instregex "VGATHERQPSrm")>; +def: InstRW<[HWWriteResGroup192], (instregex "VGATHERDPSrm")>; + } // SchedModel Index: test/CodeGen/X86/aes-schedule.ll =================================================================== --- test/CodeGen/X86/aes-schedule.ll +++ test/CodeGen/X86/aes-schedule.ll @@ -32,8 +32,8 @@ ; HASWELL-LABEL: test_aesdec: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaesdec %xmm1, %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: vaesdec (%rdi), %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaesdec (%rdi), %xmm0, %xmm0 # sched: [13:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aesdec: ; BROADWELL: # %bb.0: @@ -87,8 +87,8 @@ ; HASWELL-LABEL: test_aesdeclast: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaesdeclast %xmm1, %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: vaesdeclast (%rdi), %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaesdeclast (%rdi), %xmm0, %xmm0 # sched: [13:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aesdeclast: ; BROADWELL: # %bb.0: @@ -142,8 +142,8 @@ ; HASWELL-LABEL: test_aesenc: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaesenc %xmm1, %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: vaesenc (%rdi), %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaesenc (%rdi), %xmm0, %xmm0 # sched: [13:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aesenc: ; BROADWELL: # %bb.0: @@ -197,8 +197,8 @@ ; HASWELL-LABEL: test_aesenclast: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaesenclast %xmm1, %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: vaesenclast (%rdi), %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaesenclast (%rdi), %xmm0, %xmm0 # sched: [13:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aesenclast: ; BROADWELL: # %bb.0: @@ -255,9 +255,9 @@ ; HASWELL-LABEL: test_aesimc: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaesimc %xmm0, %xmm0 # sched: [14:2.00] -; HASWELL-NEXT: vaesimc (%rdi), %xmm1 # sched: [14:2.00] +; HASWELL-NEXT: vaesimc (%rdi), %xmm1 # sched: [20:2.00] ; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aesimc: ; BROADWELL: # %bb.0: @@ -319,9 +319,9 @@ ; HASWELL-LABEL: test_aeskeygenassist: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaeskeygenassist $7, %xmm0, %xmm0 # sched: [29:7.00] -; HASWELL-NEXT: vaeskeygenassist $7, (%rdi), %xmm1 # sched: [28:7.00] +; HASWELL-NEXT: vaeskeygenassist $7, (%rdi), %xmm1 # sched: [34:7.00] ; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aeskeygenassist: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/avx-schedule.ll =================================================================== --- test/CodeGen/X86/avx-schedule.ll +++ test/CodeGen/X86/avx-schedule.ll @@ -25,8 +25,8 @@ ; HASWELL-LABEL: test_addpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addpd: ; BROADWELL: # %bb.0: @@ -79,8 +79,8 @@ ; HASWELL-LABEL: test_addps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addps: ; BROADWELL: # %bb.0: @@ -133,8 +133,8 @@ ; HASWELL-LABEL: test_addsubpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddsubpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddsubpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddsubpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addsubpd: ; BROADWELL: # %bb.0: @@ -188,8 +188,8 @@ ; HASWELL-LABEL: test_addsubps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddsubps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddsubps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddsubps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addsubps: ; BROADWELL: # %bb.0: @@ -245,9 +245,9 @@ ; HASWELL-LABEL: test_andnotpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandnpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vandnpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vandnpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andnotpd: ; BROADWELL: # %bb.0: @@ -314,9 +314,9 @@ ; HASWELL-LABEL: test_andnotps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandnps %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vandnps (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vandnps (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andnotps: ; BROADWELL: # %bb.0: @@ -383,9 +383,9 @@ ; HASWELL-LABEL: test_andpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vandpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vandpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andpd: ; BROADWELL: # %bb.0: @@ -450,9 +450,9 @@ ; HASWELL-LABEL: test_andps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandps %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vandps (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vandps (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andps: ; BROADWELL: # %bb.0: @@ -518,8 +518,8 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendpd {{.*#+}} ymm0 = ymm0[0],ymm1[1,2],ymm0[3] sched: [1:0.33] ; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vblendpd {{.*#+}} ymm0 = ymm0[0],mem[1,2],ymm0[3] sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendpd {{.*#+}} ymm0 = ymm0[0],mem[1,2],ymm0[3] sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendpd: ; BROADWELL: # %bb.0: @@ -578,8 +578,8 @@ ; HASWELL-LABEL: test_blendps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendps {{.*#+}} ymm0 = ymm0[0],ymm1[1,2],ymm0[3,4,5,6,7] sched: [1:0.33] -; HASWELL-NEXT: vblendps {{.*#+}} ymm0 = ymm0[0,1],mem[2],ymm0[3],mem[4,5,6],ymm0[7] sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendps {{.*#+}} ymm0 = ymm0[0,1],mem[2],ymm0[3],mem[4,5,6],ymm0[7] sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendps: ; BROADWELL: # %bb.0: @@ -632,8 +632,8 @@ ; HASWELL-LABEL: test_blendvpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendvpd %ymm2, %ymm1, %ymm0, %ymm0 # sched: [2:2.00] -; HASWELL-NEXT: vblendvpd %ymm2, (%rdi), %ymm0, %ymm0 # sched: [2:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendvpd %ymm2, (%rdi), %ymm0, %ymm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendvpd: ; BROADWELL: # %bb.0: @@ -687,8 +687,8 @@ ; HASWELL-LABEL: test_blendvps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendvps %ymm2, %ymm1, %ymm0, %ymm0 # sched: [2:2.00] -; HASWELL-NEXT: vblendvps %ymm2, (%rdi), %ymm0, %ymm0 # sched: [2:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendvps %ymm2, (%rdi), %ymm0, %ymm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendvps: ; BROADWELL: # %bb.0: @@ -739,8 +739,8 @@ ; ; HASWELL-LABEL: test_broadcastf128: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcastf128 {{.*#+}} ymm0 = mem[0,1,0,1] sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vbroadcastf128 {{.*#+}} ymm0 = mem[0,1,0,1] sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastf128: ; BROADWELL: # %bb.0: @@ -784,8 +784,8 @@ ; ; HASWELL-LABEL: test_broadcastsd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcastsd (%rdi), %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vbroadcastsd (%rdi), %ymm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastsd_ymm: ; BROADWELL: # %bb.0: @@ -830,8 +830,8 @@ ; ; HASWELL-LABEL: test_broadcastss: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcastss (%rdi), %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vbroadcastss (%rdi), %xmm0 # sched: [6:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastss: ; BROADWELL: # %bb.0: @@ -876,8 +876,8 @@ ; ; HASWELL-LABEL: test_broadcastss_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcastss (%rdi), %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vbroadcastss (%rdi), %ymm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastss_ymm: ; BROADWELL: # %bb.0: @@ -927,9 +927,9 @@ ; HASWELL-LABEL: test_cmppd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcmpeqpd %ymm1, %ymm0, %ymm1 # sched: [3:1.00] -; HASWELL-NEXT: vcmpeqpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] +; HASWELL-NEXT: vcmpeqpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] ; HASWELL-NEXT: vorpd %ymm0, %ymm1, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cmppd: ; BROADWELL: # %bb.0: @@ -995,9 +995,9 @@ ; HASWELL-LABEL: test_cmpps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcmpeqps %ymm1, %ymm0, %ymm1 # sched: [3:1.00] -; HASWELL-NEXT: vcmpeqps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] +; HASWELL-NEXT: vcmpeqps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] ; HASWELL-NEXT: vorps %ymm0, %ymm1, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cmpps: ; BROADWELL: # %bb.0: @@ -1063,9 +1063,9 @@ ; HASWELL-LABEL: test_cvtdq2pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtdq2pd %xmm0, %ymm0 # sched: [6:1.00] -; HASWELL-NEXT: vcvtdq2pd (%rdi), %ymm1 # sched: [6:1.00] +; HASWELL-NEXT: vcvtdq2pd (%rdi), %ymm1 # sched: [12:1.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtdq2pd: ; BROADWELL: # %bb.0: @@ -1128,9 +1128,9 @@ ; HASWELL-LABEL: test_cvtdq2ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtdq2ps %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vcvtdq2ps (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vcvtdq2ps (%rdi), %ymm1 # sched: [10:1.00] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtdq2ps: ; BROADWELL: # %bb.0: @@ -1191,9 +1191,9 @@ ; HASWELL-LABEL: test_cvtpd2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtpd2dq %ymm0, %xmm0 # sched: [6:1.00] -; HASWELL-NEXT: vcvtpd2dqy (%rdi), %xmm1 # sched: [7:1.00] +; HASWELL-NEXT: vcvtpd2dqy (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpd2dq: ; BROADWELL: # %bb.0: @@ -1255,9 +1255,9 @@ ; HASWELL-LABEL: test_cvttpd2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttpd2dq %ymm0, %xmm0 # sched: [6:1.00] -; HASWELL-NEXT: vcvttpd2dqy (%rdi), %xmm1 # sched: [7:1.00] +; HASWELL-NEXT: vcvttpd2dqy (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttpd2dq: ; BROADWELL: # %bb.0: @@ -1318,9 +1318,9 @@ ; HASWELL-LABEL: test_cvtpd2ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtpd2ps %ymm0, %xmm0 # sched: [6:1.00] -; HASWELL-NEXT: vcvtpd2psy (%rdi), %xmm1 # sched: [7:1.00] +; HASWELL-NEXT: vcvtpd2psy (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpd2ps: ; BROADWELL: # %bb.0: @@ -1381,9 +1381,9 @@ ; HASWELL-LABEL: test_cvtps2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtps2dq %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vcvtps2dq (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vcvtps2dq (%rdi), %ymm1 # sched: [10:1.00] ; HASWELL-NEXT: vorpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtps2dq: ; BROADWELL: # %bb.0: @@ -1445,9 +1445,9 @@ ; HASWELL-LABEL: test_cvttps2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttps2dq %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vcvttps2dq (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vcvttps2dq (%rdi), %ymm1 # sched: [10:1.00] ; HASWELL-NEXT: vorps %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttps2dq: ; BROADWELL: # %bb.0: @@ -1506,8 +1506,8 @@ ; HASWELL-LABEL: test_divpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdivpd %ymm1, %ymm0, %ymm0 # sched: [35:2.00] -; HASWELL-NEXT: vdivpd (%rdi), %ymm0, %ymm0 # sched: [35:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdivpd (%rdi), %ymm0, %ymm0 # sched: [42:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_divpd: ; BROADWELL: # %bb.0: @@ -1560,8 +1560,8 @@ ; HASWELL-LABEL: test_divps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdivps %ymm1, %ymm0, %ymm0 # sched: [21:2.00] -; HASWELL-NEXT: vdivps (%rdi), %ymm0, %ymm0 # sched: [21:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdivps (%rdi), %ymm0, %ymm0 # sched: [28:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_divps: ; BROADWELL: # %bb.0: @@ -1614,8 +1614,8 @@ ; HASWELL-LABEL: test_dpps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdpps $7, %ymm1, %ymm0, %ymm0 # sched: [14:2.00] -; HASWELL-NEXT: vdpps $7, (%rdi), %ymm0, %ymm0 # sched: [14:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdpps $7, (%rdi), %ymm0, %ymm0 # sched: [21:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_dpps: ; BROADWELL: # %bb.0: @@ -1673,7 +1673,7 @@ ; HASWELL-NEXT: vextractf128 $1, %ymm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vextractf128 $1, %ymm1, (%rdi) # sched: [1:1.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_extractf128: ; BROADWELL: # %bb.0: @@ -1730,8 +1730,8 @@ ; HASWELL-LABEL: test_haddpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhaddpd %ymm1, %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: vhaddpd (%rdi), %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhaddpd (%rdi), %ymm0, %ymm0 # sched: [12:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_haddpd: ; BROADWELL: # %bb.0: @@ -1785,8 +1785,8 @@ ; HASWELL-LABEL: test_haddps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhaddps %ymm1, %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: vhaddps (%rdi), %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhaddps (%rdi), %ymm0, %ymm0 # sched: [12:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_haddps: ; BROADWELL: # %bb.0: @@ -1840,8 +1840,8 @@ ; HASWELL-LABEL: test_hsubpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhsubpd %ymm1, %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: vhsubpd (%rdi), %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhsubpd (%rdi), %ymm0, %ymm0 # sched: [12:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_hsubpd: ; BROADWELL: # %bb.0: @@ -1895,8 +1895,8 @@ ; HASWELL-LABEL: test_hsubps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhsubps %ymm1, %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: vhsubps (%rdi), %ymm0, %ymm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhsubps (%rdi), %ymm0, %ymm0 # sched: [12:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_hsubps: ; BROADWELL: # %bb.0: @@ -1952,9 +1952,9 @@ ; HASWELL-LABEL: test_insertf128: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm1 # sched: [3:1.00] -; HASWELL-NEXT: vinsertf128 $1, (%rdi), %ymm0, %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vinsertf128 $1, (%rdi), %ymm0, %ymm0 # sched: [7:0.50] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_insertf128: ; BROADWELL: # %bb.0: @@ -2012,8 +2012,8 @@ ; ; HASWELL-LABEL: test_lddqu: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vlddqu (%rdi), %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vlddqu (%rdi), %ymm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lddqu: ; BROADWELL: # %bb.0: @@ -2061,10 +2061,10 @@ ; ; HASWELL-LABEL: test_maskmovpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmaskmovpd (%rdi), %xmm0, %xmm2 # sched: [2:2.00] -; HASWELL-NEXT: vmaskmovpd %xmm1, %xmm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vmaskmovpd (%rdi), %xmm0, %xmm2 # sched: [8:2.00] +; HASWELL-NEXT: vmaskmovpd %xmm1, %xmm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovapd %xmm2, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maskmovpd: ; BROADWELL: # %bb.0: @@ -2124,10 +2124,10 @@ ; ; HASWELL-LABEL: test_maskmovpd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmaskmovpd (%rdi), %ymm0, %ymm2 # sched: [2:2.00] -; HASWELL-NEXT: vmaskmovpd %ymm1, %ymm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vmaskmovpd (%rdi), %ymm0, %ymm2 # sched: [9:2.00] +; HASWELL-NEXT: vmaskmovpd %ymm1, %ymm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovapd %ymm2, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maskmovpd_ymm: ; BROADWELL: # %bb.0: @@ -2187,10 +2187,10 @@ ; ; HASWELL-LABEL: test_maskmovps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmaskmovps (%rdi), %xmm0, %xmm2 # sched: [2:2.00] -; HASWELL-NEXT: vmaskmovps %xmm1, %xmm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vmaskmovps (%rdi), %xmm0, %xmm2 # sched: [8:2.00] +; HASWELL-NEXT: vmaskmovps %xmm1, %xmm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovaps %xmm2, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maskmovps: ; BROADWELL: # %bb.0: @@ -2250,10 +2250,10 @@ ; ; HASWELL-LABEL: test_maskmovps_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmaskmovps (%rdi), %ymm0, %ymm2 # sched: [2:2.00] -; HASWELL-NEXT: vmaskmovps %ymm1, %ymm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vmaskmovps (%rdi), %ymm0, %ymm2 # sched: [9:2.00] +; HASWELL-NEXT: vmaskmovps %ymm1, %ymm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovaps %ymm2, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maskmovps_ymm: ; BROADWELL: # %bb.0: @@ -2312,8 +2312,8 @@ ; HASWELL-LABEL: test_maxpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaxpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vmaxpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmaxpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maxpd: ; BROADWELL: # %bb.0: @@ -2367,8 +2367,8 @@ ; HASWELL-LABEL: test_maxps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaxps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vmaxps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmaxps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maxps: ; BROADWELL: # %bb.0: @@ -2422,8 +2422,8 @@ ; HASWELL-LABEL: test_minpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vminpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vminpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vminpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_minpd: ; BROADWELL: # %bb.0: @@ -2477,8 +2477,8 @@ ; HASWELL-LABEL: test_minps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vminps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vminps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vminps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_minps: ; BROADWELL: # %bb.0: @@ -2533,10 +2533,10 @@ ; ; HASWELL-LABEL: test_movapd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovapd (%rdi), %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovapd (%rdi), %ymm0 # sched: [7:0.50] ; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovapd %ymm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movapd: ; BROADWELL: # %bb.0: @@ -2595,10 +2595,10 @@ ; ; HASWELL-LABEL: test_movaps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovaps (%rdi), %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovaps (%rdi), %ymm0 # sched: [7:0.50] ; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovaps %ymm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movaps: ; BROADWELL: # %bb.0: @@ -2658,9 +2658,9 @@ ; HASWELL-LABEL: test_movddup: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovddup {{.*#+}} ymm0 = ymm0[0,0,2,2] sched: [1:1.00] -; HASWELL-NEXT: vmovddup {{.*#+}} ymm1 = mem[0,0,2,2] sched: [1:0.50] +; HASWELL-NEXT: vmovddup {{.*#+}} ymm1 = mem[0,0,2,2] sched: [7:0.50] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movddup: ; BROADWELL: # %bb.0: @@ -2720,7 +2720,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovmskpd %ymm0, %eax # sched: [3:1.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movmskpd: ; BROADWELL: # %bb.0: @@ -2772,7 +2772,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovmskps %ymm0, %eax # sched: [3:1.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movmskps: ; BROADWELL: # %bb.0: @@ -2830,7 +2830,7 @@ ; HASWELL-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntdq: ; BROADWELL: # %bb.0: @@ -2891,7 +2891,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovntpd %ymm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntpd: ; BROADWELL: # %bb.0: @@ -2944,7 +2944,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovntps %ymm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntps: ; BROADWELL: # %bb.0: @@ -2998,9 +2998,9 @@ ; HASWELL-LABEL: test_movshdup: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovshdup {{.*#+}} ymm0 = ymm0[1,1,3,3,5,5,7,7] sched: [1:1.00] -; HASWELL-NEXT: vmovshdup {{.*#+}} ymm1 = mem[1,1,3,3,5,5,7,7] sched: [1:0.50] +; HASWELL-NEXT: vmovshdup {{.*#+}} ymm1 = mem[1,1,3,3,5,5,7,7] sched: [7:0.50] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movshdup: ; BROADWELL: # %bb.0: @@ -3061,9 +3061,9 @@ ; HASWELL-LABEL: test_movsldup: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovsldup {{.*#+}} ymm0 = ymm0[0,0,2,2,4,4,6,6] sched: [1:1.00] -; HASWELL-NEXT: vmovsldup {{.*#+}} ymm1 = mem[0,0,2,2,4,4,6,6] sched: [1:0.50] +; HASWELL-NEXT: vmovsldup {{.*#+}} ymm1 = mem[0,0,2,2,4,4,6,6] sched: [7:0.50] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movsldup: ; BROADWELL: # %bb.0: @@ -3125,10 +3125,10 @@ ; ; HASWELL-LABEL: test_movupd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovupd (%rdi), %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovupd (%rdi), %ymm0 # sched: [7:0.50] ; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovupd %ymm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movupd: ; BROADWELL: # %bb.0: @@ -3189,10 +3189,10 @@ ; ; HASWELL-LABEL: test_movups: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovups (%rdi), %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovups (%rdi), %ymm0 # sched: [7:0.50] ; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovups %ymm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movups: ; BROADWELL: # %bb.0: @@ -3250,8 +3250,8 @@ ; HASWELL-LABEL: test_mulpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmulpd %ymm1, %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulpd (%rdi), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulpd (%rdi), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulpd: ; BROADWELL: # %bb.0: @@ -3304,8 +3304,8 @@ ; HASWELL-LABEL: test_mulps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmulps %ymm1, %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps (%rdi), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps (%rdi), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulps: ; BROADWELL: # %bb.0: @@ -3360,9 +3360,9 @@ ; HASWELL-LABEL: orpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vorpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vorpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vorpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: orpd: ; BROADWELL: # %bb.0: @@ -3427,9 +3427,9 @@ ; HASWELL-LABEL: test_orps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vorps %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vorps (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vorps (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_orps: ; BROADWELL: # %bb.0: @@ -3494,9 +3494,9 @@ ; HASWELL-LABEL: test_perm2f128: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vperm2f128 {{.*#+}} ymm1 = ymm0[2,3],ymm1[0,1] sched: [3:1.00] -; HASWELL-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [3:1.00] +; HASWELL-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [10:1.00] ; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_perm2f128: ; BROADWELL: # %bb.0: @@ -3557,9 +3557,9 @@ ; HASWELL-LABEL: test_permilpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilpd {{.*#+}} xmm0 = xmm0[1,0] sched: [1:1.00] -; HASWELL-NEXT: vpermilpd {{.*#+}} xmm1 = mem[1,0] sched: [1:1.00] +; HASWELL-NEXT: vpermilpd {{.*#+}} xmm1 = mem[1,0] sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilpd: ; BROADWELL: # %bb.0: @@ -3620,9 +3620,9 @@ ; HASWELL-LABEL: test_permilpd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilpd {{.*#+}} ymm0 = ymm0[1,0,2,3] sched: [1:1.00] -; HASWELL-NEXT: vpermilpd {{.*#+}} ymm1 = mem[1,0,2,3] sched: [1:1.00] +; HASWELL-NEXT: vpermilpd {{.*#+}} ymm1 = mem[1,0,2,3] sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilpd_ymm: ; BROADWELL: # %bb.0: @@ -3683,9 +3683,9 @@ ; HASWELL-LABEL: test_permilps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[3,2,1,0] sched: [1:1.00] -; HASWELL-NEXT: vpermilps {{.*#+}} xmm1 = mem[3,2,1,0] sched: [1:1.00] +; HASWELL-NEXT: vpermilps {{.*#+}} xmm1 = mem[3,2,1,0] sched: [7:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilps: ; BROADWELL: # %bb.0: @@ -3746,9 +3746,9 @@ ; HASWELL-LABEL: test_permilps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilps {{.*#+}} ymm0 = ymm0[3,2,1,0,7,6,5,4] sched: [1:1.00] -; HASWELL-NEXT: vpermilps {{.*#+}} ymm1 = mem[3,2,1,0,7,6,5,4] sched: [1:1.00] +; HASWELL-NEXT: vpermilps {{.*#+}} ymm1 = mem[3,2,1,0,7,6,5,4] sched: [8:1.00] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilps_ymm: ; BROADWELL: # %bb.0: @@ -3807,8 +3807,8 @@ ; HASWELL-LABEL: test_permilvarpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpermilpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpermilpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilvarpd: ; BROADWELL: # %bb.0: @@ -3862,8 +3862,8 @@ ; HASWELL-LABEL: test_permilvarpd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpermilpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpermilpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilvarpd_ymm: ; BROADWELL: # %bb.0: @@ -3917,8 +3917,8 @@ ; HASWELL-LABEL: test_permilvarps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilps %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpermilps (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpermilps (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilvarps: ; BROADWELL: # %bb.0: @@ -3972,8 +3972,8 @@ ; HASWELL-LABEL: test_permilvarps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermilps %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpermilps (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpermilps (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permilvarps_ymm: ; BROADWELL: # %bb.0: @@ -4028,10 +4028,10 @@ ; ; HASWELL-LABEL: test_rcpps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vrcpps (%rdi), %ymm1 # sched: [11:2.00] +; HASWELL-NEXT: vrcpps (%rdi), %ymm1 # sched: [18:2.00] ; HASWELL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rcpps: ; BROADWELL: # %bb.0: @@ -4092,10 +4092,10 @@ ; ; HASWELL-LABEL: test_roundpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vroundpd $7, %ymm0, %ymm0 # sched: [5:1.25] -; HASWELL-NEXT: vroundpd $7, (%rdi), %ymm1 # sched: [6:2.00] +; HASWELL-NEXT: vroundpd $7, %ymm0, %ymm0 # sched: [6:0.50] +; HASWELL-NEXT: vroundpd $7, (%rdi), %ymm1 # sched: [13:2.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_roundpd: ; BROADWELL: # %bb.0: @@ -4156,10 +4156,10 @@ ; ; HASWELL-LABEL: test_roundps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vroundps $7, %ymm0, %ymm0 # sched: [5:1.25] -; HASWELL-NEXT: vroundps $7, (%rdi), %ymm1 # sched: [6:2.00] +; HASWELL-NEXT: vroundps $7, %ymm0, %ymm0 # sched: [6:0.50] +; HASWELL-NEXT: vroundps $7, (%rdi), %ymm1 # sched: [13:2.00] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_roundps: ; BROADWELL: # %bb.0: @@ -4220,10 +4220,10 @@ ; ; HASWELL-LABEL: test_rsqrtps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vrsqrtps (%rdi), %ymm1 # sched: [11:2.00] +; HASWELL-NEXT: vrsqrtps (%rdi), %ymm1 # sched: [18:2.00] ; HASWELL-NEXT: vrsqrtps %ymm0, %ymm0 # sched: [11:2.00] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rsqrtps: ; BROADWELL: # %bb.0: @@ -4285,9 +4285,9 @@ ; HASWELL-LABEL: test_shufpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vshufpd {{.*#+}} ymm0 = ymm0[1],ymm1[0],ymm0[2],ymm1[3] sched: [1:1.00] -; HASWELL-NEXT: vshufpd {{.*#+}} ymm1 = ymm1[1],mem[0],ymm1[2],mem[3] sched: [1:1.00] +; HASWELL-NEXT: vshufpd {{.*#+}} ymm1 = ymm1[1],mem[0],ymm1[2],mem[3] sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shufpd: ; BROADWELL: # %bb.0: @@ -4346,8 +4346,8 @@ ; HASWELL-LABEL: test_shufps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vshufps {{.*#+}} ymm0 = ymm0[0,0],ymm1[0,0],ymm0[4,4],ymm1[4,4] sched: [1:1.00] -; HASWELL-NEXT: vshufps {{.*#+}} ymm0 = ymm0[0,3],mem[0,0],ymm0[4,7],mem[4,4] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vshufps {{.*#+}} ymm0 = ymm0[0,3],mem[0,0],ymm0[4,7],mem[4,4] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shufps: ; BROADWELL: # %bb.0: @@ -4401,10 +4401,10 @@ ; ; HASWELL-LABEL: test_sqrtpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vsqrtpd (%rdi), %ymm1 # sched: [35:2.00] +; HASWELL-NEXT: vsqrtpd (%rdi), %ymm1 # sched: [42:2.00] ; HASWELL-NEXT: vsqrtpd %ymm0, %ymm0 # sched: [35:2.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sqrtpd: ; BROADWELL: # %bb.0: @@ -4465,10 +4465,10 @@ ; ; HASWELL-LABEL: test_sqrtps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vsqrtps (%rdi), %ymm1 # sched: [21:2.00] +; HASWELL-NEXT: vsqrtps (%rdi), %ymm1 # sched: [28:2.00] ; HASWELL-NEXT: vsqrtps %ymm0, %ymm0 # sched: [21:2.00] ; HASWELL-NEXT: vaddps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sqrtps: ; BROADWELL: # %bb.0: @@ -4528,8 +4528,8 @@ ; HASWELL-LABEL: test_subpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsubpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vsubpd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vsubpd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_subpd: ; BROADWELL: # %bb.0: @@ -4582,8 +4582,8 @@ ; HASWELL-LABEL: test_subps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsubps %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vsubps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vsubps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_subps: ; BROADWELL: # %bb.0: @@ -4644,9 +4644,9 @@ ; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25] ; HASWELL-NEXT: vtestpd %xmm1, %xmm0 # sched: [1:1.00] ; HASWELL-NEXT: setb %al # sched: [1:0.50] -; HASWELL-NEXT: vtestpd (%rdi), %xmm0 # sched: [1:1.00] +; HASWELL-NEXT: vtestpd (%rdi), %xmm0 # sched: [7:1.00] ; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_testpd: ; BROADWELL: # %bb.0: @@ -4726,10 +4726,10 @@ ; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25] ; HASWELL-NEXT: vtestpd %ymm1, %ymm0 # sched: [1:1.00] ; HASWELL-NEXT: setb %al # sched: [1:0.50] -; HASWELL-NEXT: vtestpd (%rdi), %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vtestpd (%rdi), %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_testpd_ymm: ; BROADWELL: # %bb.0: @@ -4811,9 +4811,9 @@ ; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25] ; HASWELL-NEXT: vtestps %xmm1, %xmm0 # sched: [1:1.00] ; HASWELL-NEXT: setb %al # sched: [1:0.50] -; HASWELL-NEXT: vtestps (%rdi), %xmm0 # sched: [1:1.00] +; HASWELL-NEXT: vtestps (%rdi), %xmm0 # sched: [7:1.00] ; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_testps: ; BROADWELL: # %bb.0: @@ -4893,10 +4893,10 @@ ; HASWELL-NEXT: xorl %eax, %eax # sched: [1:0.25] ; HASWELL-NEXT: vtestps %ymm1, %ymm0 # sched: [1:1.00] ; HASWELL-NEXT: setb %al # sched: [1:0.50] -; HASWELL-NEXT: vtestps (%rdi), %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vtestps (%rdi), %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: adcl $0, %eax # sched: [2:0.50] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_testps_ymm: ; BROADWELL: # %bb.0: @@ -4972,9 +4972,9 @@ ; HASWELL-LABEL: test_unpckhpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpckhpd {{.*#+}} ymm0 = ymm0[1],ymm1[1],ymm0[3],ymm1[3] sched: [1:1.00] -; HASWELL-NEXT: vunpckhpd {{.*#+}} ymm1 = ymm1[1],mem[1],ymm1[3],mem[3] sched: [1:1.00] +; HASWELL-NEXT: vunpckhpd {{.*#+}} ymm1 = ymm1[1],mem[1],ymm1[3],mem[3] sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpckhpd: ; BROADWELL: # %bb.0: @@ -5033,8 +5033,8 @@ ; HASWELL-LABEL: test_unpckhps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpckhps {{.*#+}} ymm0 = ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[6],ymm1[6],ymm0[7],ymm1[7] sched: [1:1.00] -; HASWELL-NEXT: vunpckhps {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vunpckhps {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpckhps: ; BROADWELL: # %bb.0: @@ -5089,9 +5089,9 @@ ; HASWELL-LABEL: test_unpcklpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpcklpd {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[2],ymm1[2] sched: [1:1.00] -; HASWELL-NEXT: vunpcklpd {{.*#+}} ymm1 = ymm1[0],mem[0],ymm1[2],mem[2] sched: [1:1.00] +; HASWELL-NEXT: vunpcklpd {{.*#+}} ymm1 = ymm1[0],mem[0],ymm1[2],mem[2] sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpcklpd: ; BROADWELL: # %bb.0: @@ -5150,8 +5150,8 @@ ; HASWELL-LABEL: test_unpcklps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpcklps {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[4],ymm1[4],ymm0[5],ymm1[5] sched: [1:1.00] -; HASWELL-NEXT: vunpcklps {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vunpcklps {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpcklps: ; BROADWELL: # %bb.0: @@ -5206,9 +5206,9 @@ ; HASWELL-LABEL: test_xorpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vxorpd %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vxorpd (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vxorpd (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddpd %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_xorpd: ; BROADWELL: # %bb.0: @@ -5273,9 +5273,9 @@ ; HASWELL-LABEL: test_xorps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vxorps %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vxorps (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vxorps (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_xorps: ; BROADWELL: # %bb.0: @@ -5336,7 +5336,7 @@ ; HASWELL-LABEL: test_zeroall: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vzeroall # sched: [16:16.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_zeroall: ; BROADWELL: # %bb.0: @@ -5381,7 +5381,7 @@ ; HASWELL-LABEL: test_zeroupper: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_zeroupper: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/avx2-schedule.ll =================================================================== --- test/CodeGen/X86/avx2-schedule.ll +++ test/CodeGen/X86/avx2-schedule.ll @@ -15,9 +15,9 @@ ; ; HASWELL-LABEL: test_broadcasti128: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcasti128 {{.*#+}} ymm1 = mem[0,1,0,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcasti128 {{.*#+}} ymm1 = mem[0,1,0,1] sched: [7:0.50] ; HASWELL-NEXT: vpaddd %ymm0, %ymm1, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcasti128: ; BROADWELL: # %bb.0: @@ -59,7 +59,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vbroadcastsd %xmm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vaddpd %ymm0, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastsd_ymm: ; BROADWELL: # %bb.0: @@ -100,7 +100,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vbroadcastss %xmm0, %xmm0 # sched: [1:1.00] ; HASWELL-NEXT: vaddps %xmm0, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastss: ; BROADWELL: # %bb.0: @@ -141,7 +141,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vbroadcastss %xmm0, %ymm0 # sched: [3:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_broadcastss_ymm: ; BROADWELL: # %bb.0: @@ -188,7 +188,7 @@ ; HASWELL-NEXT: vextracti128 $1, %ymm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vextracti128 $1, %ymm2, (%rdi) # sched: [1:1.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_extracti128: ; BROADWELL: # %bb.0: @@ -241,8 +241,8 @@ ; ; HASWELL-LABEL: test_gatherdpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherdpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherdpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [26:2.67] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherdpd: ; BROADWELL: # %bb.0: @@ -276,8 +276,8 @@ ; ; HASWELL-LABEL: test_gatherdpd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherdpd %ymm2, (%rdi,%xmm1,8), %ymm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherdpd %ymm2, (%rdi,%xmm1,8), %ymm0 # sched: [27:4.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherdpd_ymm: ; BROADWELL: # %bb.0: @@ -311,8 +311,8 @@ ; ; HASWELL-LABEL: test_gatherdps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherdps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherdps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [25:3.67] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherdps: ; BROADWELL: # %bb.0: @@ -346,8 +346,8 @@ ; ; HASWELL-LABEL: test_gatherdps_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherdps %ymm2, (%rdi,%ymm1,4), %ymm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherdps %ymm2, (%rdi,%ymm1,4), %ymm0 # sched: [27:6.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherdps_ymm: ; BROADWELL: # %bb.0: @@ -381,8 +381,8 @@ ; ; HASWELL-LABEL: test_gatherqpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherqpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherqpd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [23:3.33] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherqpd: ; BROADWELL: # %bb.0: @@ -416,8 +416,8 @@ ; ; HASWELL-LABEL: test_gatherqpd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherqpd %ymm2, (%rdi,%ymm1,8), %ymm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherqpd %ymm2, (%rdi,%ymm1,8), %ymm0 # sched: [24:5.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherqpd_ymm: ; BROADWELL: # %bb.0: @@ -451,8 +451,8 @@ ; ; HASWELL-LABEL: test_gatherqps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [25:3.67] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherqps: ; BROADWELL: # %bb.0: @@ -487,9 +487,9 @@ ; ; HASWELL-LABEL: test_gatherqps_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%ymm1,4), %xmm0 # sched: [1:?] +; HASWELL-NEXT: vgatherqps %xmm2, (%rdi,%ymm1,4), %xmm0 # sched: [28:3.67] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_gatherqps_ymm: ; BROADWELL: # %bb.0: @@ -530,9 +530,9 @@ ; HASWELL-LABEL: test_inserti128: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm1 # sched: [3:1.00] -; HASWELL-NEXT: vinserti128 $1, (%rdi), %ymm0, %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vinserti128 $1, (%rdi), %ymm0, %ymm0 # sched: [7:0.50] ; HASWELL-NEXT: vpaddd %ymm0, %ymm1, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_inserti128: ; BROADWELL: # %bb.0: @@ -578,8 +578,8 @@ ; ; HASWELL-LABEL: test_movntdqa: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovntdqa (%rdi), %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmovntdqa (%rdi), %ymm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntdqa: ; BROADWELL: # %bb.0: @@ -615,8 +615,8 @@ ; HASWELL-LABEL: test_mpsadbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmpsadbw $7, %ymm1, %ymm0, %ymm0 # sched: [7:2.00] -; HASWELL-NEXT: vmpsadbw $7, (%rdi), %ymm0, %ymm0 # sched: [7:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmpsadbw $7, (%rdi), %ymm0, %ymm0 # sched: [14:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mpsadbw: ; BROADWELL: # %bb.0: @@ -660,9 +660,9 @@ ; HASWELL-LABEL: test_pabsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpabsb %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpabsb (%rdi), %ymm1 # sched: [1:0.50] +; HASWELL-NEXT: vpabsb (%rdi), %ymm1 # sched: [8:0.50] ; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsb: ; BROADWELL: # %bb.0: @@ -710,9 +710,9 @@ ; HASWELL-LABEL: test_pabsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpabsd %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpabsd (%rdi), %ymm1 # sched: [1:0.50] +; HASWELL-NEXT: vpabsd (%rdi), %ymm1 # sched: [8:0.50] ; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsd: ; BROADWELL: # %bb.0: @@ -760,9 +760,9 @@ ; HASWELL-LABEL: test_pabsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpabsw %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpabsw (%rdi), %ymm1 # sched: [1:0.50] +; HASWELL-NEXT: vpabsw (%rdi), %ymm1 # sched: [8:0.50] ; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsw: ; BROADWELL: # %bb.0: @@ -809,8 +809,8 @@ ; HASWELL-LABEL: test_packssdw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpackssdw %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpackssdw (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpackssdw (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packssdw: ; BROADWELL: # %bb.0: @@ -853,8 +853,8 @@ ; HASWELL-LABEL: test_packsswb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpacksswb %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpacksswb (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpacksswb (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packsswb: ; BROADWELL: # %bb.0: @@ -897,8 +897,8 @@ ; HASWELL-LABEL: test_packusdw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpackusdw %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpackusdw (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpackusdw (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packusdw: ; BROADWELL: # %bb.0: @@ -941,8 +941,8 @@ ; HASWELL-LABEL: test_packuswb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpackuswb %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpackuswb (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpackuswb (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packuswb: ; BROADWELL: # %bb.0: @@ -985,8 +985,8 @@ ; HASWELL-LABEL: test_paddb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddb: ; BROADWELL: # %bb.0: @@ -1027,8 +1027,8 @@ ; HASWELL-LABEL: test_paddd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddd: ; BROADWELL: # %bb.0: @@ -1069,8 +1069,8 @@ ; HASWELL-LABEL: test_paddq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddq (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddq (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddq: ; BROADWELL: # %bb.0: @@ -1111,8 +1111,8 @@ ; HASWELL-LABEL: test_paddsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddsb: ; BROADWELL: # %bb.0: @@ -1154,8 +1154,8 @@ ; HASWELL-LABEL: test_paddsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddsw: ; BROADWELL: # %bb.0: @@ -1197,8 +1197,8 @@ ; HASWELL-LABEL: test_paddusb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddusb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddusb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddusb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddusb: ; BROADWELL: # %bb.0: @@ -1240,8 +1240,8 @@ ; HASWELL-LABEL: test_paddusw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddusw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddusw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddusw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddusw: ; BROADWELL: # %bb.0: @@ -1283,8 +1283,8 @@ ; HASWELL-LABEL: test_paddw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddw: ; BROADWELL: # %bb.0: @@ -1325,8 +1325,8 @@ ; HASWELL-LABEL: test_palignr: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpalignr {{.*#+}} ymm0 = ymm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],ymm0[0],ymm1[17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],ymm0[16] sched: [1:1.00] -; HASWELL-NEXT: vpalignr {{.*#+}} ymm0 = mem[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],ymm0[0],mem[17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],ymm0[16] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpalignr {{.*#+}} ymm0 = mem[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],ymm0[0],mem[17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],ymm0[16] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_palignr: ; BROADWELL: # %bb.0: @@ -1368,9 +1368,9 @@ ; HASWELL-LABEL: test_pand: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpand %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: vpand (%rdi), %ymm0, %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vpand (%rdi), %ymm0, %ymm0 # sched: [8:0.50] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pand: ; BROADWELL: # %bb.0: @@ -1417,9 +1417,9 @@ ; HASWELL-LABEL: test_pandn: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpandn %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: vpandn (%rdi), %ymm0, %ymm1 # sched: [1:0.50] +; HASWELL-NEXT: vpandn (%rdi), %ymm0, %ymm1 # sched: [8:0.50] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pandn: ; BROADWELL: # %bb.0: @@ -1467,8 +1467,8 @@ ; HASWELL-LABEL: test_pavgb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpavgb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpavgb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpavgb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pavgb: ; BROADWELL: # %bb.0: @@ -1519,8 +1519,8 @@ ; HASWELL-LABEL: test_pavgw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpavgw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpavgw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpavgw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pavgw: ; BROADWELL: # %bb.0: @@ -1572,9 +1572,9 @@ ; HASWELL-LABEL: test_pblendd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpblendd {{.*#+}} xmm1 = xmm1[0,1,2],xmm0[3] sched: [1:0.33] -; HASWELL-NEXT: vpblendd {{.*#+}} xmm1 = mem[0],xmm1[1],mem[2],xmm1[3] sched: [1:0.50] +; HASWELL-NEXT: vpblendd {{.*#+}} xmm1 = mem[0],xmm1[1],mem[2],xmm1[3] sched: [7:0.50] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pblendd: ; BROADWELL: # %bb.0: @@ -1621,9 +1621,9 @@ ; HASWELL-LABEL: test_pblendd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2],ymm0[3,4,5,6],ymm1[7] sched: [1:0.33] -; HASWELL-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0],mem[1,2],ymm1[3,4,5,6,7] sched: [1:0.50] +; HASWELL-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0],mem[1,2],ymm1[3,4,5,6,7] sched: [8:0.50] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pblendd_ymm: ; BROADWELL: # %bb.0: @@ -1669,8 +1669,8 @@ ; HASWELL-LABEL: test_pblendvb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpblendvb %ymm2, %ymm1, %ymm0, %ymm0 # sched: [2:2.00] -; HASWELL-NEXT: vpblendvb %ymm3, (%rdi), %ymm0, %ymm0 # sched: [2:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpblendvb %ymm3, (%rdi), %ymm0, %ymm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pblendvb: ; BROADWELL: # %bb.0: @@ -1712,8 +1712,8 @@ ; HASWELL-LABEL: test_pblendw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpblendw {{.*#+}} ymm0 = ymm0[0,1],ymm1[2,3,4],ymm0[5,6,7,8,9],ymm1[10,11,12],ymm0[13,14,15] sched: [1:1.00] -; HASWELL-NEXT: vpblendw {{.*#+}} ymm0 = mem[0],ymm0[1],mem[2],ymm0[3],mem[4],ymm0[5],mem[6],ymm0[7],mem[8],ymm0[9],mem[10],ymm0[11],mem[12],ymm0[13],mem[14],ymm0[15] sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpblendw {{.*#+}} ymm0 = mem[0],ymm0[1],mem[2],ymm0[3],mem[4],ymm0[5],mem[6],ymm0[7],mem[8],ymm0[9],mem[10],ymm0[11],mem[12],ymm0[13],mem[14],ymm0[15] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pblendw: ; BROADWELL: # %bb.0: @@ -1755,9 +1755,9 @@ ; HASWELL-LABEL: test_pbroadcastb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastb %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vpbroadcastb (%rdi), %xmm1 # sched: [4:1.00] +; HASWELL-NEXT: vpbroadcastb (%rdi), %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastb: ; BROADWELL: # %bb.0: @@ -1804,9 +1804,9 @@ ; HASWELL-LABEL: test_pbroadcastb_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastb %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpbroadcastb (%rdi), %ymm1 # sched: [4:1.00] +; HASWELL-NEXT: vpbroadcastb (%rdi), %ymm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastb_ymm: ; BROADWELL: # %bb.0: @@ -1853,9 +1853,9 @@ ; HASWELL-LABEL: test_pbroadcastd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastd %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpbroadcastd (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vpbroadcastd (%rdi), %xmm1 # sched: [6:0.50] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastd: ; BROADWELL: # %bb.0: @@ -1901,9 +1901,9 @@ ; HASWELL-LABEL: test_pbroadcastd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastd %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpbroadcastd (%rdi), %ymm1 # sched: [1:0.50] +; HASWELL-NEXT: vpbroadcastd (%rdi), %ymm1 # sched: [7:0.50] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastd_ymm: ; BROADWELL: # %bb.0: @@ -1949,9 +1949,9 @@ ; HASWELL-LABEL: test_pbroadcastq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastq %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpbroadcastq (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vpbroadcastq (%rdi), %xmm1 # sched: [6:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastq: ; BROADWELL: # %bb.0: @@ -1997,9 +1997,9 @@ ; HASWELL-LABEL: test_pbroadcastq_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastq %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpbroadcastq (%rdi), %ymm1 # sched: [1:0.50] +; HASWELL-NEXT: vpbroadcastq (%rdi), %ymm1 # sched: [7:0.50] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastq_ymm: ; BROADWELL: # %bb.0: @@ -2045,9 +2045,9 @@ ; HASWELL-LABEL: test_pbroadcastw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastw %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vpbroadcastw (%rdi), %xmm1 # sched: [4:1.00] +; HASWELL-NEXT: vpbroadcastw (%rdi), %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastw: ; BROADWELL: # %bb.0: @@ -2094,9 +2094,9 @@ ; HASWELL-LABEL: test_pbroadcastw_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpbroadcastw %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpbroadcastw (%rdi), %ymm1 # sched: [4:1.00] +; HASWELL-NEXT: vpbroadcastw (%rdi), %ymm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pbroadcastw_ymm: ; BROADWELL: # %bb.0: @@ -2142,8 +2142,8 @@ ; HASWELL-LABEL: test_pcmpeqb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpeqb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqb: ; BROADWELL: # %bb.0: @@ -2188,8 +2188,8 @@ ; HASWELL-LABEL: test_pcmpeqd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpeqd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqd: ; BROADWELL: # %bb.0: @@ -2234,8 +2234,8 @@ ; HASWELL-LABEL: test_pcmpeqq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqq (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpeqq (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqq: ; BROADWELL: # %bb.0: @@ -2280,8 +2280,8 @@ ; HASWELL-LABEL: test_pcmpeqw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpeqw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqw: ; BROADWELL: # %bb.0: @@ -2326,8 +2326,8 @@ ; HASWELL-LABEL: test_pcmpgtb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpgtb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpgtb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtb: ; BROADWELL: # %bb.0: @@ -2372,8 +2372,8 @@ ; HASWELL-LABEL: test_pcmpgtd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpgtd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpgtd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtd: ; BROADWELL: # %bb.0: @@ -2418,8 +2418,8 @@ ; HASWELL-LABEL: test_pcmpgtq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtq %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpcmpgtq (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpgtq (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtq: ; BROADWELL: # %bb.0: @@ -2464,8 +2464,8 @@ ; HASWELL-LABEL: test_pcmpgtw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpgtw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpgtw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtw: ; BROADWELL: # %bb.0: @@ -2511,9 +2511,9 @@ ; HASWELL-LABEL: test_perm2i128: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vperm2i128 {{.*#+}} ymm1 = ymm0[2,3],ymm1[0,1] sched: [3:1.00] -; HASWELL-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [3:1.00] +; HASWELL-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],mem[0,1] sched: [10:1.00] ; HASWELL-NEXT: vpaddq %ymm0, %ymm1, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_perm2i128: ; BROADWELL: # %bb.0: @@ -2560,9 +2560,9 @@ ; HASWELL-LABEL: test_permd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermd %ymm1, %ymm0, %ymm1 # sched: [3:1.00] -; HASWELL-NEXT: vpermd (%rdi), %ymm0, %ymm0 # sched: [3:1.00] +; HASWELL-NEXT: vpermd (%rdi), %ymm0, %ymm0 # sched: [10:1.00] ; HASWELL-NEXT: vpaddd %ymm0, %ymm1, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permd: ; BROADWELL: # %bb.0: @@ -2610,9 +2610,9 @@ ; HASWELL-LABEL: test_permpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermpd {{.*#+}} ymm0 = ymm0[3,2,2,3] sched: [3:1.00] -; HASWELL-NEXT: vpermpd {{.*#+}} ymm1 = mem[0,2,2,3] sched: [3:1.00] +; HASWELL-NEXT: vpermpd {{.*#+}} ymm1 = mem[0,2,2,3] sched: [10:1.00] ; HASWELL-NEXT: vaddpd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permpd: ; BROADWELL: # %bb.0: @@ -2659,9 +2659,9 @@ ; HASWELL-LABEL: test_permps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermps %ymm1, %ymm0, %ymm1 # sched: [3:1.00] -; HASWELL-NEXT: vpermps (%rdi), %ymm0, %ymm0 # sched: [3:1.00] +; HASWELL-NEXT: vpermps (%rdi), %ymm0, %ymm0 # sched: [10:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permps: ; BROADWELL: # %bb.0: @@ -2709,9 +2709,9 @@ ; HASWELL-LABEL: test_permq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpermq {{.*#+}} ymm0 = ymm0[3,2,2,3] sched: [3:1.00] -; HASWELL-NEXT: vpermq {{.*#+}} ymm1 = mem[0,2,2,3] sched: [3:1.00] +; HASWELL-NEXT: vpermq {{.*#+}} ymm1 = mem[0,2,2,3] sched: [10:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_permq: ; BROADWELL: # %bb.0: @@ -2755,8 +2755,8 @@ ; ; HASWELL-LABEL: test_pgatherdd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherdd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherdd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [26:2.67] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherdd: ; BROADWELL: # %bb.0: @@ -2790,8 +2790,8 @@ ; ; HASWELL-LABEL: test_pgatherdd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherdd %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherdd %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [27:6.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherdd_ymm: ; BROADWELL: # %bb.0: @@ -2825,8 +2825,8 @@ ; ; HASWELL-LABEL: test_pgatherdq: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherdq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherdq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [26:2.67] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherdq: ; BROADWELL: # %bb.0: @@ -2860,8 +2860,8 @@ ; ; HASWELL-LABEL: test_pgatherdq_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherdq %ymm2, (%rdi,%xmm1,2), %ymm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherdq %ymm2, (%rdi,%xmm1,2), %ymm0 # sched: [27:4.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherdq_ymm: ; BROADWELL: # %bb.0: @@ -2895,8 +2895,8 @@ ; ; HASWELL-LABEL: test_pgatherqd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [25:5.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherqd: ; BROADWELL: # %bb.0: @@ -2931,9 +2931,9 @@ ; ; HASWELL-LABEL: test_pgatherqd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%ymm1,2), %xmm0 # sched: [1:?] +; HASWELL-NEXT: vpgatherqd %xmm2, (%rdi,%ymm1,2), %xmm0 # sched: [28:5.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherqd_ymm: ; BROADWELL: # %bb.0: @@ -2971,8 +2971,8 @@ ; ; HASWELL-LABEL: test_pgatherqq: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherqq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherqq %xmm2, (%rdi,%xmm1,2), %xmm0 # sched: [23:3.33] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherqq: ; BROADWELL: # %bb.0: @@ -3006,8 +3006,8 @@ ; ; HASWELL-LABEL: test_pgatherqq_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpgatherqq %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [1:?] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpgatherqq %ymm2, (%rdi,%ymm1,2), %ymm0 # sched: [24:5.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pgatherqq_ymm: ; BROADWELL: # %bb.0: @@ -3043,8 +3043,8 @@ ; HASWELL-LABEL: test_phaddd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphaddd %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vphaddd (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphaddd (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddd: ; BROADWELL: # %bb.0: @@ -3086,8 +3086,8 @@ ; HASWELL-LABEL: test_phaddsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphaddsw %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vphaddsw (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphaddsw (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddsw: ; BROADWELL: # %bb.0: @@ -3129,8 +3129,8 @@ ; HASWELL-LABEL: test_phaddw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphaddw %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vphaddw (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphaddw (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddw: ; BROADWELL: # %bb.0: @@ -3172,8 +3172,8 @@ ; HASWELL-LABEL: test_phsubd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphsubd %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vphsubd (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphsubd (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubd: ; BROADWELL: # %bb.0: @@ -3215,8 +3215,8 @@ ; HASWELL-LABEL: test_phsubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphsubsw %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vphsubsw (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphsubsw (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubsw: ; BROADWELL: # %bb.0: @@ -3258,8 +3258,8 @@ ; HASWELL-LABEL: test_phsubw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphsubw %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vphsubw (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphsubw (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubw: ; BROADWELL: # %bb.0: @@ -3301,8 +3301,8 @@ ; HASWELL-LABEL: test_pmaddubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaddubsw %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmaddubsw (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaddubsw (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaddubsw: ; BROADWELL: # %bb.0: @@ -3345,8 +3345,8 @@ ; HASWELL-LABEL: test_pmaddwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaddwd %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmaddwd (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaddwd (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaddwd: ; BROADWELL: # %bb.0: @@ -3389,10 +3389,10 @@ ; ; HASWELL-LABEL: test_pmaskmovd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpmaskmovd (%rdi), %xmm0, %xmm2 # sched: [2:2.00] -; HASWELL-NEXT: vpmaskmovd %xmm1, %xmm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vpmaskmovd (%rdi), %xmm0, %xmm2 # sched: [8:2.00] +; HASWELL-NEXT: vpmaskmovd %xmm1, %xmm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovdqa %xmm2, %xmm0 # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaskmovd: ; BROADWELL: # %bb.0: @@ -3438,10 +3438,10 @@ ; ; HASWELL-LABEL: test_pmaskmovd_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpmaskmovd (%rdi), %ymm0, %ymm2 # sched: [2:2.00] -; HASWELL-NEXT: vpmaskmovd %ymm1, %ymm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vpmaskmovd (%rdi), %ymm0, %ymm2 # sched: [9:2.00] +; HASWELL-NEXT: vpmaskmovd %ymm1, %ymm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovdqa %ymm2, %ymm0 # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaskmovd_ymm: ; BROADWELL: # %bb.0: @@ -3487,10 +3487,10 @@ ; ; HASWELL-LABEL: test_pmaskmovq: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpmaskmovq (%rdi), %xmm0, %xmm2 # sched: [2:2.00] -; HASWELL-NEXT: vpmaskmovq %xmm1, %xmm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vpmaskmovq (%rdi), %xmm0, %xmm2 # sched: [8:2.00] +; HASWELL-NEXT: vpmaskmovq %xmm1, %xmm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovdqa %xmm2, %xmm0 # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaskmovq: ; BROADWELL: # %bb.0: @@ -3536,10 +3536,10 @@ ; ; HASWELL-LABEL: test_pmaskmovq_ymm: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vpmaskmovq (%rdi), %ymm0, %ymm2 # sched: [2:2.00] -; HASWELL-NEXT: vpmaskmovq %ymm1, %ymm0, (%rdi) # sched: [4:1.00] +; HASWELL-NEXT: vpmaskmovq (%rdi), %ymm0, %ymm2 # sched: [9:2.00] +; HASWELL-NEXT: vpmaskmovq %ymm1, %ymm0, (%rdi) # sched: [5:1.00] ; HASWELL-NEXT: vmovdqa %ymm2, %ymm0 # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaskmovq_ymm: ; BROADWELL: # %bb.0: @@ -3585,8 +3585,8 @@ ; HASWELL-LABEL: test_pmaxsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsb: ; BROADWELL: # %bb.0: @@ -3628,8 +3628,8 @@ ; HASWELL-LABEL: test_pmaxsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxsd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxsd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxsd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsd: ; BROADWELL: # %bb.0: @@ -3671,8 +3671,8 @@ ; HASWELL-LABEL: test_pmaxsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsw: ; BROADWELL: # %bb.0: @@ -3714,8 +3714,8 @@ ; HASWELL-LABEL: test_pmaxub: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxub %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxub (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxub (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxub: ; BROADWELL: # %bb.0: @@ -3757,8 +3757,8 @@ ; HASWELL-LABEL: test_pmaxud: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxud %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxud (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxud (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxud: ; BROADWELL: # %bb.0: @@ -3800,8 +3800,8 @@ ; HASWELL-LABEL: test_pmaxuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxuw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxuw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxuw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxuw: ; BROADWELL: # %bb.0: @@ -3843,8 +3843,8 @@ ; HASWELL-LABEL: test_pminsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsb: ; BROADWELL: # %bb.0: @@ -3886,8 +3886,8 @@ ; HASWELL-LABEL: test_pminsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminsd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminsd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminsd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsd: ; BROADWELL: # %bb.0: @@ -3929,8 +3929,8 @@ ; HASWELL-LABEL: test_pminsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsw: ; BROADWELL: # %bb.0: @@ -3972,8 +3972,8 @@ ; HASWELL-LABEL: test_pminub: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminub %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminub (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminub (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminub: ; BROADWELL: # %bb.0: @@ -4015,8 +4015,8 @@ ; HASWELL-LABEL: test_pminud: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminud %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminud (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminud (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminud: ; BROADWELL: # %bb.0: @@ -4058,8 +4058,8 @@ ; HASWELL-LABEL: test_pminuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminuw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminuw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminuw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminuw: ; BROADWELL: # %bb.0: @@ -4102,7 +4102,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovmskb %ymm0, %eax # sched: [3:1.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovmskb: ; BROADWELL: # %bb.0: @@ -4143,9 +4143,9 @@ ; HASWELL-LABEL: test_pmovsxbd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxbd %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpmovsxbd (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vpmovsxbd (%rdi), %ymm1 # sched: [8:1.00] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxbd: ; BROADWELL: # %bb.0: @@ -4194,9 +4194,9 @@ ; HASWELL-LABEL: test_pmovsxbq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxbq %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpmovsxbq (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vpmovsxbq (%rdi), %ymm1 # sched: [8:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxbq: ; BROADWELL: # %bb.0: @@ -4245,9 +4245,9 @@ ; HASWELL-LABEL: test_pmovsxbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxbw %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpmovsxbw (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vpmovsxbw (%rdi), %ymm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxbw: ; BROADWELL: # %bb.0: @@ -4294,9 +4294,9 @@ ; HASWELL-LABEL: test_pmovsxdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxdq %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpmovsxdq (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vpmovsxdq (%rdi), %ymm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxdq: ; BROADWELL: # %bb.0: @@ -4343,9 +4343,9 @@ ; HASWELL-LABEL: test_pmovsxwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxwd %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpmovsxwd (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vpmovsxwd (%rdi), %ymm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxwd: ; BROADWELL: # %bb.0: @@ -4392,9 +4392,9 @@ ; HASWELL-LABEL: test_pmovsxwq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxwq %xmm0, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: vpmovsxwq (%rdi), %ymm1 # sched: [3:1.00] +; HASWELL-NEXT: vpmovsxwq (%rdi), %ymm1 # sched: [8:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxwq: ; BROADWELL: # %bb.0: @@ -4443,9 +4443,9 @@ ; HASWELL-LABEL: test_pmovzxbd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxbd {{.*#+}} ymm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero,xmm0[4],zero,zero,zero,xmm0[5],zero,zero,zero,xmm0[6],zero,zero,zero,xmm0[7],zero,zero,zero sched: [3:1.00] -; HASWELL-NEXT: vpmovzxbd {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero,mem[4],zero,zero,zero,mem[5],zero,zero,zero,mem[6],zero,zero,zero,mem[7],zero,zero,zero sched: [3:1.00] +; HASWELL-NEXT: vpmovzxbd {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero,mem[4],zero,zero,zero,mem[5],zero,zero,zero,mem[6],zero,zero,zero,mem[7],zero,zero,zero sched: [10:1.00] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxbd: ; BROADWELL: # %bb.0: @@ -4494,9 +4494,9 @@ ; HASWELL-LABEL: test_pmovzxbq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxbq {{.*#+}} ymm0 = xmm0[0],zero,zero,zero,zero,zero,zero,zero,xmm0[1],zero,zero,zero,zero,zero,zero,zero,xmm0[2],zero,zero,zero,zero,zero,zero,zero,xmm0[3],zero,zero,zero,zero,zero,zero,zero sched: [3:1.00] -; HASWELL-NEXT: vpmovzxbq {{.*#+}} ymm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero,mem[2],zero,zero,zero,zero,zero,zero,zero,mem[3],zero,zero,zero,zero,zero,zero,zero sched: [3:1.00] +; HASWELL-NEXT: vpmovzxbq {{.*#+}} ymm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero,mem[2],zero,zero,zero,zero,zero,zero,zero,mem[3],zero,zero,zero,zero,zero,zero,zero sched: [10:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxbq: ; BROADWELL: # %bb.0: @@ -4545,9 +4545,9 @@ ; HASWELL-LABEL: test_pmovzxbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxbw {{.*#+}} ymm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero,xmm0[8],zero,xmm0[9],zero,xmm0[10],zero,xmm0[11],zero,xmm0[12],zero,xmm0[13],zero,xmm0[14],zero,xmm0[15],zero sched: [3:1.00] -; HASWELL-NEXT: vpmovzxbw {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero,mem[8],zero,mem[9],zero,mem[10],zero,mem[11],zero,mem[12],zero,mem[13],zero,mem[14],zero,mem[15],zero sched: [3:1.00] +; HASWELL-NEXT: vpmovzxbw {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero,mem[8],zero,mem[9],zero,mem[10],zero,mem[11],zero,mem[12],zero,mem[13],zero,mem[14],zero,mem[15],zero sched: [10:1.00] ; HASWELL-NEXT: vpaddw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxbw: ; BROADWELL: # %bb.0: @@ -4594,9 +4594,9 @@ ; HASWELL-LABEL: test_pmovzxdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxdq {{.*#+}} ymm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero sched: [3:1.00] -; HASWELL-NEXT: vpmovzxdq {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [3:1.00] +; HASWELL-NEXT: vpmovzxdq {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [10:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxdq: ; BROADWELL: # %bb.0: @@ -4643,9 +4643,9 @@ ; HASWELL-LABEL: test_pmovzxwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxwd {{.*#+}} ymm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero sched: [3:1.00] -; HASWELL-NEXT: vpmovzxwd {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [3:1.00] +; HASWELL-NEXT: vpmovzxwd {{.*#+}} ymm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [9:1.00] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxwd: ; BROADWELL: # %bb.0: @@ -4692,9 +4692,9 @@ ; HASWELL-LABEL: test_pmovzxwq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxwq {{.*#+}} ymm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero sched: [3:1.00] -; HASWELL-NEXT: vpmovzxwq {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [3:1.00] +; HASWELL-NEXT: vpmovzxwq {{.*#+}} ymm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [10:1.00] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxwq: ; BROADWELL: # %bb.0: @@ -4742,8 +4742,8 @@ ; HASWELL-LABEL: test_pmuldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmuldq %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmuldq (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmuldq (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmuldq: ; BROADWELL: # %bb.0: @@ -4786,8 +4786,8 @@ ; HASWELL-LABEL: test_pmulhrsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulhrsw %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmulhrsw (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulhrsw (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhrsw: ; BROADWELL: # %bb.0: @@ -4829,8 +4829,8 @@ ; HASWELL-LABEL: test_pmulhuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulhuw %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmulhuw (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulhuw (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhuw: ; BROADWELL: # %bb.0: @@ -4872,8 +4872,8 @@ ; HASWELL-LABEL: test_pmulhw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulhw %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmulhw (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulhw (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhw: ; BROADWELL: # %bb.0: @@ -4915,8 +4915,8 @@ ; HASWELL-LABEL: test_pmulld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulld %ymm1, %ymm0, %ymm0 # sched: [10:2.00] -; HASWELL-NEXT: vpmulld (%rdi), %ymm0, %ymm0 # sched: [10:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulld (%rdi), %ymm0, %ymm0 # sched: [17:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulld: ; BROADWELL: # %bb.0: @@ -4957,8 +4957,8 @@ ; HASWELL-LABEL: test_pmullw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmullw %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmullw (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmullw (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmullw: ; BROADWELL: # %bb.0: @@ -4999,8 +4999,8 @@ ; HASWELL-LABEL: test_pmuludq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmuludq %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmuludq (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmuludq (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmuludq: ; BROADWELL: # %bb.0: @@ -5044,9 +5044,9 @@ ; HASWELL-LABEL: test_por: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: vpor (%rdi), %ymm0, %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vpor (%rdi), %ymm0, %ymm0 # sched: [8:0.50] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_por: ; BROADWELL: # %bb.0: @@ -5092,8 +5092,8 @@ ; HASWELL-LABEL: test_psadbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsadbw %ymm1, %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: vpsadbw (%rdi), %ymm0, %ymm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsadbw (%rdi), %ymm0, %ymm0 # sched: [12:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psadbw: ; BROADWELL: # %bb.0: @@ -5136,8 +5136,8 @@ ; HASWELL-LABEL: test_pshufb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshufb %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpshufb (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpshufb (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufb: ; BROADWELL: # %bb.0: @@ -5180,9 +5180,9 @@ ; HASWELL-LABEL: test_pshufd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshufd {{.*#+}} ymm0 = ymm0[3,2,1,0,7,6,5,4] sched: [1:1.00] -; HASWELL-NEXT: vpshufd {{.*#+}} ymm1 = mem[1,0,3,2,5,4,7,6] sched: [1:1.00] +; HASWELL-NEXT: vpshufd {{.*#+}} ymm1 = mem[1,0,3,2,5,4,7,6] sched: [8:1.00] ; HASWELL-NEXT: vpaddd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufd: ; BROADWELL: # %bb.0: @@ -5229,9 +5229,9 @@ ; HASWELL-LABEL: test_pshufhw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshufhw {{.*#+}} ymm0 = ymm0[0,1,2,3,7,6,5,4,8,9,10,11,15,14,13,12] sched: [1:1.00] -; HASWELL-NEXT: vpshufhw {{.*#+}} ymm1 = mem[0,1,2,3,5,4,7,6,8,9,10,11,13,12,15,14] sched: [1:1.00] +; HASWELL-NEXT: vpshufhw {{.*#+}} ymm1 = mem[0,1,2,3,5,4,7,6,8,9,10,11,13,12,15,14] sched: [8:1.00] ; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufhw: ; BROADWELL: # %bb.0: @@ -5278,9 +5278,9 @@ ; HASWELL-LABEL: test_pshuflw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshuflw {{.*#+}} ymm0 = ymm0[3,2,1,0,4,5,6,7,11,10,9,8,12,13,14,15] sched: [1:1.00] -; HASWELL-NEXT: vpshuflw {{.*#+}} ymm1 = mem[1,0,3,2,4,5,6,7,9,8,11,10,12,13,14,15] sched: [1:1.00] +; HASWELL-NEXT: vpshuflw {{.*#+}} ymm1 = mem[1,0,3,2,4,5,6,7,9,8,11,10,12,13,14,15] sched: [8:1.00] ; HASWELL-NEXT: vpor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshuflw: ; BROADWELL: # %bb.0: @@ -5326,8 +5326,8 @@ ; HASWELL-LABEL: test_psignb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsignb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsignb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsignb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignb: ; BROADWELL: # %bb.0: @@ -5369,8 +5369,8 @@ ; HASWELL-LABEL: test_psignd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsignd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsignd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsignd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignd: ; BROADWELL: # %bb.0: @@ -5412,8 +5412,8 @@ ; HASWELL-LABEL: test_psignw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsignw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsignw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsignw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignw: ; BROADWELL: # %bb.0: @@ -5456,9 +5456,9 @@ ; HASWELL-LABEL: test_pslld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpslld %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpslld (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpslld (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpslld $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pslld: ; BROADWELL: # %bb.0: @@ -5504,7 +5504,7 @@ ; HASWELL-LABEL: test_pslldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpslldq {{.*#+}} ymm0 = zero,zero,zero,ymm0[0,1,2,3,4,5,6,7,8,9,10,11,12],zero,zero,zero,ymm0[16,17,18,19,20,21,22,23,24,25,26,27,28] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pslldq: ; BROADWELL: # %bb.0: @@ -5540,9 +5540,9 @@ ; HASWELL-LABEL: test_psllq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllq %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsllq (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsllq (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsllq $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllq: ; BROADWELL: # %bb.0: @@ -5589,8 +5589,8 @@ ; HASWELL-LABEL: test_psllvd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllvd %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vpsllvd (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsllvd (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllvd: ; BROADWELL: # %bb.0: @@ -5632,8 +5632,8 @@ ; HASWELL-LABEL: test_psllvd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllvd %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vpsllvd (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsllvd (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllvd_ymm: ; BROADWELL: # %bb.0: @@ -5675,8 +5675,8 @@ ; HASWELL-LABEL: test_psllvq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllvq %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpsllvq (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsllvq (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllvq: ; BROADWELL: # %bb.0: @@ -5718,8 +5718,8 @@ ; HASWELL-LABEL: test_psllvq_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllvq %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpsllvq (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsllvq (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllvq_ymm: ; BROADWELL: # %bb.0: @@ -5762,9 +5762,9 @@ ; HASWELL-LABEL: test_psllw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllw %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsllw (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsllw (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsllw $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllw: ; BROADWELL: # %bb.0: @@ -5812,9 +5812,9 @@ ; HASWELL-LABEL: test_psrad: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrad %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsrad (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsrad (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrad $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrad: ; BROADWELL: # %bb.0: @@ -5861,8 +5861,8 @@ ; HASWELL-LABEL: test_psravd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsravd %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vpsravd (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsravd (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psravd: ; BROADWELL: # %bb.0: @@ -5904,8 +5904,8 @@ ; HASWELL-LABEL: test_psravd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsravd %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vpsravd (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsravd (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psravd_ymm: ; BROADWELL: # %bb.0: @@ -5948,9 +5948,9 @@ ; HASWELL-LABEL: test_psraw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsraw %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsraw (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsraw (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsraw $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psraw: ; BROADWELL: # %bb.0: @@ -5998,9 +5998,9 @@ ; HASWELL-LABEL: test_psrld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrld %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsrld (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsrld (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrld $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrld: ; BROADWELL: # %bb.0: @@ -6046,7 +6046,7 @@ ; HASWELL-LABEL: test_psrldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrldq {{.*#+}} ymm0 = ymm0[3,4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,ymm0[19,20,21,22,23,24,25,26,27,28,29,30,31],zero,zero,zero sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrldq: ; BROADWELL: # %bb.0: @@ -6082,9 +6082,9 @@ ; HASWELL-LABEL: test_psrlq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlq %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsrlq (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsrlq (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrlq $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlq: ; BROADWELL: # %bb.0: @@ -6131,8 +6131,8 @@ ; HASWELL-LABEL: test_psrlvd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlvd %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vpsrlvd (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsrlvd (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlvd: ; BROADWELL: # %bb.0: @@ -6174,8 +6174,8 @@ ; HASWELL-LABEL: test_psrlvd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlvd %ymm1, %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: vpsrlvd (%rdi), %ymm0, %ymm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsrlvd (%rdi), %ymm0, %ymm0 # sched: [10:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlvd_ymm: ; BROADWELL: # %bb.0: @@ -6217,8 +6217,8 @@ ; HASWELL-LABEL: test_psrlvq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlvq %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpsrlvq (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsrlvq (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlvq: ; BROADWELL: # %bb.0: @@ -6260,8 +6260,8 @@ ; HASWELL-LABEL: test_psrlvq_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlvq %ymm1, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: vpsrlvq (%rdi), %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsrlvq (%rdi), %ymm0, %ymm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlvq_ymm: ; BROADWELL: # %bb.0: @@ -6304,9 +6304,9 @@ ; HASWELL-LABEL: test_psrlw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlw %xmm1, %ymm0, %ymm0 # sched: [4:1.00] -; HASWELL-NEXT: vpsrlw (%rdi), %ymm0, %ymm0 # sched: [1:1.00] +; HASWELL-NEXT: vpsrlw (%rdi), %ymm0, %ymm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrlw $2, %ymm0, %ymm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlw: ; BROADWELL: # %bb.0: @@ -6353,8 +6353,8 @@ ; HASWELL-LABEL: test_psubb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubb: ; BROADWELL: # %bb.0: @@ -6395,8 +6395,8 @@ ; HASWELL-LABEL: test_psubd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubd (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubd (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubd: ; BROADWELL: # %bb.0: @@ -6437,8 +6437,8 @@ ; HASWELL-LABEL: test_psubq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubq (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubq (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubq: ; BROADWELL: # %bb.0: @@ -6479,8 +6479,8 @@ ; HASWELL-LABEL: test_psubsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubsb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubsb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubsb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubsb: ; BROADWELL: # %bb.0: @@ -6522,8 +6522,8 @@ ; HASWELL-LABEL: test_psubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubsw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubsw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubsw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubsw: ; BROADWELL: # %bb.0: @@ -6565,8 +6565,8 @@ ; HASWELL-LABEL: test_psubusb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubusb %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubusb (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubusb (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubusb: ; BROADWELL: # %bb.0: @@ -6608,8 +6608,8 @@ ; HASWELL-LABEL: test_psubusw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubusw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubusw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubusw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubusw: ; BROADWELL: # %bb.0: @@ -6651,8 +6651,8 @@ ; HASWELL-LABEL: test_psubw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubw %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubw (%rdi), %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubw (%rdi), %ymm0, %ymm0 # sched: [8:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubw: ; BROADWELL: # %bb.0: @@ -6693,8 +6693,8 @@ ; HASWELL-LABEL: test_punpckhbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhbw {{.*#+}} ymm0 = ymm0[8],ymm1[8],ymm0[9],ymm1[9],ymm0[10],ymm1[10],ymm0[11],ymm1[11],ymm0[12],ymm1[12],ymm0[13],ymm1[13],ymm0[14],ymm1[14],ymm0[15],ymm1[15],ymm0[24],ymm1[24],ymm0[25],ymm1[25],ymm0[26],ymm1[26],ymm0[27],ymm1[27],ymm0[28],ymm1[28],ymm0[29],ymm1[29],ymm0[30],ymm1[30],ymm0[31],ymm1[31] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhbw {{.*#+}} ymm0 = ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15],ymm0[24],mem[24],ymm0[25],mem[25],ymm0[26],mem[26],ymm0[27],mem[27],ymm0[28],mem[28],ymm0[29],mem[29],ymm0[30],mem[30],ymm0[31],mem[31] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpckhbw {{.*#+}} ymm0 = ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15],ymm0[24],mem[24],ymm0[25],mem[25],ymm0[26],mem[26],ymm0[27],mem[27],ymm0[28],mem[28],ymm0[29],mem[29],ymm0[30],mem[30],ymm0[31],mem[31] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhbw: ; BROADWELL: # %bb.0: @@ -6737,10 +6737,10 @@ ; HASWELL-LABEL: test_punpckhdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhdq {{.*#+}} ymm0 = ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[6],ymm1[6],ymm0[7],ymm1[7] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhdq {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [1:1.00] +; HASWELL-NEXT: vpunpckhdq {{.*#+}} ymm0 = ymm0[2],mem[2],ymm0[3],mem[3],ymm0[6],mem[6],ymm0[7],mem[7] sched: [8:1.00] ; HASWELL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 # sched: [1:0.50] ; HASWELL-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhdq: ; BROADWELL: # %bb.0: @@ -6791,9 +6791,9 @@ ; HASWELL-LABEL: test_punpckhqdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhqdq {{.*#+}} ymm1 = ymm0[1],ymm1[1],ymm0[3],ymm1[3] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhqdq {{.*#+}} ymm0 = ymm0[1],mem[1],ymm0[3],mem[3] sched: [1:1.00] +; HASWELL-NEXT: vpunpckhqdq {{.*#+}} ymm0 = ymm0[1],mem[1],ymm0[3],mem[3] sched: [8:1.00] ; HASWELL-NEXT: vpaddq %ymm0, %ymm1, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhqdq: ; BROADWELL: # %bb.0: @@ -6839,8 +6839,8 @@ ; HASWELL-LABEL: test_punpckhwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhwd {{.*#+}} ymm0 = ymm0[4],ymm1[4],ymm0[5],ymm1[5],ymm0[6],ymm1[6],ymm0[7],ymm1[7],ymm0[12],ymm1[12],ymm0[13],ymm1[13],ymm0[14],ymm1[14],ymm0[15],ymm1[15] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhwd {{.*#+}} ymm0 = ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpckhwd {{.*#+}} ymm0 = ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[12],mem[12],ymm0[13],mem[13],ymm0[14],mem[14],ymm0[15],mem[15] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhwd: ; BROADWELL: # %bb.0: @@ -6881,8 +6881,8 @@ ; HASWELL-LABEL: test_punpcklbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpcklbw {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[4],ymm1[4],ymm0[5],ymm1[5],ymm0[6],ymm1[6],ymm0[7],ymm1[7],ymm0[16],ymm1[16],ymm0[17],ymm1[17],ymm0[18],ymm1[18],ymm0[19],ymm1[19],ymm0[20],ymm1[20],ymm0[21],ymm1[21],ymm0[22],ymm1[22],ymm0[23],ymm1[23] sched: [1:1.00] -; HASWELL-NEXT: vpunpcklbw {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[16],mem[16],ymm0[17],mem[17],ymm0[18],mem[18],ymm0[19],mem[19],ymm0[20],mem[20],ymm0[21],mem[21],ymm0[22],mem[22],ymm0[23],mem[23] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpcklbw {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[4],mem[4],ymm0[5],mem[5],ymm0[6],mem[6],ymm0[7],mem[7],ymm0[16],mem[16],ymm0[17],mem[17],ymm0[18],mem[18],ymm0[19],mem[19],ymm0[20],mem[20],ymm0[21],mem[21],ymm0[22],mem[22],ymm0[23],mem[23] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklbw: ; BROADWELL: # %bb.0: @@ -6925,10 +6925,10 @@ ; HASWELL-LABEL: test_punpckldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckldq {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[4],ymm1[4],ymm0[5],ymm1[5] sched: [1:1.00] -; HASWELL-NEXT: vpunpckldq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [1:1.00] +; HASWELL-NEXT: vpunpckldq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[4],mem[4],ymm0[5],mem[5] sched: [8:1.00] ; HASWELL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 # sched: [1:0.50] ; HASWELL-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckldq: ; BROADWELL: # %bb.0: @@ -6979,9 +6979,9 @@ ; HASWELL-LABEL: test_punpcklqdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpcklqdq {{.*#+}} ymm1 = ymm0[0],ymm1[0],ymm0[2],ymm1[2] sched: [1:1.00] -; HASWELL-NEXT: vpunpcklqdq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[2],mem[2] sched: [1:1.00] +; HASWELL-NEXT: vpunpcklqdq {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[2],mem[2] sched: [8:1.00] ; HASWELL-NEXT: vpaddq %ymm0, %ymm1, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklqdq: ; BROADWELL: # %bb.0: @@ -7027,8 +7027,8 @@ ; HASWELL-LABEL: test_punpcklwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpcklwd {{.*#+}} ymm0 = ymm0[0],ymm1[0],ymm0[1],ymm1[1],ymm0[2],ymm1[2],ymm0[3],ymm1[3],ymm0[8],ymm1[8],ymm0[9],ymm1[9],ymm0[10],ymm1[10],ymm0[11],ymm1[11] sched: [1:1.00] -; HASWELL-NEXT: vpunpcklwd {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpcklwd {{.*#+}} ymm0 = ymm0[0],mem[0],ymm0[1],mem[1],ymm0[2],mem[2],ymm0[3],mem[3],ymm0[8],mem[8],ymm0[9],mem[9],ymm0[10],mem[10],ymm0[11],mem[11] sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklwd: ; BROADWELL: # %bb.0: @@ -7070,9 +7070,9 @@ ; HASWELL-LABEL: test_pxor: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpxor %ymm1, %ymm0, %ymm0 # sched: [1:0.33] -; HASWELL-NEXT: vpxor (%rdi), %ymm0, %ymm0 # sched: [1:0.50] +; HASWELL-NEXT: vpxor (%rdi), %ymm0, %ymm0 # sched: [8:0.50] ; HASWELL-NEXT: vpaddq %ymm1, %ymm0, %ymm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pxor: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/avx512-bugfix-23634.ll =================================================================== --- test/CodeGen/X86/avx512-bugfix-23634.ll +++ test/CodeGen/X86/avx512-bugfix-23634.ll @@ -16,8 +16,8 @@ ; CHECK-NEXT: movw $-21846, %ax ## imm = 0xAAAA ; CHECK-NEXT: kmovw %eax, %k1 ; CHECK-NEXT: vmovdqa32 {{.*}}(%rip), %zmm1 {%k1} -; CHECK-NEXT: vpaddd %zmm1, %zmm0, %zmm0 ; CHECK-NEXT: vpaddd %zmm0, %zmm2, %zmm0 +; CHECK-NEXT: vpaddd %zmm1, %zmm0, %zmm0 ; CHECK-NEXT: vcvtdq2ps %zmm0, %zmm0 ; CHECK-NEXT: vmovups %zmm0, (%rdi) ; CHECK-NEXT: retq Index: test/CodeGen/X86/bmi-schedule.ll =================================================================== --- test/CodeGen/X86/bmi-schedule.ll +++ test/CodeGen/X86/bmi-schedule.ll @@ -21,10 +21,10 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: andnl %esi, %edi, %eax # sched: [1:0.50] ; HASWELL-NEXT: notl %edi # sched: [1:0.25] -; HASWELL-NEXT: andw (%rdx), %di # sched: [1:0.50] +; HASWELL-NEXT: andw (%rdx), %di # sched: [6:0.50] ; HASWELL-NEXT: addl %edi, %eax # sched: [1:0.25] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andn_i16: ; BROADWELL: # %bb.0: @@ -80,9 +80,9 @@ ; HASWELL-LABEL: test_andn_i32: ; HASWELL: # %bb.0: ; HASWELL-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.50] -; HASWELL-NEXT: andnl (%rdx), %edi, %eax # sched: [1:0.50] +; HASWELL-NEXT: andnl (%rdx), %edi, %eax # sched: [6:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andn_i32: ; BROADWELL: # %bb.0: @@ -130,9 +130,9 @@ ; HASWELL-LABEL: test_andn_i64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.50] -; HASWELL-NEXT: andnq (%rdx), %rdi, %rax # sched: [1:0.50] +; HASWELL-NEXT: andnq (%rdx), %rdi, %rax # sched: [6:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andn_i64: ; BROADWELL: # %bb.0: @@ -179,10 +179,10 @@ ; ; HASWELL-LABEL: test_bextr_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: bextrl %edi, (%rdx), %ecx # sched: [2:0.50] +; HASWELL-NEXT: bextrl %edi, (%rdx), %ecx # sched: [7:0.50] ; HASWELL-NEXT: bextrl %edi, %esi, %eax # sched: [2:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bextr_i32: ; BROADWELL: # %bb.0: @@ -229,10 +229,10 @@ ; ; HASWELL-LABEL: test_bextr_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [2:0.50] +; HASWELL-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [7:0.50] ; HASWELL-NEXT: bextrq %rdi, %rsi, %rax # sched: [2:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bextr_i64: ; BROADWELL: # %bb.0: @@ -279,10 +279,10 @@ ; ; HASWELL-LABEL: test_blsi_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: blsil (%rsi), %ecx # sched: [1:0.50] +; HASWELL-NEXT: blsil (%rsi), %ecx # sched: [6:0.50] ; HASWELL-NEXT: blsil %edi, %eax # sched: [1:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blsi_i32: ; BROADWELL: # %bb.0: @@ -330,10 +330,10 @@ ; ; HASWELL-LABEL: test_blsi_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: blsiq (%rsi), %rcx # sched: [1:0.50] +; HASWELL-NEXT: blsiq (%rsi), %rcx # sched: [6:0.50] ; HASWELL-NEXT: blsiq %rdi, %rax # sched: [1:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blsi_i64: ; BROADWELL: # %bb.0: @@ -381,10 +381,10 @@ ; ; HASWELL-LABEL: test_blsmsk_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: blsmskl (%rsi), %ecx # sched: [1:0.50] +; HASWELL-NEXT: blsmskl (%rsi), %ecx # sched: [6:0.50] ; HASWELL-NEXT: blsmskl %edi, %eax # sched: [1:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blsmsk_i32: ; BROADWELL: # %bb.0: @@ -432,10 +432,10 @@ ; ; HASWELL-LABEL: test_blsmsk_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: blsmskq (%rsi), %rcx # sched: [1:0.50] +; HASWELL-NEXT: blsmskq (%rsi), %rcx # sched: [6:0.50] ; HASWELL-NEXT: blsmskq %rdi, %rax # sched: [1:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blsmsk_i64: ; BROADWELL: # %bb.0: @@ -483,10 +483,10 @@ ; ; HASWELL-LABEL: test_blsr_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: blsrl (%rsi), %ecx # sched: [1:0.50] +; HASWELL-NEXT: blsrl (%rsi), %ecx # sched: [6:0.50] ; HASWELL-NEXT: blsrl %edi, %eax # sched: [1:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blsr_i32: ; BROADWELL: # %bb.0: @@ -534,10 +534,10 @@ ; ; HASWELL-LABEL: test_blsr_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: blsrq (%rsi), %rcx # sched: [1:0.50] +; HASWELL-NEXT: blsrq (%rsi), %rcx # sched: [6:0.50] ; HASWELL-NEXT: blsrq %rdi, %rax # sched: [1:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blsr_i64: ; BROADWELL: # %bb.0: @@ -586,11 +586,11 @@ ; ; HASWELL-LABEL: test_cttz_i16: ; HASWELL: # %bb.0: -; HASWELL-NEXT: tzcntw (%rsi), %cx # sched: [3:1.00] +; HASWELL-NEXT: tzcntw (%rsi), %cx # sched: [8:1.00] ; HASWELL-NEXT: tzcntw %di, %ax # sched: [3:1.00] ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cttz_i16: ; BROADWELL: # %bb.0: @@ -641,10 +641,10 @@ ; ; HASWELL-LABEL: test_cttz_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: tzcntl (%rsi), %ecx # sched: [3:1.00] +; HASWELL-NEXT: tzcntl (%rsi), %ecx # sched: [8:1.00] ; HASWELL-NEXT: tzcntl %edi, %eax # sched: [3:1.00] ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cttz_i32: ; BROADWELL: # %bb.0: @@ -691,10 +691,10 @@ ; ; HASWELL-LABEL: test_cttz_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: tzcntq (%rsi), %rcx # sched: [3:1.00] +; HASWELL-NEXT: tzcntq (%rsi), %rcx # sched: [8:1.00] ; HASWELL-NEXT: tzcntq %rdi, %rax # sched: [3:1.00] ; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cttz_i64: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/bmi2-schedule.ll =================================================================== --- test/CodeGen/X86/bmi2-schedule.ll +++ test/CodeGen/X86/bmi2-schedule.ll @@ -16,10 +16,10 @@ ; ; HASWELL-LABEL: test_bzhi_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [1:0.50] +; HASWELL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [6:0.50] ; HASWELL-NEXT: bzhil %edi, %esi, %eax # sched: [1:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bzhi_i32: ; BROADWELL: # %bb.0: @@ -37,10 +37,10 @@ ; ; KNL-LABEL: test_bzhi_i32: ; KNL: # %bb.0: -; KNL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [1:0.50] +; KNL-NEXT: bzhil %edi, (%rdx), %ecx # sched: [6:0.50] ; KNL-NEXT: bzhil %edi, %esi, %eax # sched: [1:0.50] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_bzhi_i32: ; ZNVER1: # %bb.0: @@ -66,10 +66,10 @@ ; ; HASWELL-LABEL: test_bzhi_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [1:0.50] +; HASWELL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [6:0.50] ; HASWELL-NEXT: bzhiq %rdi, %rsi, %rax # sched: [1:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bzhi_i64: ; BROADWELL: # %bb.0: @@ -87,10 +87,10 @@ ; ; KNL-LABEL: test_bzhi_i64: ; KNL: # %bb.0: -; KNL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [1:0.50] +; KNL-NEXT: bzhiq %rdi, (%rdx), %rcx # sched: [6:0.50] ; KNL-NEXT: bzhiq %rdi, %rsi, %rax # sched: [1:0.50] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_bzhi_i64: ; ZNVER1: # %bb.0: @@ -123,9 +123,9 @@ ; HASWELL-NEXT: movq %rdx, %rax # sched: [1:0.25] ; HASWELL-NEXT: movq %rdi, %rdx # sched: [1:0.25] ; HASWELL-NEXT: mulxq %rsi, %rsi, %rcx # sched: [4:1.00] -; HASWELL-NEXT: mulxq (%rax), %rdx, %rax # sched: [4:1.00] +; HASWELL-NEXT: mulxq (%rax), %rdx, %rax # sched: [9:1.00] ; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulx_i64: ; BROADWELL: # %bb.0: @@ -150,9 +150,9 @@ ; KNL-NEXT: movq %rdx, %rax # sched: [1:0.25] ; KNL-NEXT: movq %rdi, %rdx # sched: [1:0.25] ; KNL-NEXT: mulxq %rsi, %rsi, %rcx # sched: [4:1.00] -; KNL-NEXT: mulxq (%rax), %rdx, %rax # sched: [4:1.00] +; KNL-NEXT: mulxq (%rax), %rdx, %rax # sched: [9:1.00] ; KNL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_mulx_i64: ; ZNVER1: # %bb.0: @@ -186,10 +186,10 @@ ; ; HASWELL-LABEL: test_pdep_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [3:1.00] +; HASWELL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [8:1.00] ; HASWELL-NEXT: pdepl %esi, %edi, %eax # sched: [3:1.00] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pdep_i32: ; BROADWELL: # %bb.0: @@ -207,10 +207,10 @@ ; ; KNL-LABEL: test_pdep_i32: ; KNL: # %bb.0: -; KNL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [3:1.00] +; KNL-NEXT: pdepl (%rdx), %edi, %ecx # sched: [8:1.00] ; KNL-NEXT: pdepl %esi, %edi, %eax # sched: [3:1.00] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_pdep_i32: ; ZNVER1: # %bb.0: @@ -236,10 +236,10 @@ ; ; HASWELL-LABEL: test_pdep_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [3:1.00] +; HASWELL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [8:1.00] ; HASWELL-NEXT: pdepq %rsi, %rdi, %rax # sched: [3:1.00] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pdep_i64: ; BROADWELL: # %bb.0: @@ -257,10 +257,10 @@ ; ; KNL-LABEL: test_pdep_i64: ; KNL: # %bb.0: -; KNL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [3:1.00] +; KNL-NEXT: pdepq (%rdx), %rdi, %rcx # sched: [8:1.00] ; KNL-NEXT: pdepq %rsi, %rdi, %rax # sched: [3:1.00] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_pdep_i64: ; ZNVER1: # %bb.0: @@ -286,10 +286,10 @@ ; ; HASWELL-LABEL: test_pext_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pextl (%rdx), %edi, %ecx # sched: [3:1.00] +; HASWELL-NEXT: pextl (%rdx), %edi, %ecx # sched: [8:1.00] ; HASWELL-NEXT: pextl %esi, %edi, %eax # sched: [3:1.00] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pext_i32: ; BROADWELL: # %bb.0: @@ -307,10 +307,10 @@ ; ; KNL-LABEL: test_pext_i32: ; KNL: # %bb.0: -; KNL-NEXT: pextl (%rdx), %edi, %ecx # sched: [3:1.00] +; KNL-NEXT: pextl (%rdx), %edi, %ecx # sched: [8:1.00] ; KNL-NEXT: pextl %esi, %edi, %eax # sched: [3:1.00] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_pext_i32: ; ZNVER1: # %bb.0: @@ -336,10 +336,10 @@ ; ; HASWELL-LABEL: test_pext_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [3:1.00] +; HASWELL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [8:1.00] ; HASWELL-NEXT: pextq %rsi, %rdi, %rax # sched: [3:1.00] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pext_i64: ; BROADWELL: # %bb.0: @@ -357,10 +357,10 @@ ; ; KNL-LABEL: test_pext_i64: ; KNL: # %bb.0: -; KNL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [3:1.00] +; KNL-NEXT: pextq (%rdx), %rdi, %rcx # sched: [8:1.00] ; KNL-NEXT: pextq %rsi, %rdi, %rax # sched: [3:1.00] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_pext_i64: ; ZNVER1: # %bb.0: @@ -387,9 +387,9 @@ ; HASWELL-LABEL: test_rorx_i32: ; HASWELL: # %bb.0: ; HASWELL-NEXT: rorxl $5, %edi, %ecx # sched: [1:0.50] -; HASWELL-NEXT: rorxl $5, (%rdx), %eax # sched: [1:0.50] +; HASWELL-NEXT: rorxl $5, (%rdx), %eax # sched: [6:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rorx_i32: ; BROADWELL: # %bb.0: @@ -408,9 +408,9 @@ ; KNL-LABEL: test_rorx_i32: ; KNL: # %bb.0: ; KNL-NEXT: rorxl $5, %edi, %ecx # sched: [1:0.50] -; KNL-NEXT: rorxl $5, (%rdx), %eax # sched: [1:0.50] +; KNL-NEXT: rorxl $5, (%rdx), %eax # sched: [6:0.50] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_rorx_i32: ; ZNVER1: # %bb.0: @@ -440,9 +440,9 @@ ; HASWELL-LABEL: test_rorx_i64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: rorxq $5, %rdi, %rcx # sched: [1:0.50] -; HASWELL-NEXT: rorxq $5, (%rdx), %rax # sched: [1:0.50] +; HASWELL-NEXT: rorxq $5, (%rdx), %rax # sched: [6:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rorx_i64: ; BROADWELL: # %bb.0: @@ -461,9 +461,9 @@ ; KNL-LABEL: test_rorx_i64: ; KNL: # %bb.0: ; KNL-NEXT: rorxq $5, %rdi, %rcx # sched: [1:0.50] -; KNL-NEXT: rorxq $5, (%rdx), %rax # sched: [1:0.50] +; KNL-NEXT: rorxq $5, (%rdx), %rax # sched: [6:0.50] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_rorx_i64: ; ZNVER1: # %bb.0: @@ -493,9 +493,9 @@ ; HASWELL-LABEL: test_sarx_i32: ; HASWELL: # %bb.0: ; HASWELL-NEXT: sarxl %esi, %edi, %ecx # sched: [1:0.50] -; HASWELL-NEXT: sarxl %esi, (%rdx), %eax # sched: [1:0.50] +; HASWELL-NEXT: sarxl %esi, (%rdx), %eax # sched: [6:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sarx_i32: ; BROADWELL: # %bb.0: @@ -514,9 +514,9 @@ ; KNL-LABEL: test_sarx_i32: ; KNL: # %bb.0: ; KNL-NEXT: sarxl %esi, %edi, %ecx # sched: [1:0.50] -; KNL-NEXT: sarxl %esi, (%rdx), %eax # sched: [1:0.50] +; KNL-NEXT: sarxl %esi, (%rdx), %eax # sched: [6:0.50] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_sarx_i32: ; ZNVER1: # %bb.0: @@ -542,9 +542,9 @@ ; HASWELL-LABEL: test_sarx_i64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: sarxq %rsi, %rdi, %rcx # sched: [1:0.50] -; HASWELL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [1:0.50] +; HASWELL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [6:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sarx_i64: ; BROADWELL: # %bb.0: @@ -563,9 +563,9 @@ ; KNL-LABEL: test_sarx_i64: ; KNL: # %bb.0: ; KNL-NEXT: sarxq %rsi, %rdi, %rcx # sched: [1:0.50] -; KNL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [1:0.50] +; KNL-NEXT: sarxq %rsi, (%rdx), %rax # sched: [6:0.50] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_sarx_i64: ; ZNVER1: # %bb.0: @@ -591,9 +591,9 @@ ; HASWELL-LABEL: test_shlx_i32: ; HASWELL: # %bb.0: ; HASWELL-NEXT: shlxl %esi, %edi, %ecx # sched: [1:0.50] -; HASWELL-NEXT: shlxl %esi, (%rdx), %eax # sched: [1:0.50] +; HASWELL-NEXT: shlxl %esi, (%rdx), %eax # sched: [6:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shlx_i32: ; BROADWELL: # %bb.0: @@ -612,9 +612,9 @@ ; KNL-LABEL: test_shlx_i32: ; KNL: # %bb.0: ; KNL-NEXT: shlxl %esi, %edi, %ecx # sched: [1:0.50] -; KNL-NEXT: shlxl %esi, (%rdx), %eax # sched: [1:0.50] +; KNL-NEXT: shlxl %esi, (%rdx), %eax # sched: [6:0.50] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_shlx_i32: ; ZNVER1: # %bb.0: @@ -640,9 +640,9 @@ ; HASWELL-LABEL: test_shlx_i64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: shlxq %rsi, %rdi, %rcx # sched: [1:0.50] -; HASWELL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [1:0.50] +; HASWELL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [6:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shlx_i64: ; BROADWELL: # %bb.0: @@ -661,9 +661,9 @@ ; KNL-LABEL: test_shlx_i64: ; KNL: # %bb.0: ; KNL-NEXT: shlxq %rsi, %rdi, %rcx # sched: [1:0.50] -; KNL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [1:0.50] +; KNL-NEXT: shlxq %rsi, (%rdx), %rax # sched: [6:0.50] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_shlx_i64: ; ZNVER1: # %bb.0: @@ -689,9 +689,9 @@ ; HASWELL-LABEL: test_shrx_i32: ; HASWELL: # %bb.0: ; HASWELL-NEXT: shrxl %esi, %edi, %ecx # sched: [1:0.50] -; HASWELL-NEXT: shrxl %esi, (%rdx), %eax # sched: [1:0.50] +; HASWELL-NEXT: shrxl %esi, (%rdx), %eax # sched: [6:0.50] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shrx_i32: ; BROADWELL: # %bb.0: @@ -710,9 +710,9 @@ ; KNL-LABEL: test_shrx_i32: ; KNL: # %bb.0: ; KNL-NEXT: shrxl %esi, %edi, %ecx # sched: [1:0.50] -; KNL-NEXT: shrxl %esi, (%rdx), %eax # sched: [1:0.50] +; KNL-NEXT: shrxl %esi, (%rdx), %eax # sched: [6:0.50] ; KNL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_shrx_i32: ; ZNVER1: # %bb.0: @@ -738,9 +738,9 @@ ; HASWELL-LABEL: test_shrx_i64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: shrxq %rsi, %rdi, %rcx # sched: [1:0.50] -; HASWELL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [1:0.50] +; HASWELL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [6:0.50] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shrx_i64: ; BROADWELL: # %bb.0: @@ -759,9 +759,9 @@ ; KNL-LABEL: test_shrx_i64: ; KNL: # %bb.0: ; KNL-NEXT: shrxq %rsi, %rdi, %rcx # sched: [1:0.50] -; KNL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [1:0.50] +; KNL-NEXT: shrxq %rsi, (%rdx), %rax # sched: [6:0.50] ; KNL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; ZNVER1-LABEL: test_shrx_i64: ; ZNVER1: # %bb.0: Index: test/CodeGen/X86/f16c-schedule.ll =================================================================== --- test/CodeGen/X86/f16c-schedule.ll +++ test/CodeGen/X86/f16c-schedule.ll @@ -24,10 +24,10 @@ ; ; HASWELL-LABEL: test_vcvtph2ps_128: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vcvtph2ps (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vcvtph2ps (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vcvtph2ps %xmm0, %xmm0 # sched: [2:1.00] ; HASWELL-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vcvtph2ps_128: ; BROADWELL: # %bb.0: @@ -81,10 +81,10 @@ ; ; HASWELL-LABEL: test_vcvtph2ps_256: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vcvtph2ps (%rdi), %ymm1 # sched: [1:1.00] +; HASWELL-NEXT: vcvtph2ps (%rdi), %ymm1 # sched: [7:1.00] ; HASWELL-NEXT: vcvtph2ps %xmm0, %ymm0 # sched: [2:1.00] ; HASWELL-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vcvtph2ps_256: ; BROADWELL: # %bb.0: @@ -137,8 +137,8 @@ ; HASWELL-LABEL: test_vcvtps2ph_128: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtps2ph $0, %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtps2ph $0, %xmm1, (%rdi) # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vcvtps2ph $0, %xmm1, (%rdi) # sched: [5:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vcvtps2ph_128: ; BROADWELL: # %bb.0: @@ -189,9 +189,9 @@ ; HASWELL-LABEL: test_vcvtps2ph_256: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtps2ph $0, %ymm0, %xmm0 # sched: [6:1.00] -; HASWELL-NEXT: vcvtps2ph $0, %ymm1, (%rdi) # sched: [6:1.00] +; HASWELL-NEXT: vcvtps2ph $0, %ymm1, (%rdi) # sched: [7:1.00] ; HASWELL-NEXT: vzeroupper # sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vcvtps2ph_256: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/fma-schedule.ll =================================================================== --- test/CodeGen/X86/fma-schedule.ll +++ test/CodeGen/X86/fma-schedule.ll @@ -18,15 +18,15 @@ define <2 x double> @test_vfmadd213pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfmadd213pd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmadd213pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmadd213pd: ; BROADWELL: # %bb.0: @@ -43,8 +43,8 @@ ; KNL-LABEL: test_vfmadd213pd: ; KNL: # %bb.0: ; KNL-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmadd213pd: ; SKX: # %bb.0: @@ -54,8 +54,8 @@ ; ; ZNVER1-LABEL: test_vfmadd213pd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfmadd.pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -66,15 +66,15 @@ define <4 x double> @test_vfmadd213pd_ymm(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2, <4 x double> *%a3) { ; GENERIC-LABEL: test_vfmadd213pd_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmadd213pd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmadd213pd_ymm: ; BROADWELL: # %bb.0: @@ -91,8 +91,8 @@ ; KNL-LABEL: test_vfmadd213pd_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmadd213pd_ymm: ; SKX: # %bb.0: @@ -102,8 +102,8 @@ ; ; ZNVER1-LABEL: test_vfmadd213pd_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x double> @llvm.x86.fma.vfmadd.pd.256(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) %2 = load <4 x double>, <4 x double> *%a3 @@ -114,15 +114,15 @@ define <4 x float> @test_vfmadd213ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfmadd213ps: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmadd213ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmadd213ps: ; BROADWELL: # %bb.0: @@ -139,8 +139,8 @@ ; KNL-LABEL: test_vfmadd213ps: ; KNL: # %bb.0: ; KNL-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmadd213ps: ; SKX: # %bb.0: @@ -150,8 +150,8 @@ ; ; ZNVER1-LABEL: test_vfmadd213ps: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -162,15 +162,15 @@ define <8 x float> @test_vfmadd213ps_ymm(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2, <8 x float> *%a3) { ; GENERIC-LABEL: test_vfmadd213ps_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmadd213ps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmadd213ps_ymm: ; BROADWELL: # %bb.0: @@ -187,8 +187,8 @@ ; KNL-LABEL: test_vfmadd213ps_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmadd213ps_ymm: ; SKX: # %bb.0: @@ -198,8 +198,8 @@ ; ; ZNVER1-LABEL: test_vfmadd213ps_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <8 x float> @llvm.x86.fma.vfmadd.ps.256(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) %2 = load <8 x float>, <8 x float> *%a3 @@ -210,15 +210,15 @@ define <2 x double> @test_vfmadd213sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfmadd213sd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmadd213sd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmadd213sd: ; BROADWELL: # %bb.0: @@ -235,8 +235,8 @@ ; KNL-LABEL: test_vfmadd213sd: ; KNL: # %bb.0: ; KNL-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmadd213sd: ; SKX: # %bb.0: @@ -246,8 +246,8 @@ ; ; ZNVER1-LABEL: test_vfmadd213sd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfmadd.sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -258,15 +258,15 @@ define <4 x float> @test_vfmadd213ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfmadd213ss: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmadd213ss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmadd213ss: ; BROADWELL: # %bb.0: @@ -283,8 +283,8 @@ ; KNL-LABEL: test_vfmadd213ss: ; KNL: # %bb.0: ; KNL-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmadd213ss: ; SKX: # %bb.0: @@ -294,8 +294,8 @@ ; ; ZNVER1-LABEL: test_vfmadd213ss: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfmadd.ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -318,15 +318,15 @@ define <2 x double> @test_vfmaddsubpd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfmaddsubpd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmaddsubpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmaddsubpd: ; BROADWELL: # %bb.0: @@ -343,8 +343,8 @@ ; KNL-LABEL: test_vfmaddsubpd: ; KNL: # %bb.0: ; KNL-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmaddsubpd: ; SKX: # %bb.0: @@ -354,8 +354,8 @@ ; ; ZNVER1-LABEL: test_vfmaddsubpd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmaddsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmaddsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfmaddsub.pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -366,15 +366,15 @@ define <4 x double> @test_vfmaddsubpd_ymm(<4 x double> %a0, <4 x double> %a1, <4 x double> %a4, <4 x double> *%a3) { ; GENERIC-LABEL: test_vfmaddsubpd_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmaddsubpd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmaddsubpd_ymm: ; BROADWELL: # %bb.0: @@ -391,8 +391,8 @@ ; KNL-LABEL: test_vfmaddsubpd_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmaddsubpd_ymm: ; SKX: # %bb.0: @@ -402,8 +402,8 @@ ; ; ZNVER1-LABEL: test_vfmaddsubpd_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmaddsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmaddsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x double> @llvm.x86.fma.vfmaddsub.pd.256(<4 x double> %a0, <4 x double> %a1, <4 x double> %a4) %2 = load <4 x double>, <4 x double> *%a3 @@ -414,15 +414,15 @@ define <4 x float> @test_vfmaddsubps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a4, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfmaddsubps: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmaddsubps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmaddsubps: ; BROADWELL: # %bb.0: @@ -439,8 +439,8 @@ ; KNL-LABEL: test_vfmaddsubps: ; KNL: # %bb.0: ; KNL-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmaddsubps: ; SKX: # %bb.0: @@ -450,8 +450,8 @@ ; ; ZNVER1-LABEL: test_vfmaddsubps: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmaddsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmaddsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfmaddsub.ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a4) %2 = load <4 x float>, <4 x float> *%a3 @@ -462,15 +462,15 @@ define <8 x float> @test_vfmaddsubps_ymm(<8 x float> %a0, <8 x float> %a1, <8 x float> %a8, <8 x float> *%a3) { ; GENERIC-LABEL: test_vfmaddsubps_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmaddsubps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmaddsubps_ymm: ; BROADWELL: # %bb.0: @@ -487,8 +487,8 @@ ; KNL-LABEL: test_vfmaddsubps_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmaddsubps_ymm: ; SKX: # %bb.0: @@ -498,8 +498,8 @@ ; ; ZNVER1-LABEL: test_vfmaddsubps_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmaddsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmaddsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <8 x float> @llvm.x86.fma.vfmaddsub.ps.256(<8 x float> %a0, <8 x float> %a1, <8 x float> %a8) %2 = load <8 x float>, <8 x float> *%a3 @@ -522,15 +522,15 @@ define <2 x double> @test_vfmsubaddpd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfmsubaddpd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsubaddpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsubaddpd: ; BROADWELL: # %bb.0: @@ -547,8 +547,8 @@ ; KNL-LABEL: test_vfmsubaddpd: ; KNL: # %bb.0: ; KNL-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsubaddpd: ; SKX: # %bb.0: @@ -558,8 +558,8 @@ ; ; ZNVER1-LABEL: test_vfmsubaddpd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmsubadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsubadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfmsubadd.pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -570,15 +570,15 @@ define <4 x double> @test_vfmsubaddpd_ymm(<4 x double> %a0, <4 x double> %a1, <4 x double> %a4, <4 x double> *%a3) { ; GENERIC-LABEL: test_vfmsubaddpd_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsubaddpd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsubaddpd_ymm: ; BROADWELL: # %bb.0: @@ -595,8 +595,8 @@ ; KNL-LABEL: test_vfmsubaddpd_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsubaddpd_ymm: ; SKX: # %bb.0: @@ -606,8 +606,8 @@ ; ; ZNVER1-LABEL: test_vfmsubaddpd_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmsubadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsubadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x double> @llvm.x86.fma.vfmsubadd.pd.256(<4 x double> %a0, <4 x double> %a1, <4 x double> %a4) %2 = load <4 x double>, <4 x double> *%a3 @@ -618,15 +618,15 @@ define <4 x float> @test_vfmsubaddps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a4, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfmsubaddps: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsubaddps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsubaddps: ; BROADWELL: # %bb.0: @@ -643,8 +643,8 @@ ; KNL-LABEL: test_vfmsubaddps: ; KNL: # %bb.0: ; KNL-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsubaddps: ; SKX: # %bb.0: @@ -654,8 +654,8 @@ ; ; ZNVER1-LABEL: test_vfmsubaddps: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmsubadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsubadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfmsubadd.ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a4) %2 = load <4 x float>, <4 x float> *%a3 @@ -666,15 +666,15 @@ define <8 x float> @test_vfmsubaddps_ymm(<8 x float> %a0, <8 x float> %a1, <8 x float> %a8, <8 x float> *%a3) { ; GENERIC-LABEL: test_vfmsubaddps_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsubaddps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsubaddps_ymm: ; BROADWELL: # %bb.0: @@ -691,8 +691,8 @@ ; KNL-LABEL: test_vfmsubaddps_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsubaddps_ymm: ; SKX: # %bb.0: @@ -702,8 +702,8 @@ ; ; ZNVER1-LABEL: test_vfmsubaddps_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmsubadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsubadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <8 x float> @llvm.x86.fma.vfmsubadd.ps.256(<8 x float> %a0, <8 x float> %a1, <8 x float> %a8) %2 = load <8 x float>, <8 x float> *%a3 @@ -726,15 +726,15 @@ define <2 x double> @test_vfmsub213pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfmsub213pd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsub213pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsub213pd: ; BROADWELL: # %bb.0: @@ -751,8 +751,8 @@ ; KNL-LABEL: test_vfmsub213pd: ; KNL: # %bb.0: ; KNL-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsub213pd: ; SKX: # %bb.0: @@ -762,8 +762,8 @@ ; ; ZNVER1-LABEL: test_vfmsub213pd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfmsub.pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -774,15 +774,15 @@ define <4 x double> @test_vfmsub213pd_ymm(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2, <4 x double> *%a3) { ; GENERIC-LABEL: test_vfmsub213pd_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsub213pd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsub213pd_ymm: ; BROADWELL: # %bb.0: @@ -799,8 +799,8 @@ ; KNL-LABEL: test_vfmsub213pd_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsub213pd_ymm: ; SKX: # %bb.0: @@ -810,8 +810,8 @@ ; ; ZNVER1-LABEL: test_vfmsub213pd_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x double> @llvm.x86.fma.vfmsub.pd.256(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) %2 = load <4 x double>, <4 x double> *%a3 @@ -822,15 +822,15 @@ define <4 x float> @test_vfmsub213ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfmsub213ps: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsub213ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsub213ps: ; BROADWELL: # %bb.0: @@ -847,8 +847,8 @@ ; KNL-LABEL: test_vfmsub213ps: ; KNL: # %bb.0: ; KNL-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsub213ps: ; SKX: # %bb.0: @@ -858,8 +858,8 @@ ; ; ZNVER1-LABEL: test_vfmsub213ps: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfmsub.ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -870,15 +870,15 @@ define <8 x float> @test_vfmsub213ps_ymm(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2, <8 x float> *%a3) { ; GENERIC-LABEL: test_vfmsub213ps_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsub213ps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsub213ps_ymm: ; BROADWELL: # %bb.0: @@ -895,8 +895,8 @@ ; KNL-LABEL: test_vfmsub213ps_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsub213ps_ymm: ; SKX: # %bb.0: @@ -906,8 +906,8 @@ ; ; ZNVER1-LABEL: test_vfmsub213ps_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <8 x float> @llvm.x86.fma.vfmsub.ps.256(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) %2 = load <8 x float>, <8 x float> *%a3 @@ -918,15 +918,15 @@ define <2 x double> @test_vfmsub213sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfmsub213sd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsub213sd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsub213sd: ; BROADWELL: # %bb.0: @@ -943,8 +943,8 @@ ; KNL-LABEL: test_vfmsub213sd: ; KNL: # %bb.0: ; KNL-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsub213sd: ; SKX: # %bb.0: @@ -954,8 +954,8 @@ ; ; ZNVER1-LABEL: test_vfmsub213sd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfmsub.sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -966,15 +966,15 @@ define <4 x float> @test_vfmsub213ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfmsub213ss: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfmsub213ss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfmsub213ss: ; BROADWELL: # %bb.0: @@ -991,8 +991,8 @@ ; KNL-LABEL: test_vfmsub213ss: ; KNL: # %bb.0: ; KNL-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfmsub213ss: ; SKX: # %bb.0: @@ -1002,8 +1002,8 @@ ; ; ZNVER1-LABEL: test_vfmsub213ss: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfmsub.ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -1026,15 +1026,15 @@ define <2 x double> @test_vfnmadd213pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfnmadd213pd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmadd213pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmadd213pd: ; BROADWELL: # %bb.0: @@ -1051,8 +1051,8 @@ ; KNL-LABEL: test_vfnmadd213pd: ; KNL: # %bb.0: ; KNL-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmadd213pd: ; SKX: # %bb.0: @@ -1062,8 +1062,8 @@ ; ; ZNVER1-LABEL: test_vfnmadd213pd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmadd213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfnmadd.pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -1074,15 +1074,15 @@ define <4 x double> @test_vfnmadd213pd_ymm(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2, <4 x double> *%a3) { ; GENERIC-LABEL: test_vfnmadd213pd_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmadd213pd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmadd213pd_ymm: ; BROADWELL: # %bb.0: @@ -1099,8 +1099,8 @@ ; KNL-LABEL: test_vfnmadd213pd_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmadd213pd_ymm: ; SKX: # %bb.0: @@ -1110,8 +1110,8 @@ ; ; ZNVER1-LABEL: test_vfnmadd213pd_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmadd213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x double> @llvm.x86.fma.vfnmadd.pd.256(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) %2 = load <4 x double>, <4 x double> *%a3 @@ -1122,15 +1122,15 @@ define <4 x float> @test_vfnmadd213ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfnmadd213ps: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmadd213ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmadd213ps: ; BROADWELL: # %bb.0: @@ -1147,8 +1147,8 @@ ; KNL-LABEL: test_vfnmadd213ps: ; KNL: # %bb.0: ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmadd213ps: ; SKX: # %bb.0: @@ -1158,8 +1158,8 @@ ; ; ZNVER1-LABEL: test_vfnmadd213ps: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmadd213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfnmadd.ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -1170,15 +1170,15 @@ define <8 x float> @test_vfnmadd213ps_ymm(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2, <8 x float> *%a3) { ; GENERIC-LABEL: test_vfnmadd213ps_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmadd213ps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmadd213ps_ymm: ; BROADWELL: # %bb.0: @@ -1195,8 +1195,8 @@ ; KNL-LABEL: test_vfnmadd213ps_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmadd213ps_ymm: ; SKX: # %bb.0: @@ -1206,8 +1206,8 @@ ; ; ZNVER1-LABEL: test_vfnmadd213ps_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmadd213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <8 x float> @llvm.x86.fma.vfnmadd.ps.256(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) %2 = load <8 x float>, <8 x float> *%a3 @@ -1218,15 +1218,15 @@ define <2 x double> @test_vfnmadd213sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfnmadd213sd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmadd213sd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmadd213sd: ; BROADWELL: # %bb.0: @@ -1243,8 +1243,8 @@ ; KNL-LABEL: test_vfnmadd213sd: ; KNL: # %bb.0: ; KNL-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmadd213sd: ; SKX: # %bb.0: @@ -1254,8 +1254,8 @@ ; ; ZNVER1-LABEL: test_vfnmadd213sd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmadd213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfnmadd.sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -1266,15 +1266,15 @@ define <4 x float> @test_vfnmadd213ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfnmadd213ss: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmadd213ss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmadd213ss: ; BROADWELL: # %bb.0: @@ -1291,8 +1291,8 @@ ; KNL-LABEL: test_vfnmadd213ss: ; KNL: # %bb.0: ; KNL-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmadd213ss: ; SKX: # %bb.0: @@ -1302,8 +1302,8 @@ ; ; ZNVER1-LABEL: test_vfnmadd213ss: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmadd213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfnmadd.ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -1326,15 +1326,15 @@ define <2 x double> @test_vfnmsub213pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfnmsub213pd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmsub213pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmsub213pd: ; BROADWELL: # %bb.0: @@ -1351,8 +1351,8 @@ ; KNL-LABEL: test_vfnmsub213pd: ; KNL: # %bb.0: ; KNL-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmsub213pd: ; SKX: # %bb.0: @@ -1362,8 +1362,8 @@ ; ; ZNVER1-LABEL: test_vfnmsub213pd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmsub213pd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfnmsub.pd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -1374,15 +1374,15 @@ define <4 x double> @test_vfnmsub213pd_ymm(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2, <4 x double> *%a3) { ; GENERIC-LABEL: test_vfnmsub213pd_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmsub213pd_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmsub213pd_ymm: ; BROADWELL: # %bb.0: @@ -1399,8 +1399,8 @@ ; KNL-LABEL: test_vfnmsub213pd_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmsub213pd_ymm: ; SKX: # %bb.0: @@ -1410,8 +1410,8 @@ ; ; ZNVER1-LABEL: test_vfnmsub213pd_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmsub213pd (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x double> @llvm.x86.fma.vfnmsub.pd.256(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) %2 = load <4 x double>, <4 x double> *%a3 @@ -1422,15 +1422,15 @@ define <4 x float> @test_vfnmsub213ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfnmsub213ps: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmsub213ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmsub213ps: ; BROADWELL: # %bb.0: @@ -1447,8 +1447,8 @@ ; KNL-LABEL: test_vfnmsub213ps: ; KNL: # %bb.0: ; KNL-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmsub213ps: ; SKX: # %bb.0: @@ -1458,8 +1458,8 @@ ; ; ZNVER1-LABEL: test_vfnmsub213ps: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmsub213ps (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfnmsub.ps(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 @@ -1470,15 +1470,15 @@ define <8 x float> @test_vfnmsub213ps_ymm(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2, <8 x float> *%a3) { ; GENERIC-LABEL: test_vfnmsub213ps_ymm: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 -; GENERIC-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 +; GENERIC-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmsub213ps_ymm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmsub213ps_ymm: ; BROADWELL: # %bb.0: @@ -1495,8 +1495,8 @@ ; KNL-LABEL: test_vfnmsub213ps_ymm: ; KNL: # %bb.0: ; KNL-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmsub213ps_ymm: ; SKX: # %bb.0: @@ -1506,8 +1506,8 @@ ; ; ZNVER1-LABEL: test_vfnmsub213ps_ymm: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 -; ZNVER1-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 +; ZNVER1-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmsub213ps (%rdi), %ymm1, %ymm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <8 x float> @llvm.x86.fma.vfnmsub.ps.256(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) %2 = load <8 x float>, <8 x float> *%a3 @@ -1518,15 +1518,15 @@ define <2 x double> @test_vfnmsub213sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2, <2 x double> *%a3) { ; GENERIC-LABEL: test_vfnmsub213sd: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmsub213sd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmsub213sd: ; BROADWELL: # %bb.0: @@ -1543,8 +1543,8 @@ ; KNL-LABEL: test_vfnmsub213sd: ; KNL: # %bb.0: ; KNL-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmsub213sd: ; SKX: # %bb.0: @@ -1554,8 +1554,8 @@ ; ; ZNVER1-LABEL: test_vfnmsub213sd: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmsub213sd (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <2 x double> @llvm.x86.fma.vfnmsub.sd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) %2 = load <2 x double>, <2 x double> *%a3 @@ -1566,15 +1566,15 @@ define <4 x float> @test_vfnmsub213ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2, <4 x float> *%a3) { ; GENERIC-LABEL: test_vfnmsub213ss: ; GENERIC: # %bb.0: -; GENERIC-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 -; GENERIC-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 +; GENERIC-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; GENERIC-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_vfnmsub213ss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_vfnmsub213ss: ; BROADWELL: # %bb.0: @@ -1591,8 +1591,8 @@ ; KNL-LABEL: test_vfnmsub213ss: ; KNL: # %bb.0: ; KNL-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: test_vfnmsub213ss: ; SKX: # %bb.0: @@ -1602,8 +1602,8 @@ ; ; ZNVER1-LABEL: test_vfnmsub213ss: ; ZNVER1: # %bb.0: -; ZNVER1-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 -; ZNVER1-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 +; ZNVER1-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 # sched: [5:0.50] +; ZNVER1-NEXT: vfnmsub213ss (%rdi), %xmm1, %xmm0 # sched: [5:0.50] ; ZNVER1-NEXT: retq # sched: [1:0.50] %1 = call <4 x float> @llvm.x86.fma.vfnmsub.ss(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) %2 = load <4 x float>, <4 x float> *%a3 Index: test/CodeGen/X86/lea32-schedule.ll =================================================================== --- test/CodeGen/X86/lea32-schedule.ll +++ test/CodeGen/X86/lea32-schedule.ll @@ -46,7 +46,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal -24(%rdi), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_offset: ; BROADWELL: # %bb.0: @@ -110,7 +110,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal 1024(%rdi), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_offset_big: ; BROADWELL: # %bb.0: @@ -180,7 +180,7 @@ ; HASWELL-NEXT: # kill: %esi %esi %rsi ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal (%rdi,%rsi), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add: ; BROADWELL: # %bb.0: @@ -256,7 +256,7 @@ ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal (%rdi,%rsi), %eax # sched: [1:0.50] ; HASWELL-NEXT: addl $16, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_offset: ; BROADWELL: # %bb.0: @@ -338,7 +338,7 @@ ; HASWELL-NEXT: leal (%rdi,%rsi), %eax # sched: [1:0.50] ; HASWELL-NEXT: addl $-4096, %eax # imm = 0xF000 ; HASWELL-NEXT: # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_offset_big: ; BROADWELL: # %bb.0: @@ -411,7 +411,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_mul: ; BROADWELL: # %bb.0: @@ -478,7 +478,7 @@ ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] ; HASWELL-NEXT: addl $-32, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_mul_offset: ; BROADWELL: # %bb.0: @@ -551,7 +551,7 @@ ; HASWELL-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] ; HASWELL-NEXT: addl $10000, %eax # imm = 0x2710 ; HASWELL-NEXT: # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_mul_offset_big: ; BROADWELL: # %bb.0: @@ -625,7 +625,7 @@ ; HASWELL-NEXT: # kill: %esi %esi %rsi ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal (%rdi,%rsi,2), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_scale: ; BROADWELL: # %bb.0: @@ -702,7 +702,7 @@ ; HASWELL-NEXT: # kill: %edi %edi %rdi ; HASWELL-NEXT: leal (%rdi,%rsi,4), %eax # sched: [1:0.50] ; HASWELL-NEXT: addl $96, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_scale_offset: ; BROADWELL: # %bb.0: @@ -785,7 +785,7 @@ ; HASWELL-NEXT: leal (%rdi,%rsi,8), %eax # sched: [1:0.50] ; HASWELL-NEXT: addl $-1200, %eax # imm = 0xFB50 ; HASWELL-NEXT: # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_scale_offset_big: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/lea64-schedule.ll =================================================================== --- test/CodeGen/X86/lea64-schedule.ll +++ test/CodeGen/X86/lea64-schedule.ll @@ -41,7 +41,7 @@ ; HASWELL-LABEL: test_lea_offset: ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq -24(%rdi), %rax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_offset: ; BROADWELL: # %bb.0: @@ -96,7 +96,7 @@ ; HASWELL-LABEL: test_lea_offset_big: ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq 1024(%rdi), %rax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_offset_big: ; BROADWELL: # %bb.0: @@ -152,7 +152,7 @@ ; HASWELL-LABEL: test_lea_add: ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq (%rdi,%rsi), %rax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add: ; BROADWELL: # %bb.0: @@ -210,7 +210,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq (%rdi,%rsi), %rax # sched: [1:0.50] ; HASWELL-NEXT: addq $16, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_offset: ; BROADWELL: # %bb.0: @@ -274,7 +274,7 @@ ; HASWELL-NEXT: leaq (%rdi,%rsi), %rax # sched: [1:0.50] ; HASWELL-NEXT: addq $-4096, %rax # imm = 0xF000 ; HASWELL-NEXT: # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_offset_big: ; BROADWELL: # %bb.0: @@ -334,7 +334,7 @@ ; HASWELL-LABEL: test_lea_mul: ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_mul: ; BROADWELL: # %bb.0: @@ -392,7 +392,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] ; HASWELL-NEXT: addq $-32, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_mul_offset: ; BROADWELL: # %bb.0: @@ -456,7 +456,7 @@ ; HASWELL-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] ; HASWELL-NEXT: addq $10000, %rax # imm = 0x2710 ; HASWELL-NEXT: # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_mul_offset_big: ; BROADWELL: # %bb.0: @@ -516,7 +516,7 @@ ; HASWELL-LABEL: test_lea_add_scale: ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq (%rdi,%rsi,2), %rax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_scale: ; BROADWELL: # %bb.0: @@ -575,7 +575,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: leaq (%rdi,%rsi,4), %rax # sched: [1:0.50] ; HASWELL-NEXT: addq $96, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_scale_offset: ; BROADWELL: # %bb.0: @@ -640,7 +640,7 @@ ; HASWELL-NEXT: leaq (%rdi,%rsi,8), %rax # sched: [1:0.50] ; HASWELL-NEXT: addq $-1200, %rax # imm = 0xFB50 ; HASWELL-NEXT: # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lea_add_scale_offset_big: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/lzcnt-schedule.ll =================================================================== --- test/CodeGen/X86/lzcnt-schedule.ll +++ test/CodeGen/X86/lzcnt-schedule.ll @@ -18,11 +18,11 @@ ; ; HASWELL-LABEL: test_ctlz_i16: ; HASWELL: # %bb.0: -; HASWELL-NEXT: lzcntw (%rsi), %cx # sched: [3:1.00] +; HASWELL-NEXT: lzcntw (%rsi), %cx # sched: [8:1.00] ; HASWELL-NEXT: lzcntw %di, %ax # sched: [3:1.00] ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ctlz_i16: ; BROADWELL: # %bb.0: @@ -73,10 +73,10 @@ ; ; HASWELL-LABEL: test_ctlz_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: lzcntl (%rsi), %ecx # sched: [3:1.00] +; HASWELL-NEXT: lzcntl (%rsi), %ecx # sched: [8:1.00] ; HASWELL-NEXT: lzcntl %edi, %eax # sched: [3:1.00] ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ctlz_i32: ; BROADWELL: # %bb.0: @@ -123,10 +123,10 @@ ; ; HASWELL-LABEL: test_ctlz_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: lzcntq (%rsi), %rcx # sched: [3:1.00] +; HASWELL-NEXT: lzcntq (%rsi), %rcx # sched: [8:1.00] ; HASWELL-NEXT: lzcntq %rdi, %rax # sched: [3:1.00] ; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ctlz_i64: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/mmx-schedule.ll =================================================================== --- test/CodeGen/X86/mmx-schedule.ll +++ test/CodeGen/X86/mmx-schedule.ll @@ -46,11 +46,11 @@ ; ; HASWELL-LABEL: test_cvtpd2pi: ; HASWELL: # %bb.0: -; HASWELL-NEXT: cvtpd2pi (%rdi), %mm0 # sched: [4:1.00] +; HASWELL-NEXT: cvtpd2pi (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: cvtpd2pi %xmm0, %mm1 # sched: [4:1.00] ; HASWELL-NEXT: por %mm1, %mm0 # sched: [1:0.33] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpd2pi: ; BROADWELL: # %bb.0: @@ -132,9 +132,9 @@ ; HASWELL-LABEL: test_cvtpi2pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: cvtpi2pd %mm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: cvtpi2pd (%rdi), %xmm1 # sched: [4:1.00] +; HASWELL-NEXT: cvtpi2pd (%rdi), %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpi2pd: ; BROADWELL: # %bb.0: @@ -210,9 +210,9 @@ ; HASWELL-LABEL: test_cvtpi2ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: cvtpi2ps %mm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: cvtpi2ps (%rdi), %xmm1 # sched: [3:1.00] +; HASWELL-NEXT: cvtpi2ps (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpi2ps: ; BROADWELL: # %bb.0: @@ -292,10 +292,10 @@ ; HASWELL-LABEL: test_cvtps2pi: ; HASWELL: # %bb.0: ; HASWELL-NEXT: cvtps2pi %xmm0, %mm0 # sched: [4:1.00] -; HASWELL-NEXT: cvtps2pi (%rdi), %mm1 # sched: [3:1.00] +; HASWELL-NEXT: cvtps2pi (%rdi), %mm1 # sched: [8:1.00] ; HASWELL-NEXT: por %mm0, %mm1 # sched: [1:0.33] ; HASWELL-NEXT: movd %mm1, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtps2pi: ; BROADWELL: # %bb.0: @@ -380,11 +380,11 @@ ; ; HASWELL-LABEL: test_cvttpd2pi: ; HASWELL: # %bb.0: -; HASWELL-NEXT: cvttpd2pi (%rdi), %mm0 # sched: [4:1.00] +; HASWELL-NEXT: cvttpd2pi (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: cvttpd2pi %xmm0, %mm1 # sched: [4:1.00] ; HASWELL-NEXT: por %mm1, %mm0 # sched: [1:0.33] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttpd2pi: ; BROADWELL: # %bb.0: @@ -470,10 +470,10 @@ ; HASWELL-LABEL: test_cvttps2pi: ; HASWELL: # %bb.0: ; HASWELL-NEXT: cvttps2pi %xmm0, %mm0 # sched: [4:1.00] -; HASWELL-NEXT: cvttps2pi (%rdi), %mm1 # sched: [3:1.00] +; HASWELL-NEXT: cvttps2pi (%rdi), %mm1 # sched: [8:1.00] ; HASWELL-NEXT: por %mm0, %mm1 # sched: [1:0.33] ; HASWELL-NEXT: movd %mm1, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttps2pi: ; BROADWELL: # %bb.0: @@ -547,7 +547,7 @@ ; HASWELL-LABEL: test_emms: ; HASWELL: # %bb.0: ; HASWELL-NEXT: emms # sched: [31:10.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_emms: ; BROADWELL: # %bb.0: @@ -602,7 +602,7 @@ ; HASWELL-LABEL: test_maskmovq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: maskmovq %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maskmovq: ; BROADWELL: # %bb.0: @@ -694,15 +694,15 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovd %edi, %xmm0 # sched: [1:1.00] ; HASWELL-NEXT: vmovq %xmm0, -{{[0-9]+}}(%rsp) # sched: [1:1.00] -; HASWELL-NEXT: movq -{{[0-9]+}}(%rsp), %mm1 # sched: [1:0.50] -; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: movq -{{[0-9]+}}(%rsp), %mm1 # sched: [5:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vmovlps %xmm0, -{{[0-9]+}}(%rsp) # sched: [1:1.00] -; HASWELL-NEXT: paddd -{{[0-9]+}}(%rsp), %mm1 # sched: [1:0.50] +; HASWELL-NEXT: paddd -{{[0-9]+}}(%rsp), %mm1 # sched: [6:0.50] ; HASWELL-NEXT: paddd %mm1, %mm0 # sched: [1:0.50] ; HASWELL-NEXT: movd %mm1, %ecx # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %eax # sched: [1:1.00] ; HASWELL-NEXT: movl %ecx, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movd: ; BROADWELL: # %bb.0: @@ -822,7 +822,7 @@ ; HASWELL-NEXT: movdq2q %xmm0, %mm0 # sched: [2:0.67] ; HASWELL-NEXT: paddd %mm0, %mm0 # sched: [1:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movdq2q: ; BROADWELL: # %bb.0: @@ -889,7 +889,7 @@ ; HASWELL-LABEL: test_movntq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: movntq %mm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntq: ; BROADWELL: # %bb.0: @@ -953,10 +953,10 @@ ; ; HASWELL-LABEL: test_movq: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movq (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: movq (%rdi), %mm0 # sched: [5:0.50] ; HASWELL-NEXT: paddd %mm0, %mm0 # sched: [1:0.50] ; HASWELL-NEXT: movq %mm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movq: ; BROADWELL: # %bb.0: @@ -1024,7 +1024,7 @@ ; HASWELL-LABEL: test_movq2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: movq2dq %mm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movq2dq: ; BROADWELL: # %bb.0: @@ -1086,10 +1086,10 @@ ; ; HASWELL-LABEL: test_pabsb: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pabsb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pabsb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: pabsb %mm0, %mm0 # sched: [1:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsb: ; BROADWELL: # %bb.0: @@ -1164,10 +1164,10 @@ ; ; HASWELL-LABEL: test_pabsd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pabsd (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pabsd (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: pabsd %mm0, %mm0 # sched: [1:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsd: ; BROADWELL: # %bb.0: @@ -1242,10 +1242,10 @@ ; ; HASWELL-LABEL: test_pabsw: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pabsw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pabsw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: pabsw %mm0, %mm0 # sched: [1:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsw: ; BROADWELL: # %bb.0: @@ -1321,9 +1321,9 @@ ; HASWELL-LABEL: test_packssdw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: packssdw %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: packssdw (%rdi), %mm0 # sched: [2:2.00] +; HASWELL-NEXT: packssdw (%rdi), %mm0 # sched: [7:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packssdw: ; BROADWELL: # %bb.0: @@ -1399,9 +1399,9 @@ ; HASWELL-LABEL: test_packsswb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: packsswb %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: packsswb (%rdi), %mm0 # sched: [2:2.00] +; HASWELL-NEXT: packsswb (%rdi), %mm0 # sched: [7:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packsswb: ; BROADWELL: # %bb.0: @@ -1477,9 +1477,9 @@ ; HASWELL-LABEL: test_packuswb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: packuswb %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: packuswb (%rdi), %mm0 # sched: [2:2.00] +; HASWELL-NEXT: packuswb (%rdi), %mm0 # sched: [7:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packuswb: ; BROADWELL: # %bb.0: @@ -1555,9 +1555,9 @@ ; HASWELL-LABEL: test_paddb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddb: ; BROADWELL: # %bb.0: @@ -1633,9 +1633,9 @@ ; HASWELL-LABEL: test_paddd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddd %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddd (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddd (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddd: ; BROADWELL: # %bb.0: @@ -1711,9 +1711,9 @@ ; HASWELL-LABEL: test_paddq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddq %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddq (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddq (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddq: ; BROADWELL: # %bb.0: @@ -1789,9 +1789,9 @@ ; HASWELL-LABEL: test_paddsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddsb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddsb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddsb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddsb: ; BROADWELL: # %bb.0: @@ -1867,9 +1867,9 @@ ; HASWELL-LABEL: test_paddsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddsw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddsw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddsw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddsw: ; BROADWELL: # %bb.0: @@ -1945,9 +1945,9 @@ ; HASWELL-LABEL: test_paddusb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddusb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddusb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddusb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddusb: ; BROADWELL: # %bb.0: @@ -2023,9 +2023,9 @@ ; HASWELL-LABEL: test_paddusw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddusw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddusw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddusw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddusw: ; BROADWELL: # %bb.0: @@ -2101,9 +2101,9 @@ ; HASWELL-LABEL: test_paddw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: paddw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: paddw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: paddw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddw: ; BROADWELL: # %bb.0: @@ -2179,9 +2179,9 @@ ; HASWELL-LABEL: test_palignr: ; HASWELL: # %bb.0: ; HASWELL-NEXT: palignr $1, %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: palignr $1, (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: palignr $1, (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_palignr: ; BROADWELL: # %bb.0: @@ -2257,9 +2257,9 @@ ; HASWELL-LABEL: test_pand: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pand %mm1, %mm0 # sched: [1:0.33] -; HASWELL-NEXT: pand (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pand (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pand: ; BROADWELL: # %bb.0: @@ -2335,9 +2335,9 @@ ; HASWELL-LABEL: test_pandn: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pandn %mm1, %mm0 # sched: [1:0.33] -; HASWELL-NEXT: pandn (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pandn (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pandn: ; BROADWELL: # %bb.0: @@ -2413,9 +2413,9 @@ ; HASWELL-LABEL: test_pavgb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pavgb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pavgb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pavgb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pavgb: ; BROADWELL: # %bb.0: @@ -2491,9 +2491,9 @@ ; HASWELL-LABEL: test_pavgw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pavgw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pavgw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pavgw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pavgw: ; BROADWELL: # %bb.0: @@ -2569,9 +2569,9 @@ ; HASWELL-LABEL: test_pcmpeqb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pcmpeqb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pcmpeqb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pcmpeqb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqb: ; BROADWELL: # %bb.0: @@ -2647,9 +2647,9 @@ ; HASWELL-LABEL: test_pcmpeqd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pcmpeqd %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pcmpeqd (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pcmpeqd (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqd: ; BROADWELL: # %bb.0: @@ -2725,9 +2725,9 @@ ; HASWELL-LABEL: test_pcmpeqw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pcmpeqw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pcmpeqw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pcmpeqw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqw: ; BROADWELL: # %bb.0: @@ -2803,9 +2803,9 @@ ; HASWELL-LABEL: test_pcmpgtb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pcmpgtb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pcmpgtb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pcmpgtb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtb: ; BROADWELL: # %bb.0: @@ -2881,9 +2881,9 @@ ; HASWELL-LABEL: test_pcmpgtd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pcmpgtd %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pcmpgtd (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pcmpgtd (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtd: ; BROADWELL: # %bb.0: @@ -2959,9 +2959,9 @@ ; HASWELL-LABEL: test_pcmpgtw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pcmpgtw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pcmpgtw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pcmpgtw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtw: ; BROADWELL: # %bb.0: @@ -3029,7 +3029,7 @@ ; HASWELL-LABEL: test_pextrw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pextrw $0, %mm0, %eax # sched: [2:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pextrw: ; BROADWELL: # %bb.0: @@ -3092,9 +3092,9 @@ ; HASWELL-LABEL: test_phaddd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: phaddd %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: phaddd (%rdi), %mm0 # sched: [3:2.00] +; HASWELL-NEXT: phaddd (%rdi), %mm0 # sched: [8:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddd: ; BROADWELL: # %bb.0: @@ -3170,9 +3170,9 @@ ; HASWELL-LABEL: test_phaddsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: phaddsw %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: phaddsw (%rdi), %mm0 # sched: [3:2.00] +; HASWELL-NEXT: phaddsw (%rdi), %mm0 # sched: [8:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddsw: ; BROADWELL: # %bb.0: @@ -3248,9 +3248,9 @@ ; HASWELL-LABEL: test_phaddw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: phaddw %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: phaddw (%rdi), %mm0 # sched: [3:2.00] +; HASWELL-NEXT: phaddw (%rdi), %mm0 # sched: [8:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddw: ; BROADWELL: # %bb.0: @@ -3326,9 +3326,9 @@ ; HASWELL-LABEL: test_phsubd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: phsubd %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: phsubd (%rdi), %mm0 # sched: [3:2.00] +; HASWELL-NEXT: phsubd (%rdi), %mm0 # sched: [8:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubd: ; BROADWELL: # %bb.0: @@ -3404,9 +3404,9 @@ ; HASWELL-LABEL: test_phsubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: phsubsw %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: phsubsw (%rdi), %mm0 # sched: [3:2.00] +; HASWELL-NEXT: phsubsw (%rdi), %mm0 # sched: [8:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubsw: ; BROADWELL: # %bb.0: @@ -3482,9 +3482,9 @@ ; HASWELL-LABEL: test_phsubw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: phsubw %mm1, %mm0 # sched: [3:2.00] -; HASWELL-NEXT: phsubw (%rdi), %mm0 # sched: [3:2.00] +; HASWELL-NEXT: phsubw (%rdi), %mm0 # sched: [8:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubw: ; BROADWELL: # %bb.0: @@ -3564,10 +3564,10 @@ ; HASWELL-LABEL: test_pinsrw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pinsrw $0, %edi, %mm0 # sched: [2:2.00] -; HASWELL-NEXT: movswl (%rsi), %eax # sched: [4:0.50] +; HASWELL-NEXT: movswl (%rsi), %eax # sched: [5:0.50] ; HASWELL-NEXT: pinsrw $1, %eax, %mm0 # sched: [2:2.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pinsrw: ; BROADWELL: # %bb.0: @@ -3649,9 +3649,9 @@ ; HASWELL-LABEL: test_pmaddwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmaddwd %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmaddwd (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmaddwd (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaddwd: ; BROADWELL: # %bb.0: @@ -3727,9 +3727,9 @@ ; HASWELL-LABEL: test_pmaddubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmaddubsw %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmaddubsw (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmaddubsw (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaddubsw: ; BROADWELL: # %bb.0: @@ -3805,9 +3805,9 @@ ; HASWELL-LABEL: test_pmaxsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmaxsw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pmaxsw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pmaxsw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsw: ; BROADWELL: # %bb.0: @@ -3883,9 +3883,9 @@ ; HASWELL-LABEL: test_pmaxub: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmaxub %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pmaxub (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pmaxub (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxub: ; BROADWELL: # %bb.0: @@ -3961,9 +3961,9 @@ ; HASWELL-LABEL: test_pminsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pminsw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pminsw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pminsw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsw: ; BROADWELL: # %bb.0: @@ -4039,9 +4039,9 @@ ; HASWELL-LABEL: test_pminub: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pminub %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: pminub (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pminub (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminub: ; BROADWELL: # %bb.0: @@ -4108,8 +4108,8 @@ ; ; HASWELL-LABEL: test_pmovmskb: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pmovmskb %mm0, %eax # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: pmovmskb %mm0, %eax # sched: [1:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovmskb: ; BROADWELL: # %bb.0: @@ -4172,9 +4172,9 @@ ; HASWELL-LABEL: test_pmulhrsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmulhrsw %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmulhrsw (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmulhrsw (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhrsw: ; BROADWELL: # %bb.0: @@ -4250,9 +4250,9 @@ ; HASWELL-LABEL: test_pmulhw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmulhw %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmulhw (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmulhw (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhw: ; BROADWELL: # %bb.0: @@ -4328,9 +4328,9 @@ ; HASWELL-LABEL: test_pmulhuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmulhuw %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmulhuw (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmulhuw (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhuw: ; BROADWELL: # %bb.0: @@ -4406,9 +4406,9 @@ ; HASWELL-LABEL: test_pmullw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmullw %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmullw (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmullw (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmullw: ; BROADWELL: # %bb.0: @@ -4484,9 +4484,9 @@ ; HASWELL-LABEL: test_pmuludq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pmuludq %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: pmuludq (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: pmuludq (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmuludq: ; BROADWELL: # %bb.0: @@ -4562,9 +4562,9 @@ ; HASWELL-LABEL: test_por: ; HASWELL: # %bb.0: ; HASWELL-NEXT: por %mm1, %mm0 # sched: [1:0.33] -; HASWELL-NEXT: por (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: por (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_por: ; BROADWELL: # %bb.0: @@ -4640,9 +4640,9 @@ ; HASWELL-LABEL: test_psadbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psadbw %mm1, %mm0 # sched: [5:1.00] -; HASWELL-NEXT: psadbw (%rdi), %mm0 # sched: [5:1.00] +; HASWELL-NEXT: psadbw (%rdi), %mm0 # sched: [10:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psadbw: ; BROADWELL: # %bb.0: @@ -4718,9 +4718,9 @@ ; HASWELL-LABEL: test_pshufb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pshufb %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: pshufb (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: pshufb (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufb: ; BROADWELL: # %bb.0: @@ -4795,10 +4795,10 @@ ; ; HASWELL-LABEL: test_pshufw: ; HASWELL: # %bb.0: -; HASWELL-NEXT: pshufw $0, (%rdi), %mm0 # mm0 = mem[0,0,0,0] sched: [1:1.00] +; HASWELL-NEXT: pshufw $0, (%rdi), %mm0 # mm0 = mem[0,0,0,0] sched: [6:1.00] ; HASWELL-NEXT: pshufw $0, %mm0, %mm0 # mm0 = mm0[0,0,0,0] sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufw: ; BROADWELL: # %bb.0: @@ -4874,9 +4874,9 @@ ; HASWELL-LABEL: test_psignb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psignb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psignb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psignb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignb: ; BROADWELL: # %bb.0: @@ -4952,9 +4952,9 @@ ; HASWELL-LABEL: test_psignd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psignd %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psignd (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psignd (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignd: ; BROADWELL: # %bb.0: @@ -5030,9 +5030,9 @@ ; HASWELL-LABEL: test_psignw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psignw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psignw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psignw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignw: ; BROADWELL: # %bb.0: @@ -5112,10 +5112,10 @@ ; HASWELL-LABEL: test_pslld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pslld %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: pslld (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: pslld (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: pslld $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pslld: ; BROADWELL: # %bb.0: @@ -5202,10 +5202,10 @@ ; HASWELL-LABEL: test_psllq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psllq %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psllq (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psllq (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psllq $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllq: ; BROADWELL: # %bb.0: @@ -5292,10 +5292,10 @@ ; HASWELL-LABEL: test_psllw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psllw %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psllw (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psllw (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psllw $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllw: ; BROADWELL: # %bb.0: @@ -5382,10 +5382,10 @@ ; HASWELL-LABEL: test_psrad: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psrad %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psrad (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psrad (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psrad $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrad: ; BROADWELL: # %bb.0: @@ -5472,10 +5472,10 @@ ; HASWELL-LABEL: test_psraw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psraw %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psraw (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psraw (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psraw $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psraw: ; BROADWELL: # %bb.0: @@ -5562,10 +5562,10 @@ ; HASWELL-LABEL: test_psrld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psrld %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psrld (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psrld (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psrld $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrld: ; BROADWELL: # %bb.0: @@ -5652,10 +5652,10 @@ ; HASWELL-LABEL: test_psrlq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psrlq %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psrlq (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psrlq (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psrlq $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlq: ; BROADWELL: # %bb.0: @@ -5742,10 +5742,10 @@ ; HASWELL-LABEL: test_psrlw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psrlw %mm1, %mm0 # sched: [1:1.00] -; HASWELL-NEXT: psrlw (%rdi), %mm0 # sched: [1:1.00] +; HASWELL-NEXT: psrlw (%rdi), %mm0 # sched: [6:1.00] ; HASWELL-NEXT: psrlw $7, %mm0 # sched: [1:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlw: ; BROADWELL: # %bb.0: @@ -5828,9 +5828,9 @@ ; HASWELL-LABEL: test_psubb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubb: ; BROADWELL: # %bb.0: @@ -5906,9 +5906,9 @@ ; HASWELL-LABEL: test_psubd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubd %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubd (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubd (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubd: ; BROADWELL: # %bb.0: @@ -5984,9 +5984,9 @@ ; HASWELL-LABEL: test_psubq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubq %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubq (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubq (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubq: ; BROADWELL: # %bb.0: @@ -6062,9 +6062,9 @@ ; HASWELL-LABEL: test_psubsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubsb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubsb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubsb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubsb: ; BROADWELL: # %bb.0: @@ -6140,9 +6140,9 @@ ; HASWELL-LABEL: test_psubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubsw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubsw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubsw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubsw: ; BROADWELL: # %bb.0: @@ -6218,9 +6218,9 @@ ; HASWELL-LABEL: test_psubusb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubusb %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubusb (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubusb (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubusb: ; BROADWELL: # %bb.0: @@ -6296,9 +6296,9 @@ ; HASWELL-LABEL: test_psubusw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubusw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubusw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubusw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubusw: ; BROADWELL: # %bb.0: @@ -6374,9 +6374,9 @@ ; HASWELL-LABEL: test_psubw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: psubw %mm1, %mm0 # sched: [1:0.50] -; HASWELL-NEXT: psubw (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: psubw (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubw: ; BROADWELL: # %bb.0: @@ -6452,9 +6452,9 @@ ; HASWELL-LABEL: test_punpckhbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: punpckhbw %mm1, %mm0 # mm0 = mm0[4],mm1[4],mm0[5],mm1[5],mm0[6],mm1[6],mm0[7],mm1[7] sched: [1:1.00] -; HASWELL-NEXT: punpckhbw (%rdi), %mm0 # mm0 = mm0[4],mem[4],mm0[5],mem[5],mm0[6],mem[6],mm0[7],mem[7] sched: [1:1.00] +; HASWELL-NEXT: punpckhbw (%rdi), %mm0 # mm0 = mm0[4],mem[4],mm0[5],mem[5],mm0[6],mem[6],mm0[7],mem[7] sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhbw: ; BROADWELL: # %bb.0: @@ -6530,9 +6530,9 @@ ; HASWELL-LABEL: test_punpckhdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: punpckhdq %mm1, %mm0 # mm0 = mm0[1],mm1[1] sched: [1:1.00] -; HASWELL-NEXT: punpckhdq (%rdi), %mm0 # mm0 = mm0[1],mem[1] sched: [1:1.00] +; HASWELL-NEXT: punpckhdq (%rdi), %mm0 # mm0 = mm0[1],mem[1] sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhdq: ; BROADWELL: # %bb.0: @@ -6608,9 +6608,9 @@ ; HASWELL-LABEL: test_punpckhwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: punpckhwd %mm1, %mm0 # mm0 = mm0[2],mm1[2],mm0[3],mm1[3] sched: [1:1.00] -; HASWELL-NEXT: punpckhwd (%rdi), %mm0 # mm0 = mm0[2],mem[2],mm0[3],mem[3] sched: [1:1.00] +; HASWELL-NEXT: punpckhwd (%rdi), %mm0 # mm0 = mm0[2],mem[2],mm0[3],mem[3] sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhwd: ; BROADWELL: # %bb.0: @@ -6686,9 +6686,9 @@ ; HASWELL-LABEL: test_punpcklbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: punpcklbw %mm1, %mm0 # mm0 = mm0[0],mm1[0],mm0[1],mm1[1],mm0[2],mm1[2],mm0[3],mm1[3] sched: [1:1.00] -; HASWELL-NEXT: punpcklbw (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1],mm0[2],mem[2],mm0[3],mem[3] sched: [1:1.00] +; HASWELL-NEXT: punpcklbw (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1],mm0[2],mem[2],mm0[3],mem[3] sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklbw: ; BROADWELL: # %bb.0: @@ -6764,9 +6764,9 @@ ; HASWELL-LABEL: test_punpckldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: punpckldq %mm1, %mm0 # mm0 = mm0[0],mm1[0] sched: [1:1.00] -; HASWELL-NEXT: punpckldq (%rdi), %mm0 # mm0 = mm0[0],mem[0] sched: [1:1.00] +; HASWELL-NEXT: punpckldq (%rdi), %mm0 # mm0 = mm0[0],mem[0] sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckldq: ; BROADWELL: # %bb.0: @@ -6842,9 +6842,9 @@ ; HASWELL-LABEL: test_punpcklwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: punpcklwd %mm1, %mm0 # mm0 = mm0[0],mm1[0],mm0[1],mm1[1] sched: [1:1.00] -; HASWELL-NEXT: punpcklwd (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1] sched: [1:1.00] +; HASWELL-NEXT: punpcklwd (%rdi), %mm0 # mm0 = mm0[0],mem[0],mm0[1],mem[1] sched: [6:1.00] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklwd: ; BROADWELL: # %bb.0: @@ -6920,9 +6920,9 @@ ; HASWELL-LABEL: test_pxor: ; HASWELL: # %bb.0: ; HASWELL-NEXT: pxor %mm1, %mm0 # sched: [1:0.33] -; HASWELL-NEXT: pxor (%rdi), %mm0 # sched: [1:0.50] +; HASWELL-NEXT: pxor (%rdi), %mm0 # sched: [6:0.50] ; HASWELL-NEXT: movd %mm0, %rax # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pxor: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/movbe-schedule.ll =================================================================== --- test/CodeGen/X86/movbe-schedule.ll +++ test/CodeGen/X86/movbe-schedule.ll @@ -34,9 +34,9 @@ ; ; HASWELL-LABEL: test_movbe_i16: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movbew (%rdi), %ax # sched: [1:0.50] -; HASWELL-NEXT: movbew %si, (%rdx) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: movbew (%rdi), %ax # sched: [6:0.50] +; HASWELL-NEXT: movbew %si, (%rdx) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movbe_i16: ; BROADWELL: # %bb.0: @@ -94,9 +94,9 @@ ; ; HASWELL-LABEL: test_movbe_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movbel (%rdi), %eax # sched: [1:0.50] -; HASWELL-NEXT: movbel %esi, (%rdx) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: movbel (%rdi), %eax # sched: [6:0.50] +; HASWELL-NEXT: movbel %esi, (%rdx) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movbe_i32: ; BROADWELL: # %bb.0: @@ -154,9 +154,9 @@ ; ; HASWELL-LABEL: test_movbe_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movbeq (%rdi), %rax # sched: [1:0.50] -; HASWELL-NEXT: movbeq %rsi, (%rdx) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: movbeq (%rdi), %rax # sched: [6:0.50] +; HASWELL-NEXT: movbeq %rsi, (%rdx) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movbe_i64: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/mul-constant-i32.ll =================================================================== --- test/CodeGen/X86/mul-constant-i32.ll +++ test/CodeGen/X86/mul-constant-i32.ll @@ -17,7 +17,7 @@ ; X64-HSW-LABEL: test_mul_by_1: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_1: ; X64-JAG: # %bb.0: @@ -32,7 +32,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_1: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: movl %edi, %eax # sched: [1:0.25] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_1: ; JAG-NOOPT: # %bb.0: @@ -63,7 +63,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_2: ; X64-JAG: # %bb.0: @@ -81,7 +81,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: # kill: %edi %edi %rdi ; HSW-NOOPT-NEXT: leal (%rdi,%rdi), %eax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_2: ; JAG-NOOPT: # %bb.0: @@ -114,7 +114,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_3: ; X64-JAG: # %bb.0: @@ -131,7 +131,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: # kill: %edi %edi %rdi ; HSW-NOOPT-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_3: ; JAG-NOOPT: # %bb.0: @@ -165,7 +165,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (,%rdi,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_4: ; X64-JAG: # %bb.0: @@ -183,7 +183,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: # kill: %edi %edi %rdi ; HSW-NOOPT-NEXT: leal (,%rdi,4), %eax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_4: ; JAG-NOOPT: # %bb.0: @@ -216,7 +216,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_5: ; X64-JAG: # %bb.0: @@ -233,7 +233,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: # kill: %edi %edi %rdi ; HSW-NOOPT-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_5: ; JAG-NOOPT: # %bb.0: @@ -269,7 +269,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: addl %edi, %edi # sched: [1:0.25] ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_6: ; X64-JAG: # %bb.0: @@ -286,7 +286,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_6: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $6, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_6: ; JAG-NOOPT: # %bb.0: @@ -321,7 +321,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (,%rdi,8), %eax # sched: [1:0.50] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_7: ; X64-JAG: # %bb.0: @@ -338,7 +338,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_7: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $7, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_7: ; JAG-NOOPT: # %bb.0: @@ -371,7 +371,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (,%rdi,8), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_8: ; X64-JAG: # %bb.0: @@ -389,7 +389,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: # kill: %edi %edi %rdi ; HSW-NOOPT-NEXT: leal (,%rdi,8), %eax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_8: ; JAG-NOOPT: # %bb.0: @@ -422,7 +422,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_9: ; X64-JAG: # %bb.0: @@ -439,7 +439,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: # kill: %edi %edi %rdi ; HSW-NOOPT-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_9: ; JAG-NOOPT: # %bb.0: @@ -475,7 +475,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: addl %edi, %edi # sched: [1:0.25] ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_10: ; X64-JAG: # %bb.0: @@ -492,7 +492,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_10: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $10, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_10: ; JAG-NOOPT: # %bb.0: @@ -527,7 +527,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rax,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_11: ; X64-JAG: # %bb.0: @@ -544,7 +544,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_11: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $11, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_11: ; JAG-NOOPT: # %bb.0: @@ -577,7 +577,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: shll $2, %edi # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_12: ; X64-JAG: # %bb.0: @@ -594,7 +594,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_12: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $12, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_12: ; JAG-NOOPT: # %bb.0: @@ -629,7 +629,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_13: ; X64-JAG: # %bb.0: @@ -646,7 +646,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_13: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $13, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_13: ; JAG-NOOPT: # %bb.0: @@ -681,7 +681,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_14: ; X64-JAG: # %bb.0: @@ -699,7 +699,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_14: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $14, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_14: ; JAG-NOOPT: # %bb.0: @@ -732,7 +732,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_15: ; X64-JAG: # %bb.0: @@ -749,7 +749,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_15: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $15, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_15: ; JAG-NOOPT: # %bb.0: @@ -782,7 +782,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shll $4, %edi # sched: [1:0.50] ; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_16: ; X64-JAG: # %bb.0: @@ -800,7 +800,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: shll $4, %edi # sched: [1:0.50] ; HSW-NOOPT-NEXT: movl %edi, %eax # sched: [1:0.25] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_16: ; JAG-NOOPT: # %bb.0: @@ -838,7 +838,7 @@ ; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25] ; X64-HSW-NEXT: shll $4, %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rax,%rdi), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_17: ; X64-JAG: # %bb.0: @@ -856,7 +856,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_17: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $17, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_17: ; JAG-NOOPT: # %bb.0: @@ -892,7 +892,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: addl %edi, %edi # sched: [1:0.25] ; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_18: ; X64-JAG: # %bb.0: @@ -909,7 +909,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_18: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $18, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_18: ; JAG-NOOPT: # %bb.0: @@ -946,7 +946,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: shll $2, %eax # sched: [1:0.50] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_19: ; X64-JAG: # %bb.0: @@ -964,7 +964,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_19: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $19, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_19: ; JAG-NOOPT: # %bb.0: @@ -997,7 +997,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: shll $2, %edi # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_20: ; X64-JAG: # %bb.0: @@ -1014,7 +1014,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_20: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $20, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_20: ; JAG-NOOPT: # %bb.0: @@ -1049,7 +1049,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_21: ; X64-JAG: # %bb.0: @@ -1066,7 +1066,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_21: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $21, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_21: ; JAG-NOOPT: # %bb.0: @@ -1101,7 +1101,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rax,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_22: ; X64-JAG: # %bb.0: @@ -1119,7 +1119,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_22: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $22, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_22: ; JAG-NOOPT: # %bb.0: @@ -1154,7 +1154,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] ; X64-HSW-NEXT: shll $3, %eax # sched: [1:0.50] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_23: ; X64-JAG: # %bb.0: @@ -1172,7 +1172,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_23: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $23, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_23: ; JAG-NOOPT: # %bb.0: @@ -1205,7 +1205,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: shll $3, %edi # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rdi,%rdi,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_24: ; X64-JAG: # %bb.0: @@ -1222,7 +1222,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_24: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $24, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_24: ; JAG-NOOPT: # %bb.0: @@ -1257,7 +1257,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rax,%rax,4), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_25: ; X64-JAG: # %bb.0: @@ -1274,7 +1274,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_25: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $25, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_25: ; JAG-NOOPT: # %bb.0: @@ -1311,7 +1311,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_26: ; X64-JAG: # %bb.0: @@ -1329,7 +1329,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_26: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $26, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_26: ; JAG-NOOPT: # %bb.0: @@ -1362,7 +1362,7 @@ ; X64-HSW-NEXT: # kill: %edi %edi %rdi ; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_27: ; X64-JAG: # %bb.0: @@ -1379,7 +1379,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_27: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $27, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_27: ; JAG-NOOPT: # %bb.0: @@ -1416,7 +1416,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,8), %eax # sched: [1:0.50] ; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50] ; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_28: ; X64-JAG: # %bb.0: @@ -1434,7 +1434,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_28: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $28, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_28: ; JAG-NOOPT: # %bb.0: @@ -1471,7 +1471,7 @@ ; X64-HSW-NEXT: leal (%rax,%rax,2), %eax # sched: [1:0.50] ; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25] ; X64-HSW-NEXT: addl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_29: ; X64-JAG: # %bb.0: @@ -1490,7 +1490,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_29: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $29, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_29: ; JAG-NOOPT: # %bb.0: @@ -1526,7 +1526,7 @@ ; X64-HSW-NEXT: shll $5, %eax # sched: [1:0.50] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_30: ; X64-JAG: # %bb.0: @@ -1544,7 +1544,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_30: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $30, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_30: ; JAG-NOOPT: # %bb.0: @@ -1578,7 +1578,7 @@ ; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25] ; X64-HSW-NEXT: shll $5, %eax # sched: [1:0.50] ; X64-HSW-NEXT: subl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_31: ; X64-JAG: # %bb.0: @@ -1595,7 +1595,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_31: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imull $31, %edi, %eax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_31: ; JAG-NOOPT: # %bb.0: @@ -1628,7 +1628,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shll $5, %edi # sched: [1:0.50] ; X64-HSW-NEXT: movl %edi, %eax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_32: ; X64-JAG: # %bb.0: @@ -1646,7 +1646,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: shll $5, %edi # sched: [1:0.50] ; HSW-NOOPT-NEXT: movl %edi, %eax # sched: [1:0.25] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_32: ; JAG-NOOPT: # %bb.0: @@ -1687,7 +1687,7 @@ ; X64-HSW-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; X64-HSW-NEXT: addl $2, %eax # sched: [1:0.25] ; X64-HSW-NEXT: imull %ecx, %eax # sched: [4:1.00] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_spec: ; X64-JAG: # %bb.0: @@ -1713,7 +1713,7 @@ ; HSW-NOOPT-NEXT: leal (%rdi,%rdi,4), %eax # sched: [1:0.50] ; HSW-NOOPT-NEXT: addl $2, %eax # sched: [1:0.25] ; HSW-NOOPT-NEXT: imull %ecx, %eax # sched: [4:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_spec: ; JAG-NOOPT: # %bb.0: Index: test/CodeGen/X86/mul-constant-i64.ll =================================================================== --- test/CodeGen/X86/mul-constant-i64.ll +++ test/CodeGen/X86/mul-constant-i64.ll @@ -18,7 +18,7 @@ ; X64-HSW-LABEL: test_mul_by_1: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_1: ; X64-JAG: # %bb.0: @@ -34,7 +34,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_1: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: movq %rdi, %rax # sched: [1:0.25] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_1: ; JAG-NOOPT: # %bb.0: @@ -66,7 +66,7 @@ ; X64-HSW-LABEL: test_mul_by_2: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_2: ; X64-JAG: # %bb.0: @@ -84,7 +84,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_2: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: leaq (%rdi,%rdi), %rax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_2: ; JAG-NOOPT: # %bb.0: @@ -116,7 +116,7 @@ ; X64-HSW-LABEL: test_mul_by_3: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_3: ; X64-JAG: # %bb.0: @@ -134,7 +134,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_3: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_3: ; JAG-NOOPT: # %bb.0: @@ -166,7 +166,7 @@ ; X64-HSW-LABEL: test_mul_by_4: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (,%rdi,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_4: ; X64-JAG: # %bb.0: @@ -184,7 +184,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_4: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: leaq (,%rdi,4), %rax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_4: ; JAG-NOOPT: # %bb.0: @@ -216,7 +216,7 @@ ; X64-HSW-LABEL: test_mul_by_5: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_5: ; X64-JAG: # %bb.0: @@ -234,7 +234,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_5: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_5: ; JAG-NOOPT: # %bb.0: @@ -268,7 +268,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: addq %rdi, %rdi # sched: [1:0.25] ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_6: ; X64-JAG: # %bb.0: @@ -287,7 +287,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_6: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $6, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_6: ; JAG-NOOPT: # %bb.0: @@ -323,7 +323,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (,%rdi,8), %rax # sched: [1:0.50] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_7: ; X64-JAG: # %bb.0: @@ -342,7 +342,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_7: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $7, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_7: ; JAG-NOOPT: # %bb.0: @@ -375,7 +375,7 @@ ; X64-HSW-LABEL: test_mul_by_8: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (,%rdi,8), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_8: ; X64-JAG: # %bb.0: @@ -393,7 +393,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_8: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: leaq (,%rdi,8), %rax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_8: ; JAG-NOOPT: # %bb.0: @@ -425,7 +425,7 @@ ; X64-HSW-LABEL: test_mul_by_9: ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_9: ; X64-JAG: # %bb.0: @@ -443,7 +443,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_9: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_9: ; JAG-NOOPT: # %bb.0: @@ -477,7 +477,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: addq %rdi, %rdi # sched: [1:0.25] ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_10: ; X64-JAG: # %bb.0: @@ -496,7 +496,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_10: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $10, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_10: ; JAG-NOOPT: # %bb.0: @@ -532,7 +532,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rax,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_11: ; X64-JAG: # %bb.0: @@ -551,7 +551,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_11: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $11, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_11: ; JAG-NOOPT: # %bb.0: @@ -585,7 +585,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shlq $2, %rdi # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_12: ; X64-JAG: # %bb.0: @@ -604,7 +604,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_12: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $12, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_12: ; JAG-NOOPT: # %bb.0: @@ -640,7 +640,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_13: ; X64-JAG: # %bb.0: @@ -659,7 +659,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_13: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $13, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_13: ; JAG-NOOPT: # %bb.0: @@ -696,7 +696,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_14: ; X64-JAG: # %bb.0: @@ -716,7 +716,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_14: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $14, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_14: ; JAG-NOOPT: # %bb.0: @@ -751,7 +751,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_15: ; X64-JAG: # %bb.0: @@ -770,7 +770,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_15: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $15, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_15: ; JAG-NOOPT: # %bb.0: @@ -804,7 +804,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shlq $4, %rdi # sched: [1:0.50] ; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_16: ; X64-JAG: # %bb.0: @@ -824,7 +824,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: shlq $4, %rdi # sched: [1:0.50] ; HSW-NOOPT-NEXT: movq %rdi, %rax # sched: [1:0.25] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_16: ; JAG-NOOPT: # %bb.0: @@ -864,7 +864,7 @@ ; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25] ; X64-HSW-NEXT: shlq $4, %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rax,%rdi), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_17: ; X64-JAG: # %bb.0: @@ -884,7 +884,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_17: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $17, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_17: ; JAG-NOOPT: # %bb.0: @@ -920,7 +920,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: addq %rdi, %rdi # sched: [1:0.25] ; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_18: ; X64-JAG: # %bb.0: @@ -939,7 +939,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_18: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $18, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_18: ; JAG-NOOPT: # %bb.0: @@ -977,7 +977,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: shlq $2, %rax # sched: [1:0.50] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_19: ; X64-JAG: # %bb.0: @@ -997,7 +997,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_19: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $19, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_19: ; JAG-NOOPT: # %bb.0: @@ -1031,7 +1031,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shlq $2, %rdi # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_20: ; X64-JAG: # %bb.0: @@ -1050,7 +1050,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_20: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $20, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_20: ; JAG-NOOPT: # %bb.0: @@ -1086,7 +1086,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_21: ; X64-JAG: # %bb.0: @@ -1105,7 +1105,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_21: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $21, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_21: ; JAG-NOOPT: # %bb.0: @@ -1142,7 +1142,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rax,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_22: ; X64-JAG: # %bb.0: @@ -1162,7 +1162,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_22: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $22, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_22: ; JAG-NOOPT: # %bb.0: @@ -1199,7 +1199,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] ; X64-HSW-NEXT: shlq $3, %rax # sched: [1:0.50] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_23: ; X64-JAG: # %bb.0: @@ -1219,7 +1219,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_23: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $23, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_23: ; JAG-NOOPT: # %bb.0: @@ -1253,7 +1253,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shlq $3, %rdi # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rdi,%rdi,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_24: ; X64-JAG: # %bb.0: @@ -1272,7 +1272,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_24: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $24, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_24: ; JAG-NOOPT: # %bb.0: @@ -1308,7 +1308,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rax,%rax,4), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_25: ; X64-JAG: # %bb.0: @@ -1327,7 +1327,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_25: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $25, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_25: ; JAG-NOOPT: # %bb.0: @@ -1365,7 +1365,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_26: ; X64-JAG: # %bb.0: @@ -1385,7 +1385,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_26: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $26, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_26: ; JAG-NOOPT: # %bb.0: @@ -1420,7 +1420,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_27: ; X64-JAG: # %bb.0: @@ -1439,7 +1439,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_27: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $27, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_27: ; JAG-NOOPT: # %bb.0: @@ -1477,7 +1477,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,8), %rax # sched: [1:0.50] ; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50] ; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_28: ; X64-JAG: # %bb.0: @@ -1497,7 +1497,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_28: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $28, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_28: ; JAG-NOOPT: # %bb.0: @@ -1536,7 +1536,7 @@ ; X64-HSW-NEXT: leaq (%rax,%rax,2), %rax # sched: [1:0.50] ; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25] ; X64-HSW-NEXT: addq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_29: ; X64-JAG: # %bb.0: @@ -1557,7 +1557,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_29: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $29, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_29: ; JAG-NOOPT: # %bb.0: @@ -1596,7 +1596,7 @@ ; X64-HSW-NEXT: shlq $5, %rax # sched: [1:0.50] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_30: ; X64-JAG: # %bb.0: @@ -1617,7 +1617,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_30: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $30, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_30: ; JAG-NOOPT: # %bb.0: @@ -1654,7 +1654,7 @@ ; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25] ; X64-HSW-NEXT: shlq $5, %rax # sched: [1:0.50] ; X64-HSW-NEXT: subq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_31: ; X64-JAG: # %bb.0: @@ -1674,7 +1674,7 @@ ; HSW-NOOPT-LABEL: test_mul_by_31: ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: imulq $31, %rdi, %rax # sched: [3:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_31: ; JAG-NOOPT: # %bb.0: @@ -1709,7 +1709,7 @@ ; X64-HSW: # %bb.0: ; X64-HSW-NEXT: shlq $5, %rdi # sched: [1:0.50] ; X64-HSW-NEXT: movq %rdi, %rax # sched: [1:0.25] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_by_32: ; X64-JAG: # %bb.0: @@ -1729,7 +1729,7 @@ ; HSW-NOOPT: # %bb.0: ; HSW-NOOPT-NEXT: shlq $5, %rdi # sched: [1:0.50] ; HSW-NOOPT-NEXT: movq %rdi, %rax # sched: [1:0.25] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_by_32: ; JAG-NOOPT: # %bb.0: @@ -1793,7 +1793,7 @@ ; X64-HSW-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; X64-HSW-NEXT: addq $2, %rax # sched: [1:0.25] ; X64-HSW-NEXT: imulq %rcx, %rax # sched: [4:1.00] -; X64-HSW-NEXT: retq # sched: [2:1.00] +; X64-HSW-NEXT: retq # sched: [7:1.00] ; ; X64-JAG-LABEL: test_mul_spec: ; X64-JAG: # %bb.0: @@ -1841,7 +1841,7 @@ ; HSW-NOOPT-NEXT: leaq (%rdi,%rdi,4), %rax # sched: [1:0.50] ; HSW-NOOPT-NEXT: addq $2, %rax # sched: [1:0.25] ; HSW-NOOPT-NEXT: imulq %rcx, %rax # sched: [4:1.00] -; HSW-NOOPT-NEXT: retq # sched: [2:1.00] +; HSW-NOOPT-NEXT: retq # sched: [7:1.00] ; ; JAG-NOOPT-LABEL: test_mul_spec: ; JAG-NOOPT: # %bb.0: Index: test/CodeGen/X86/popcnt-schedule.ll =================================================================== --- test/CodeGen/X86/popcnt-schedule.ll +++ test/CodeGen/X86/popcnt-schedule.ll @@ -38,11 +38,11 @@ ; ; HASWELL-LABEL: test_ctpop_i16: ; HASWELL: # %bb.0: -; HASWELL-NEXT: popcntw (%rsi), %cx # sched: [3:1.00] +; HASWELL-NEXT: popcntw (%rsi), %cx # sched: [8:1.00] ; HASWELL-NEXT: popcntw %di, %ax # sched: [3:1.00] ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ctpop_i16: ; BROADWELL: # %bb.0: @@ -107,10 +107,10 @@ ; ; HASWELL-LABEL: test_ctpop_i32: ; HASWELL: # %bb.0: -; HASWELL-NEXT: popcntl (%rsi), %ecx # sched: [3:1.00] +; HASWELL-NEXT: popcntl (%rsi), %ecx # sched: [8:1.00] ; HASWELL-NEXT: popcntl %edi, %eax # sched: [3:1.00] ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ctpop_i32: ; BROADWELL: # %bb.0: @@ -171,10 +171,10 @@ ; ; HASWELL-LABEL: test_ctpop_i64: ; HASWELL: # %bb.0: -; HASWELL-NEXT: popcntq (%rsi), %rcx # sched: [3:1.00] +; HASWELL-NEXT: popcntq (%rsi), %rcx # sched: [8:1.00] ; HASWELL-NEXT: popcntq %rdi, %rax # sched: [3:1.00] ; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ctpop_i64: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/recip-fastmath.ll =================================================================== --- test/CodeGen/X86/recip-fastmath.ll +++ test/CodeGen/X86/recip-fastmath.ll @@ -51,9 +51,9 @@ ; ; HASWELL-LABEL: f32_no_estimate: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vdivss %xmm0, %xmm1, %xmm0 # sched: [13:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_no_estimate: ; HASWELL-NO-FMA: # %bb.0: @@ -63,9 +63,9 @@ ; ; KNL-LABEL: f32_no_estimate: ; KNL: # %bb.0: -; KNL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50] +; KNL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50] ; KNL-NEXT: vdivss %xmm0, %xmm1, %xmm0 # sched: [13:1.00] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_no_estimate: ; SKX: # %bb.0: @@ -128,9 +128,9 @@ ; HASWELL-LABEL: f32_one_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50] +; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_one_step: ; HASWELL-NO-FMA: # %bb.0: @@ -145,9 +145,9 @@ ; KNL-LABEL: f32_one_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50] +; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50] ; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_one_step: ; SKX: # %bb.0: @@ -233,13 +233,13 @@ ; HASWELL-LABEL: f32_two_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_two_step: ; HASWELL-NO-FMA: # %bb.0: @@ -258,13 +258,13 @@ ; KNL-LABEL: f32_two_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; KNL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_two_step: ; SKX: # %bb.0: @@ -314,9 +314,9 @@ ; ; HASWELL-LABEL: v4f32_no_estimate: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NEXT: vdivps %xmm0, %xmm1, %xmm0 # sched: [13:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v4f32_no_estimate: ; HASWELL-NO-FMA: # %bb.0: @@ -326,9 +326,9 @@ ; ; KNL-LABEL: v4f32_no_estimate: ; KNL: # %bb.0: -; KNL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} xmm1 = [1,1,1,1] sched: [6:0.50] ; KNL-NEXT: vdivps %xmm0, %xmm1, %xmm0 # sched: [13:1.00] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v4f32_no_estimate: ; SKX: # %bb.0: @@ -391,10 +391,10 @@ ; HASWELL-LABEL: v4f32_one_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v4f32_one_step: ; HASWELL-NO-FMA: # %bb.0: @@ -409,10 +409,10 @@ ; KNL-LABEL: v4f32_one_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v4f32_one_step: ; SKX: # %bb.0: @@ -498,13 +498,13 @@ ; HASWELL-LABEL: v4f32_two_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v4f32_two_step: ; HASWELL-NO-FMA: # %bb.0: @@ -523,13 +523,13 @@ ; KNL-LABEL: v4f32_two_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v4f32_two_step: ; SKX: # %bb.0: @@ -582,9 +582,9 @@ ; ; HASWELL-LABEL: v8f32_no_estimate: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NEXT: vdivps %ymm0, %ymm1, %ymm0 # sched: [21:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_no_estimate: ; HASWELL-NO-FMA: # %bb.0: @@ -594,9 +594,9 @@ ; ; KNL-LABEL: v8f32_no_estimate: ; KNL: # %bb.0: -; KNL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} ymm1 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; KNL-NEXT: vdivps %ymm0, %ymm1, %ymm0 # sched: [21:2.00] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_no_estimate: ; SKX: # %bb.0: @@ -666,10 +666,10 @@ ; HASWELL-LABEL: v8f32_one_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_one_step: ; HASWELL-NO-FMA: # %bb.0: @@ -684,10 +684,10 @@ ; KNL-LABEL: v8f32_one_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_one_step: ; SKX: # %bb.0: @@ -786,13 +786,13 @@ ; HASWELL-LABEL: v8f32_two_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_two_step: ; HASWELL-NO-FMA: # %bb.0: @@ -811,13 +811,13 @@ ; KNL-LABEL: v8f32_two_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; KNL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_two_step: ; SKX: # %bb.0: Index: test/CodeGen/X86/recip-fastmath2.ll =================================================================== --- test/CodeGen/X86/recip-fastmath2.ll +++ test/CodeGen/X86/recip-fastmath2.ll @@ -45,20 +45,20 @@ ; HASWELL-LABEL: f32_no_step_2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_no_step_2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: f32_no_step_2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00] -; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_no_step_2: ; SKX: # %bb.0: @@ -126,29 +126,29 @@ ; HASWELL-LABEL: f32_one_step_2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50] +; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_one_step_2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vsubss %xmm0, %xmm2, %xmm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddss %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: f32_one_step_2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50] +; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50] ; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_one_step_2: ; SKX: # %bb.0: @@ -223,32 +223,32 @@ ; HASWELL-LABEL: f32_one_step_2_divs: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50] +; HASWELL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50] +; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [10:0.50] ; HASWELL-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_one_step_2_divs: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vsubss %xmm0, %xmm2, %xmm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddss %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50] +; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [10:0.50] ; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: f32_one_step_2_divs: ; KNL: # %bb.0: ; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [5:0.50] +; KNL-NEXT: vfnmadd213ss {{.*}}(%rip), %xmm1, %xmm0 # sched: [10:0.50] ; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50] +; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 # sched: [10:0.50] ; KNL-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_one_step_2_divs: ; SKX: # %bb.0: @@ -342,20 +342,20 @@ ; HASWELL-LABEL: f32_two_step_2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: f32_two_step_2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm1, %xmm0, %xmm2 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm3 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vmovss {{.*#+}} xmm3 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vsubss %xmm2, %xmm3, %xmm2 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm2, %xmm1, %xmm2 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddss %xmm2, %xmm1, %xmm1 # sched: [3:1.00] @@ -363,20 +363,20 @@ ; HASWELL-NO-FMA-NEXT: vsubss %xmm0, %xmm3, %xmm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulss %xmm0, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddss %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: f32_two_step_2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpss %xmm0, %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; KNL-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; KNL-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ss %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfnmadd213ss %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ss %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm0 # sched: [10:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: f32_two_step_2: ; SKX: # %bb.0: @@ -450,31 +450,31 @@ ; HASWELL-LABEL: v4f32_one_step2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v4f32_one_step2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NO-FMA-NEXT: vsubps %xmm0, %xmm2, %xmm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v4f32_one_step2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v4f32_one_step2: ; SKX: # %bb.0: @@ -549,34 +549,34 @@ ; HASWELL-LABEL: v4f32_one_step_2_divs: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [11:0.50] ; HASWELL-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v4f32_one_step_2_divs: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NO-FMA-NEXT: vsubps %xmm0, %xmm2, %xmm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [11:0.50] ; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v4f32_one_step_2_divs: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [5:0.50] +; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm1 # sched: [11:0.50] ; KNL-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v4f32_one_step_2_divs: ; SKX: # %bb.0: @@ -670,20 +670,20 @@ ; HASWELL-LABEL: v4f32_two_step2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; HASWELL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v4f32_two_step2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm1, %xmm0, %xmm2 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm3 = [1,1,1,1] sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} xmm3 = [1,1,1,1] sched: [6:0.50] ; HASWELL-NO-FMA-NEXT: vsubps %xmm2, %xmm3, %xmm2 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm2, %xmm1, %xmm2 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %xmm2, %xmm1, %xmm1 # sched: [3:1.00] @@ -691,20 +691,20 @@ ; HASWELL-NO-FMA-NEXT: vsubps %xmm0, %xmm3, %xmm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %xmm0, %xmm1, %xmm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v4f32_two_step2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %xmm0, %xmm1 # sched: [5:1.00] -; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} xmm2 = [1,1,1,1] sched: [6:0.50] ; KNL-NEXT: vmovaps %xmm1, %xmm3 # sched: [1:1.00] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm0, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm1, %xmm1, %xmm3 # sched: [5:0.50] ; KNL-NEXT: vfnmadd213ps %xmm2, %xmm3, %xmm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %xmm3, %xmm3, %xmm0 # sched: [5:0.50] -; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 # sched: [11:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v4f32_two_step2: ; SKX: # %bb.0: @@ -786,31 +786,31 @@ ; HASWELL-LABEL: v8f32_one_step2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_one_step2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm1, %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NO-FMA-NEXT: vsubps %ymm0, %ymm2, %ymm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v8f32_one_step2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_one_step2: ; SKX: # %bb.0: @@ -894,34 +894,34 @@ ; HASWELL-LABEL: v8f32_one_step_2_divs: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [5:0.50] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [12:0.50] ; HASWELL-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_one_step_2_divs: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm1, %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NO-FMA-NEXT: vsubps %ymm0, %ymm2, %ymm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [5:0.50] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [12:0.50] ; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v8f32_one_step_2_divs: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [5:0.50] +; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm1 # sched: [12:0.50] ; KNL-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_one_step_2_divs: ; SKX: # %bb.0: @@ -1029,20 +1029,20 @@ ; HASWELL-LABEL: v8f32_two_step2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50] ; HASWELL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50] ; HASWELL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_two_step2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm1, %ymm0, %ymm2 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm3 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; HASWELL-NO-FMA-NEXT: vbroadcastss {{.*#+}} ymm3 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; HASWELL-NO-FMA-NEXT: vsubps %ymm2, %ymm3, %ymm2 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm2, %ymm1, %ymm2 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %ymm2, %ymm1, %ymm1 # sched: [3:1.00] @@ -1050,20 +1050,20 @@ ; HASWELL-NO-FMA-NEXT: vsubps %ymm0, %ymm3, %ymm0 # sched: [3:1.00] ; HASWELL-NO-FMA-NEXT: vmulps %ymm0, %ymm1, %ymm0 # sched: [5:0.50] ; HASWELL-NO-FMA-NEXT: vaddps %ymm0, %ymm1, %ymm0 # sched: [3:1.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v8f32_two_step2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm1 # sched: [11:2.00] -; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [1:0.50] +; KNL-NEXT: vbroadcastss {{.*#+}} ymm2 = [1,1,1,1,1,1,1,1] sched: [7:0.50] ; KNL-NEXT: vmovaps %ymm1, %ymm3 # sched: [1:1.00] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm0, %ymm3 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm1, %ymm1, %ymm3 # sched: [5:0.50] ; KNL-NEXT: vfnmadd213ps %ymm2, %ymm3, %ymm0 # sched: [5:0.50] ; KNL-NEXT: vfmadd132ps %ymm3, %ymm3, %ymm0 # sched: [5:0.50] -; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_two_step2: ; SKX: # %bb.0: @@ -1110,17 +1110,17 @@ ; HASWELL-LABEL: v8f32_no_step: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_no_step: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v8f32_no_step: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_no_step: ; SKX: # %bb.0: @@ -1166,20 +1166,20 @@ ; HASWELL-LABEL: v8f32_no_step2: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] -; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; HASWELL-NO-FMA-LABEL: v8f32_no_step2: ; HASWELL-NO-FMA: # %bb.0: ; HASWELL-NO-FMA-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] -; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; HASWELL-NO-FMA-NEXT: retq # sched: [2:1.00] +; HASWELL-NO-FMA-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; HASWELL-NO-FMA-NEXT: retq # sched: [7:1.00] ; ; KNL-LABEL: v8f32_no_step2: ; KNL: # %bb.0: ; KNL-NEXT: vrcpps %ymm0, %ymm0 # sched: [11:2.00] -; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [5:0.50] -; KNL-NEXT: retq # sched: [2:1.00] +; KNL-NEXT: vmulps {{.*}}(%rip), %ymm0, %ymm0 # sched: [12:0.50] +; KNL-NEXT: retq # sched: [7:1.00] ; ; SKX-LABEL: v8f32_no_step2: ; SKX: # %bb.0: Index: test/CodeGen/X86/schedule-x86_32.ll =================================================================== --- test/CodeGen/X86/schedule-x86_32.ll +++ test/CodeGen/X86/schedule-x86_32.ll @@ -46,11 +46,11 @@ ; ; HASWELL-LABEL: test_aaa: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50] +; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: aaa # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aaa: ; BROADWELL: # %bb.0: @@ -130,11 +130,11 @@ ; ; HASWELL-LABEL: test_aad: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movzwl {{[0-9]+}}(%esp), %eax # sched: [4:0.50] +; HASWELL-NEXT: movzwl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: aad # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aad: ; BROADWELL: # %bb.0: @@ -214,11 +214,11 @@ ; ; HASWELL-LABEL: test_aam: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50] +; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: aam # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aam: ; BROADWELL: # %bb.0: @@ -298,11 +298,11 @@ ; ; HASWELL-LABEL: test_aas: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50] +; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: aas # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_aas: ; BROADWELL: # %bb.0: @@ -384,11 +384,11 @@ ; ; HASWELL-LABEL: test_daa: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50] +; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: daa # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_daa: ; BROADWELL: # %bb.0: @@ -468,11 +468,11 @@ ; ; HASWELL-LABEL: test_das: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [1:0.50] +; HASWELL-NEXT: movb {{[0-9]+}}(%esp), %al # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: das # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_das: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/schedule-x86_64.ll =================================================================== --- test/CodeGen/X86/schedule-x86_64.ll +++ test/CodeGen/X86/schedule-x86_64.ll @@ -60,11 +60,11 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: #APP ; HASWELL-NEXT: bsfw %di, %ax # sched: [3:1.00] -; HASWELL-NEXT: bsfw (%rsi), %cx # sched: [3:1.00] +; HASWELL-NEXT: bsfw (%rsi), %cx # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bsf16: ; BROADWELL: # %bb.0: @@ -162,10 +162,10 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: #APP ; HASWELL-NEXT: bsfl %edi, %eax # sched: [3:1.00] -; HASWELL-NEXT: bsfl (%rsi), %ecx # sched: [3:1.00] +; HASWELL-NEXT: bsfl (%rsi), %ecx # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bsf32: ; BROADWELL: # %bb.0: @@ -258,10 +258,10 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: #APP ; HASWELL-NEXT: bsfq %rdi, %rax # sched: [3:1.00] -; HASWELL-NEXT: bsfq (%rsi), %rcx # sched: [3:1.00] +; HASWELL-NEXT: bsfq (%rsi), %rcx # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bsf64: ; BROADWELL: # %bb.0: @@ -359,11 +359,11 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: #APP ; HASWELL-NEXT: bsrw %di, %ax # sched: [3:1.00] -; HASWELL-NEXT: bsrw (%rsi), %cx # sched: [3:1.00] +; HASWELL-NEXT: bsrw (%rsi), %cx # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bsr16: ; BROADWELL: # %bb.0: @@ -461,10 +461,10 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: #APP ; HASWELL-NEXT: bsrl %edi, %eax # sched: [3:1.00] -; HASWELL-NEXT: bsrl (%rsi), %ecx # sched: [3:1.00] +; HASWELL-NEXT: bsrl (%rsi), %ecx # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bsr32: ; BROADWELL: # %bb.0: @@ -557,10 +557,10 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: #APP ; HASWELL-NEXT: bsrq %rdi, %rax # sched: [3:1.00] -; HASWELL-NEXT: bsrq (%rsi), %rcx # sched: [3:1.00] +; HASWELL-NEXT: bsrq (%rsi), %rcx # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP ; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bsr64: ; BROADWELL: # %bb.0: @@ -642,7 +642,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: bswapl %edi # sched: [2:0.50] ; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bswap32: ; BROADWELL: # %bb.0: @@ -705,7 +705,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: bswapq %rdi # sched: [2:0.50] ; HASWELL-NEXT: movq %rdi, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_bswap64: ; BROADWELL: # %bb.0: @@ -806,7 +806,7 @@ ; HASWELL-NEXT: cwtd # sched: [2:0.50] ; HASWELL-NEXT: cwtl # sched: [1:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cbw_cdq_cdqe_cqo_cwd_cwde: ; BROADWELL: # %bb.0: @@ -915,7 +915,7 @@ ; HASWELL-NEXT: cld # sched: [3:1.00] ; HASWELL-NEXT: cmc # sched: [1:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_clc_cld_cmc: ; BROADWELL: # %bb.0: @@ -1012,7 +1012,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: cpuid # sched: [18:2.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cpuid: ; BROADWELL: # %bb.0: @@ -1111,7 +1111,7 @@ ; HASWELL-NEXT: invlpg (%rdi) # sched: [100:0.25] ; HASWELL-NEXT: invlpga %ecx, %rax # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_invlpg_invlpga: ; BROADWELL: # %bb.0: @@ -1321,14 +1321,14 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: shldw %cl, %si, %di # sched: [6:1.00] ; HASWELL-NEXT: shrdw %cl, %si, %di # sched: [6:1.00] -; HASWELL-NEXT: shldw %cl, %si, (%rdx) # sched: [6:1.00] -; HASWELL-NEXT: shrdw %cl, %si, (%rdx) # sched: [6:1.00] +; HASWELL-NEXT: shldw %cl, %si, (%rdx) # sched: [12:1.00] +; HASWELL-NEXT: shrdw %cl, %si, (%rdx) # sched: [12:1.00] ; HASWELL-NEXT: shldw $7, %si, %di # sched: [3:1.00] ; HASWELL-NEXT: shrdw $7, %si, %di # sched: [3:1.00] -; HASWELL-NEXT: shldw $7, %si, (%rdx) # sched: [4:1.00] -; HASWELL-NEXT: shrdw $7, %si, (%rdx) # sched: [4:1.00] +; HASWELL-NEXT: shldw $7, %si, (%rdx) # sched: [10:1.00] +; HASWELL-NEXT: shrdw $7, %si, (%rdx) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shld_shrd_16: ; BROADWELL: # %bb.0: @@ -1464,14 +1464,14 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: shldl %cl, %esi, %edi # sched: [6:1.00] ; HASWELL-NEXT: shrdl %cl, %esi, %edi # sched: [6:1.00] -; HASWELL-NEXT: shldl %cl, %esi, (%rdx) # sched: [6:1.00] -; HASWELL-NEXT: shrdl %cl, %esi, (%rdx) # sched: [6:1.00] +; HASWELL-NEXT: shldl %cl, %esi, (%rdx) # sched: [12:1.00] +; HASWELL-NEXT: shrdl %cl, %esi, (%rdx) # sched: [12:1.00] ; HASWELL-NEXT: shldl $7, %esi, %edi # sched: [3:1.00] ; HASWELL-NEXT: shrdl $7, %esi, %edi # sched: [3:1.00] -; HASWELL-NEXT: shldl $7, %esi, (%rdx) # sched: [4:1.00] -; HASWELL-NEXT: shrdl $7, %esi, (%rdx) # sched: [4:1.00] +; HASWELL-NEXT: shldl $7, %esi, (%rdx) # sched: [10:1.00] +; HASWELL-NEXT: shrdl $7, %esi, (%rdx) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shld_shrd_32: ; BROADWELL: # %bb.0: @@ -1607,14 +1607,14 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: shldq %cl, %rsi, %rdi # sched: [6:1.00] ; HASWELL-NEXT: shrdq %cl, %rsi, %rdi # sched: [6:1.00] -; HASWELL-NEXT: shldq %cl, %rsi, (%rdx) # sched: [6:1.00] -; HASWELL-NEXT: shrdq %cl, %rsi, (%rdx) # sched: [6:1.00] +; HASWELL-NEXT: shldq %cl, %rsi, (%rdx) # sched: [12:1.00] +; HASWELL-NEXT: shrdq %cl, %rsi, (%rdx) # sched: [12:1.00] ; HASWELL-NEXT: shldq $7, %rsi, %rdi # sched: [3:1.00] ; HASWELL-NEXT: shrdq $7, %rsi, %rdi # sched: [3:1.00] -; HASWELL-NEXT: shldq $7, %rsi, (%rdx) # sched: [4:1.00] -; HASWELL-NEXT: shrdq $7, %rsi, (%rdx) # sched: [4:1.00] +; HASWELL-NEXT: shldq $7, %rsi, (%rdx) # sched: [10:1.00] +; HASWELL-NEXT: shrdq $7, %rsi, (%rdx) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shld_shrd_64: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/sse-schedule.ll =================================================================== --- test/CodeGen/X86/sse-schedule.ll +++ test/CodeGen/X86/sse-schedule.ll @@ -39,8 +39,8 @@ ; HASWELL-LABEL: test_addps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddps (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddps (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addps: ; BROADWELL: # %bb.0: @@ -105,8 +105,8 @@ ; HASWELL-LABEL: test_addss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddss (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddss (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addss: ; BROADWELL: # %bb.0: @@ -175,8 +175,8 @@ ; HASWELL-LABEL: test_andps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandps %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vandps (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vandps (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andps: ; BROADWELL: # %bb.0: @@ -249,8 +249,8 @@ ; HASWELL-LABEL: test_andnotps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandnps %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vandnps (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vandnps (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andnotps: ; BROADWELL: # %bb.0: @@ -325,9 +325,9 @@ ; HASWELL-LABEL: test_cmpps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcmpeqps %xmm1, %xmm0, %xmm1 # sched: [3:1.00] -; HASWELL-NEXT: vcmpeqps (%rdi), %xmm0, %xmm0 # sched: [3:1.00] +; HASWELL-NEXT: vcmpeqps (%rdi), %xmm0, %xmm0 # sched: [9:1.00] ; HASWELL-NEXT: vorps %xmm0, %xmm1, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cmpps: ; BROADWELL: # %bb.0: @@ -401,8 +401,8 @@ ; HASWELL-LABEL: test_cmpss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcmpeqss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vcmpeqss (%rdi), %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vcmpeqss (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cmpss: ; BROADWELL: # %bb.0: @@ -507,13 +507,13 @@ ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %cl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25] -; HASWELL-NEXT: vcomiss (%rdi), %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: vcomiss (%rdi), %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %dl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25] ; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25] ; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_comiss: ; BROADWELL: # %bb.0: @@ -624,9 +624,9 @@ ; HASWELL-LABEL: test_cvtsi2ss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsi2ssl %edi, %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtsi2ssl (%rsi), %xmm1, %xmm1 # sched: [8:1.00] +; HASWELL-NEXT: vcvtsi2ssl (%rsi), %xmm1, %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsi2ss: ; BROADWELL: # %bb.0: @@ -701,9 +701,9 @@ ; HASWELL-LABEL: test_cvtsi2ssq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsi2ssq %rdi, %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: vcvtsi2ssq (%rsi), %xmm1, %xmm1 # sched: [8:1.00] +; HASWELL-NEXT: vcvtsi2ssq (%rsi), %xmm1, %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsi2ssq: ; BROADWELL: # %bb.0: @@ -778,9 +778,9 @@ ; HASWELL-LABEL: test_cvtss2si: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtss2si %xmm0, %ecx # sched: [4:1.00] -; HASWELL-NEXT: vcvtss2si (%rdi), %eax # sched: [4:1.00] +; HASWELL-NEXT: vcvtss2si (%rdi), %eax # sched: [9:1.00] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtss2si: ; BROADWELL: # %bb.0: @@ -858,9 +858,9 @@ ; HASWELL-LABEL: test_cvtss2siq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtss2si %xmm0, %rcx # sched: [4:1.00] -; HASWELL-NEXT: vcvtss2si (%rdi), %rax # sched: [4:1.00] +; HASWELL-NEXT: vcvtss2si (%rdi), %rax # sched: [9:1.00] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtss2siq: ; BROADWELL: # %bb.0: @@ -938,9 +938,9 @@ ; HASWELL-LABEL: test_cvttss2si: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttss2si %xmm0, %ecx # sched: [4:1.00] -; HASWELL-NEXT: vcvttss2si (%rdi), %eax # sched: [4:1.00] +; HASWELL-NEXT: vcvttss2si (%rdi), %eax # sched: [9:1.00] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttss2si: ; BROADWELL: # %bb.0: @@ -1015,9 +1015,9 @@ ; HASWELL-LABEL: test_cvttss2siq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttss2si %xmm0, %rcx # sched: [4:1.00] -; HASWELL-NEXT: vcvttss2si (%rdi), %rax # sched: [4:1.00] +; HASWELL-NEXT: vcvttss2si (%rdi), %rax # sched: [9:1.00] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttss2siq: ; BROADWELL: # %bb.0: @@ -1088,8 +1088,8 @@ ; HASWELL-LABEL: test_divps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdivps %xmm1, %xmm0, %xmm0 # sched: [13:1.00] -; HASWELL-NEXT: vdivps (%rdi), %xmm0, %xmm0 # sched: [13:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdivps (%rdi), %xmm0, %xmm0 # sched: [19:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_divps: ; BROADWELL: # %bb.0: @@ -1154,8 +1154,8 @@ ; HASWELL-LABEL: test_divss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdivss %xmm1, %xmm0, %xmm0 # sched: [13:1.00] -; HASWELL-NEXT: vdivss (%rdi), %xmm0, %xmm0 # sched: [13:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdivss (%rdi), %xmm0, %xmm0 # sched: [18:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_divss: ; BROADWELL: # %bb.0: @@ -1220,8 +1220,8 @@ ; HASWELL-LABEL: test_ldmxcsr: ; HASWELL: # %bb.0: ; HASWELL-NEXT: movl %edi, -{{[0-9]+}}(%rsp) # sched: [1:1.00] -; HASWELL-NEXT: vldmxcsr -{{[0-9]+}}(%rsp) # sched: [2:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vldmxcsr -{{[0-9]+}}(%rsp) # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ldmxcsr: ; BROADWELL: # %bb.0: @@ -1288,8 +1288,8 @@ ; HASWELL-LABEL: test_maxps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaxps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vmaxps (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmaxps (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maxps: ; BROADWELL: # %bb.0: @@ -1355,8 +1355,8 @@ ; HASWELL-LABEL: test_maxss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaxss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vmaxss (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmaxss (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maxss: ; BROADWELL: # %bb.0: @@ -1422,8 +1422,8 @@ ; HASWELL-LABEL: test_minps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vminps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vminps (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vminps (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_minps: ; BROADWELL: # %bb.0: @@ -1489,8 +1489,8 @@ ; HASWELL-LABEL: test_minss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vminss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vminss (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vminss (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_minss: ; BROADWELL: # %bb.0: @@ -1559,10 +1559,10 @@ ; ; HASWELL-LABEL: test_movaps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovaps (%rdi), %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovaps (%rdi), %xmm0 # sched: [6:0.50] ; HASWELL-NEXT: vaddps %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovaps %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movaps: ; BROADWELL: # %bb.0: @@ -1636,7 +1636,7 @@ ; HASWELL-LABEL: test_movhlps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm1[1],xmm0[1] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movhlps: ; BROADWELL: # %bb.0: @@ -1701,10 +1701,10 @@ ; ; HASWELL-LABEL: test_movhps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [1:1.00] +; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movhps: ; BROADWELL: # %bb.0: @@ -1781,7 +1781,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0] sched: [1:1.00] ; HASWELL-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movlhps: ; BROADWELL: # %bb.0: @@ -1848,10 +1848,10 @@ ; ; HASWELL-LABEL: test_movlps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [1:1.00] +; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovlps %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movlps: ; BROADWELL: # %bb.0: @@ -1923,7 +1923,7 @@ ; HASWELL-LABEL: test_movmskps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovmskps %xmm0, %eax # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movmskps: ; BROADWELL: # %bb.0: @@ -1984,7 +1984,7 @@ ; HASWELL-LABEL: test_movntps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovntps %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntps: ; BROADWELL: # %bb.0: @@ -2045,10 +2045,10 @@ ; ; HASWELL-LABEL: test_movss_mem: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vaddss %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovss %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movss_mem: ; BROADWELL: # %bb.0: @@ -2120,7 +2120,7 @@ ; HASWELL-LABEL: test_movss_reg: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0],xmm0[1,2,3] sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movss_reg: ; BROADWELL: # %bb.0: @@ -2181,10 +2181,10 @@ ; ; HASWELL-LABEL: test_movups: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovups (%rdi), %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovups (%rdi), %xmm0 # sched: [6:0.50] ; HASWELL-NEXT: vaddps %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovups %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movups: ; BROADWELL: # %bb.0: @@ -2254,8 +2254,8 @@ ; HASWELL-LABEL: test_mulps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmulps %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulps (%rdi), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulps (%rdi), %xmm0, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulps: ; BROADWELL: # %bb.0: @@ -2320,8 +2320,8 @@ ; HASWELL-LABEL: test_mulss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmulss %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulss (%rdi), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulss (%rdi), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulss: ; BROADWELL: # %bb.0: @@ -2390,8 +2390,8 @@ ; HASWELL-LABEL: test_orps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vorps %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vorps (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vorps (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_orps: ; BROADWELL: # %bb.0: @@ -2461,8 +2461,8 @@ ; ; HASWELL-LABEL: test_prefetchnta: ; HASWELL: # %bb.0: -; HASWELL-NEXT: prefetchnta (%rdi) # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: prefetchnta (%rdi) # sched: [5:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_prefetchnta: ; BROADWELL: # %bb.0: @@ -2527,9 +2527,9 @@ ; HASWELL-LABEL: test_rcpps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpps %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vrcpps (%rdi), %xmm1 # sched: [5:1.00] +; HASWELL-NEXT: vrcpps (%rdi), %xmm1 # sched: [11:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rcpps: ; BROADWELL: # %bb.0: @@ -2611,10 +2611,10 @@ ; HASWELL-LABEL: test_rcpss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrcpss %xmm0, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vrcpss %xmm1, %xmm1, %xmm1 # sched: [5:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rcpss: ; BROADWELL: # %bb.0: @@ -2699,9 +2699,9 @@ ; HASWELL-LABEL: test_rsqrtps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrsqrtps %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vrsqrtps (%rdi), %xmm1 # sched: [5:1.00] +; HASWELL-NEXT: vrsqrtps (%rdi), %xmm1 # sched: [11:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rsqrtps: ; BROADWELL: # %bb.0: @@ -2783,10 +2783,10 @@ ; HASWELL-LABEL: test_rsqrtss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vrsqrtss %xmm0, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vrsqrtss %xmm1, %xmm1, %xmm1 # sched: [5:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_rsqrtss: ; BROADWELL: # %bb.0: @@ -2866,8 +2866,8 @@ ; ; HASWELL-LABEL: test_sfence: ; HASWELL: # %bb.0: -; HASWELL-NEXT: sfence # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: sfence # sched: [2:0.33] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sfence: ; BROADWELL: # %bb.0: @@ -2930,8 +2930,8 @@ ; HASWELL-LABEL: test_shufps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vshufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[0,0] sched: [1:1.00] -; HASWELL-NEXT: vshufps {{.*#+}} xmm0 = xmm0[0,3],mem[0,0] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vshufps {{.*#+}} xmm0 = xmm0[0,3],mem[0,0] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shufps: ; BROADWELL: # %bb.0: @@ -3001,9 +3001,9 @@ ; HASWELL-LABEL: test_sqrtps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsqrtps %xmm0, %xmm0 # sched: [14:1.00] -; HASWELL-NEXT: vsqrtps (%rdi), %xmm1 # sched: [14:1.00] +; HASWELL-NEXT: vsqrtps (%rdi), %xmm1 # sched: [20:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sqrtps: ; BROADWELL: # %bb.0: @@ -3085,10 +3085,10 @@ ; HASWELL-LABEL: test_sqrtss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsqrtss %xmm0, %xmm0, %xmm0 # sched: [14:1.00] -; HASWELL-NEXT: vmovaps (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vmovaps (%rdi), %xmm1 # sched: [6:0.50] ; HASWELL-NEXT: vsqrtss %xmm1, %xmm1, %xmm1 # sched: [14:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sqrtss: ; BROADWELL: # %bb.0: @@ -3164,9 +3164,9 @@ ; ; HASWELL-LABEL: test_stmxcsr: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vstmxcsr -{{[0-9]+}}(%rsp) # sched: [1:1.00] -; HASWELL-NEXT: movl -{{[0-9]+}}(%rsp), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vstmxcsr -{{[0-9]+}}(%rsp) # sched: [2:1.00] +; HASWELL-NEXT: movl -{{[0-9]+}}(%rsp), %eax # sched: [5:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_stmxcsr: ; BROADWELL: # %bb.0: @@ -3233,8 +3233,8 @@ ; HASWELL-LABEL: test_subps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsubps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vsubps (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vsubps (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_subps: ; BROADWELL: # %bb.0: @@ -3299,8 +3299,8 @@ ; HASWELL-LABEL: test_subss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsubss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vsubss (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vsubss (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_subss: ; BROADWELL: # %bb.0: @@ -3400,13 +3400,13 @@ ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %cl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25] -; HASWELL-NEXT: vucomiss (%rdi), %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: vucomiss (%rdi), %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %dl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25] ; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25] ; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ucomiss: ; BROADWELL: # %bb.0: @@ -3517,8 +3517,8 @@ ; HASWELL-LABEL: test_unpckhps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpckhps {{.*#+}} xmm0 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] sched: [1:1.00] -; HASWELL-NEXT: vunpckhps {{.*#+}} xmm0 = xmm0[2],mem[2],xmm0[3],mem[3] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vunpckhps {{.*#+}} xmm0 = xmm0[2],mem[2],xmm0[3],mem[3] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpckhps: ; BROADWELL: # %bb.0: @@ -3587,8 +3587,8 @@ ; HASWELL-LABEL: test_unpcklps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpcklps {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] sched: [1:1.00] -; HASWELL-NEXT: vunpcklps {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vunpcklps {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpcklps: ; BROADWELL: # %bb.0: @@ -3657,8 +3657,8 @@ ; HASWELL-LABEL: test_xorps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vxorps %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vxorps (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vxorps (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_xorps: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/sse2-schedule.ll =================================================================== --- test/CodeGen/X86/sse2-schedule.ll +++ test/CodeGen/X86/sse2-schedule.ll @@ -39,8 +39,8 @@ ; HASWELL-LABEL: test_addpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addpd: ; BROADWELL: # %bb.0: @@ -105,8 +105,8 @@ ; HASWELL-LABEL: test_addsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addsd: ; BROADWELL: # %bb.0: @@ -175,9 +175,9 @@ ; HASWELL-LABEL: test_andpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vandpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00] +; HASWELL-NEXT: vandpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andpd: ; BROADWELL: # %bb.0: @@ -256,9 +256,9 @@ ; HASWELL-LABEL: test_andnotpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vandnpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vandnpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00] +; HASWELL-NEXT: vandnpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_andnotpd: ; BROADWELL: # %bb.0: @@ -337,7 +337,7 @@ ; HASWELL-LABEL: test_clflush: ; HASWELL: # %bb.0: ; HASWELL-NEXT: clflush (%rdi) # sched: [2:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_clflush: ; BROADWELL: # %bb.0: @@ -400,9 +400,9 @@ ; HASWELL-LABEL: test_cmppd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcmpeqpd %xmm1, %xmm0, %xmm1 # sched: [3:1.00] -; HASWELL-NEXT: vcmpeqpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] +; HASWELL-NEXT: vcmpeqpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00] ; HASWELL-NEXT: vorpd %xmm0, %xmm1, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cmppd: ; BROADWELL: # %bb.0: @@ -476,8 +476,8 @@ ; HASWELL-LABEL: test_cmpsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcmpeqsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vcmpeqsd (%rdi), %xmm0, %xmm0 # sched: [7:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vcmpeqsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cmpsd: ; BROADWELL: # %bb.0: @@ -582,13 +582,13 @@ ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %cl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25] -; HASWELL-NEXT: vcomisd (%rdi), %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: vcomisd (%rdi), %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %dl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25] ; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25] ; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_comisd: ; BROADWELL: # %bb.0: @@ -699,9 +699,9 @@ ; HASWELL-LABEL: test_cvtdq2pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtdq2pd %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtdq2pd (%rdi), %xmm1 # sched: [4:1.00] +; HASWELL-NEXT: vcvtdq2pd (%rdi), %xmm1 # sched: [10:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtdq2pd: ; BROADWELL: # %bb.0: @@ -779,9 +779,9 @@ ; HASWELL-LABEL: test_cvtdq2ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtdq2ps %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vcvtdq2ps (%rdi), %xmm1 # sched: [3:1.00] +; HASWELL-NEXT: vcvtdq2ps (%rdi), %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtdq2ps: ; BROADWELL: # %bb.0: @@ -857,9 +857,9 @@ ; HASWELL-LABEL: test_cvtpd2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtpd2dq %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtpd2dqx (%rdi), %xmm1 # sched: [7:1.00] +; HASWELL-NEXT: vcvtpd2dqx (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpd2dq: ; BROADWELL: # %bb.0: @@ -936,9 +936,9 @@ ; HASWELL-LABEL: test_cvtpd2ps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtpd2ps %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtpd2psx (%rdi), %xmm1 # sched: [7:1.00] +; HASWELL-NEXT: vcvtpd2psx (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtpd2ps: ; BROADWELL: # %bb.0: @@ -1015,9 +1015,9 @@ ; HASWELL-LABEL: test_cvtps2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtps2dq %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vcvtps2dq (%rdi), %xmm1 # sched: [3:1.00] +; HASWELL-NEXT: vcvtps2dq (%rdi), %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtps2dq: ; BROADWELL: # %bb.0: @@ -1094,9 +1094,9 @@ ; HASWELL-LABEL: test_cvtps2pd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtps2pd %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vcvtps2pd (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vcvtps2pd (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtps2pd: ; BROADWELL: # %bb.0: @@ -1173,9 +1173,9 @@ ; HASWELL-LABEL: test_cvtsd2si: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsd2si %xmm0, %ecx # sched: [4:1.00] -; HASWELL-NEXT: vcvtsd2si (%rdi), %eax # sched: [4:1.00] +; HASWELL-NEXT: vcvtsd2si (%rdi), %eax # sched: [9:1.00] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsd2si: ; BROADWELL: # %bb.0: @@ -1253,9 +1253,9 @@ ; HASWELL-LABEL: test_cvtsd2siq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsd2si %xmm0, %rcx # sched: [4:1.00] -; HASWELL-NEXT: vcvtsd2si (%rdi), %rax # sched: [4:1.00] +; HASWELL-NEXT: vcvtsd2si (%rdi), %rax # sched: [9:1.00] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsd2siq: ; BROADWELL: # %bb.0: @@ -1338,10 +1338,10 @@ ; HASWELL-LABEL: test_cvtsd2ss: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsd2ss %xmm0, %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vmovsd {{.*#+}} xmm1 = mem[0],zero sched: [1:0.50] +; HASWELL-NEXT: vmovsd {{.*#+}} xmm1 = mem[0],zero sched: [5:0.50] ; HASWELL-NEXT: vcvtsd2ss %xmm1, %xmm1, %xmm1 # sched: [4:1.00] ; HASWELL-NEXT: vaddss %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsd2ss: ; BROADWELL: # %bb.0: @@ -1421,9 +1421,9 @@ ; HASWELL-LABEL: test_cvtsi2sd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsi2sdl %edi, %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtsi2sdl (%rsi), %xmm1, %xmm1 # sched: [8:1.00] +; HASWELL-NEXT: vcvtsi2sdl (%rsi), %xmm1, %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsi2sd: ; BROADWELL: # %bb.0: @@ -1498,9 +1498,9 @@ ; HASWELL-LABEL: test_cvtsi2sdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtsi2sdq %rdi, %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvtsi2sdq (%rsi), %xmm1, %xmm1 # sched: [8:1.00] +; HASWELL-NEXT: vcvtsi2sdq (%rsi), %xmm1, %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtsi2sdq: ; BROADWELL: # %bb.0: @@ -1582,10 +1582,10 @@ ; HASWELL-LABEL: test_cvtss2sd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvtss2sd %xmm0, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vcvtss2sd %xmm1, %xmm1, %xmm1 # sched: [2:1.00] ; HASWELL-NEXT: vaddsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvtss2sd: ; BROADWELL: # %bb.0: @@ -1666,9 +1666,9 @@ ; HASWELL-LABEL: test_cvttpd2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttpd2dq %xmm0, %xmm0 # sched: [4:1.00] -; HASWELL-NEXT: vcvttpd2dqx (%rdi), %xmm1 # sched: [7:1.00] +; HASWELL-NEXT: vcvttpd2dqx (%rdi), %xmm1 # sched: [8:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttpd2dq: ; BROADWELL: # %bb.0: @@ -1746,9 +1746,9 @@ ; HASWELL-LABEL: test_cvttps2dq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttps2dq %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vcvttps2dq (%rdi), %xmm1 # sched: [3:1.00] +; HASWELL-NEXT: vcvttps2dq (%rdi), %xmm1 # sched: [9:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttps2dq: ; BROADWELL: # %bb.0: @@ -1823,9 +1823,9 @@ ; HASWELL-LABEL: test_cvttsd2si: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttsd2si %xmm0, %ecx # sched: [4:1.00] -; HASWELL-NEXT: vcvttsd2si (%rdi), %eax # sched: [4:1.00] +; HASWELL-NEXT: vcvttsd2si (%rdi), %eax # sched: [9:1.00] ; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttsd2si: ; BROADWELL: # %bb.0: @@ -1900,9 +1900,9 @@ ; HASWELL-LABEL: test_cvttsd2siq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vcvttsd2si %xmm0, %rcx # sched: [4:1.00] -; HASWELL-NEXT: vcvttsd2si (%rdi), %rax # sched: [4:1.00] +; HASWELL-NEXT: vcvttsd2si (%rdi), %rax # sched: [9:1.00] ; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_cvttsd2siq: ; BROADWELL: # %bb.0: @@ -1973,8 +1973,8 @@ ; HASWELL-LABEL: test_divpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdivpd %xmm1, %xmm0, %xmm0 # sched: [20:1.00] -; HASWELL-NEXT: vdivpd (%rdi), %xmm0, %xmm0 # sched: [20:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdivpd (%rdi), %xmm0, %xmm0 # sched: [26:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_divpd: ; BROADWELL: # %bb.0: @@ -2039,8 +2039,8 @@ ; HASWELL-LABEL: test_divsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdivsd %xmm1, %xmm0, %xmm0 # sched: [20:1.00] -; HASWELL-NEXT: vdivsd (%rdi), %xmm0, %xmm0 # sched: [20:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdivsd (%rdi), %xmm0, %xmm0 # sched: [25:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_divsd: ; BROADWELL: # %bb.0: @@ -2107,7 +2107,7 @@ ; HASWELL-LABEL: test_lfence: ; HASWELL: # %bb.0: ; HASWELL-NEXT: lfence # sched: [2:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lfence: ; BROADWELL: # %bb.0: @@ -2168,7 +2168,7 @@ ; HASWELL-LABEL: test_mfence: ; HASWELL: # %bb.0: ; HASWELL-NEXT: mfence # sched: [2:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mfence: ; BROADWELL: # %bb.0: @@ -2227,7 +2227,7 @@ ; HASWELL-LABEL: test_maskmovdqu: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaskmovdqu %xmm1, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maskmovdqu: ; BROADWELL: # %bb.0: @@ -2286,8 +2286,8 @@ ; HASWELL-LABEL: test_maxpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaxpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vmaxpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmaxpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maxpd: ; BROADWELL: # %bb.0: @@ -2353,8 +2353,8 @@ ; HASWELL-LABEL: test_maxsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmaxsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vmaxsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmaxsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_maxsd: ; BROADWELL: # %bb.0: @@ -2420,8 +2420,8 @@ ; HASWELL-LABEL: test_minpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vminpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vminpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vminpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_minpd: ; BROADWELL: # %bb.0: @@ -2487,8 +2487,8 @@ ; HASWELL-LABEL: test_minsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vminsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vminsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vminsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_minsd: ; BROADWELL: # %bb.0: @@ -2557,10 +2557,10 @@ ; ; HASWELL-LABEL: test_movapd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovapd (%rdi), %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovapd (%rdi), %xmm0 # sched: [6:0.50] ; HASWELL-NEXT: vaddpd %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovapd %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movapd: ; BROADWELL: # %bb.0: @@ -2633,10 +2633,10 @@ ; ; HASWELL-LABEL: test_movdqa: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovdqa (%rdi), %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovdqa (%rdi), %xmm0 # sched: [6:0.50] ; HASWELL-NEXT: vpaddq %xmm0, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vmovdqa %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movdqa: ; BROADWELL: # %bb.0: @@ -2709,10 +2709,10 @@ ; ; HASWELL-LABEL: test_movdqu: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovdqu (%rdi), %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovdqu (%rdi), %xmm0 # sched: [6:0.50] ; HASWELL-NEXT: vpaddq %xmm0, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vmovdqu %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movdqu: ; BROADWELL: # %bb.0: @@ -2798,12 +2798,12 @@ ; HASWELL-LABEL: test_movd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovd %edi, %xmm1 # sched: [1:1.00] -; HASWELL-NEXT: vmovd {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [1:0.50] +; HASWELL-NEXT: vmovd {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:0.50] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm1 # sched: [1:0.50] ; HASWELL-NEXT: vpaddd %xmm2, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vmovd %xmm0, %eax # sched: [1:1.00] ; HASWELL-NEXT: vmovd %xmm1, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movd: ; BROADWELL: # %bb.0: @@ -2909,12 +2909,12 @@ ; HASWELL-LABEL: test_movd_64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovq %rdi, %xmm1 # sched: [1:1.00] -; HASWELL-NEXT: vmovq {{.*#+}} xmm2 = mem[0],zero sched: [1:0.50] +; HASWELL-NEXT: vmovq {{.*#+}} xmm2 = mem[0],zero sched: [5:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm1 # sched: [1:0.50] ; HASWELL-NEXT: vpaddq %xmm2, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vmovq %xmm0, %rax # sched: [1:1.00] ; HASWELL-NEXT: vmovq %xmm1, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movd_64: ; BROADWELL: # %bb.0: @@ -3007,10 +3007,10 @@ ; ; HASWELL-LABEL: test_movhpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [1:1.00] +; HASWELL-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovhpd %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movhpd: ; BROADWELL: # %bb.0: @@ -3086,10 +3086,10 @@ ; ; HASWELL-LABEL: test_movlpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [1:1.00] +; HASWELL-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovlpd %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movlpd: ; BROADWELL: # %bb.0: @@ -3160,7 +3160,7 @@ ; HASWELL-LABEL: test_movmskpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovmskpd %xmm0, %eax # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movmskpd: ; BROADWELL: # %bb.0: @@ -3222,7 +3222,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddq %xmm0, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vmovntdq %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntdqa: ; BROADWELL: # %bb.0: @@ -3287,7 +3287,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddpd %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovntpd %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntpd: ; BROADWELL: # %bb.0: @@ -3354,10 +3354,10 @@ ; ; HASWELL-LABEL: test_movq_mem: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovq {{.*#+}} xmm1 = mem[0],zero sched: [1:0.50] +; HASWELL-NEXT: vmovq {{.*#+}} xmm1 = mem[0],zero sched: [5:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vmovq %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movq_mem: ; BROADWELL: # %bb.0: @@ -3432,7 +3432,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero sched: [1:0.33] ; HASWELL-NEXT: vpaddq %xmm0, %xmm1, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movq_reg: ; BROADWELL: # %bb.0: @@ -3499,10 +3499,10 @@ ; ; HASWELL-LABEL: test_movsd_mem: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero sched: [1:0.50] +; HASWELL-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero sched: [5:0.50] ; HASWELL-NEXT: vaddsd %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovsd %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movsd_mem: ; BROADWELL: # %bb.0: @@ -3575,7 +3575,7 @@ ; HASWELL-LABEL: test_movsd_reg: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovlhps {{.*#+}} xmm0 = xmm1[0],xmm0[0] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movsd_reg: ; BROADWELL: # %bb.0: @@ -3636,10 +3636,10 @@ ; ; HASWELL-LABEL: test_movupd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovupd (%rdi), %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vmovupd (%rdi), %xmm0 # sched: [6:0.50] ; HASWELL-NEXT: vaddpd %xmm0, %xmm0, %xmm0 # sched: [3:1.00] ; HASWELL-NEXT: vmovupd %xmm0, (%rsi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movupd: ; BROADWELL: # %bb.0: @@ -3709,8 +3709,8 @@ ; HASWELL-LABEL: test_mulpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmulpd %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulpd (%rdi), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulpd (%rdi), %xmm0, %xmm0 # sched: [11:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulpd: ; BROADWELL: # %bb.0: @@ -3775,8 +3775,8 @@ ; HASWELL-LABEL: test_mulsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmulsd %xmm1, %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: vmulsd (%rdi), %xmm0, %xmm0 # sched: [5:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmulsd (%rdi), %xmm0, %xmm0 # sched: [10:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mulsd: ; BROADWELL: # %bb.0: @@ -3845,9 +3845,9 @@ ; HASWELL-LABEL: test_orpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vorpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vorpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00] +; HASWELL-NEXT: vorpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_orpd: ; BROADWELL: # %bb.0: @@ -3926,8 +3926,8 @@ ; HASWELL-LABEL: test_packssdw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpackssdw %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpackssdw (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpackssdw (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packssdw: ; BROADWELL: # %bb.0: @@ -3998,8 +3998,8 @@ ; HASWELL-LABEL: test_packsswb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpacksswb %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpacksswb (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpacksswb (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packsswb: ; BROADWELL: # %bb.0: @@ -4070,8 +4070,8 @@ ; HASWELL-LABEL: test_packuswb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpackuswb %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpackuswb (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpackuswb (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packuswb: ; BROADWELL: # %bb.0: @@ -4142,8 +4142,8 @@ ; HASWELL-LABEL: test_paddb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddb: ; BROADWELL: # %bb.0: @@ -4212,8 +4212,8 @@ ; HASWELL-LABEL: test_paddd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddd: ; BROADWELL: # %bb.0: @@ -4278,8 +4278,8 @@ ; HASWELL-LABEL: test_paddq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddq (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddq (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddq: ; BROADWELL: # %bb.0: @@ -4348,8 +4348,8 @@ ; HASWELL-LABEL: test_paddsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddsb: ; BROADWELL: # %bb.0: @@ -4419,8 +4419,8 @@ ; HASWELL-LABEL: test_paddsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddsw: ; BROADWELL: # %bb.0: @@ -4490,8 +4490,8 @@ ; HASWELL-LABEL: test_paddusb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddusb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddusb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddusb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddusb: ; BROADWELL: # %bb.0: @@ -4561,8 +4561,8 @@ ; HASWELL-LABEL: test_paddusw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddusw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddusw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddusw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddusw: ; BROADWELL: # %bb.0: @@ -4632,8 +4632,8 @@ ; HASWELL-LABEL: test_paddw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpaddw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpaddw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_paddw: ; BROADWELL: # %bb.0: @@ -4702,9 +4702,9 @@ ; HASWELL-LABEL: test_pand: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpand %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: vpand (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpand (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pand: ; BROADWELL: # %bb.0: @@ -4785,9 +4785,9 @@ ; HASWELL-LABEL: test_pandn: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpandn %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: vpandn (%rdi), %xmm0, %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vpandn (%rdi), %xmm0, %xmm1 # sched: [7:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pandn: ; BROADWELL: # %bb.0: @@ -4864,8 +4864,8 @@ ; HASWELL-LABEL: test_pavgb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpavgb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpavgb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpavgb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pavgb: ; BROADWELL: # %bb.0: @@ -4944,8 +4944,8 @@ ; HASWELL-LABEL: test_pavgw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpavgw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpavgw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpavgw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pavgw: ; BROADWELL: # %bb.0: @@ -5026,9 +5026,9 @@ ; HASWELL-LABEL: test_pcmpeqb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqb %xmm1, %xmm0, %xmm1 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpcmpeqb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqb: ; BROADWELL: # %bb.0: @@ -5107,9 +5107,9 @@ ; HASWELL-LABEL: test_pcmpeqd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqd %xmm1, %xmm0, %xmm1 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqd: ; BROADWELL: # %bb.0: @@ -5188,9 +5188,9 @@ ; HASWELL-LABEL: test_pcmpeqw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqw %xmm1, %xmm0, %xmm1 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpcmpeqw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqw: ; BROADWELL: # %bb.0: @@ -5270,9 +5270,9 @@ ; HASWELL-LABEL: test_pcmpgtb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtb %xmm1, %xmm0, %xmm1 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpgtb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpcmpgtb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtb: ; BROADWELL: # %bb.0: @@ -5352,9 +5352,9 @@ ; HASWELL-LABEL: test_pcmpgtd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtd %xmm1, %xmm0, %xmm1 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpcmpeqd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtd: ; BROADWELL: # %bb.0: @@ -5434,9 +5434,9 @@ ; HASWELL-LABEL: test_pcmpgtw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtw %xmm1, %xmm0, %xmm1 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpgtw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpcmpgtw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm0, %xmm1, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtw: ; BROADWELL: # %bb.0: @@ -5510,7 +5510,7 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpextrw $6, %xmm0, %eax # sched: [2:1.00] ; HASWELL-NEXT: # kill: %ax %ax %eax -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pextrw: ; BROADWELL: # %bb.0: @@ -5577,8 +5577,8 @@ ; HASWELL-LABEL: test_pinsrw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpinsrw $1, %edi, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vpinsrw $3, (%rsi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpinsrw $3, (%rsi), %xmm0, %xmm0 # sched: [6:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pinsrw: ; BROADWELL: # %bb.0: @@ -5651,8 +5651,8 @@ ; HASWELL-LABEL: test_pmaddwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaddwd %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmaddwd (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaddwd (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaddwd: ; BROADWELL: # %bb.0: @@ -5723,8 +5723,8 @@ ; HASWELL-LABEL: test_pmaxsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsw: ; BROADWELL: # %bb.0: @@ -5794,8 +5794,8 @@ ; HASWELL-LABEL: test_pmaxub: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxub %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxub (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxub (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxub: ; BROADWELL: # %bb.0: @@ -5865,8 +5865,8 @@ ; HASWELL-LABEL: test_pminsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsw: ; BROADWELL: # %bb.0: @@ -5936,8 +5936,8 @@ ; HASWELL-LABEL: test_pminub: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminub %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminub (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminub (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminub: ; BROADWELL: # %bb.0: @@ -6001,7 +6001,7 @@ ; HASWELL-LABEL: test_pmovmskb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovmskb %xmm0, %eax # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovmskb: ; BROADWELL: # %bb.0: @@ -6060,8 +6060,8 @@ ; HASWELL-LABEL: test_pmulhuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulhuw %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmulhuw (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulhuw (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhuw: ; BROADWELL: # %bb.0: @@ -6127,8 +6127,8 @@ ; HASWELL-LABEL: test_pmulhw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulhw %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmulhw (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulhw (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhw: ; BROADWELL: # %bb.0: @@ -6194,8 +6194,8 @@ ; HASWELL-LABEL: test_pmullw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmullw %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmullw (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmullw (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmullw: ; BROADWELL: # %bb.0: @@ -6268,8 +6268,8 @@ ; HASWELL-LABEL: test_pmuludq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmuludq %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmuludq (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmuludq (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmuludq: ; BROADWELL: # %bb.0: @@ -6340,9 +6340,9 @@ ; HASWELL-LABEL: test_por: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: vpor (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpor (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_por: ; BROADWELL: # %bb.0: @@ -6421,8 +6421,8 @@ ; HASWELL-LABEL: test_psadbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpsadbw (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsadbw (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psadbw: ; BROADWELL: # %bb.0: @@ -6495,9 +6495,9 @@ ; HASWELL-LABEL: test_pshufd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[1,0,3,2] sched: [1:1.00] -; HASWELL-NEXT: vpshufd {{.*#+}} xmm1 = mem[3,2,1,0] sched: [1:1.00] +; HASWELL-NEXT: vpshufd {{.*#+}} xmm1 = mem[3,2,1,0] sched: [7:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufd: ; BROADWELL: # %bb.0: @@ -6574,9 +6574,9 @@ ; HASWELL-LABEL: test_pshufhw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,5,4,7,6] sched: [1:1.00] -; HASWELL-NEXT: vpshufhw {{.*#+}} xmm1 = mem[0,1,2,3,7,6,5,4] sched: [1:1.00] +; HASWELL-NEXT: vpshufhw {{.*#+}} xmm1 = mem[0,1,2,3,7,6,5,4] sched: [7:1.00] ; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufhw: ; BROADWELL: # %bb.0: @@ -6653,9 +6653,9 @@ ; HASWELL-LABEL: test_pshuflw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshuflw {{.*#+}} xmm0 = xmm0[1,0,3,2,4,5,6,7] sched: [1:1.00] -; HASWELL-NEXT: vpshuflw {{.*#+}} xmm1 = mem[3,2,1,0,4,5,6,7] sched: [1:1.00] +; HASWELL-NEXT: vpshuflw {{.*#+}} xmm1 = mem[3,2,1,0,4,5,6,7] sched: [7:1.00] ; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshuflw: ; BROADWELL: # %bb.0: @@ -6730,9 +6730,9 @@ ; HASWELL-LABEL: test_pslld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpslld %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpslld (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpslld (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpslld $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pslld: ; BROADWELL: # %bb.0: @@ -6807,7 +6807,7 @@ ; HASWELL-LABEL: test_pslldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pslldq: ; BROADWELL: # %bb.0: @@ -6869,9 +6869,9 @@ ; HASWELL-LABEL: test_psllq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllq %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsllq (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsllq (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsllq $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllq: ; BROADWELL: # %bb.0: @@ -6948,9 +6948,9 @@ ; HASWELL-LABEL: test_psllw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsllw %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsllw (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsllw (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsllw $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psllw: ; BROADWELL: # %bb.0: @@ -7027,9 +7027,9 @@ ; HASWELL-LABEL: test_psrad: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrad %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsrad (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsrad (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrad $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrad: ; BROADWELL: # %bb.0: @@ -7106,9 +7106,9 @@ ; HASWELL-LABEL: test_psraw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsraw %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsraw (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsraw (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsraw $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psraw: ; BROADWELL: # %bb.0: @@ -7185,9 +7185,9 @@ ; HASWELL-LABEL: test_psrld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrld %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsrld (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsrld (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrld $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrld: ; BROADWELL: # %bb.0: @@ -7262,7 +7262,7 @@ ; HASWELL-LABEL: test_psrldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrldq {{.*#+}} xmm0 = xmm0[4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,zero sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrldq: ; BROADWELL: # %bb.0: @@ -7324,9 +7324,9 @@ ; HASWELL-LABEL: test_psrlq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlq %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsrlq (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsrlq (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrlq $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlq: ; BROADWELL: # %bb.0: @@ -7403,9 +7403,9 @@ ; HASWELL-LABEL: test_psrlw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsrlw %xmm1, %xmm0, %xmm0 # sched: [2:1.00] -; HASWELL-NEXT: vpsrlw (%rdi), %xmm0, %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vpsrlw (%rdi), %xmm0, %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: vpsrlw $2, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psrlw: ; BROADWELL: # %bb.0: @@ -7482,8 +7482,8 @@ ; HASWELL-LABEL: test_psubb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubb: ; BROADWELL: # %bb.0: @@ -7552,8 +7552,8 @@ ; HASWELL-LABEL: test_psubd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubd: ; BROADWELL: # %bb.0: @@ -7618,8 +7618,8 @@ ; HASWELL-LABEL: test_psubq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubq (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubq (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubq: ; BROADWELL: # %bb.0: @@ -7688,8 +7688,8 @@ ; HASWELL-LABEL: test_psubsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubsb: ; BROADWELL: # %bb.0: @@ -7759,8 +7759,8 @@ ; HASWELL-LABEL: test_psubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubsw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubsw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubsw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubsw: ; BROADWELL: # %bb.0: @@ -7830,8 +7830,8 @@ ; HASWELL-LABEL: test_psubusb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubusb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubusb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubusb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubusb: ; BROADWELL: # %bb.0: @@ -7901,8 +7901,8 @@ ; HASWELL-LABEL: test_psubusw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubusw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubusw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubusw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubusw: ; BROADWELL: # %bb.0: @@ -7972,8 +7972,8 @@ ; HASWELL-LABEL: test_psubw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsubw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsubw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsubw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psubw: ; BROADWELL: # %bb.0: @@ -8042,8 +8042,8 @@ ; HASWELL-LABEL: test_punpckhbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhbw {{.*#+}} xmm0 = xmm0[8],xmm1[8],xmm0[9],xmm1[9],xmm0[10],xmm1[10],xmm0[11],xmm1[11],xmm0[12],xmm1[12],xmm0[13],xmm1[13],xmm0[14],xmm1[14],xmm0[15],xmm1[15] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhbw {{.*#+}} xmm0 = xmm0[8],mem[8],xmm0[9],mem[9],xmm0[10],mem[10],xmm0[11],mem[11],xmm0[12],mem[12],xmm0[13],mem[13],xmm0[14],mem[14],xmm0[15],mem[15] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpckhbw {{.*#+}} xmm0 = xmm0[8],mem[8],xmm0[9],mem[9],xmm0[10],mem[10],xmm0[11],mem[11],xmm0[12],mem[12],xmm0[13],mem[13],xmm0[14],mem[14],xmm0[15],mem[15] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhbw: ; BROADWELL: # %bb.0: @@ -8114,9 +8114,9 @@ ; HASWELL-LABEL: test_punpckhdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhdq {{.*#+}} xmm0 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhdq {{.*#+}} xmm1 = xmm1[2],mem[2],xmm1[3],mem[3] sched: [1:1.00] +; HASWELL-NEXT: vpunpckhdq {{.*#+}} xmm1 = xmm1[2],mem[2],xmm1[3],mem[3] sched: [7:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhdq: ; BROADWELL: # %bb.0: @@ -8191,9 +8191,9 @@ ; HASWELL-LABEL: test_punpckhqdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhqdq {{.*#+}} xmm0 = xmm0[1],xmm1[1] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhqdq {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [1:1.00] +; HASWELL-NEXT: vpunpckhqdq {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [7:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhqdq: ; BROADWELL: # %bb.0: @@ -8268,8 +8268,8 @@ ; HASWELL-LABEL: test_punpckhwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckhwd {{.*#+}} xmm0 = xmm0[4],xmm1[4],xmm0[5],xmm1[5],xmm0[6],xmm1[6],xmm0[7],xmm1[7] sched: [1:1.00] -; HASWELL-NEXT: vpunpckhwd {{.*#+}} xmm0 = xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpckhwd {{.*#+}} xmm0 = xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckhwd: ; BROADWELL: # %bb.0: @@ -8338,8 +8338,8 @@ ; HASWELL-LABEL: test_punpcklbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpcklbw {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[3],xmm1[3],xmm0[4],xmm1[4],xmm0[5],xmm1[5],xmm0[6],xmm1[6],xmm0[7],xmm1[7] sched: [1:1.00] -; HASWELL-NEXT: vpunpcklbw {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3],xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpcklbw {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3],xmm0[4],mem[4],xmm0[5],mem[5],xmm0[6],mem[6],xmm0[7],mem[7] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklbw: ; BROADWELL: # %bb.0: @@ -8410,9 +8410,9 @@ ; HASWELL-LABEL: test_punpckldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] sched: [1:1.00] -; HASWELL-NEXT: vpunpckldq {{.*#+}} xmm1 = xmm1[0],mem[0],xmm1[1],mem[1] sched: [1:1.00] +; HASWELL-NEXT: vpunpckldq {{.*#+}} xmm1 = xmm1[0],mem[0],xmm1[1],mem[1] sched: [7:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpckldq: ; BROADWELL: # %bb.0: @@ -8487,9 +8487,9 @@ ; HASWELL-LABEL: test_punpcklqdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] sched: [1:1.00] -; HASWELL-NEXT: vpunpcklqdq {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [1:1.00] +; HASWELL-NEXT: vpunpcklqdq {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [7:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklqdq: ; BROADWELL: # %bb.0: @@ -8564,8 +8564,8 @@ ; HASWELL-LABEL: test_punpcklwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpunpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[3],xmm1[3] sched: [1:1.00] -; HASWELL-NEXT: vpunpcklwd {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpunpcklwd {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1],xmm0[2],mem[2],xmm0[3],mem[3] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_punpcklwd: ; BROADWELL: # %bb.0: @@ -8634,9 +8634,9 @@ ; HASWELL-LABEL: test_pxor: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpxor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: vpxor (%rdi), %xmm0, %xmm0 # sched: [1:0.50] +; HASWELL-NEXT: vpxor (%rdi), %xmm0, %xmm0 # sched: [7:0.50] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pxor: ; BROADWELL: # %bb.0: @@ -8711,9 +8711,9 @@ ; HASWELL-LABEL: test_shufpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vshufpd {{.*#+}} xmm0 = xmm0[1],xmm1[0] sched: [1:1.00] -; HASWELL-NEXT: vshufpd {{.*#+}} xmm1 = xmm1[1],mem[0] sched: [1:1.00] +; HASWELL-NEXT: vshufpd {{.*#+}} xmm1 = xmm1[1],mem[0] sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_shufpd: ; BROADWELL: # %bb.0: @@ -8789,9 +8789,9 @@ ; HASWELL-LABEL: test_sqrtpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsqrtpd %xmm0, %xmm0 # sched: [21:1.00] -; HASWELL-NEXT: vsqrtpd (%rdi), %xmm1 # sched: [21:1.00] +; HASWELL-NEXT: vsqrtpd (%rdi), %xmm1 # sched: [27:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sqrtpd: ; BROADWELL: # %bb.0: @@ -8873,10 +8873,10 @@ ; HASWELL-LABEL: test_sqrtsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsqrtsd %xmm0, %xmm0, %xmm0 # sched: [21:1.00] -; HASWELL-NEXT: vmovapd (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vmovapd (%rdi), %xmm1 # sched: [6:0.50] ; HASWELL-NEXT: vsqrtsd %xmm1, %xmm1, %xmm1 # sched: [21:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_sqrtsd: ; BROADWELL: # %bb.0: @@ -8953,8 +8953,8 @@ ; HASWELL-LABEL: test_subpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsubpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vsubpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vsubpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_subpd: ; BROADWELL: # %bb.0: @@ -9019,8 +9019,8 @@ ; HASWELL-LABEL: test_subsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vsubsd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vsubsd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vsubsd (%rdi), %xmm0, %xmm0 # sched: [8:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_subsd: ; BROADWELL: # %bb.0: @@ -9120,13 +9120,13 @@ ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %cl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25] -; HASWELL-NEXT: vucomisd (%rdi), %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: vucomisd (%rdi), %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: setnp %al # sched: [1:0.50] ; HASWELL-NEXT: sete %dl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %dl # sched: [1:0.25] ; HASWELL-NEXT: orb %cl, %dl # sched: [1:0.25] ; HASWELL-NEXT: movzbl %dl, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ucomisd: ; BROADWELL: # %bb.0: @@ -9237,9 +9237,9 @@ ; HASWELL-LABEL: test_unpckhpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1] sched: [1:1.00] -; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [1:1.00] +; HASWELL-NEXT: vunpckhpd {{.*#+}} xmm1 = xmm1[1],mem[1] sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpckhpd: ; BROADWELL: # %bb.0: @@ -9320,9 +9320,9 @@ ; HASWELL-LABEL: test_unpcklpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vunpcklpd {{.*#+}} xmm0 = xmm0[0],xmm1[0] sched: [1:1.00] -; HASWELL-NEXT: vunpcklpd {{.*#+}} xmm1 = xmm0[0],mem[0] sched: [1:1.00] +; HASWELL-NEXT: vunpcklpd {{.*#+}} xmm1 = xmm0[0],mem[0] sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_unpcklpd: ; BROADWELL: # %bb.0: @@ -9397,9 +9397,9 @@ ; HASWELL-LABEL: test_xorpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vxorpd %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vxorpd (%rdi), %xmm0, %xmm0 # sched: [1:1.00] +; HASWELL-NEXT: vxorpd (%rdi), %xmm0, %xmm0 # sched: [7:1.00] ; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_xorpd: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/sse3-schedule.ll =================================================================== --- test/CodeGen/X86/sse3-schedule.ll +++ test/CodeGen/X86/sse3-schedule.ll @@ -39,8 +39,8 @@ ; HASWELL-LABEL: test_addsubpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddsubpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddsubpd (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddsubpd (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addsubpd: ; BROADWELL: # %bb.0: @@ -106,8 +106,8 @@ ; HASWELL-LABEL: test_addsubps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vaddsubps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vaddsubps (%rdi), %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vaddsubps (%rdi), %xmm0, %xmm0 # sched: [9:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_addsubps: ; BROADWELL: # %bb.0: @@ -173,8 +173,8 @@ ; HASWELL-LABEL: test_haddpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhaddpd %xmm1, %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: vhaddpd (%rdi), %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhaddpd (%rdi), %xmm0, %xmm0 # sched: [11:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_haddpd: ; BROADWELL: # %bb.0: @@ -240,8 +240,8 @@ ; HASWELL-LABEL: test_haddps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhaddps %xmm1, %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: vhaddps (%rdi), %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhaddps (%rdi), %xmm0, %xmm0 # sched: [11:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_haddps: ; BROADWELL: # %bb.0: @@ -307,8 +307,8 @@ ; HASWELL-LABEL: test_hsubpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhsubpd %xmm1, %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: vhsubpd (%rdi), %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhsubpd (%rdi), %xmm0, %xmm0 # sched: [11:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_hsubpd: ; BROADWELL: # %bb.0: @@ -374,8 +374,8 @@ ; HASWELL-LABEL: test_hsubps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vhsubps %xmm1, %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: vhsubps (%rdi), %xmm0, %xmm0 # sched: [5:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vhsubps (%rdi), %xmm0, %xmm0 # sched: [11:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_hsubps: ; BROADWELL: # %bb.0: @@ -438,8 +438,8 @@ ; ; HASWELL-LABEL: test_lddqu: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vlddqu (%rdi), %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vlddqu (%rdi), %xmm0 # sched: [6:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_lddqu: ; BROADWELL: # %bb.0: @@ -504,7 +504,7 @@ ; HASWELL-NEXT: leaq (%rdi), %rax # sched: [1:0.50] ; HASWELL-NEXT: movl %esi, %ecx # sched: [1:0.25] ; HASWELL-NEXT: monitor # sched: [100:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_monitor: ; BROADWELL: # %bb.0: @@ -578,9 +578,9 @@ ; HASWELL-LABEL: test_movddup: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovddup {{.*#+}} xmm0 = xmm0[0,0] sched: [1:1.00] -; HASWELL-NEXT: vmovddup {{.*#+}} xmm1 = mem[0,0] sched: [1:0.50] +; HASWELL-NEXT: vmovddup {{.*#+}} xmm1 = mem[0,0] sched: [5:0.50] ; HASWELL-NEXT: vsubpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movddup: ; BROADWELL: # %bb.0: @@ -656,9 +656,9 @@ ; HASWELL-LABEL: test_movshdup: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovshdup {{.*#+}} xmm0 = xmm0[1,1,3,3] sched: [1:1.00] -; HASWELL-NEXT: vmovshdup {{.*#+}} xmm1 = mem[1,1,3,3] sched: [1:0.50] +; HASWELL-NEXT: vmovshdup {{.*#+}} xmm1 = mem[1,1,3,3] sched: [6:0.50] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movshdup: ; BROADWELL: # %bb.0: @@ -734,9 +734,9 @@ ; HASWELL-LABEL: test_movsldup: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmovsldup {{.*#+}} xmm0 = xmm0[0,0,2,2] sched: [1:1.00] -; HASWELL-NEXT: vmovsldup {{.*#+}} xmm1 = mem[0,0,2,2] sched: [1:0.50] +; HASWELL-NEXT: vmovsldup {{.*#+}} xmm1 = mem[0,0,2,2] sched: [6:0.50] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movsldup: ; BROADWELL: # %bb.0: @@ -813,7 +813,7 @@ ; HASWELL-NEXT: movl %edi, %ecx # sched: [1:0.25] ; HASWELL-NEXT: movl %esi, %eax # sched: [1:0.25] ; HASWELL-NEXT: mwait # sched: [20:2.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mwait: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/sse41-schedule.ll =================================================================== --- test/CodeGen/X86/sse41-schedule.ll +++ test/CodeGen/X86/sse41-schedule.ll @@ -36,8 +36,8 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendpd {{.*#+}} xmm0 = xmm0[0],xmm1[1] sched: [1:0.33] ; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: vblendpd {{.*#+}} xmm0 = xmm0[0],mem[1] sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendpd {{.*#+}} xmm0 = xmm0[0],mem[1] sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendpd: ; BROADWELL: # %bb.0: @@ -103,8 +103,8 @@ ; HASWELL-LABEL: test_blendps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0],xmm1[1,2],xmm0[3] sched: [1:0.33] -; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0],mem[1],xmm0[2,3] sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0],mem[1],xmm0[2,3] sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendps: ; BROADWELL: # %bb.0: @@ -169,8 +169,8 @@ ; HASWELL-LABEL: test_blendvpd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vblendvpd %xmm2, (%rdi), %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendvpd %xmm2, (%rdi), %xmm0, %xmm0 # sched: [8:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendvpd: ; BROADWELL: # %bb.0: @@ -236,8 +236,8 @@ ; HASWELL-LABEL: test_blendvps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vblendvps %xmm2, %xmm1, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vblendvps %xmm2, (%rdi), %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vblendvps %xmm2, (%rdi), %xmm0, %xmm0 # sched: [8:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_blendvps: ; BROADWELL: # %bb.0: @@ -297,8 +297,8 @@ ; HASWELL-LABEL: test_dppd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdppd $7, %xmm1, %xmm0, %xmm0 # sched: [9:1.00] -; HASWELL-NEXT: vdppd $7, (%rdi), %xmm0, %xmm0 # sched: [9:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdppd $7, (%rdi), %xmm0, %xmm0 # sched: [15:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_dppd: ; BROADWELL: # %bb.0: @@ -358,8 +358,8 @@ ; HASWELL-LABEL: test_dpps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vdpps $7, %xmm1, %xmm0, %xmm0 # sched: [14:2.00] -; HASWELL-NEXT: vdpps $7, (%rdi), %xmm0, %xmm0 # sched: [14:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vdpps $7, (%rdi), %xmm0, %xmm0 # sched: [20:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_dpps: ; BROADWELL: # %bb.0: @@ -419,8 +419,8 @@ ; HASWELL-LABEL: test_extractps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vextractps $3, %xmm0, %eax # sched: [2:1.00] -; HASWELL-NEXT: vextractps $1, %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vextractps $1, %xmm0, (%rdi) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_extractps: ; BROADWELL: # %bb.0: @@ -481,8 +481,8 @@ ; HASWELL-LABEL: test_insertps: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vinsertps {{.*#+}} xmm0 = zero,xmm1[0],xmm0[2,3] sched: [1:1.00] -; HASWELL-NEXT: vinsertps {{.*#+}} xmm0 = xmm0[0,1,2],mem[0] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vinsertps {{.*#+}} xmm0 = xmm0[0,1,2],mem[0] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_insertps: ; BROADWELL: # %bb.0: @@ -538,8 +538,8 @@ ; ; HASWELL-LABEL: test_movntdqa: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vmovntdqa (%rdi), %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmovntdqa (%rdi), %xmm0 # sched: [6:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_movntdqa: ; BROADWELL: # %bb.0: @@ -592,8 +592,8 @@ ; HASWELL-LABEL: test_mpsadbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vmpsadbw $7, %xmm1, %xmm0, %xmm0 # sched: [7:2.00] -; HASWELL-NEXT: vmpsadbw $7, (%rdi), %xmm0, %xmm0 # sched: [7:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vmpsadbw $7, (%rdi), %xmm0, %xmm0 # sched: [13:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_mpsadbw: ; BROADWELL: # %bb.0: @@ -654,8 +654,8 @@ ; HASWELL-LABEL: test_packusdw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpackusdw %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpackusdw (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpackusdw (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_packusdw: ; BROADWELL: # %bb.0: @@ -722,8 +722,8 @@ ; HASWELL-LABEL: test_pblendvb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpblendvb %xmm2, %xmm1, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vpblendvb %xmm2, (%rdi), %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpblendvb %xmm2, (%rdi), %xmm0, %xmm0 # sched: [8:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pblendvb: ; BROADWELL: # %bb.0: @@ -783,8 +783,8 @@ ; HASWELL-LABEL: test_pblendw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0],xmm1[1],xmm0[2],xmm1[3],xmm0[4],xmm1[5],xmm0[6],xmm1[7] sched: [1:1.00] -; HASWELL-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0,1],mem[2,3],xmm0[4,5,6],mem[7] sched: [4:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0,1],mem[2,3],xmm0[4,5,6],mem[7] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pblendw: ; BROADWELL: # %bb.0: @@ -843,8 +843,8 @@ ; HASWELL-LABEL: test_pcmpeqq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpeqq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpcmpeqq (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpeqq (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpeqq: ; BROADWELL: # %bb.0: @@ -907,8 +907,8 @@ ; HASWELL-LABEL: test_pextrb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpextrb $3, %xmm0, %eax # sched: [2:1.00] -; HASWELL-NEXT: vpextrb $1, %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpextrb $1, %xmm0, (%rdi) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pextrb: ; BROADWELL: # %bb.0: @@ -972,8 +972,8 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpaddd %xmm0, %xmm0, %xmm0 # sched: [1:0.50] ; HASWELL-NEXT: vpextrd $3, %xmm0, %eax # sched: [2:1.00] -; HASWELL-NEXT: vpextrd $1, %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpextrd $1, %xmm0, (%rdi) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pextrd: ; BROADWELL: # %bb.0: @@ -1038,8 +1038,8 @@ ; HASWELL-LABEL: test_pextrq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpextrq $1, %xmm0, %rax # sched: [2:1.00] -; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpextrq $1, %xmm0, (%rdi) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pextrq: ; BROADWELL: # %bb.0: @@ -1098,8 +1098,8 @@ ; HASWELL-LABEL: test_pextrw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpextrw $3, %xmm0, %eax # sched: [2:1.00] -; HASWELL-NEXT: vpextrw $1, %xmm0, (%rdi) # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpextrw $1, %xmm0, (%rdi) # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pextrw: ; BROADWELL: # %bb.0: @@ -1158,9 +1158,9 @@ ; ; HASWELL-LABEL: test_phminposuw: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vphminposuw (%rdi), %xmm0 # sched: [5:1.00] +; HASWELL-NEXT: vphminposuw (%rdi), %xmm0 # sched: [11:1.00] ; HASWELL-NEXT: vphminposuw %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phminposuw: ; BROADWELL: # %bb.0: @@ -1220,8 +1220,8 @@ ; HASWELL-LABEL: test_pinsrb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpinsrb $1, %edi, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vpinsrb $3, (%rsi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpinsrb $3, (%rsi), %xmm0, %xmm0 # sched: [6:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pinsrb: ; BROADWELL: # %bb.0: @@ -1280,8 +1280,8 @@ ; HASWELL-LABEL: test_pinsrd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpinsrd $1, %edi, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vpinsrd $3, (%rsi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpinsrd $3, (%rsi), %xmm0, %xmm0 # sched: [6:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pinsrd: ; BROADWELL: # %bb.0: @@ -1343,9 +1343,9 @@ ; HASWELL-LABEL: test_pinsrq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpinsrq $1, %rdi, %xmm0, %xmm0 # sched: [2:2.00] -; HASWELL-NEXT: vpinsrq $1, (%rsi), %xmm1, %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpinsrq $1, (%rsi), %xmm1, %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pinsrq: ; BROADWELL: # %bb.0: @@ -1410,8 +1410,8 @@ ; HASWELL-LABEL: test_pmaxsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsb: ; BROADWELL: # %bb.0: @@ -1471,8 +1471,8 @@ ; HASWELL-LABEL: test_pmaxsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxsd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxsd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxsd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxsd: ; BROADWELL: # %bb.0: @@ -1532,8 +1532,8 @@ ; HASWELL-LABEL: test_pmaxud: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxud %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxud (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxud (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxud: ; BROADWELL: # %bb.0: @@ -1593,8 +1593,8 @@ ; HASWELL-LABEL: test_pmaxuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaxuw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpmaxuw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaxuw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaxuw: ; BROADWELL: # %bb.0: @@ -1654,8 +1654,8 @@ ; HASWELL-LABEL: test_pminsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminsb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminsb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminsb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsb: ; BROADWELL: # %bb.0: @@ -1715,8 +1715,8 @@ ; HASWELL-LABEL: test_pminsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminsd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminsd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminsd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminsd: ; BROADWELL: # %bb.0: @@ -1776,8 +1776,8 @@ ; HASWELL-LABEL: test_pminud: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminud %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminud (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminud (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminud: ; BROADWELL: # %bb.0: @@ -1837,8 +1837,8 @@ ; HASWELL-LABEL: test_pminuw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpminuw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpminuw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpminuw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pminuw: ; BROADWELL: # %bb.0: @@ -1902,9 +1902,9 @@ ; HASWELL-LABEL: test_pmovsxbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxbw %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpmovsxbw (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpmovsxbw (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxbw: ; BROADWELL: # %bb.0: @@ -1974,9 +1974,9 @@ ; HASWELL-LABEL: test_pmovsxbd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxbd %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpmovsxbd (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpmovsxbd (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxbd: ; BROADWELL: # %bb.0: @@ -2046,9 +2046,9 @@ ; HASWELL-LABEL: test_pmovsxbq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxbq %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpmovsxbq (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpmovsxbq (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxbq: ; BROADWELL: # %bb.0: @@ -2118,9 +2118,9 @@ ; HASWELL-LABEL: test_pmovsxdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxdq %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpmovsxdq (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpmovsxdq (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxdq: ; BROADWELL: # %bb.0: @@ -2190,9 +2190,9 @@ ; HASWELL-LABEL: test_pmovsxwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxwd %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpmovsxwd (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpmovsxwd (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxwd: ; BROADWELL: # %bb.0: @@ -2262,9 +2262,9 @@ ; HASWELL-LABEL: test_pmovsxwq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovsxwq %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpmovsxwq (%rdi), %xmm1 # sched: [1:1.00] +; HASWELL-NEXT: vpmovsxwq (%rdi), %xmm1 # sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovsxwq: ; BROADWELL: # %bb.0: @@ -2334,9 +2334,9 @@ ; HASWELL-LABEL: test_pmovzxbw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxbw {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero sched: [1:1.00] -; HASWELL-NEXT: vpmovzxbw {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [1:1.00] +; HASWELL-NEXT: vpmovzxbw {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero,mem[4],zero,mem[5],zero,mem[6],zero,mem[7],zero sched: [6:1.00] ; HASWELL-NEXT: vpaddw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxbw: ; BROADWELL: # %bb.0: @@ -2406,9 +2406,9 @@ ; HASWELL-LABEL: test_pmovzxbd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxbd {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero sched: [1:1.00] -; HASWELL-NEXT: vpmovzxbd {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [1:1.00] +; HASWELL-NEXT: vpmovzxbd {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero,mem[2],zero,zero,zero,mem[3],zero,zero,zero sched: [6:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxbd: ; BROADWELL: # %bb.0: @@ -2478,9 +2478,9 @@ ; HASWELL-LABEL: test_pmovzxbq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxbq {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,zero,zero,zero,zero,xmm0[1],zero,zero,zero,zero,zero,zero,zero sched: [1:1.00] -; HASWELL-NEXT: vpmovzxbq {{.*#+}} xmm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero sched: [1:1.00] +; HASWELL-NEXT: vpmovzxbq {{.*#+}} xmm1 = mem[0],zero,zero,zero,zero,zero,zero,zero,mem[1],zero,zero,zero,zero,zero,zero,zero sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxbq: ; BROADWELL: # %bb.0: @@ -2550,9 +2550,9 @@ ; HASWELL-LABEL: test_pmovzxdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxdq {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero sched: [1:1.00] -; HASWELL-NEXT: vpmovzxdq {{.*#+}} xmm1 = mem[0],zero,mem[1],zero sched: [1:1.00] +; HASWELL-NEXT: vpmovzxdq {{.*#+}} xmm1 = mem[0],zero,mem[1],zero sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxdq: ; BROADWELL: # %bb.0: @@ -2622,9 +2622,9 @@ ; HASWELL-LABEL: test_pmovzxwd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxwd {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero sched: [1:1.00] -; HASWELL-NEXT: vpmovzxwd {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [1:1.00] +; HASWELL-NEXT: vpmovzxwd {{.*#+}} xmm1 = mem[0],zero,mem[1],zero,mem[2],zero,mem[3],zero sched: [6:1.00] ; HASWELL-NEXT: vpaddd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxwd: ; BROADWELL: # %bb.0: @@ -2694,9 +2694,9 @@ ; HASWELL-LABEL: test_pmovzxwq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmovzxwq {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero sched: [1:1.00] -; HASWELL-NEXT: vpmovzxwq {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero sched: [1:1.00] +; HASWELL-NEXT: vpmovzxwq {{.*#+}} xmm1 = mem[0],zero,zero,zero,mem[1],zero,zero,zero sched: [6:1.00] ; HASWELL-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmovzxwq: ; BROADWELL: # %bb.0: @@ -2762,8 +2762,8 @@ ; HASWELL-LABEL: test_pmuldq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmuldq %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmuldq (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmuldq (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmuldq: ; BROADWELL: # %bb.0: @@ -2824,8 +2824,8 @@ ; HASWELL-LABEL: test_pmulld: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulld %xmm1, %xmm0, %xmm0 # sched: [10:2.00] -; HASWELL-NEXT: vpmulld (%rdi), %xmm0, %xmm0 # sched: [10:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulld (%rdi), %xmm0, %xmm0 # sched: [16:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulld: ; BROADWELL: # %bb.0: @@ -2897,11 +2897,11 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vptest %xmm1, %xmm0 # sched: [2:1.00] ; HASWELL-NEXT: setb %al # sched: [1:0.50] -; HASWELL-NEXT: vptest (%rdi), %xmm0 # sched: [2:1.00] +; HASWELL-NEXT: vptest (%rdi), %xmm0 # sched: [8:1.00] ; HASWELL-NEXT: setb %cl # sched: [1:0.50] ; HASWELL-NEXT: andb %al, %cl # sched: [1:0.25] ; HASWELL-NEXT: movzbl %cl, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ptest: ; BROADWELL: # %bb.0: @@ -2985,10 +2985,10 @@ ; ; HASWELL-LABEL: test_roundpd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vroundpd $7, %xmm0, %xmm0 # sched: [5:1.25] -; HASWELL-NEXT: vroundpd $7, (%rdi), %xmm1 # sched: [6:2.00] +; HASWELL-NEXT: vroundpd $7, %xmm0, %xmm0 # sched: [6:0.50] +; HASWELL-NEXT: vroundpd $7, (%rdi), %xmm1 # sched: [12:2.00] ; HASWELL-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_roundpd: ; BROADWELL: # %bb.0: @@ -3057,10 +3057,10 @@ ; ; HASWELL-LABEL: test_roundps: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vroundps $7, %xmm0, %xmm0 # sched: [5:1.25] -; HASWELL-NEXT: vroundps $7, (%rdi), %xmm1 # sched: [6:2.00] +; HASWELL-NEXT: vroundps $7, %xmm0, %xmm0 # sched: [6:0.50] +; HASWELL-NEXT: vroundps $7, (%rdi), %xmm1 # sched: [12:2.00] ; HASWELL-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_roundps: ; BROADWELL: # %bb.0: @@ -3130,10 +3130,10 @@ ; ; HASWELL-LABEL: test_roundsd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vroundsd $7, %xmm1, %xmm0, %xmm1 # sched: [5:1.25] -; HASWELL-NEXT: vroundsd $7, (%rdi), %xmm0, %xmm0 # sched: [6:2.00] +; HASWELL-NEXT: vroundsd $7, %xmm1, %xmm0, %xmm1 # sched: [6:0.50] +; HASWELL-NEXT: vroundsd $7, (%rdi), %xmm0, %xmm0 # sched: [12:2.00] ; HASWELL-NEXT: vaddpd %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_roundsd: ; BROADWELL: # %bb.0: @@ -3203,10 +3203,10 @@ ; ; HASWELL-LABEL: test_roundss: ; HASWELL: # %bb.0: -; HASWELL-NEXT: vroundss $7, %xmm1, %xmm0, %xmm1 # sched: [5:1.25] -; HASWELL-NEXT: vroundss $7, (%rdi), %xmm0, %xmm0 # sched: [6:2.00] +; HASWELL-NEXT: vroundss $7, %xmm1, %xmm0, %xmm1 # sched: [6:0.50] +; HASWELL-NEXT: vroundss $7, (%rdi), %xmm0, %xmm0 # sched: [12:2.00] ; HASWELL-NEXT: vaddps %xmm0, %xmm1, %xmm0 # sched: [3:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_roundss: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/sse42-schedule.ll =================================================================== --- test/CodeGen/X86/sse42-schedule.ll +++ test/CodeGen/X86/sse42-schedule.ll @@ -35,9 +35,9 @@ ; HASWELL-LABEL: crc32_32_8: ; HASWELL: # %bb.0: ; HASWELL-NEXT: crc32b %sil, %edi # sched: [3:1.00] -; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [7:1.00] +; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [8:1.00] ; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: crc32_32_8: ; BROADWELL: # %bb.0: @@ -105,9 +105,9 @@ ; HASWELL-LABEL: crc32_32_16: ; HASWELL: # %bb.0: ; HASWELL-NEXT: crc32w %si, %edi # sched: [3:1.00] -; HASWELL-NEXT: crc32w (%rdx), %edi # sched: [7:1.00] +; HASWELL-NEXT: crc32w (%rdx), %edi # sched: [8:1.00] ; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: crc32_32_16: ; BROADWELL: # %bb.0: @@ -175,9 +175,9 @@ ; HASWELL-LABEL: crc32_32_32: ; HASWELL: # %bb.0: ; HASWELL-NEXT: crc32l %esi, %edi # sched: [3:1.00] -; HASWELL-NEXT: crc32l (%rdx), %edi # sched: [7:1.00] +; HASWELL-NEXT: crc32l (%rdx), %edi # sched: [8:1.00] ; HASWELL-NEXT: movl %edi, %eax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: crc32_32_32: ; BROADWELL: # %bb.0: @@ -245,9 +245,9 @@ ; HASWELL-LABEL: crc32_64_8: ; HASWELL: # %bb.0: ; HASWELL-NEXT: crc32b %sil, %edi # sched: [3:1.00] -; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [7:1.00] +; HASWELL-NEXT: crc32b (%rdx), %edi # sched: [8:1.00] ; HASWELL-NEXT: movq %rdi, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: crc32_64_8: ; BROADWELL: # %bb.0: @@ -315,9 +315,9 @@ ; HASWELL-LABEL: crc32_64_64: ; HASWELL: # %bb.0: ; HASWELL-NEXT: crc32q %rsi, %rdi # sched: [3:1.00] -; HASWELL-NEXT: crc32q (%rdx), %rdi # sched: [7:1.00] +; HASWELL-NEXT: crc32q (%rdx), %rdi # sched: [8:1.00] ; HASWELL-NEXT: movq %rdi, %rax # sched: [1:0.25] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: crc32_64_64: ; BROADWELL: # %bb.0: @@ -408,10 +408,10 @@ ; HASWELL-NEXT: movl %ecx, %esi # sched: [1:0.25] ; HASWELL-NEXT: movl $7, %eax # sched: [1:0.25] ; HASWELL-NEXT: movl $7, %edx # sched: [1:0.25] -; HASWELL-NEXT: vpcmpestri $7, (%rdi), %xmm0 # sched: [18:4.00] +; HASWELL-NEXT: vpcmpestri $7, (%rdi), %xmm0 # sched: [24:4.00] ; HASWELL-NEXT: # kill: %ecx %ecx %rcx ; HASWELL-NEXT: leal (%rcx,%rsi), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpestri: ; BROADWELL: # %bb.0: @@ -523,8 +523,8 @@ ; HASWELL-NEXT: vpcmpestrm $7, %xmm1, %xmm0 # sched: [19:4.00] ; HASWELL-NEXT: movl $7, %eax # sched: [1:0.25] ; HASWELL-NEXT: movl $7, %edx # sched: [1:0.25] -; HASWELL-NEXT: vpcmpestrm $7, (%rdi), %xmm0 # sched: [19:4.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpestrm $7, (%rdi), %xmm0 # sched: [25:4.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpestrm: ; BROADWELL: # %bb.0: @@ -614,10 +614,10 @@ ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpistri $7, %xmm1, %xmm0 # sched: [11:3.00] ; HASWELL-NEXT: movl %ecx, %eax # sched: [1:0.25] -; HASWELL-NEXT: vpcmpistri $7, (%rdi), %xmm0 # sched: [11:3.00] +; HASWELL-NEXT: vpcmpistri $7, (%rdi), %xmm0 # sched: [17:3.00] ; HASWELL-NEXT: # kill: %ecx %ecx %rcx ; HASWELL-NEXT: leal (%rcx,%rax), %eax # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpistri: ; BROADWELL: # %bb.0: @@ -693,8 +693,8 @@ ; HASWELL-LABEL: test_pcmpistrm: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpistrm $7, %xmm1, %xmm0 # sched: [11:3.00] -; HASWELL-NEXT: vpcmpistrm $7, (%rdi), %xmm0 # sched: [11:3.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpistrm $7, (%rdi), %xmm0 # sched: [17:3.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpistrm: ; BROADWELL: # %bb.0: @@ -754,8 +754,8 @@ ; HASWELL-LABEL: test_pcmpgtq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpcmpgtq (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpcmpgtq (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pcmpgtq: ; BROADWELL: # %bb.0: @@ -818,8 +818,8 @@ ; HASWELL-LABEL: test_pclmulqdq: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpclmulqdq $0, %xmm1, %xmm0, %xmm0 # sched: [11:2.00] -; HASWELL-NEXT: vpclmulqdq $0, (%rdi), %xmm0, %xmm0 # sched: [11:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpclmulqdq $0, (%rdi), %xmm0, %xmm0 # sched: [17:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pclmulqdq: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/ssse3-schedule.ll =================================================================== --- test/CodeGen/X86/ssse3-schedule.ll +++ test/CodeGen/X86/ssse3-schedule.ll @@ -44,9 +44,9 @@ ; HASWELL-LABEL: test_pabsb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpabsb %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpabsb (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vpabsb (%rdi), %xmm1 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsb: ; BROADWELL: # %bb.0: @@ -123,9 +123,9 @@ ; HASWELL-LABEL: test_pabsd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpabsd %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpabsd (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vpabsd (%rdi), %xmm1 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsd: ; BROADWELL: # %bb.0: @@ -202,9 +202,9 @@ ; HASWELL-LABEL: test_pabsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpabsw %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpabsw (%rdi), %xmm1 # sched: [1:0.50] +; HASWELL-NEXT: vpabsw (%rdi), %xmm1 # sched: [7:0.50] ; HASWELL-NEXT: vpor %xmm1, %xmm0, %xmm0 # sched: [1:0.33] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pabsw: ; BROADWELL: # %bb.0: @@ -281,8 +281,8 @@ ; HASWELL-LABEL: test_palignr: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpalignr {{.*#+}} xmm0 = xmm0[6,7,8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5] sched: [1:1.00] -; HASWELL-NEXT: vpalignr {{.*#+}} xmm0 = mem[14,15],xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13] sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpalignr {{.*#+}} xmm0 = mem[14,15],xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13] sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_palignr: ; BROADWELL: # %bb.0: @@ -347,8 +347,8 @@ ; HASWELL-LABEL: test_phaddd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphaddd %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vphaddd (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphaddd (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddd: ; BROADWELL: # %bb.0: @@ -414,8 +414,8 @@ ; HASWELL-LABEL: test_phaddsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphaddsw %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vphaddsw (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphaddsw (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddsw: ; BROADWELL: # %bb.0: @@ -481,8 +481,8 @@ ; HASWELL-LABEL: test_phaddw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphaddw %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vphaddw (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphaddw (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phaddw: ; BROADWELL: # %bb.0: @@ -548,8 +548,8 @@ ; HASWELL-LABEL: test_phsubd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphsubd %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vphsubd (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphsubd (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubd: ; BROADWELL: # %bb.0: @@ -615,8 +615,8 @@ ; HASWELL-LABEL: test_phsubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphsubsw %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vphsubsw (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphsubsw (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubsw: ; BROADWELL: # %bb.0: @@ -682,8 +682,8 @@ ; HASWELL-LABEL: test_phsubw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vphsubw %xmm1, %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: vphsubw (%rdi), %xmm0, %xmm0 # sched: [3:2.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vphsubw (%rdi), %xmm0, %xmm0 # sched: [9:2.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_phsubw: ; BROADWELL: # %bb.0: @@ -749,8 +749,8 @@ ; HASWELL-LABEL: test_pmaddubsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmaddubsw %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmaddubsw (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmaddubsw (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmaddubsw: ; BROADWELL: # %bb.0: @@ -817,8 +817,8 @@ ; HASWELL-LABEL: test_pmulhrsw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpmulhrsw %xmm1, %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: vpmulhrsw (%rdi), %xmm0, %xmm0 # sched: [5:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpmulhrsw (%rdi), %xmm0, %xmm0 # sched: [11:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pmulhrsw: ; BROADWELL: # %bb.0: @@ -884,8 +884,8 @@ ; HASWELL-LABEL: test_pshufb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpshufb %xmm1, %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: vpshufb (%rdi), %xmm0, %xmm0 # sched: [1:1.00] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpshufb (%rdi), %xmm0, %xmm0 # sched: [7:1.00] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_pshufb: ; BROADWELL: # %bb.0: @@ -955,8 +955,8 @@ ; HASWELL-LABEL: test_psignb: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsignb %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsignb (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsignb (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignb: ; BROADWELL: # %bb.0: @@ -1026,8 +1026,8 @@ ; HASWELL-LABEL: test_psignd: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsignd %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsignd (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsignd (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignd: ; BROADWELL: # %bb.0: @@ -1097,8 +1097,8 @@ ; HASWELL-LABEL: test_psignw: ; HASWELL: # %bb.0: ; HASWELL-NEXT: vpsignw %xmm1, %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: vpsignw (%rdi), %xmm0, %xmm0 # sched: [1:0.50] -; HASWELL-NEXT: retq # sched: [2:1.00] +; HASWELL-NEXT: vpsignw (%rdi), %xmm0, %xmm0 # sched: [7:0.50] +; HASWELL-NEXT: retq # sched: [7:1.00] ; ; BROADWELL-LABEL: test_psignw: ; BROADWELL: # %bb.0: Index: test/CodeGen/X86/x87-schedule.ll =================================================================== --- test/CodeGen/X86/x87-schedule.ll +++ test/CodeGen/X86/x87-schedule.ll @@ -45,7 +45,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: f2xm1 # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_f2xm1: ; BROADWELL: # %bb.0: @@ -119,7 +119,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fabs # sched: [1:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fabs: ; BROADWELL: # %bb.0: @@ -210,15 +210,15 @@ ; ; HASWELL-LABEL: test_fadd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fadd %st(0), %st(1) # sched: [3:1.00] ; HASWELL-NEXT: fadd %st(2) # sched: [3:1.00] -; HASWELL-NEXT: fadds (%ecx) # sched: [3:1.00] -; HASWELL-NEXT: faddl (%eax) # sched: [3:1.00] +; HASWELL-NEXT: fadds (%ecx) # sched: [10:1.00] +; HASWELL-NEXT: faddl (%eax) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fadd: ; BROADWELL: # %bb.0: @@ -334,15 +334,15 @@ ; ; HASWELL-LABEL: test_faddp_fiadd: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: faddp %st(1) # sched: [3:1.00] ; HASWELL-NEXT: faddp %st(2) # sched: [3:1.00] -; HASWELL-NEXT: fiadds (%ecx) # sched: [6:2.00] -; HASWELL-NEXT: fiaddl (%eax) # sched: [6:2.00] +; HASWELL-NEXT: fiadds (%ecx) # sched: [13:2.00] +; HASWELL-NEXT: fiaddl (%eax) # sched: [13:2.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_faddp_fiadd: ; BROADWELL: # %bb.0: @@ -444,7 +444,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fchs # sched: [1:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fchs: ; BROADWELL: # %bb.0: @@ -528,7 +528,7 @@ ; HASWELL-NEXT: fnclex # sched: [1:1.25] ; HASWELL-NEXT: fnclex # sched: [1:1.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fclex_fnclex: ; BROADWELL: # %bb.0: @@ -647,7 +647,7 @@ ; HASWELL-NEXT: fcmovnu %st(1), %st(0) # sched: [3:1.00] ; HASWELL-NEXT: fcmovu %st(1), %st(0) # sched: [3:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fcmov: ; BROADWELL: # %bb.0: @@ -773,15 +773,15 @@ ; ; HASWELL-LABEL: test_fcom: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fcom %st(1) # sched: [1:1.00] ; HASWELL-NEXT: fcom %st(3) # sched: [1:1.00] -; HASWELL-NEXT: fcoms (%ecx) # sched: [1:1.00] -; HASWELL-NEXT: fcoml (%eax) # sched: [1:1.00] +; HASWELL-NEXT: fcoms (%ecx) # sched: [8:1.00] +; HASWELL-NEXT: fcoml (%eax) # sched: [8:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fcom: ; BROADWELL: # %bb.0: @@ -901,16 +901,16 @@ ; ; HASWELL-LABEL: test_fcomp_fcompp: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fcomp %st(1) # sched: [1:1.00] ; HASWELL-NEXT: fcomp %st(3) # sched: [1:1.00] -; HASWELL-NEXT: fcomps (%ecx) # sched: [1:1.00] -; HASWELL-NEXT: fcompl (%eax) # sched: [1:1.00] +; HASWELL-NEXT: fcomps (%ecx) # sched: [8:1.00] +; HASWELL-NEXT: fcompl (%eax) # sched: [8:1.00] ; HASWELL-NEXT: fcompp # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fcomp_fcompp: ; BROADWELL: # %bb.0: @@ -1019,7 +1019,7 @@ ; HASWELL-NEXT: fcomi %st(3) # sched: [1:0.50] ; HASWELL-NEXT: fcompi %st(3) # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fcomi_fcomip: ; BROADWELL: # %bb.0: @@ -1098,7 +1098,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fcos # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fcos: ; BROADWELL: # %bb.0: @@ -1172,7 +1172,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fdecstp # sched: [2:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fdecstp: ; BROADWELL: # %bb.0: @@ -1263,15 +1263,15 @@ ; ; HASWELL-LABEL: test_fdiv: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fdiv %st(0), %st(1) # sched: [24:1.00] ; HASWELL-NEXT: fdiv %st(2) # sched: [20:1.00] -; HASWELL-NEXT: fdivs (%ecx) # sched: [24:1.00] -; HASWELL-NEXT: fdivl (%eax) # sched: [24:1.00] +; HASWELL-NEXT: fdivs (%ecx) # sched: [31:1.00] +; HASWELL-NEXT: fdivl (%eax) # sched: [31:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fdiv: ; BROADWELL: # %bb.0: @@ -1387,15 +1387,15 @@ ; ; HASWELL-LABEL: test_fdivp_fidiv: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fdivp %st(1) # sched: [24:1.00] ; HASWELL-NEXT: fdivp %st(2) # sched: [24:1.00] -; HASWELL-NEXT: fidivs (%ecx) # sched: [27:1.00] -; HASWELL-NEXT: fidivl (%eax) # sched: [27:1.00] +; HASWELL-NEXT: fidivs (%ecx) # sched: [34:1.00] +; HASWELL-NEXT: fidivl (%eax) # sched: [34:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fdivp_fidiv: ; BROADWELL: # %bb.0: @@ -1511,15 +1511,15 @@ ; ; HASWELL-LABEL: test_fdivr: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fdivr %st(0), %st(1) # sched: [20:1.00] ; HASWELL-NEXT: fdivr %st(2) # sched: [24:1.00] -; HASWELL-NEXT: fdivrs (%ecx) # sched: [20:1.00] -; HASWELL-NEXT: fdivrl (%eax) # sched: [20:1.00] +; HASWELL-NEXT: fdivrs (%ecx) # sched: [27:1.00] +; HASWELL-NEXT: fdivrl (%eax) # sched: [27:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fdivr: ; BROADWELL: # %bb.0: @@ -1635,15 +1635,15 @@ ; ; HASWELL-LABEL: test_fdivrp_fidivr: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fdivrp %st(1) # sched: [20:1.00] ; HASWELL-NEXT: fdivrp %st(2) # sched: [20:1.00] -; HASWELL-NEXT: fidivrs (%ecx) # sched: [23:1.00] -; HASWELL-NEXT: fidivrl (%eax) # sched: [23:1.00] +; HASWELL-NEXT: fidivrs (%ecx) # sched: [30:1.00] +; HASWELL-NEXT: fidivrl (%eax) # sched: [30:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fdivrp_fidivr: ; BROADWELL: # %bb.0: @@ -1742,7 +1742,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: ffree %st(0) # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ffree: ; BROADWELL: # %bb.0: @@ -1833,15 +1833,15 @@ ; ; HASWELL-LABEL: test_ficom: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP -; HASWELL-NEXT: ficoms (%ecx) # sched: [4:2.00] -; HASWELL-NEXT: ficoml (%eax) # sched: [4:2.00] -; HASWELL-NEXT: ficomps (%ecx) # sched: [4:2.00] -; HASWELL-NEXT: ficompl (%eax) # sched: [4:2.00] +; HASWELL-NEXT: ficoms (%ecx) # sched: [11:2.00] +; HASWELL-NEXT: ficoml (%eax) # sched: [11:2.00] +; HASWELL-NEXT: ficomps (%ecx) # sched: [11:2.00] +; HASWELL-NEXT: ficompl (%eax) # sched: [11:2.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ficom: ; BROADWELL: # %bb.0: @@ -1957,15 +1957,15 @@ ; ; HASWELL-LABEL: test_fild: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %edx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %edx # sched: [5:0.50] ; HASWELL-NEXT: #APP -; HASWELL-NEXT: filds (%edx) # sched: [3:1.00] -; HASWELL-NEXT: fildl (%ecx) # sched: [3:1.00] -; HASWELL-NEXT: fildll (%eax) # sched: [3:1.00] +; HASWELL-NEXT: filds (%edx) # sched: [10:1.00] +; HASWELL-NEXT: fildl (%ecx) # sched: [10:1.00] +; HASWELL-NEXT: fildll (%eax) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fild: ; BROADWELL: # %bb.0: @@ -2064,7 +2064,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fincstp # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fincstp: ; BROADWELL: # %bb.0: @@ -2148,7 +2148,7 @@ ; HASWELL-NEXT: fninit # sched: [1:?] ; HASWELL-NEXT: fninit # sched: [1:?] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_finit_fninit: ; BROADWELL: # %bb.0: @@ -2266,7 +2266,7 @@ ; HASWELL-NEXT: fldpi # sched: [1:0.50] ; HASWELL-NEXT: fldz # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fld1_fldl2e_fldl2t_fldlg2_fldln2_fldpi_fldz: ; BROADWELL: # %bb.0: @@ -2382,15 +2382,15 @@ ; ; HASWELL-LABEL: test_fmul: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fmul %st(0), %st(1) # sched: [5:1.00] ; HASWELL-NEXT: fmul %st(2) # sched: [5:1.00] -; HASWELL-NEXT: fmuls (%ecx) # sched: [5:1.00] -; HASWELL-NEXT: fmull (%eax) # sched: [5:1.00] +; HASWELL-NEXT: fmuls (%ecx) # sched: [12:1.00] +; HASWELL-NEXT: fmull (%eax) # sched: [12:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fmul: ; BROADWELL: # %bb.0: @@ -2506,15 +2506,15 @@ ; ; HASWELL-LABEL: test_fmulp_fimul: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fmulp %st(1) # sched: [5:1.00] ; HASWELL-NEXT: fmulp %st(2) # sched: [5:1.00] -; HASWELL-NEXT: fimuls (%ecx) # sched: [8:1.00] -; HASWELL-NEXT: fimull (%eax) # sched: [8:1.00] +; HASWELL-NEXT: fimuls (%ecx) # sched: [15:1.00] +; HASWELL-NEXT: fimull (%eax) # sched: [15:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fmulp_fimul: ; BROADWELL: # %bb.0: @@ -2613,7 +2613,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fnop # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fnop: ; BROADWELL: # %bb.0: @@ -2687,7 +2687,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fpatan # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fpatan: ; BROADWELL: # %bb.0: @@ -2766,7 +2766,7 @@ ; HASWELL-NEXT: fprem # sched: [19:?] ; HASWELL-NEXT: fprem1 # sched: [19:?] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fprem_fprem1: ; BROADWELL: # %bb.0: @@ -2845,7 +2845,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fptan # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fptan: ; BROADWELL: # %bb.0: @@ -2919,7 +2919,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: frndint # sched: [11:?] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_frndint: ; BROADWELL: # %bb.0: @@ -2997,7 +2997,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fscale # sched: [75:?] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fscale: ; BROADWELL: # %bb.0: @@ -3071,7 +3071,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsin # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsin: ; BROADWELL: # %bb.0: @@ -3145,7 +3145,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsincos # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsincos: ; BROADWELL: # %bb.0: @@ -3219,7 +3219,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsqrt # sched: [15:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsqrt: ; BROADWELL: # %bb.0: @@ -3322,15 +3322,15 @@ ; ; HASWELL-LABEL: test_fsub: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsub %st(0), %st(1) # sched: [3:1.00] ; HASWELL-NEXT: fsub %st(2) # sched: [3:1.00] -; HASWELL-NEXT: fsubs (%ecx) # sched: [3:1.00] -; HASWELL-NEXT: fsubl (%eax) # sched: [3:1.00] +; HASWELL-NEXT: fsubs (%ecx) # sched: [10:1.00] +; HASWELL-NEXT: fsubl (%eax) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsub: ; BROADWELL: # %bb.0: @@ -3446,15 +3446,15 @@ ; ; HASWELL-LABEL: test_fsubp_fisub: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsubp %st(1) # sched: [3:1.00] ; HASWELL-NEXT: fsubp %st(2) # sched: [3:1.00] -; HASWELL-NEXT: fisubs (%ecx) # sched: [6:2.00] -; HASWELL-NEXT: fisubl (%eax) # sched: [6:2.00] +; HASWELL-NEXT: fisubs (%ecx) # sched: [13:2.00] +; HASWELL-NEXT: fisubl (%eax) # sched: [13:2.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsubp_fisub: ; BROADWELL: # %bb.0: @@ -3570,15 +3570,15 @@ ; ; HASWELL-LABEL: test_fsubr: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsubr %st(0), %st(1) # sched: [3:1.00] ; HASWELL-NEXT: fsubr %st(2) # sched: [3:1.00] -; HASWELL-NEXT: fsubrs (%ecx) # sched: [3:1.00] -; HASWELL-NEXT: fsubrl (%eax) # sched: [3:1.00] +; HASWELL-NEXT: fsubrs (%ecx) # sched: [10:1.00] +; HASWELL-NEXT: fsubrl (%eax) # sched: [10:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsubr: ; BROADWELL: # %bb.0: @@ -3694,15 +3694,15 @@ ; ; HASWELL-LABEL: test_fsubrp_fisubr: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %ecx # sched: [5:0.50] ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fsubrp %st(1) # sched: [3:1.00] ; HASWELL-NEXT: fsubrp %st(2) # sched: [3:1.00] -; HASWELL-NEXT: fisubrs (%ecx) # sched: [6:2.00] -; HASWELL-NEXT: fisubrl (%eax) # sched: [6:2.00] +; HASWELL-NEXT: fisubrs (%ecx) # sched: [13:2.00] +; HASWELL-NEXT: fisubrl (%eax) # sched: [13:2.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fsubrp_fisubr: ; BROADWELL: # %bb.0: @@ -3801,7 +3801,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: ftst # sched: [1:1.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_ftst: ; BROADWELL: # %bb.0: @@ -3895,7 +3895,7 @@ ; HASWELL-NEXT: fucomp %st(3) # sched: [1:1.00] ; HASWELL-NEXT: fucompp # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fucom_fucomp_fucompp: ; BROADWELL: # %bb.0: @@ -3994,7 +3994,7 @@ ; HASWELL-NEXT: fucomi %st(3) # sched: [1:0.50] ; HASWELL-NEXT: fucompi %st(3) # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fucomi_fucomip: ; BROADWELL: # %bb.0: @@ -4073,7 +4073,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: wait # sched: [1:0.50] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fwait: ; BROADWELL: # %bb.0: @@ -4147,7 +4147,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fxam # sched: [1:2.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fxam: ; BROADWELL: # %bb.0: @@ -4226,7 +4226,7 @@ ; HASWELL-NEXT: fxch %st(1) # sched: [17:4.00] ; HASWELL-NEXT: fxch %st(3) # sched: [17:4.00] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fxch: ; BROADWELL: # %bb.0: @@ -4310,12 +4310,12 @@ ; ; HASWELL-LABEL: test_fxrstor_fxsave: ; HASWELL: # %bb.0: -; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [1:0.50] +; HASWELL-NEXT: movl {{[0-9]+}}(%esp), %eax # sched: [5:0.50] ; HASWELL-NEXT: #APP -; HASWELL-NEXT: fxrstor (%eax) # sched: [59:16.50] +; HASWELL-NEXT: fxrstor (%eax) # sched: [64:16.50] ; HASWELL-NEXT: fxsave (%eax) # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fxrstor_fxsave: ; BROADWELL: # %bb.0: @@ -4399,7 +4399,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fxtract # sched: [15:?] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fxtract: ; BROADWELL: # %bb.0: @@ -4473,7 +4473,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fyl2x # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fyl2x: ; BROADWELL: # %bb.0: @@ -4547,7 +4547,7 @@ ; HASWELL-NEXT: #APP ; HASWELL-NEXT: fyl2xp1 # sched: [100:0.25] ; HASWELL-NEXT: #NO_APP -; HASWELL-NEXT: retl # sched: [5:0.50] +; HASWELL-NEXT: retl # sched: [7:1.00] ; ; BROADWELL-LABEL: test_fyl2xp1: ; BROADWELL: # %bb.0: