//===- X86ScheduleAtom.td - X86 Atom Scheduling Definitions -*- tablegen -*-==// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file defines the schedule class data for the Intel Atom // in order (Saltwell-32nm/Bonnell-45nm) processors. // //===----------------------------------------------------------------------===// // // Scheduling information derived from the "Intel 64 and IA32 Architectures // Optimization Reference Manual", Chapter 13, Section 4. // Atom machine model. def AtomModel : SchedMachineModel { let IssueWidth = 2; // Allows 2 instructions per scheduling group. let MicroOpBufferSize = 0; // In-order execution, always hide latency. let LoadLatency = 3; // Expected cycles, may be overriden. let HighLatency = 30;// Expected, may be overriden. // On the Atom, the throughput for taken branches is 2 cycles. For small // simple loops, expand by a small factor to hide the backedge cost. let LoopMicroOpBufferSize = 10; let PostRAScheduler = 1; let CompleteModel = 0; } let SchedModel = AtomModel in { // Functional Units def AtomPort0 : ProcResource<1>; // ALU: ALU0, shift/rotate, load/store // SIMD/FP: SIMD ALU, Shuffle,SIMD/FP multiply, divide def AtomPort1 : ProcResource<1>; // ALU: ALU1, bit processing, jump, and LEA // SIMD/FP: SIMD ALU, FP Adder def AtomPort01 : ProcResGroup<[AtomPort0, AtomPort1]>; // Loads are 3 cycles, so ReadAfterLd registers needn't be available until 3 // cycles after the memory operand. def : ReadAdvance<ReadAfterLd, 3>; // Many SchedWrites are defined in pairs with and without a folded load. // Instructions with folded loads are usually micro-fused, so they only appear // as two micro-ops when dispatched by the schedulers. // This multiclass defines the resource usage for variants with and without // folded loads. multiclass AtomWriteResPair<X86FoldableSchedWrite SchedRW, list<ProcResourceKind> RRPorts, list<ProcResourceKind> RMPorts, int RRLat = 1, int RMLat = 1, list<int> RRRes = [1], list<int> RMRes = [1]> { // Register variant is using a single cycle on ExePort. def : WriteRes<SchedRW, RRPorts> { let Latency = RRLat; let ResourceCycles = RRRes; } // Memory variant also uses a cycle on JLAGU and adds 3 cycles to the // latency. def : WriteRes<SchedRW.Folded, RMPorts> { let Latency = RMLat; let ResourceCycles = RMRes; } } // A folded store needs a cycle on Port0 for the store data. def : WriteRes<WriteRMW, [AtomPort0]>; //////////////////////////////////////////////////////////////////////////////// // Arithmetic. //////////////////////////////////////////////////////////////////////////////// defm : AtomWriteResPair<WriteALU, [AtomPort01], [AtomPort0]>; defm : AtomWriteResPair<WriteADC, [AtomPort01], [AtomPort0]>; defm : AtomWriteResPair<WriteIMul, [AtomPort01], [AtomPort01], 7, 7, [7], [7]>; defm : AtomWriteResPair<WriteIMul64, [AtomPort01], [AtomPort01], 12, 12, [12], [12]>; defm : X86WriteRes<WriteBSWAP32, [AtomPort0], 1, [1], 1>; defm : X86WriteRes<WriteBSWAP64, [AtomPort0], 1, [1], 1>; defm : AtomWriteResPair<WriteDiv8, [AtomPort01], [AtomPort01], 50, 68, [50], [68]>; defm : AtomWriteResPair<WriteDiv16, [AtomPort01], [AtomPort01], 50, 50, [50], [50]>; defm : AtomWriteResPair<WriteDiv32, [AtomPort01], [AtomPort01], 50, 50, [50], [50]>; defm : AtomWriteResPair<WriteDiv64, [AtomPort01], [AtomPort01],130,130,[130],[130]>; defm : AtomWriteResPair<WriteIDiv8, [AtomPort01], [AtomPort01], 62, 62, [62], [62]>; defm : AtomWriteResPair<WriteIDiv16, [AtomPort01], [AtomPort01], 62, 62, [62], [62]>; defm : AtomWriteResPair<WriteIDiv32, [AtomPort01], [AtomPort01], 62, 62, [62], [62]>; defm : AtomWriteResPair<WriteIDiv64, [AtomPort01], [AtomPort01],130,130,[130],[130]>; defm : X86WriteResPairUnsupported<WriteCRC32>; defm : AtomWriteResPair<WriteCMOV, [AtomPort01], [AtomPort0]>; defm : AtomWriteResPair<WriteCMOV2, [AtomPort01], [AtomPort0]>; defm : X86WriteRes<WriteFCMOV, [AtomPort01], 9, [9], 1>; // x87 conditional move. def : WriteRes<WriteSETCC, [AtomPort01]>; def : WriteRes<WriteSETCCStore, [AtomPort01]> { let Latency = 2; let ResourceCycles = [2]; } def : WriteRes<WriteLAHFSAHF, [AtomPort01]> { let Latency = 2; let ResourceCycles = [2]; } def : WriteRes<WriteBitTest,[AtomPort01]>; defm : X86WriteResUnsupported<WriteIMulH>; // This is for simple LEAs with one or two input operands. def : WriteRes<WriteLEA, [AtomPort1]>; def AtomWriteIMul16Ld : SchedWriteRes<[AtomPort01]> { let Latency = 8; let ResourceCycles = [8]; } def : InstRW<[AtomWriteIMul16Ld], (instrs MUL16m, IMUL16m)>; def AtomWriteIMul32 : SchedWriteRes<[AtomPort01]> { let Latency = 6; let ResourceCycles = [6]; } def : InstRW<[AtomWriteIMul32], (instrs MUL32r, IMUL32r)>; def AtomWriteIMul64I : SchedWriteRes<[AtomPort01]> { let Latency = 14; let ResourceCycles = [14]; } def : InstRW<[AtomWriteIMul64I], (instrs IMUL64rri8, IMUL64rri32, IMUL64rmi8, IMUL64rmi32)>; // Bit counts. defm : AtomWriteResPair<WriteBSF, [AtomPort01], [AtomPort01], 16, 16, [16], [16]>; defm : AtomWriteResPair<WriteBSR, [AtomPort01], [AtomPort01], 16, 16, [16], [16]>; defm : X86WriteResPairUnsupported<WritePOPCNT>; defm : X86WriteResPairUnsupported<WriteLZCNT>; defm : X86WriteResPairUnsupported<WriteTZCNT>; // BMI1 BEXTR, BMI2 BZHI defm : X86WriteResPairUnsupported<WriteBEXTR>; defm : X86WriteResPairUnsupported<WriteBZHI>; //////////////////////////////////////////////////////////////////////////////// // Integer shifts and rotates. //////////////////////////////////////////////////////////////////////////////// defm : AtomWriteResPair<WriteShift, [AtomPort0], [AtomPort0]>; defm : X86WriteRes<WriteSHDrri, [AtomPort01], 2, [2], 1>; defm : X86WriteRes<WriteSHDrrcl,[AtomPort01], 2, [2], 1>; defm : X86WriteRes<WriteSHDmri, [AtomPort01], 4, [4], 1>; defm : X86WriteRes<WriteSHDmrcl,[AtomPort01], 4, [4], 1>; //////////////////////////////////////////////////////////////////////////////// // Loads, stores, and moves, not folded with other operations. //////////////////////////////////////////////////////////////////////////////// def : WriteRes<WriteLoad, [AtomPort0]>; def : WriteRes<WriteStore, [AtomPort0]>; def : WriteRes<WriteStoreNT, [AtomPort0]>; def : WriteRes<WriteMove, [AtomPort01]>; // Treat misc copies as a move. def : InstRW<[WriteMove], (instrs COPY)>; //////////////////////////////////////////////////////////////////////////////// // Idioms that clear a register, like xorps %xmm0, %xmm0. // These can often bypass execution ports completely. //////////////////////////////////////////////////////////////////////////////// def : WriteRes<WriteZero, []>; //////////////////////////////////////////////////////////////////////////////// // Branches don't produce values, so they have no latency, but they still // consume resources. Indirect branches can fold loads. //////////////////////////////////////////////////////////////////////////////// defm : AtomWriteResPair<WriteJump, [AtomPort1], [AtomPort1]>; //////////////////////////////////////////////////////////////////////////////// // Special case scheduling classes. //////////////////////////////////////////////////////////////////////////////// def : WriteRes<WriteSystem, [AtomPort01]> { let Latency = 100; } def : WriteRes<WriteMicrocoded, [AtomPort01]> { let Latency = 100; } def : WriteRes<WriteFence, [AtomPort0]>; // Nops don't have dependencies, so there's no actual latency, but we set this // to '1' to tell the scheduler that the nop uses an ALU slot for a cycle. def : WriteRes<WriteNop, [AtomPort01]>; //////////////////////////////////////////////////////////////////////////////// // Floating point. This covers both scalar and vector operations. //////////////////////////////////////////////////////////////////////////////// defm : X86WriteRes<WriteFLD0, [AtomPort01], 1, [1], 1>; defm : X86WriteRes<WriteFLD1, [AtomPort01], 6, [6], 1>; def : WriteRes<WriteFLoad, [AtomPort0]>; def : WriteRes<WriteFLoadX, [AtomPort0]>; defm : X86WriteResUnsupported<WriteFLoadY>; defm : X86WriteResUnsupported<WriteFMaskedLoad>; defm : X86WriteResUnsupported<WriteFMaskedLoadY>; def : WriteRes<WriteFStore, [AtomPort0]>; def : WriteRes<WriteFStoreX, [AtomPort0]>; defm : X86WriteResUnsupported<WriteFStoreY>; def : WriteRes<WriteFStoreNT, [AtomPort0]>; def : WriteRes<WriteFStoreNTX, [AtomPort0]>; defm : X86WriteResUnsupported<WriteFStoreNTY>; defm : X86WriteResUnsupported<WriteFMaskedStore>; defm : X86WriteResUnsupported<WriteFMaskedStoreY>; def : WriteRes<WriteFMove, [AtomPort01]>; def : WriteRes<WriteFMoveX, [AtomPort01]>; defm : X86WriteResUnsupported<WriteFMoveY>; defm : X86WriteRes<WriteEMMS, [AtomPort01], 5, [5], 1>; defm : AtomWriteResPair<WriteFAdd, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : AtomWriteResPair<WriteFAddX, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : X86WriteResPairUnsupported<WriteFAddY>; defm : X86WriteResPairUnsupported<WriteFAddZ>; defm : AtomWriteResPair<WriteFAdd64, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : AtomWriteResPair<WriteFAdd64X, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : X86WriteResPairUnsupported<WriteFAdd64Y>; defm : X86WriteResPairUnsupported<WriteFAdd64Z>; defm : AtomWriteResPair<WriteFCmp, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : AtomWriteResPair<WriteFCmpX, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : X86WriteResPairUnsupported<WriteFCmpY>; defm : X86WriteResPairUnsupported<WriteFCmpZ>; defm : AtomWriteResPair<WriteFCmp64, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : AtomWriteResPair<WriteFCmp64X, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : X86WriteResPairUnsupported<WriteFCmp64Y>; defm : X86WriteResPairUnsupported<WriteFCmp64Z>; defm : AtomWriteResPair<WriteFCom, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : AtomWriteResPair<WriteFMul, [AtomPort0], [AtomPort0], 4, 4, [4], [4]>; defm : AtomWriteResPair<WriteFMulX, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : X86WriteResPairUnsupported<WriteFMulY>; defm : X86WriteResPairUnsupported<WriteFMulZ>; defm : AtomWriteResPair<WriteFMul64, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : AtomWriteResPair<WriteFMul64X, [AtomPort01], [AtomPort01], 9, 10, [9], [10]>; defm : X86WriteResPairUnsupported<WriteFMul64Y>; defm : X86WriteResPairUnsupported<WriteFMul64Z>; defm : AtomWriteResPair<WriteFRcp, [AtomPort0], [AtomPort0], 4, 4, [4], [4]>; defm : AtomWriteResPair<WriteFRcpX, [AtomPort01], [AtomPort01], 9, 10, [9], [10]>; defm : X86WriteResPairUnsupported<WriteFRcpY>; defm : X86WriteResPairUnsupported<WriteFRcpZ>; defm : AtomWriteResPair<WriteFRsqrt, [AtomPort0], [AtomPort0], 4, 4, [4], [4]>; defm : AtomWriteResPair<WriteFRsqrtX, [AtomPort01], [AtomPort01], 9, 10, [9], [10]>; defm : X86WriteResPairUnsupported<WriteFRsqrtY>; defm : X86WriteResPairUnsupported<WriteFRsqrtZ>; defm : AtomWriteResPair<WriteFDiv, [AtomPort01], [AtomPort01], 34, 34, [34], [34]>; defm : AtomWriteResPair<WriteFDivX, [AtomPort01], [AtomPort01], 70, 70, [70], [70]>; defm : X86WriteResPairUnsupported<WriteFDivY>; defm : X86WriteResPairUnsupported<WriteFDivZ>; defm : AtomWriteResPair<WriteFDiv64, [AtomPort01], [AtomPort01], 62, 62, [62], [62]>; defm : AtomWriteResPair<WriteFDiv64X, [AtomPort01], [AtomPort01],125,125,[125],[125]>; defm : X86WriteResPairUnsupported<WriteFDiv64Y>; defm : X86WriteResPairUnsupported<WriteFDiv64Z>; defm : AtomWriteResPair<WriteFSqrt, [AtomPort01], [AtomPort01], 34, 34, [34], [34]>; defm : AtomWriteResPair<WriteFSqrtX, [AtomPort01], [AtomPort01], 70, 70, [70], [70]>; defm : X86WriteResPairUnsupported<WriteFSqrtY>; defm : X86WriteResPairUnsupported<WriteFSqrtZ>; defm : AtomWriteResPair<WriteFSqrt64, [AtomPort01], [AtomPort01], 62, 62, [62], [62]>; defm : AtomWriteResPair<WriteFSqrt64X, [AtomPort01], [AtomPort01],125,125,[125],[125]>; defm : X86WriteResPairUnsupported<WriteFSqrt64Y>; defm : X86WriteResPairUnsupported<WriteFSqrt64Z>; defm : AtomWriteResPair<WriteFSqrt80, [AtomPort01], [AtomPort01], 71, 71, [71], [71]>; defm : AtomWriteResPair<WriteFSign, [AtomPort1], [AtomPort1]>; defm : AtomWriteResPair<WriteFRnd, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : X86WriteResPairUnsupported<WriteFRndY>; defm : X86WriteResPairUnsupported<WriteFRndZ>; defm : AtomWriteResPair<WriteFLogic, [AtomPort01], [AtomPort0]>; defm : X86WriteResPairUnsupported<WriteFLogicY>; defm : X86WriteResPairUnsupported<WriteFLogicZ>; defm : AtomWriteResPair<WriteFTest, [AtomPort01], [AtomPort0]>; defm : X86WriteResPairUnsupported<WriteFTestY>; defm : X86WriteResPairUnsupported<WriteFTestZ>; defm : AtomWriteResPair<WriteFShuffle, [AtomPort0], [AtomPort0]>; defm : X86WriteResPairUnsupported<WriteFShuffleY>; defm : X86WriteResPairUnsupported<WriteFShuffleZ>; defm : X86WriteResPairUnsupported<WriteFVarShuffle>; defm : X86WriteResPairUnsupported<WriteFVarShuffleY>; defm : X86WriteResPairUnsupported<WriteFVarShuffleZ>; defm : X86WriteResPairUnsupported<WriteFMA>; defm : X86WriteResPairUnsupported<WriteFMAX>; defm : X86WriteResPairUnsupported<WriteFMAY>; defm : X86WriteResPairUnsupported<WriteFMAZ>; defm : X86WriteResPairUnsupported<WriteDPPD>; defm : X86WriteResPairUnsupported<WriteDPPS>; defm : X86WriteResPairUnsupported<WriteDPPSY>; defm : X86WriteResPairUnsupported<WriteDPPSZ>; defm : X86WriteResPairUnsupported<WriteFBlend>; defm : X86WriteResPairUnsupported<WriteFBlendY>; defm : X86WriteResPairUnsupported<WriteFBlendZ>; defm : X86WriteResPairUnsupported<WriteFVarBlend>; defm : X86WriteResPairUnsupported<WriteFVarBlendY>; defm : X86WriteResPairUnsupported<WriteFVarBlendZ>; defm : X86WriteResPairUnsupported<WriteFShuffle256>; defm : X86WriteResPairUnsupported<WriteFVarShuffle256>; //////////////////////////////////////////////////////////////////////////////// // Conversions. //////////////////////////////////////////////////////////////////////////////// defm : AtomWriteResPair<WriteCvtSS2I, [AtomPort01], [AtomPort01], 8, 9, [8], [9]>; defm : AtomWriteResPair<WriteCvtPS2I, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : X86WriteResPairUnsupported<WriteCvtPS2IY>; defm : X86WriteResPairUnsupported<WriteCvtPS2IZ>; defm : AtomWriteResPair<WriteCvtSD2I, [AtomPort01], [AtomPort01], 8, 9, [8], [9]>; defm : AtomWriteResPair<WriteCvtPD2I, [AtomPort01], [AtomPort01], 7, 8, [7], [8]>; defm : X86WriteResPairUnsupported<WriteCvtPD2IY>; defm : X86WriteResPairUnsupported<WriteCvtPD2IZ>; defm : AtomWriteResPair<WriteCvtI2SS, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : AtomWriteResPair<WriteCvtI2PS, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : X86WriteResPairUnsupported<WriteCvtI2PSY>; defm : X86WriteResPairUnsupported<WriteCvtI2PSZ>; defm : AtomWriteResPair<WriteCvtI2SD, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : AtomWriteResPair<WriteCvtI2PD, [AtomPort01], [AtomPort01], 7, 8, [7], [8]>; defm : X86WriteResPairUnsupported<WriteCvtI2PDY>; defm : X86WriteResPairUnsupported<WriteCvtI2PDZ>; defm : AtomWriteResPair<WriteCvtSS2SD, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : AtomWriteResPair<WriteCvtPS2PD, [AtomPort01], [AtomPort01], 7, 8, [7], [8]>; defm : X86WriteResPairUnsupported<WriteCvtPS2PDY>; defm : X86WriteResPairUnsupported<WriteCvtPS2PDZ>; defm : AtomWriteResPair<WriteCvtSD2SS, [AtomPort01], [AtomPort01], 6, 7, [6], [7]>; defm : AtomWriteResPair<WriteCvtPD2PS, [AtomPort01], [AtomPort01], 7, 8, [7], [8]>; defm : X86WriteResPairUnsupported<WriteCvtPD2PSY>; defm : X86WriteResPairUnsupported<WriteCvtPD2PSZ>; defm : X86WriteResPairUnsupported<WriteCvtPH2PS>; defm : X86WriteResPairUnsupported<WriteCvtPH2PSY>; defm : X86WriteResPairUnsupported<WriteCvtPH2PSZ>; defm : X86WriteResUnsupported<WriteCvtPS2PH>; defm : X86WriteResUnsupported<WriteCvtPS2PHSt>; defm : X86WriteResUnsupported<WriteCvtPS2PHY>; defm : X86WriteResUnsupported<WriteCvtPS2PHZ>; defm : X86WriteResUnsupported<WriteCvtPS2PHYSt>; defm : X86WriteResUnsupported<WriteCvtPS2PHZSt>; //////////////////////////////////////////////////////////////////////////////// // Vector integer operations. //////////////////////////////////////////////////////////////////////////////// def : WriteRes<WriteVecLoad, [AtomPort0]>; def : WriteRes<WriteVecLoadX, [AtomPort0]>; defm : X86WriteResUnsupported<WriteVecLoadY>; def : WriteRes<WriteVecLoadNT, [AtomPort0]>; defm : X86WriteResUnsupported<WriteVecLoadNTY>; defm : X86WriteResUnsupported<WriteVecMaskedLoad>; defm : X86WriteResUnsupported<WriteVecMaskedLoadY>; def : WriteRes<WriteVecStore, [AtomPort0]>; def : WriteRes<WriteVecStoreX, [AtomPort0]>; defm : X86WriteResUnsupported<WriteVecStoreY>; def : WriteRes<WriteVecStoreNT, [AtomPort0]>; defm : X86WriteResUnsupported<WriteVecStoreNTY>; def : WriteRes<WriteVecMaskedStore, [AtomPort0]>; defm : X86WriteResUnsupported<WriteVecMaskedStoreY>; def : WriteRes<WriteVecMove, [AtomPort0]>; def : WriteRes<WriteVecMoveX, [AtomPort01]>; defm : X86WriteResUnsupported<WriteVecMoveY>; defm : X86WriteRes<WriteVecMoveToGpr, [AtomPort0], 3, [3], 1>; defm : X86WriteRes<WriteVecMoveFromGpr, [AtomPort0], 1, [1], 1>; defm : AtomWriteResPair<WriteVecALU, [AtomPort01], [AtomPort0], 1, 1>; defm : AtomWriteResPair<WriteVecALUX, [AtomPort01], [AtomPort0], 1, 1>; defm : X86WriteResPairUnsupported<WriteVecALUY>; defm : X86WriteResPairUnsupported<WriteVecALUZ>; defm : AtomWriteResPair<WriteVecLogic, [AtomPort01], [AtomPort0], 1, 1>; defm : AtomWriteResPair<WriteVecLogicX, [AtomPort01], [AtomPort0], 1, 1>; defm : X86WriteResPairUnsupported<WriteVecLogicY>; defm : X86WriteResPairUnsupported<WriteVecLogicZ>; defm : AtomWriteResPair<WriteVecTest, [AtomPort01], [AtomPort0], 1, 1>; defm : X86WriteResPairUnsupported<WriteVecTestY>; defm : X86WriteResPairUnsupported<WriteVecTestZ>; defm : AtomWriteResPair<WriteVecShift, [AtomPort01], [AtomPort01], 2, 3, [2], [3]>; defm : AtomWriteResPair<WriteVecShiftX, [AtomPort01], [AtomPort01], 2, 3, [2], [3]>; defm : X86WriteResPairUnsupported<WriteVecShiftY>; defm : X86WriteResPairUnsupported<WriteVecShiftZ>; defm : AtomWriteResPair<WriteVecShiftImm, [AtomPort01], [AtomPort01], 1, 1, [1], [1]>; defm : AtomWriteResPair<WriteVecShiftImmX, [AtomPort01], [AtomPort01], 1, 1, [1], [1]>; defm : X86WriteResPairUnsupported<WriteVecShiftImmY>; defm : X86WriteResPairUnsupported<WriteVecShiftImmZ>; defm : AtomWriteResPair<WriteVecIMul, [AtomPort0], [AtomPort0], 4, 4, [4], [4]>; defm : AtomWriteResPair<WriteVecIMulX, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : X86WriteResPairUnsupported<WriteVecIMulY>; defm : X86WriteResPairUnsupported<WriteVecIMulZ>; defm : X86WriteResPairUnsupported<WritePMULLD>; defm : X86WriteResPairUnsupported<WritePMULLDY>; defm : X86WriteResPairUnsupported<WritePMULLDZ>; defm : X86WriteResPairUnsupported<WritePHMINPOS>; defm : X86WriteResPairUnsupported<WriteMPSAD>; defm : X86WriteResPairUnsupported<WriteMPSADY>; defm : X86WriteResPairUnsupported<WriteMPSADZ>; defm : AtomWriteResPair<WritePSADBW, [AtomPort01], [AtomPort01], 4, 4, [4], [4]>; defm : AtomWriteResPair<WritePSADBWX, [AtomPort0], [AtomPort0], 5, 5, [5], [5]>; defm : X86WriteResPairUnsupported<WritePSADBWY>; defm : X86WriteResPairUnsupported<WritePSADBWZ>; defm : AtomWriteResPair<WriteShuffle, [AtomPort0], [AtomPort0], 1, 1>; defm : AtomWriteResPair<WriteShuffleX, [AtomPort0], [AtomPort0], 1, 1>; defm : X86WriteResPairUnsupported<WriteShuffleY>; defm : X86WriteResPairUnsupported<WriteShuffleZ>; defm : AtomWriteResPair<WriteVarShuffle, [AtomPort0], [AtomPort0], 1, 1>; defm : AtomWriteResPair<WriteVarShuffleX, [AtomPort01], [AtomPort01], 4, 5, [4], [5]>; defm : X86WriteResPairUnsupported<WriteVarShuffleY>; defm : X86WriteResPairUnsupported<WriteVarShuffleZ>; defm : X86WriteResPairUnsupported<WriteBlend>; defm : X86WriteResPairUnsupported<WriteBlendY>; defm : X86WriteResPairUnsupported<WriteBlendZ>; defm : X86WriteResPairUnsupported<WriteVarBlend>; defm : X86WriteResPairUnsupported<WriteVarBlendY>; defm : X86WriteResPairUnsupported<WriteVarBlendZ>; defm : X86WriteResPairUnsupported<WriteShuffle256>; defm : X86WriteResPairUnsupported<WriteVarShuffle256>; defm : X86WriteResPairUnsupported<WriteVarVecShift>; defm : X86WriteResPairUnsupported<WriteVarVecShiftY>; defm : X86WriteResPairUnsupported<WriteVarVecShiftZ>; //////////////////////////////////////////////////////////////////////////////// // Vector insert/extract operations. //////////////////////////////////////////////////////////////////////////////// defm : AtomWriteResPair<WriteVecInsert, [AtomPort0], [AtomPort0], 1, 1>; def : WriteRes<WriteVecExtract, [AtomPort0]>; def : WriteRes<WriteVecExtractSt, [AtomPort0]>; //////////////////////////////////////////////////////////////////////////////// // SSE42 String instructions. //////////////////////////////////////////////////////////////////////////////// defm : X86WriteResPairUnsupported<WritePCmpIStrI>; defm : X86WriteResPairUnsupported<WritePCmpIStrM>; defm : X86WriteResPairUnsupported<WritePCmpEStrI>; defm : X86WriteResPairUnsupported<WritePCmpEStrM>; //////////////////////////////////////////////////////////////////////////////// // MOVMSK Instructions. //////////////////////////////////////////////////////////////////////////////// def : WriteRes<WriteFMOVMSK, [AtomPort0]> { let Latency = 3; let ResourceCycles = [3]; } def : WriteRes<WriteVecMOVMSK, [AtomPort0]> { let Latency = 3; let ResourceCycles = [3]; } defm : X86WriteResUnsupported<WriteVecMOVMSKY>; def : WriteRes<WriteMMXMOVMSK, [AtomPort0]> { let Latency = 3; let ResourceCycles = [3]; } //////////////////////////////////////////////////////////////////////////////// // AES instructions. //////////////////////////////////////////////////////////////////////////////// defm : X86WriteResPairUnsupported<WriteAESIMC>; defm : X86WriteResPairUnsupported<WriteAESKeyGen>; defm : X86WriteResPairUnsupported<WriteAESDecEnc>; //////////////////////////////////////////////////////////////////////////////// // Horizontal add/sub instructions. //////////////////////////////////////////////////////////////////////////////// defm : AtomWriteResPair<WriteFHAdd, [AtomPort01], [AtomPort01], 8, 9, [8], [9]>; defm : AtomWriteResPair<WriteFHAddY, [AtomPort01], [AtomPort01], 8, 9, [8], [9]>; defm : AtomWriteResPair<WritePHAdd, [AtomPort01], [AtomPort01], 3, 4, [3], [4]>; defm : AtomWriteResPair<WritePHAddX, [AtomPort01], [AtomPort01], 7, 8, [7], [8]>; defm : AtomWriteResPair<WritePHAddY, [AtomPort01], [AtomPort01], 7, 8, [7], [8]>; //////////////////////////////////////////////////////////////////////////////// // Carry-less multiplication instructions. //////////////////////////////////////////////////////////////////////////////// defm : X86WriteResPairUnsupported<WriteCLMul>; //////////////////////////////////////////////////////////////////////////////// // Load/store MXCSR. //////////////////////////////////////////////////////////////////////////////// def : WriteRes<WriteLDMXCSR, [AtomPort01]> { let Latency = 5; let ResourceCycles = [5]; } def : WriteRes<WriteSTMXCSR, [AtomPort01]> { let Latency = 15; let ResourceCycles = [15]; } //////////////////////////////////////////////////////////////////////////////// // Special Cases. //////////////////////////////////////////////////////////////////////////////// // Port0 def AtomWrite0_1 : SchedWriteRes<[AtomPort0]> { let Latency = 1; let ResourceCycles = [1]; } def : InstRW<[AtomWrite0_1], (instrs FXAM, LD_Frr, MOVSX64rr32)>; def : SchedAlias<WriteALURMW, AtomWrite0_1>; def : SchedAlias<WriteADCRMW, AtomWrite0_1>; def : InstRW<[AtomWrite0_1], (instregex "(RCL|RCR|ROL|ROR|SAR|SHL|SHR)(8|16|32|64)m", "MOV(S|Z)X(32|64)rr(8|8_NOREX|16)")>; def AtomWrite0_5 : SchedWriteRes<[AtomPort0]> { let Latency = 5; let ResourceCycles = [5]; } def : InstRW<[AtomWrite0_5], (instregex "IMUL32(rm|rr)")>; // Port1 def AtomWrite1_1 : SchedWriteRes<[AtomPort1]> { let Latency = 1; let ResourceCycles = [1]; } def : InstRW<[AtomWrite1_1], (instrs FCOMPP)>; def : InstRW<[AtomWrite1_1], (instregex "UCOM_F(P|PP)?r", "BT(C|R|S)?(16|32|64)(rr|ri8)")>; def AtomWrite1_5 : SchedWriteRes<[AtomPort1]> { let Latency = 5; let ResourceCycles = [5]; } def : InstRW<[AtomWrite1_5], (instrs MMX_CVTPI2PSirr, MMX_CVTPI2PSirm, MMX_CVTPS2PIirr, MMX_CVTTPS2PIirr)>; // Port0 and Port1 def AtomWrite0_1_1 : SchedWriteRes<[AtomPort0, AtomPort1]> { let Latency = 1; let ResourceCycles = [1, 1]; } def : InstRW<[AtomWrite0_1_1], (instrs POP32r, POP64r, POP16rmr, POP32rmr, POP64rmr, PUSH16r, PUSH32r, PUSH64r, PUSHi16, PUSHi32, PUSH16rmr, PUSH32rmr, PUSH64rmr, PUSH16i8, PUSH32i8, PUSH64i8, PUSH64i32, XCH_F)>; def : InstRW<[AtomWrite0_1_1], (instregex "RETI(L|Q|W)$", "IRET(16|32|64)?")>; def AtomWrite0_1_5 : SchedWriteRes<[AtomPort0, AtomPort1]> { let Latency = 5; let ResourceCycles = [5, 5]; } def : InstRW<[AtomWrite0_1_5], (instrs MMX_CVTPS2PIirm, MMX_CVTTPS2PIirm)>; def : InstRW<[AtomWrite0_1_5], (instregex "ILD_F(16|32|64)")>; // Port0 or Port1 def AtomWrite01_1 : SchedWriteRes<[AtomPort01]> { let Latency = 1; let ResourceCycles = [1]; } def : InstRW<[AtomWrite01_1], (instrs FDECSTP, FFREE, FFREEP, FINCSTP, WAIT, LFENCE, STOSB, STOSL, STOSQ, STOSW, MOVSSrr, MOVSSrr_REV, PSLLDQri, PSRLDQri)>; def : InstRW<[AtomWrite01_1], (instregex "MMX_PACK(SSDW|SSWB|USWB)irr", "MMX_PUNPCKH(BW|DQ|WD)irr")>; def AtomWrite01_2 : SchedWriteRes<[AtomPort01]> { let Latency = 2; let ResourceCycles = [2]; } def : InstRW<[AtomWrite01_2], (instrs LEAVE, LEAVE64, POP16r, PUSH16rmm, PUSH32rmm, PUSH64rmm, LODSB, LODSL, LODSQ, LODSW, SCASB, SCASL, SCASQ, SCASW)>; def : InstRW<[AtomWrite01_2], (instregex "BT(C|R|S)(16|32|64)mi8", "PUSH(CS|DS|ES|FS|GS|SS)(16|32|64)", "XADD(8|16|32|64)rr", "XCHG(8|16|32|64)(ar|rr)", "(ST|ISTT)_F(P)?(16|32|64)?(m|rr)", "MMX_P(ADD|SUB)Qirr", "MOV(S|Z)X16rr8", "MOV(UPS|UPD|DQU)mr", "MASKMOVDQU(64)?", "P(ADD|SUB)Qrr")>; def AtomWrite01_3 : SchedWriteRes<[AtomPort01]> { let Latency = 3; let ResourceCycles = [3]; } def : InstRW<[AtomWrite01_3], (instrs CLD, LDDQUrm, CMPSB, CMPSL, CMPSQ, CMPSW, MOVSB, MOVSL, MOVSQ, MOVSW, POP16rmm, POP32rmm, POP64rmm)>; def : InstRW<[AtomWrite01_3], (instregex "XADD(8|16|32|64)rm", "XCHG(8|16|32|64)rm", "PH(ADD|SUB)Drr", "MOV(S|Z)X16rm8", "MMX_P(ADD|SUB)Qirm", "MOV(UPS|UPD|DQU)rm", "P(ADD|SUB)Qrm")>; def AtomWrite01_4 : SchedWriteRes<[AtomPort01]> { let Latency = 4; let ResourceCycles = [4]; } def : InstRW<[AtomWrite01_4], (instrs CBW, CWD, CWDE, CDQ, CDQE, CQO, JCXZ, JECXZ, JRCXZ, LD_F80m)>; def : InstRW<[AtomWrite01_4], (instregex "PH(ADD|SUB)Drm", "(MMX_)?PEXTRWrr(_REV)?")>; def AtomWrite01_5 : SchedWriteRes<[AtomPort01]> { let Latency = 5; let ResourceCycles = [5]; } def : InstRW<[AtomWrite01_5], (instrs FLDCW16m, ST_FP80m)>; def : InstRW<[AtomWrite01_5], (instregex "MMX_PH(ADD|SUB)S?Wrr")>; def AtomWrite01_6 : SchedWriteRes<[AtomPort01]> { let Latency = 6; let ResourceCycles = [6]; } def : InstRW<[AtomWrite01_6], (instrs CMPXCHG8rm, INTO, XLAT, SHLD16rrCL, SHRD16rrCL, SHLD16rri8, SHRD16rri8, SHLD16mrCL, SHRD16mrCL, SHLD16mri8, SHRD16mri8)>; def : InstRW<[AtomWrite01_6], (instregex "IMUL16rr", "IST_F(P)?(16|32|64)?m", "MMX_PH(ADD|SUB)S?Wrm")>; def AtomWrite01_7 : SchedWriteRes<[AtomPort01]> { let Latency = 7; let ResourceCycles = [7]; } def : InstRW<[AtomWrite01_7], (instrs AAD8i8)>; def AtomWrite01_8 : SchedWriteRes<[AtomPort01]> { let Latency = 8; let ResourceCycles = [8]; } def : InstRW<[AtomWrite01_8], (instrs LOOPE, PUSHA16, PUSHA32, SHLD64rrCL, SHRD64rrCL, FNSTCW16m)>; def AtomWrite01_9 : SchedWriteRes<[AtomPort01]> { let Latency = 9; let ResourceCycles = [9]; } def : InstRW<[AtomWrite01_9], (instrs BT16mr, BT32mr, BT64mr, POPA16, POPA32, PUSHF16, PUSHF32, PUSHF64, SHLD64mrCL, SHRD64mrCL, SHLD64mri8, SHRD64mri8, SHLD64rri8, SHRD64rri8, CMPXCHG8rr)>; def : InstRW<[AtomWrite01_9], (instregex "(U)?COM_FI", "TST_F", "(U)?COMIS(D|S)rr", "CVT(T)?SS2SI64rr(_Int)?")>; def AtomWrite01_10 : SchedWriteRes<[AtomPort01]> { let Latency = 10; let ResourceCycles = [10]; } def : SchedAlias<WriteFLDC, AtomWrite01_10>; def : InstRW<[AtomWrite01_10], (instregex "(U)?COMIS(D|S)rm", "CVT(T)?SS2SI64rm(_Int)?")>; def AtomWrite01_11 : SchedWriteRes<[AtomPort01]> { let Latency = 11; let ResourceCycles = [11]; } def : InstRW<[AtomWrite01_11], (instrs BOUNDS16rm, BOUNDS32rm)>; def : InstRW<[AtomWrite01_11], (instregex "BT(C|R|S)(16|32|64)mr")>; def AtomWrite01_13 : SchedWriteRes<[AtomPort01]> { let Latency = 13; let ResourceCycles = [13]; } def : InstRW<[AtomWrite01_13], (instrs AAA, AAS)>; def AtomWrite01_14 : SchedWriteRes<[AtomPort01]> { let Latency = 14; let ResourceCycles = [14]; } def : InstRW<[AtomWrite01_14], (instrs CMPXCHG16rm, CMPXCHG32rm, CMPXCHG64rm)>; def AtomWrite01_15 : SchedWriteRes<[AtomPort01]> { let Latency = 15; let ResourceCycles = [15]; } def : InstRW<[AtomWrite01_15], (instrs CMPXCHG16rr, CMPXCHG32rr, CMPXCHG64rr)>; def AtomWrite01_17 : SchedWriteRes<[AtomPort01]> { let Latency = 17; let ResourceCycles = [17]; } def : InstRW<[AtomWrite01_17], (instrs LOOPNE, PAUSE)>; def AtomWrite01_18 : SchedWriteRes<[AtomPort01]> { let Latency = 18; let ResourceCycles = [18]; } def : InstRW<[AtomWrite01_18], (instrs CMPXCHG8B, DAA, LOOP)>; def AtomWrite01_20 : SchedWriteRes<[AtomPort01]> { let Latency = 20; let ResourceCycles = [20]; } def : InstRW<[AtomWrite01_20], (instrs DAS)>; def AtomWrite01_21 : SchedWriteRes<[AtomPort01]> { let Latency = 21; let ResourceCycles = [21]; } def : InstRW<[AtomWrite01_21], (instrs AAM8i8, STD)>; def AtomWrite01_22 : SchedWriteRes<[AtomPort01]> { let Latency = 22; let ResourceCycles = [22]; } def : InstRW<[AtomWrite01_22], (instrs CMPXCHG16B)>; def AtomWrite01_23 : SchedWriteRes<[AtomPort01]> { let Latency = 23; let ResourceCycles = [23]; } def : InstRW<[AtomWrite01_23], (instrs ARPL16mr, ARPL16rr)>; def AtomWrite01_25 : SchedWriteRes<[AtomPort01]> { let Latency = 25; let ResourceCycles = [25]; } def : InstRW<[AtomWrite01_25], (instrs FNCLEX, FXTRACT)>; def AtomWrite01_26 : SchedWriteRes<[AtomPort01]> { let Latency = 26; let ResourceCycles = [26]; } def : InstRW<[AtomWrite01_26], (instrs POPF32, POPF64)>; def AtomWrite01_29 : SchedWriteRes<[AtomPort01]> { let Latency = 29; let ResourceCycles = [29]; } def : InstRW<[AtomWrite01_29], (instregex "POP(DS|ES|FS|GS)(16|32|64)")>; def AtomWrite01_30 : SchedWriteRes<[AtomPort01]> { let Latency = 30; let ResourceCycles = [30]; } def : InstRW<[AtomWrite01_30], (instrs RDTSC, RDTSCP)>; def AtomWrite01_32 : SchedWriteRes<[AtomPort01]> { let Latency = 32; let ResourceCycles = [32]; } def : InstRW<[AtomWrite01_32], (instrs ENTER, POPF16)>; def AtomWrite01_45 : SchedWriteRes<[AtomPort01]> { let Latency = 45; let ResourceCycles = [45]; } def : InstRW<[AtomWrite01_45], (instrs MONITORrrr)>; def AtomWrite01_46 : SchedWriteRes<[AtomPort01]> { let Latency = 46; let ResourceCycles = [46]; } def : InstRW<[AtomWrite01_46], (instrs FRNDINT, MWAITrr, RDPMC)>; def AtomWrite01_48 : SchedWriteRes<[AtomPort01]> { let Latency = 48; let ResourceCycles = [48]; } def : InstRW<[AtomWrite01_48], (instrs POPSS16, POPSS32)>; def AtomWrite01_55 : SchedWriteRes<[AtomPort01]> { let Latency = 55; let ResourceCycles = [55]; } def : InstRW<[AtomWrite01_55], (instrs FPREM)>; def AtomWrite01_59 : SchedWriteRes<[AtomPort01]> { let Latency = 59; let ResourceCycles = [59]; } def : InstRW<[AtomWrite01_59], (instrs INSB, INSL, INSW)>; def AtomWrite01_63 : SchedWriteRes<[AtomPort01]> { let Latency = 63; let ResourceCycles = [63]; } def : InstRW<[AtomWrite01_63], (instrs FNINIT)>; def AtomWrite01_68 : SchedWriteRes<[AtomPort01]> { let Latency = 68; let ResourceCycles = [68]; } def : InstRW<[AtomWrite01_68], (instrs OUT8rr, OUT16rr, OUT32rr)>; def AtomWrite01_71 : SchedWriteRes<[AtomPort01]> { let Latency = 71; let ResourceCycles = [71]; } def : InstRW<[AtomWrite01_71], (instrs FPREM1, INVLPG, INVLPGA32, INVLPGA64)>; def AtomWrite01_72 : SchedWriteRes<[AtomPort01]> { let Latency = 72; let ResourceCycles = [72]; } def : InstRW<[AtomWrite01_72], (instrs OUT8ir, OUT16ir, OUT32ir)>; def AtomWrite01_74 : SchedWriteRes<[AtomPort01]> { let Latency = 74; let ResourceCycles = [74]; } def : InstRW<[AtomWrite01_74], (instrs OUTSB, OUTSL, OUTSW)>; def AtomWrite01_77 : SchedWriteRes<[AtomPort01]> { let Latency = 77; let ResourceCycles = [77]; } def : InstRW<[AtomWrite01_77], (instrs FSCALE)>; def AtomWrite01_78 : SchedWriteRes<[AtomPort01]> { let Latency = 78; let ResourceCycles = [78]; } def : InstRW<[AtomWrite01_78], (instrs RDMSR)>; def AtomWrite01_79 : SchedWriteRes<[AtomPort01]> { let Latency = 79; let ResourceCycles = [79]; } def : InstRW<[AtomWrite01_79], (instregex "RET(L|Q|W)?$", "LRETI?(L|Q|W)")>; def AtomWrite01_92 : SchedWriteRes<[AtomPort01]> { let Latency = 92; let ResourceCycles = [92]; } def : InstRW<[AtomWrite01_92], (instrs IN8ri, IN16ri, IN32ri)>; def AtomWrite01_94 : SchedWriteRes<[AtomPort01]> { let Latency = 94; let ResourceCycles = [94]; } def : InstRW<[AtomWrite01_94], (instrs IN8rr, IN16rr, IN32rr)>; def AtomWrite01_99 : SchedWriteRes<[AtomPort01]> { let Latency = 99; let ResourceCycles = [99]; } def : InstRW<[AtomWrite01_99], (instrs F2XM1)>; def AtomWrite01_121 : SchedWriteRes<[AtomPort01]> { let Latency = 121; let ResourceCycles = [121]; } def : InstRW<[AtomWrite01_121], (instrs CPUID)>; def AtomWrite01_127 : SchedWriteRes<[AtomPort01]> { let Latency = 127; let ResourceCycles = [127]; } def : InstRW<[AtomWrite01_127], (instrs INT)>; def AtomWrite01_130 : SchedWriteRes<[AtomPort01]> { let Latency = 130; let ResourceCycles = [130]; } def : InstRW<[AtomWrite01_130], (instrs INT3)>; def AtomWrite01_140 : SchedWriteRes<[AtomPort01]> { let Latency = 140; let ResourceCycles = [140]; } def : InstRW<[AtomWrite01_140], (instrs FXSAVE, FXSAVE64)>; def AtomWrite01_141 : SchedWriteRes<[AtomPort01]> { let Latency = 141; let ResourceCycles = [141]; } def : InstRW<[AtomWrite01_141], (instrs FXRSTOR, FXRSTOR64)>; def AtomWrite01_146 : SchedWriteRes<[AtomPort01]> { let Latency = 146; let ResourceCycles = [146]; } def : InstRW<[AtomWrite01_146], (instrs FYL2X)>; def AtomWrite01_147 : SchedWriteRes<[AtomPort01]> { let Latency = 147; let ResourceCycles = [147]; } def : InstRW<[AtomWrite01_147], (instrs FYL2XP1)>; def AtomWrite01_168 : SchedWriteRes<[AtomPort01]> { let Latency = 168; let ResourceCycles = [168]; } def : InstRW<[AtomWrite01_168], (instrs FPTAN)>; def AtomWrite01_174 : SchedWriteRes<[AtomPort01]> { let Latency = 174; let ResourceCycles = [174]; } def : InstRW<[AtomWrite01_174], (instrs FSINCOS)>; def : InstRW<[AtomWrite01_174], (instregex "(COS|SIN)_F")>; def AtomWrite01_183 : SchedWriteRes<[AtomPort01]> { let Latency = 183; let ResourceCycles = [183]; } def : InstRW<[AtomWrite01_183], (instrs FPATAN)>; def AtomWrite01_202 : SchedWriteRes<[AtomPort01]> { let Latency = 202; let ResourceCycles = [202]; } def : InstRW<[AtomWrite01_202], (instrs WRMSR)>; } // SchedModel