003 File Manager
Current Path:
/usr/src/contrib/llvm-project/llvm/lib/Target/PowerPC
usr
/
src
/
contrib
/
llvm-project
/
llvm
/
lib
/
Target
/
PowerPC
/
📁
..
📁
AsmParser
📁
Disassembler
📁
MCTargetDesc
📄
P9InstrResources.td
(37.36 KB)
📄
PPC.h
(4.69 KB)
📄
PPC.td
(32.37 KB)
📄
PPCAsmPrinter.cpp
(70.77 KB)
📄
PPCBoolRetToInt.cpp
(9.97 KB)
📄
PPCBranchCoalescing.cpp
(30.16 KB)
📄
PPCBranchSelector.cpp
(15.97 KB)
📄
PPCCCState.cpp
(1.08 KB)
📄
PPCCCState.h
(1.19 KB)
📄
PPCCTRLoops.cpp
(6.68 KB)
📄
PPCCallingConv.cpp
(6.19 KB)
📄
PPCCallingConv.h
(1.97 KB)
📄
PPCCallingConv.td
(16.32 KB)
📄
PPCEarlyReturn.cpp
(7.14 KB)
📄
PPCExpandISEL.cpp
(17.93 KB)
📄
PPCFastISel.cpp
(85.51 KB)
📄
PPCFrameLowering.cpp
(98.6 KB)
📄
PPCFrameLowering.h
(7.46 KB)
📄
PPCHazardRecognizers.cpp
(14.02 KB)
📄
PPCHazardRecognizers.h
(3.83 KB)
📄
PPCISelDAGToDAG.cpp
(256.88 KB)
📄
PPCISelLowering.cpp
(669.73 KB)
📄
PPCISelLowering.h
(55.9 KB)
📄
PPCInstr64Bit.td
(75.68 KB)
📄
PPCInstrAltivec.td
(77.68 KB)
📄
PPCInstrBuilder.h
(1.5 KB)
📄
PPCInstrFormats.td
(57.38 KB)
📄
PPCInstrHTM.td
(5.48 KB)
📄
PPCInstrInfo.cpp
(171.06 KB)
📄
PPCInstrInfo.h
(29.06 KB)
📄
PPCInstrInfo.td
(233.39 KB)
📄
PPCInstrPrefix.td
(41.72 KB)
📄
PPCInstrQPX.td
(57.56 KB)
📄
PPCInstrSPE.td
(49.71 KB)
📄
PPCInstrVSX.td
(223.48 KB)
📄
PPCLoopInstrFormPrep.cpp
(33.45 KB)
📄
PPCLowerMASSVEntries.cpp
(6.42 KB)
📄
PPCMCInstLower.cpp
(6.62 KB)
📄
PPCMIPeephole.cpp
(63.48 KB)
📄
PPCMachineFunctionInfo.cpp
(2.59 KB)
📄
PPCMachineFunctionInfo.h
(9.15 KB)
📄
PPCMachineScheduler.cpp
(4.03 KB)
📄
PPCMachineScheduler.h
(1.81 KB)
📄
PPCMacroFusion.cpp
(6.68 KB)
📄
PPCMacroFusion.def
(1.8 KB)
📄
PPCMacroFusion.h
(886 B)
📄
PPCPerfectShuffle.h
(397.57 KB)
📄
PPCPfmCounters.td
(705 B)
📄
PPCPreEmitPeephole.cpp
(13.36 KB)
📄
PPCQPXLoadSplat.cpp
(5.31 KB)
📄
PPCReduceCRLogicals.cpp
(28.66 KB)
📄
PPCRegisterInfo.cpp
(51.93 KB)
📄
PPCRegisterInfo.h
(6.61 KB)
📄
PPCRegisterInfo.td
(14.24 KB)
📄
PPCSchedule.td
(5.21 KB)
📄
PPCSchedule440.td
(34.57 KB)
📄
PPCScheduleA2.td
(7.85 KB)
📄
PPCScheduleE500.td
(16.59 KB)
📄
PPCScheduleE500mc.td
(20.89 KB)
📄
PPCScheduleE5500.td
(23.62 KB)
📄
PPCScheduleG3.td
(4.49 KB)
📄
PPCScheduleG4.td
(5.42 KB)
📄
PPCScheduleG4Plus.td
(6.45 KB)
📄
PPCScheduleG5.td
(7.1 KB)
📄
PPCScheduleP7.td
(22.26 KB)
📄
PPCScheduleP8.td
(23.96 KB)
📄
PPCScheduleP9.td
(12.27 KB)
📄
PPCSubtarget.cpp
(7.58 KB)
📄
PPCSubtarget.h
(13.21 KB)
📄
PPCTLSDynamicCall.cpp
(6.53 KB)
📄
PPCTOCRegDeps.cpp
(5.3 KB)
📄
PPCTargetMachine.cpp
(18.94 KB)
📄
PPCTargetMachine.h
(2.2 KB)
📄
PPCTargetObjectFile.cpp
(2.45 KB)
📄
PPCTargetObjectFile.h
(1.19 KB)
📄
PPCTargetStreamer.h
(1.02 KB)
📄
PPCTargetTransformInfo.cpp
(38.72 KB)
📄
PPCTargetTransformInfo.h
(5.6 KB)
📄
PPCVSXCopy.cpp
(5.68 KB)
📄
PPCVSXFMAMutate.cpp
(15.12 KB)
📄
PPCVSXSwapRemoval.cpp
(36.78 KB)
📄
README_P9.txt
(22.25 KB)
📁
TargetInfo
Editing: PPCScheduleP8.td
//===-- PPCScheduleP8.td - PPC P8 Scheduling Definitions ---*- tablegen -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file defines the itinerary class data for the POWER8 processor. // //===----------------------------------------------------------------------===// // Scheduling for the P8 involves tracking two types of resources: // 1. The dispatch bundle slots // 2. The functional unit resources // Dispatch units: def P8_DU1 : FuncUnit; def P8_DU2 : FuncUnit; def P8_DU3 : FuncUnit; def P8_DU4 : FuncUnit; def P8_DU5 : FuncUnit; def P8_DU6 : FuncUnit; def P8_DU7 : FuncUnit; // Only branch instructions will use DU7,DU8 def P8_DU8 : FuncUnit; // 10 insns per cycle (2-LU, 2-LSU, 2-FXU, 2-FPU, 1-CRU, 1-BRU). def P8_LU1 : FuncUnit; // Loads or fixed-point operations 1 def P8_LU2 : FuncUnit; // Loads or fixed-point operations 2 // Load/Store pipelines can handle Stores, fixed-point loads, and simple // fixed-point operations. def P8_LSU1 : FuncUnit; // Load/Store pipeline 1 def P8_LSU2 : FuncUnit; // Load/Store pipeline 2 // Fixed Point unit def P8_FXU1 : FuncUnit; // FX pipeline 1 def P8_FXU2 : FuncUnit; // FX pipeline 2 // The Floating-Point Unit (FPU) and Vector Media Extension (VMX) units // are combined on P7 and newer into a Vector Scalar Unit (VSU). // The P8 Instruction latency documents still refers to the unit as the // FPU, so keep in mind that FPU==VSU. // In contrast to the P7, the VMX units on P8 are symmetric, so no need to // split vector integer ops or 128-bit load/store/perms to the specific units. def P8_FPU1 : FuncUnit; // VS pipeline 1 def P8_FPU2 : FuncUnit; // VS pipeline 2 def P8_CRU : FuncUnit; // CR unit (CR logicals and move-from-SPRs) def P8_BRU : FuncUnit; // BR unit def P8Itineraries : ProcessorItineraries< [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6, P8_DU7, P8_DU8, P8_LU1, P8_LU2, P8_LSU1, P8_LSU2, P8_FXU1, P8_FXU2, P8_FPU1, P8_FPU2, P8_CRU, P8_BRU], [], [ InstrItinData<IIC_IntSimple , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2, P8_LU1, P8_LU2, P8_LSU1, P8_LSU2]>], [1, 1, 1]>, InstrItinData<IIC_IntGeneral , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2, P8_LU1, P8_LU2, P8_LSU1, P8_LSU2]>], [1, 1, 1]>, InstrItinData<IIC_IntISEL, [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FXU1, P8_FXU2], 0>, InstrStage<1, [P8_BRU]>], [1, 1, 1, 1]>, InstrItinData<IIC_IntCompare , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1, 1]>, InstrItinData<IIC_IntDivW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<15, [P8_FXU1, P8_FXU2]>], [15, 1, 1]>, InstrItinData<IIC_IntDivD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<23, [P8_FXU1, P8_FXU2]>], [23, 1, 1]>, InstrItinData<IIC_IntMulHW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 1, 1]>, InstrItinData<IIC_IntMulHWU , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 1, 1]>, InstrItinData<IIC_IntMulHD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 1, 1]>, InstrItinData<IIC_IntMulLI , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 1, 1]>, InstrItinData<IIC_IntRotate , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1, 1]>, InstrItinData<IIC_IntRotateD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1, 1]>, InstrItinData<IIC_IntRotateDI , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1, 1]>, InstrItinData<IIC_IntShift , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1, 1]>, InstrItinData<IIC_IntTrapW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1]>, InstrItinData<IIC_IntTrapD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [1, 1]>, InstrItinData<IIC_BrB , [InstrStage<1, [P8_DU7, P8_DU8], 0>, InstrStage<1, [P8_BRU]>], [3, 1, 1]>, // FIXME - the Br* groups below are not branch related, so should probably // be renamed. // IIC_BrCR consists of the cr* instructions. (crand,crnor,creqv, etc). // and should be 'First' in dispatch. InstrItinData<IIC_BrCR , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_CRU]>], [3, 1, 1]>, // IIC_BrMCR consists of the mcrf instruction. InstrItinData<IIC_BrMCR , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_CRU]>], [3, 1, 1]>, // IIC_BrMCRX consists of mcrxr (obsolete instruction) and mtcrf, which // should be first in the dispatch group. InstrItinData<IIC_BrMCRX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 1, 1]>, InstrItinData<IIC_BrMCRX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 1]>, InstrItinData<IIC_LdStLoad , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2]>], [2, 1, 1]>, InstrItinData<IIC_LdStLoadUpd , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2 ], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [2, 2, 1, 1]>, // Update-Indexed form loads/stores are no longer first and last in the // dispatch group. They are simply cracked, so require DU1,DU2. InstrItinData<IIC_LdStLoadUpdX, [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 3, 1, 1]>, InstrItinData<IIC_LdStLD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2]>], [2, 1, 1]>, InstrItinData<IIC_LdStLDU , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [2, 2, 1, 1]>, InstrItinData<IIC_LdStLDUX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 3, 1, 1]>, InstrItinData<IIC_LdStLFD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LU1, P8_LU2]>], [3, 1, 1]>, InstrItinData<IIC_LdStLVecX , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LU1, P8_LU2]>], [3, 1, 1]>, InstrItinData<IIC_LdStLFDU , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 3, 1, 1]>, InstrItinData<IIC_LdStLFDUX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 3, 1, 1]>, InstrItinData<IIC_LdStLHA , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2, P8_LU1, P8_LU2]>], [3, 1, 1]>, InstrItinData<IIC_LdStLHAU , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 4, 1, 1]>, // first+last in dispatch group. InstrItinData<IIC_LdStLHAUX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_DU3], 0>, InstrStage<1, [P8_DU4], 0>, InstrStage<1, [P8_DU5], 0>, InstrStage<1, [P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 4, 1, 1]>, InstrItinData<IIC_LdStLWA , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2]>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [3, 1, 1]>, InstrItinData<IIC_LdStLWARX, [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_DU3], 0>, InstrStage<1, [P8_DU4], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2]>], [3, 1, 1]>, // first+last InstrItinData<IIC_LdStLDARX, [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_DU3], 0>, InstrStage<1, [P8_DU4], 0>, InstrStage<1, [P8_DU5], 0>, InstrStage<1, [P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2]>], [3, 1, 1]>, InstrItinData<IIC_LdStLMW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2, P8_LU1, P8_LU2]>], [2, 1, 1]>, // Stores are dual-issued from the issue queue, so may only take up one // dispatch slot. The instruction will be broken into two IOPS. The agen // op is issued to the LSU, and the data op (register fetch) is issued // to either the LU (GPR store) or the VSU (FPR store). InstrItinData<IIC_LdStStore , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2]>, InstrStage<1, [P8_LU1, P8_LU2]>], [1, 1, 1]>, InstrItinData<IIC_LdStSTD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LU1, P8_LU2, P8_LSU1, P8_LSU2]>] [1, 1, 1]>, InstrItinData<IIC_LdStSTU , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LU1, P8_LU2, P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [2, 1, 1, 1]>, // First+last InstrItinData<IIC_LdStSTUX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_DU3], 0>, InstrStage<1, [P8_DU4], 0>, InstrStage<1, [P8_DU5], 0>, InstrStage<1, [P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [2, 1, 1, 1]>, InstrItinData<IIC_LdStSTFD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [1, 1, 1]>, InstrItinData<IIC_LdStSTFDU , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_FXU1, P8_FXU2], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [2, 1, 1, 1]>, InstrItinData<IIC_LdStSTVEBX , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [1, 1, 1]>, InstrItinData<IIC_LdStSTDCX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_DU3], 0>, InstrStage<1, [P8_DU4], 0>, InstrStage<1, [P8_DU5], 0>, InstrStage<1, [P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_LU1, P8_LU2]>], [1, 1, 1]>, InstrItinData<IIC_LdStSTWCX , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_DU2], 0>, InstrStage<1, [P8_DU3], 0>, InstrStage<1, [P8_DU4], 0>, InstrStage<1, [P8_DU5], 0>, InstrStage<1, [P8_DU6], 0>, InstrStage<1, [P8_LSU1, P8_LSU2], 0>, InstrStage<1, [P8_LU1, P8_LU2]>], [1, 1, 1]>, InstrItinData<IIC_SprMFCR , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_CRU]>], [6, 1]>, InstrItinData<IIC_SprMFCRF , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_CRU]>], [3, 1]>, InstrItinData<IIC_SprMTSPR , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FXU1, P8_FXU2]>], [4, 1]>, // mtctr InstrItinData<IIC_FPGeneral , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [5, 1, 1]>, InstrItinData<IIC_FPAddSub , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [5, 1, 1]>, InstrItinData<IIC_FPCompare , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [8, 1, 1]>, InstrItinData<IIC_FPDivD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [33, 1, 1]>, InstrItinData<IIC_FPDivS , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [27, 1, 1]>, InstrItinData<IIC_FPSqrtD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [44, 1, 1]>, InstrItinData<IIC_FPSqrtS , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [32, 1, 1]>, InstrItinData<IIC_FPFused , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [5, 1, 1, 1]>, InstrItinData<IIC_FPRes , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [5, 1, 1]>, InstrItinData<IIC_VecGeneral , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [2, 1, 1]>, InstrItinData<IIC_VecVSL , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [2, 1, 1]>, InstrItinData<IIC_VecVSR , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [2, 1, 1]>, InstrItinData<IIC_VecFP , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [6, 1, 1]>, InstrItinData<IIC_VecFPCompare, [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [6, 1, 1]>, InstrItinData<IIC_VecFPRound , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [6, 1, 1]>, InstrItinData<IIC_VecComplex , [InstrStage<1, [P8_DU1], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [7, 1, 1]>, InstrItinData<IIC_VecPerm , [InstrStage<1, [P8_DU1, P8_DU2], 0>, InstrStage<1, [P8_FPU1, P8_FPU2]>], [3, 1, 1]> ]>; // ===---------------------------------------------------------------------===// // P8 machine model for scheduling and other instruction cost heuristics. // P8 has an 8 insn dispatch group (6 non-branch, 2 branch) and can issue up // to 10 insns per cycle (2-LU, 2-LSU, 2-FXU, 2-FPU, 1-CRU, 1-BRU). def P8Model : SchedMachineModel { let IssueWidth = 8; // up to 8 instructions dispatched per cycle. // up to six non-branch instructions. // up to two branches in a dispatch group. let LoadLatency = 3; // Optimistic load latency assuming bypass. // This is overriden by OperandCycles if the // Itineraries are queried instead. let MispredictPenalty = 16; // Try to make sure we have at least 10 dispatch groups in a loop. let LoopMicroOpBufferSize = 60; let CompleteModel = 0; let Itineraries = P8Itineraries; }
Upload File
Create Folder