003 File Manager
Current Path:
/usr/src/contrib/llvm-project/llvm/lib/Target/X86
usr
/
src
/
contrib
/
llvm-project
/
llvm
/
lib
/
Target
/
X86
/
📁
..
📁
AsmParser
📁
Disassembler
📄
ImmutableGraph.h
(15.15 KB)
📁
MCTargetDesc
📁
TargetInfo
📄
X86.h
(7.41 KB)
📄
X86.td
(68.44 KB)
📄
X86AsmPrinter.cpp
(27.18 KB)
📄
X86AsmPrinter.h
(5.96 KB)
📄
X86AvoidStoreForwardingBlocks.cpp
(27.94 KB)
📄
X86AvoidTrailingCall.cpp
(4.91 KB)
📄
X86CallFrameOptimization.cpp
(23.07 KB)
📄
X86CallLowering.cpp
(17.62 KB)
📄
X86CallLowering.h
(1.74 KB)
📄
X86CallingConv.cpp
(13.34 KB)
📄
X86CallingConv.h
(1.09 KB)
📄
X86CallingConv.td
(46.15 KB)
📄
X86CmovConversion.cpp
(34.07 KB)
📄
X86CondBrFolding.cpp
(18.4 KB)
📄
X86DiscriminateMemOps.cpp
(7.11 KB)
📄
X86DomainReassignment.cpp
(25.87 KB)
📄
X86EvexToVex.cpp
(8.8 KB)
📄
X86ExpandPseudo.cpp
(16.95 KB)
📄
X86FastISel.cpp
(139.28 KB)
📄
X86FixupBWInsts.cpp
(18.09 KB)
📄
X86FixupLEAs.cpp
(24.44 KB)
📄
X86FixupSetCC.cpp
(4.44 KB)
📄
X86FlagsCopyLowering.cpp
(40.36 KB)
📄
X86FloatingPoint.cpp
(62.66 KB)
📄
X86FrameLowering.cpp
(138.71 KB)
📄
X86FrameLowering.h
(11.64 KB)
📄
X86GenRegisterBankInfo.def
(3.32 KB)
📄
X86ISelDAGToDAG.cpp
(208.37 KB)
📄
X86ISelLowering.cpp
(1.94 MB)
📄
X86ISelLowering.h
(60.88 KB)
📄
X86IndirectBranchTracking.cpp
(6.17 KB)
📄
X86IndirectThunks.cpp
(9.78 KB)
📄
X86InsertPrefetch.cpp
(9.64 KB)
📄
X86InsertWait.cpp
(4.47 KB)
📄
X86Instr3DNow.td
(5.24 KB)
📄
X86InstrAMX.td
(5.6 KB)
📄
X86InstrAVX512.td
(653.76 KB)
📄
X86InstrArithmetic.td
(75.61 KB)
📄
X86InstrBuilder.h
(8.45 KB)
📄
X86InstrCMovSetCC.td
(5.76 KB)
📄
X86InstrCompiler.td
(95.78 KB)
📄
X86InstrControl.td
(20.53 KB)
📄
X86InstrExtension.td
(11.64 KB)
📄
X86InstrFMA.td
(33.23 KB)
📄
X86InstrFMA3Info.cpp
(6.21 KB)
📄
X86InstrFMA3Info.h
(3.25 KB)
📄
X86InstrFPStack.td
(39.52 KB)
📄
X86InstrFoldTables.cpp
(393.01 KB)
📄
X86InstrFoldTables.h
(3.03 KB)
📄
X86InstrFormats.td
(41.05 KB)
📄
X86InstrFragmentsSIMD.td
(61.14 KB)
📄
X86InstrInfo.cpp
(322.72 KB)
📄
X86InstrInfo.h
(29.34 KB)
📄
X86InstrInfo.td
(169.76 KB)
📄
X86InstrMMX.td
(29.55 KB)
📄
X86InstrMPX.td
(3.63 KB)
📄
X86InstrSGX.td
(1.12 KB)
📄
X86InstrSSE.td
(385.01 KB)
📄
X86InstrSVM.td
(2.16 KB)
📄
X86InstrShiftRotate.td
(49.56 KB)
📄
X86InstrSystem.td
(34.03 KB)
📄
X86InstrTSX.td
(2.1 KB)
📄
X86InstrVMX.td
(3.53 KB)
📄
X86InstrVecCompiler.td
(21.09 KB)
📄
X86InstrXOP.td
(23.81 KB)
📄
X86InstructionSelector.cpp
(61.11 KB)
📄
X86InterleavedAccess.cpp
(32.7 KB)
📄
X86IntrinsicsInfo.h
(73.96 KB)
📄
X86LegalizerInfo.cpp
(15.6 KB)
📄
X86LegalizerInfo.h
(1.65 KB)
📄
X86LoadValueInjectionLoadHardening.cpp
(32.4 KB)
📄
X86LoadValueInjectionRetHardening.cpp
(4.93 KB)
📄
X86MCInstLower.cpp
(96.53 KB)
📄
X86MachineFunctionInfo.cpp
(1.1 KB)
📄
X86MachineFunctionInfo.h
(8.87 KB)
📄
X86MacroFusion.cpp
(2.62 KB)
📄
X86MacroFusion.h
(992 B)
📄
X86OptimizeLEAs.cpp
(27.47 KB)
📄
X86PadShortFunction.cpp
(7.33 KB)
📄
X86PartialReduction.cpp
(15.46 KB)
📄
X86PfmCounters.td
(10.18 KB)
📄
X86RegisterBankInfo.cpp
(10.55 KB)
📄
X86RegisterBankInfo.h
(2.87 KB)
📄
X86RegisterBanks.td
(629 B)
📄
X86RegisterInfo.cpp
(29 KB)
📄
X86RegisterInfo.h
(5.61 KB)
📄
X86RegisterInfo.td
(26.07 KB)
📄
X86SchedBroadwell.td
(69.45 KB)
📄
X86SchedHaswell.td
(73.96 KB)
📄
X86SchedPredicates.td
(4.23 KB)
📄
X86SchedSandyBridge.td
(50 KB)
📄
X86SchedSkylakeClient.td
(74.65 KB)
📄
X86SchedSkylakeServer.td
(113.85 KB)
📄
X86Schedule.td
(36.9 KB)
📄
X86ScheduleAtom.td
(38.26 KB)
📄
X86ScheduleBdVer2.td
(56.78 KB)
📄
X86ScheduleBtVer2.td
(46.98 KB)
📄
X86ScheduleSLM.td
(22.91 KB)
📄
X86ScheduleZnver1.td
(48.97 KB)
📄
X86ScheduleZnver2.td
(48.12 KB)
📄
X86SelectionDAGInfo.cpp
(12.02 KB)
📄
X86SelectionDAGInfo.h
(1.8 KB)
📄
X86ShuffleDecodeConstantPool.cpp
(11.22 KB)
📄
X86ShuffleDecodeConstantPool.h
(2.13 KB)
📄
X86SpeculativeExecutionSideEffectSuppression.cpp
(6.97 KB)
📄
X86SpeculativeLoadHardening.cpp
(93.16 KB)
📄
X86Subtarget.cpp
(13.25 KB)
📄
X86Subtarget.h
(32.08 KB)
📄
X86TargetMachine.cpp
(18.88 KB)
📄
X86TargetMachine.h
(2.04 KB)
📄
X86TargetObjectFile.cpp
(2.61 KB)
📄
X86TargetObjectFile.h
(2.13 KB)
📄
X86TargetTransformInfo.cpp
(189.14 KB)
📄
X86TargetTransformInfo.h
(9.63 KB)
📄
X86VZeroUpper.cpp
(12.59 KB)
📄
X86WinAllocaExpander.cpp
(9.54 KB)
📄
X86WinEHState.cpp
(28.97 KB)
Editing: X86InstrFMA3Info.cpp
//===-- X86InstrFMA3Info.cpp - X86 FMA3 Instruction Information -----------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file contains the implementation of the classes providing information // about existing X86 FMA3 opcodes, classifying and grouping them. // //===----------------------------------------------------------------------===// #include "X86InstrFMA3Info.h" #include "X86InstrInfo.h" #include "llvm/Support/ManagedStatic.h" #include "llvm/Support/Threading.h" #include <cassert> #include <cstdint> using namespace llvm; #define FMA3GROUP(Name, Suf, Attrs) \ { { X86::Name##132##Suf, X86::Name##213##Suf, X86::Name##231##Suf }, Attrs }, #define FMA3GROUP_MASKED(Name, Suf, Attrs) \ FMA3GROUP(Name, Suf, Attrs) \ FMA3GROUP(Name, Suf##k, Attrs | X86InstrFMA3Group::KMergeMasked) \ FMA3GROUP(Name, Suf##kz, Attrs | X86InstrFMA3Group::KZeroMasked) #define FMA3GROUP_PACKED_WIDTHS(Name, Suf, Attrs) \ FMA3GROUP(Name, Suf##Ym, Attrs) \ FMA3GROUP(Name, Suf##Yr, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Z128m, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Z128r, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Z256m, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Z256r, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Zm, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Zr, Attrs) \ FMA3GROUP(Name, Suf##m, Attrs) \ FMA3GROUP(Name, Suf##r, Attrs) #define FMA3GROUP_PACKED(Name, Attrs) \ FMA3GROUP_PACKED_WIDTHS(Name, PD, Attrs) \ FMA3GROUP_PACKED_WIDTHS(Name, PS, Attrs) #define FMA3GROUP_SCALAR_WIDTHS(Name, Suf, Attrs) \ FMA3GROUP(Name, Suf##Zm, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Zm_Int, Attrs | X86InstrFMA3Group::Intrinsic) \ FMA3GROUP(Name, Suf##Zr, Attrs) \ FMA3GROUP_MASKED(Name, Suf##Zr_Int, Attrs | X86InstrFMA3Group::Intrinsic) \ FMA3GROUP(Name, Suf##m, Attrs) \ FMA3GROUP(Name, Suf##m_Int, Attrs | X86InstrFMA3Group::Intrinsic) \ FMA3GROUP(Name, Suf##r, Attrs) \ FMA3GROUP(Name, Suf##r_Int, Attrs | X86InstrFMA3Group::Intrinsic) #define FMA3GROUP_SCALAR(Name, Attrs) \ FMA3GROUP_SCALAR_WIDTHS(Name, SD, Attrs) \ FMA3GROUP_SCALAR_WIDTHS(Name, SS, Attrs) #define FMA3GROUP_FULL(Name, Attrs) \ FMA3GROUP_PACKED(Name, Attrs) \ FMA3GROUP_SCALAR(Name, Attrs) static const X86InstrFMA3Group Groups[] = { FMA3GROUP_FULL(VFMADD, 0) FMA3GROUP_PACKED(VFMADDSUB, 0) FMA3GROUP_FULL(VFMSUB, 0) FMA3GROUP_PACKED(VFMSUBADD, 0) FMA3GROUP_FULL(VFNMADD, 0) FMA3GROUP_FULL(VFNMSUB, 0) }; #define FMA3GROUP_PACKED_AVX512_WIDTHS(Name, Type, Suf, Attrs) \ FMA3GROUP_MASKED(Name, Type##Z128##Suf, Attrs) \ FMA3GROUP_MASKED(Name, Type##Z256##Suf, Attrs) \ FMA3GROUP_MASKED(Name, Type##Z##Suf, Attrs) #define FMA3GROUP_PACKED_AVX512(Name, Suf, Attrs) \ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PD, Suf, Attrs) \ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PS, Suf, Attrs) #define FMA3GROUP_PACKED_AVX512_ROUND(Name, Suf, Attrs) \ FMA3GROUP_MASKED(Name, PDZ##Suf, Attrs) \ FMA3GROUP_MASKED(Name, PSZ##Suf, Attrs) #define FMA3GROUP_SCALAR_AVX512_ROUND(Name, Suf, Attrs) \ FMA3GROUP(Name, SDZ##Suf, Attrs) \ FMA3GROUP_MASKED(Name, SDZ##Suf##_Int, Attrs) \ FMA3GROUP(Name, SSZ##Suf, Attrs) \ FMA3GROUP_MASKED(Name, SSZ##Suf##_Int, Attrs) static const X86InstrFMA3Group BroadcastGroups[] = { FMA3GROUP_PACKED_AVX512(VFMADD, mb, 0) FMA3GROUP_PACKED_AVX512(VFMADDSUB, mb, 0) FMA3GROUP_PACKED_AVX512(VFMSUB, mb, 0) FMA3GROUP_PACKED_AVX512(VFMSUBADD, mb, 0) FMA3GROUP_PACKED_AVX512(VFNMADD, mb, 0) FMA3GROUP_PACKED_AVX512(VFNMSUB, mb, 0) }; static const X86InstrFMA3Group RoundGroups[] = { FMA3GROUP_PACKED_AVX512_ROUND(VFMADD, rb, 0) FMA3GROUP_SCALAR_AVX512_ROUND(VFMADD, rb, X86InstrFMA3Group::Intrinsic) FMA3GROUP_PACKED_AVX512_ROUND(VFMADDSUB, rb, 0) FMA3GROUP_PACKED_AVX512_ROUND(VFMSUB, rb, 0) FMA3GROUP_SCALAR_AVX512_ROUND(VFMSUB, rb, X86InstrFMA3Group::Intrinsic) FMA3GROUP_PACKED_AVX512_ROUND(VFMSUBADD, rb, 0) FMA3GROUP_PACKED_AVX512_ROUND(VFNMADD, rb, 0) FMA3GROUP_SCALAR_AVX512_ROUND(VFNMADD, rb, X86InstrFMA3Group::Intrinsic) FMA3GROUP_PACKED_AVX512_ROUND(VFNMSUB, rb, 0) FMA3GROUP_SCALAR_AVX512_ROUND(VFNMSUB, rb, X86InstrFMA3Group::Intrinsic) }; static void verifyTables() { #ifndef NDEBUG static std::atomic<bool> TableChecked(false); if (!TableChecked.load(std::memory_order_relaxed)) { assert(llvm::is_sorted(Groups) && llvm::is_sorted(RoundGroups) && llvm::is_sorted(BroadcastGroups) && "FMA3 tables not sorted!"); TableChecked.store(true, std::memory_order_relaxed); } #endif } /// Returns a reference to a group of FMA3 opcodes to where the given /// \p Opcode is included. If the given \p Opcode is not recognized as FMA3 /// and not included into any FMA3 group, then nullptr is returned. const X86InstrFMA3Group *llvm::getFMA3Group(unsigned Opcode, uint64_t TSFlags) { // FMA3 instructions have a well defined encoding pattern we can exploit. uint8_t BaseOpcode = X86II::getBaseOpcodeFor(TSFlags); bool IsFMA3 = ((TSFlags & X86II::EncodingMask) == X86II::VEX || (TSFlags & X86II::EncodingMask) == X86II::EVEX) && (TSFlags & X86II::OpMapMask) == X86II::T8 && (TSFlags & X86II::OpPrefixMask) == X86II::PD && ((BaseOpcode >= 0x96 && BaseOpcode <= 0x9F) || (BaseOpcode >= 0xA6 && BaseOpcode <= 0xAF) || (BaseOpcode >= 0xB6 && BaseOpcode <= 0xBF)); if (!IsFMA3) return nullptr; verifyTables(); ArrayRef<X86InstrFMA3Group> Table; if (TSFlags & X86II::EVEX_RC) Table = makeArrayRef(RoundGroups); else if (TSFlags & X86II::EVEX_B) Table = makeArrayRef(BroadcastGroups); else Table = makeArrayRef(Groups); // FMA 132 instructions have an opcode of 0x96-0x9F // FMA 213 instructions have an opcode of 0xA6-0xAF // FMA 231 instructions have an opcode of 0xB6-0xBF unsigned FormIndex = ((BaseOpcode - 0x90) >> 4) & 0x3; auto I = partition_point(Table, [=](const X86InstrFMA3Group &Group) { return Group.Opcodes[FormIndex] < Opcode; }); assert(I != Table.end() && I->Opcodes[FormIndex] == Opcode && "Couldn't find FMA3 opcode!"); return I; }
Upload File
Create Folder