003 File Manager
Current Path:
/usr/src/contrib/llvm-project/llvm/lib/Target/ARM
usr
/
src
/
contrib
/
llvm-project
/
llvm
/
lib
/
Target
/
ARM
/
📁
..
📄
A15SDOptimizer.cpp
(24.01 KB)
📄
ARM.h
(2.78 KB)
📄
ARM.td
(73.6 KB)
📄
ARMAsmPrinter.cpp
(80.17 KB)
📄
ARMAsmPrinter.h
(5.74 KB)
📄
ARMBaseInstrInfo.cpp
(209.03 KB)
📄
ARMBaseInstrInfo.h
(36.07 KB)
📄
ARMBaseRegisterInfo.cpp
(34.2 KB)
📄
ARMBaseRegisterInfo.h
(7.84 KB)
📄
ARMBasicBlockInfo.cpp
(5.18 KB)
📄
ARMBasicBlockInfo.h
(5.25 KB)
📄
ARMCallLowering.cpp
(19.74 KB)
📄
ARMCallLowering.h
(1.89 KB)
📄
ARMCallingConv.cpp
(11.8 KB)
📄
ARMCallingConv.h
(2.43 KB)
📄
ARMCallingConv.td
(14.63 KB)
📄
ARMConstantIslandPass.cpp
(90.84 KB)
📄
ARMConstantPoolValue.cpp
(11.53 KB)
📄
ARMConstantPoolValue.h
(10.1 KB)
📄
ARMExpandPseudoInsts.cpp
(115.56 KB)
📄
ARMFastISel.cpp
(106.14 KB)
📄
ARMFeatures.h
(2.48 KB)
📄
ARMFrameLowering.cpp
(102.32 KB)
📄
ARMFrameLowering.h
(4.02 KB)
📄
ARMHazardRecognizer.cpp
(3.41 KB)
📄
ARMHazardRecognizer.h
(1.54 KB)
📄
ARMISelDAGToDAG.cpp
(206.42 KB)
📄
ARMISelLowering.cpp
(728.6 KB)
📄
ARMISelLowering.h
(38.98 KB)
📄
ARMInstrCDE.td
(24.04 KB)
📄
ARMInstrFormats.td
(93.92 KB)
📄
ARMInstrInfo.cpp
(4.2 KB)
📄
ARMInstrInfo.h
(1.49 KB)
📄
ARMInstrInfo.td
(243.51 KB)
📄
ARMInstrMVE.td
(299.67 KB)
📄
ARMInstrNEON.td
(436.25 KB)
📄
ARMInstrThumb.td
(65.92 KB)
📄
ARMInstrThumb2.td
(211.06 KB)
📄
ARMInstrVFP.td
(110.46 KB)
📄
ARMInstructionSelector.cpp
(39.12 KB)
📄
ARMLegalizerInfo.cpp
(18.8 KB)
📄
ARMLegalizerInfo.h
(2.41 KB)
📄
ARMLoadStoreOptimizer.cpp
(94.44 KB)
📄
ARMLowOverheadLoops.cpp
(60.28 KB)
📄
ARMMCInstLower.cpp
(7.2 KB)
📄
ARMMachineFunctionInfo.cpp
(821 B)
📄
ARMMachineFunctionInfo.h
(9.68 KB)
📄
ARMMacroFusion.cpp
(2.36 KB)
📄
ARMMacroFusion.h
(966 B)
📄
ARMOptimizeBarriersPass.cpp
(3.43 KB)
📄
ARMParallelDSP.cpp
(26.82 KB)
📄
ARMPerfectShuffle.h
(382.02 KB)
📄
ARMPredicates.td
(14.16 KB)
📄
ARMRegisterBankInfo.cpp
(18.18 KB)
📄
ARMRegisterBankInfo.h
(1.41 KB)
📄
ARMRegisterBanks.td
(577 B)
📄
ARMRegisterInfo.cpp
(685 B)
📄
ARMRegisterInfo.h
(845 B)
📄
ARMRegisterInfo.td
(24.53 KB)
📄
ARMSchedule.td
(15.13 KB)
📄
ARMScheduleA57.td
(62.61 KB)
📄
ARMScheduleA57WriteRes.td
(11.43 KB)
📄
ARMScheduleA8.td
(49.59 KB)
📄
ARMScheduleA9.td
(130.35 KB)
📄
ARMScheduleM4.td
(4.77 KB)
📄
ARMScheduleR52.td
(44.27 KB)
📄
ARMScheduleSwift.td
(50.53 KB)
📄
ARMScheduleV6.td
(12.34 KB)
📄
ARMSelectionDAGInfo.cpp
(9.21 KB)
📄
ARMSelectionDAGInfo.h
(2.81 KB)
📄
ARMSubtarget.cpp
(16.73 KB)
📄
ARMSubtarget.h
(31.56 KB)
📄
ARMSystemRegister.td
(5.42 KB)
📄
ARMTargetMachine.cpp
(19.74 KB)
📄
ARMTargetMachine.h
(3.48 KB)
📄
ARMTargetObjectFile.cpp
(3.75 KB)
📄
ARMTargetObjectFile.h
(1.67 KB)
📄
ARMTargetTransformInfo.cpp
(63.49 KB)
📄
ARMTargetTransformInfo.h
(10.22 KB)
📁
AsmParser
📁
Disassembler
📁
MCTargetDesc
📄
MLxExpansionPass.cpp
(11.56 KB)
📄
MVEGatherScatterLowering.cpp
(40.3 KB)
📄
MVETailPredication.cpp
(23.2 KB)
📄
MVEVPTBlockPass.cpp
(10.77 KB)
📄
MVEVPTOptimisationsPass.cpp
(16.46 KB)
📁
TargetInfo
📄
Thumb1FrameLowering.cpp
(39.45 KB)
📄
Thumb1FrameLowering.h
(3.48 KB)
📄
Thumb1InstrInfo.cpp
(5.73 KB)
📄
Thumb1InstrInfo.h
(2.38 KB)
📄
Thumb2ITBlockPass.cpp
(9.09 KB)
📄
Thumb2InstrInfo.cpp
(26.43 KB)
📄
Thumb2InstrInfo.h
(3.75 KB)
📄
Thumb2SizeReduction.cpp
(40.25 KB)
📄
ThumbRegisterInfo.cpp
(21.75 KB)
📄
ThumbRegisterInfo.h
(2.44 KB)
📁
Utils
Editing: MVEVPTBlockPass.cpp
//===-- MVEVPTBlockPass.cpp - Insert MVE VPT blocks -----------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "ARM.h" #include "ARMMachineFunctionInfo.h" #include "ARMSubtarget.h" #include "MCTargetDesc/ARMBaseInfo.h" #include "Thumb2InstrInfo.h" #include "llvm/ADT/SmallSet.h" #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/Statistic.h" #include "llvm/ADT/StringRef.h" #include "llvm/CodeGen/MachineBasicBlock.h" #include "llvm/CodeGen/MachineFunction.h" #include "llvm/CodeGen/MachineFunctionPass.h" #include "llvm/CodeGen/MachineInstr.h" #include "llvm/CodeGen/MachineInstrBuilder.h" #include "llvm/CodeGen/MachineInstrBundle.h" #include "llvm/CodeGen/MachineOperand.h" #include "llvm/IR/DebugLoc.h" #include "llvm/MC/MCInstrDesc.h" #include "llvm/MC/MCRegisterInfo.h" #include "llvm/Support/Debug.h" #include <cassert> #include <new> using namespace llvm; #define DEBUG_TYPE "arm-mve-vpt" namespace { class MVEVPTBlock : public MachineFunctionPass { public: static char ID; const Thumb2InstrInfo *TII; const TargetRegisterInfo *TRI; MVEVPTBlock() : MachineFunctionPass(ID) {} bool runOnMachineFunction(MachineFunction &Fn) override; MachineFunctionProperties getRequiredProperties() const override { return MachineFunctionProperties().set( MachineFunctionProperties::Property::NoVRegs); } StringRef getPassName() const override { return "MVE VPT block insertion pass"; } private: bool InsertVPTBlocks(MachineBasicBlock &MBB); }; char MVEVPTBlock::ID = 0; } // end anonymous namespace INITIALIZE_PASS(MVEVPTBlock, DEBUG_TYPE, "ARM MVE VPT block pass", false, false) static MachineInstr *findVCMPToFoldIntoVPST(MachineBasicBlock::iterator MI, const TargetRegisterInfo *TRI, unsigned &NewOpcode) { // Search backwards to the instruction that defines VPR. This may or not // be a VCMP, we check that after this loop. If we find another instruction // that reads cpsr, we return nullptr. MachineBasicBlock::iterator CmpMI = MI; while (CmpMI != MI->getParent()->begin()) { --CmpMI; if (CmpMI->modifiesRegister(ARM::VPR, TRI)) break; if (CmpMI->readsRegister(ARM::VPR, TRI)) break; } if (CmpMI == MI) return nullptr; NewOpcode = VCMPOpcodeToVPT(CmpMI->getOpcode()); if (NewOpcode == 0) return nullptr; // Search forward from CmpMI to MI, checking if either register was def'd if (registerDefinedBetween(CmpMI->getOperand(1).getReg(), std::next(CmpMI), MI, TRI)) return nullptr; if (registerDefinedBetween(CmpMI->getOperand(2).getReg(), std::next(CmpMI), MI, TRI)) return nullptr; return &*CmpMI; } // Advances Iter past a block of predicated instructions. // Returns true if it successfully skipped the whole block of predicated // instructions. Returns false when it stopped early (due to MaxSteps), or if // Iter didn't point to a predicated instruction. static bool StepOverPredicatedInstrs(MachineBasicBlock::instr_iterator &Iter, MachineBasicBlock::instr_iterator EndIter, unsigned MaxSteps, unsigned &NumInstrsSteppedOver) { ARMVCC::VPTCodes NextPred = ARMVCC::None; Register PredReg; NumInstrsSteppedOver = 0; while (Iter != EndIter) { NextPred = getVPTInstrPredicate(*Iter, PredReg); assert(NextPred != ARMVCC::Else && "VPT block pass does not expect Else preds"); if (NextPred == ARMVCC::None || MaxSteps == 0) break; --MaxSteps; ++Iter; ++NumInstrsSteppedOver; }; return NumInstrsSteppedOver != 0 && (NextPred == ARMVCC::None || Iter == EndIter); } // Returns true if at least one instruction in the range [Iter, End) defines // or kills VPR. static bool IsVPRDefinedOrKilledByBlock(MachineBasicBlock::iterator Iter, MachineBasicBlock::iterator End) { for (; Iter != End; ++Iter) if (Iter->definesRegister(ARM::VPR) || Iter->killsRegister(ARM::VPR)) return true; return false; } // Creates a T, TT, TTT or TTTT BlockMask depending on BlockSize. static ARM::PredBlockMask GetInitialBlockMask(unsigned BlockSize) { switch (BlockSize) { case 1: return ARM::PredBlockMask::T; case 2: return ARM::PredBlockMask::TT; case 3: return ARM::PredBlockMask::TTT; case 4: return ARM::PredBlockMask::TTTT; default: llvm_unreachable("Invalid BlockSize!"); } } // Given an iterator (Iter) that points at an instruction with a "Then" // predicate, tries to create the largest block of continuous predicated // instructions possible, and returns the VPT Block Mask of that block. // // This will try to perform some minor optimization in order to maximize the // size of the block. static ARM::PredBlockMask CreateVPTBlock(MachineBasicBlock::instr_iterator &Iter, MachineBasicBlock::instr_iterator EndIter, SmallVectorImpl<MachineInstr *> &DeadInstructions) { MachineBasicBlock::instr_iterator BlockBeg = Iter; (void)BlockBeg; assert(getVPTInstrPredicate(*Iter) == ARMVCC::Then && "Expected a Predicated Instruction"); LLVM_DEBUG(dbgs() << "VPT block created for: "; Iter->dump()); unsigned BlockSize; StepOverPredicatedInstrs(Iter, EndIter, 4, BlockSize); LLVM_DEBUG(for (MachineBasicBlock::instr_iterator AddedInstIter = std::next(BlockBeg); AddedInstIter != Iter; ++AddedInstIter) { dbgs() << " adding: "; AddedInstIter->dump(); }); // Generate the initial BlockMask ARM::PredBlockMask BlockMask = GetInitialBlockMask(BlockSize); // Remove VPNOTs while there's still room in the block, so we can make the // largest block possible. ARMVCC::VPTCodes CurrentPredicate = ARMVCC::Else; while (BlockSize < 4 && Iter != EndIter && Iter->getOpcode() == ARM::MVE_VPNOT) { // Try to skip all of the predicated instructions after the VPNOT, stopping // after (4 - BlockSize). If we can't skip them all, stop. unsigned ElseInstCnt = 0; MachineBasicBlock::instr_iterator VPNOTBlockEndIter = std::next(Iter); if (!StepOverPredicatedInstrs(VPNOTBlockEndIter, EndIter, (4 - BlockSize), ElseInstCnt)) break; // Check if this VPNOT can be removed or not: It can only be removed if at // least one of the predicated instruction that follows it kills or sets // VPR. if (!IsVPRDefinedOrKilledByBlock(Iter, VPNOTBlockEndIter)) break; LLVM_DEBUG(dbgs() << " removing VPNOT: "; Iter->dump();); // Record the new size of the block BlockSize += ElseInstCnt; assert(BlockSize <= 4 && "Block is too large!"); // Record the VPNot to remove it later. DeadInstructions.push_back(&*Iter); ++Iter; // Replace the predicates of the instructions we're adding. // Note that we are using "Iter" to iterate over the block so we can update // it at the same time. for (; Iter != VPNOTBlockEndIter; ++Iter) { // Find the register in which the predicate is int OpIdx = findFirstVPTPredOperandIdx(*Iter); assert(OpIdx != -1); // Change the predicate and update the mask Iter->getOperand(OpIdx).setImm(CurrentPredicate); BlockMask = expandPredBlockMask(BlockMask, CurrentPredicate); LLVM_DEBUG(dbgs() << " adding : "; Iter->dump()); } CurrentPredicate = (CurrentPredicate == ARMVCC::Then ? ARMVCC::Else : ARMVCC::Then); } return BlockMask; } bool MVEVPTBlock::InsertVPTBlocks(MachineBasicBlock &Block) { bool Modified = false; MachineBasicBlock::instr_iterator MBIter = Block.instr_begin(); MachineBasicBlock::instr_iterator EndIter = Block.instr_end(); SmallVector<MachineInstr *, 4> DeadInstructions; while (MBIter != EndIter) { MachineInstr *MI = &*MBIter; Register PredReg; DebugLoc DL = MI->getDebugLoc(); ARMVCC::VPTCodes Pred = getVPTInstrPredicate(*MI, PredReg); // The idea of the predicate is that None, Then and Else are for use when // handling assembly language: they correspond to the three possible // suffixes "", "t" and "e" on the mnemonic. So when instructions are read // from assembly source or disassembled from object code, you expect to // see a mixture whenever there's a long VPT block. But in code // generation, we hope we'll never generate an Else as input to this pass. assert(Pred != ARMVCC::Else && "VPT block pass does not expect Else preds"); if (Pred == ARMVCC::None) { ++MBIter; continue; } ARM::PredBlockMask BlockMask = CreateVPTBlock(MBIter, EndIter, DeadInstructions); // Search back for a VCMP that can be folded to create a VPT, or else // create a VPST directly MachineInstrBuilder MIBuilder; unsigned NewOpcode; LLVM_DEBUG(dbgs() << " final block mask: " << (unsigned)BlockMask << "\n"); if (MachineInstr *VCMP = findVCMPToFoldIntoVPST(MI, TRI, NewOpcode)) { LLVM_DEBUG(dbgs() << " folding VCMP into VPST: "; VCMP->dump()); MIBuilder = BuildMI(Block, MI, DL, TII->get(NewOpcode)); MIBuilder.addImm((uint64_t)BlockMask); MIBuilder.add(VCMP->getOperand(1)); MIBuilder.add(VCMP->getOperand(2)); MIBuilder.add(VCMP->getOperand(3)); VCMP->eraseFromParent(); } else { MIBuilder = BuildMI(Block, MI, DL, TII->get(ARM::MVE_VPST)); MIBuilder.addImm((uint64_t)BlockMask); } finalizeBundle( Block, MachineBasicBlock::instr_iterator(MIBuilder.getInstr()), MBIter); Modified = true; } // Erase all dead instructions for (MachineInstr *DeadMI : DeadInstructions) { if (DeadMI->isInsideBundle()) DeadMI->eraseFromBundle(); else DeadMI->eraseFromParent(); } return Modified; } bool MVEVPTBlock::runOnMachineFunction(MachineFunction &Fn) { const ARMSubtarget &STI = static_cast<const ARMSubtarget &>(Fn.getSubtarget()); if (!STI.isThumb2() || !STI.hasMVEIntegerOps()) return false; TII = static_cast<const Thumb2InstrInfo *>(STI.getInstrInfo()); TRI = STI.getRegisterInfo(); LLVM_DEBUG(dbgs() << "********** ARM MVE VPT BLOCKS **********\n" << "********** Function: " << Fn.getName() << '\n'); bool Modified = false; for (MachineBasicBlock &MBB : Fn) Modified |= InsertVPTBlocks(MBB); LLVM_DEBUG(dbgs() << "**************************************\n"); return Modified; } /// createMVEVPTBlock - Returns an instance of the MVE VPT block /// insertion pass. FunctionPass *llvm::createMVEVPTBlockPass() { return new MVEVPTBlock(); }
Upload File
Create Folder