LLVM: lib/Target/AMDGPU/AMDGPUGlobalISelDivergenceLowering.cpp Source File

//===-- AMDGPUGlobalISelDivergenceLowering.cpp ----------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// GlobalISel pass that selects divergent i1 phis as lane mask phis.

/// Lane mask merging uses same algorithm as SDAG in SILowerI1Copies.

/// Handles all cases of temporal divergence.

/// For divergent non-phi i1 and uniform i1 uses outside of the cycle this pass

/// currently depends on LCSSA to insert phis with one incoming.

//

//===----------------------------------------------------------------------===//


#include "AMDGPU.h"

#include "AMDGPUGlobalISelUtils.h"

#include "SILowerI1Copies.h"

#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"

#include "llvm/CodeGen/MachineFunctionPass.h"

#include "llvm/CodeGen/MachineUniformityAnalysis.h"

#include "llvm/InitializePasses.h"


#define DEBUG_TYPE "amdgpu-global-isel-divergence-lowering"


using namespace llvm;


namespace {


class AMDGPUGlobalISelDivergenceLowering : public MachineFunctionPass {

public:

  static char ID;


public:

  AMDGPUGlobalISelDivergenceLowering() : MachineFunctionPass(ID) {}


  bool runOnMachineFunction(MachineFunction &MF) override;


  StringRef getPassName() const override {

    return "AMDGPU GlobalISel divergence lowering";

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.setPreservesCFG();

    AU.addRequired<MachineDominatorTreeWrapperPass>();

    AU.addRequired<MachinePostDominatorTreeWrapperPass>();

    AU.addRequired<MachineUniformityAnalysisPass>();

    MachineFunctionPass::getAnalysisUsage(AU);

  }

};


class DivergenceLoweringHelper : public PhiLoweringHelper {

public:

  DivergenceLoweringHelper(MachineFunction *MF, MachineDominatorTree *DT,

                           MachinePostDominatorTree *PDT,

                           MachineUniformityInfo *MUI);


private:

  MachineUniformityInfo *MUI = nullptr;

  MachineIRBuilder B;

  Register buildRegCopyToLaneMask(Register Reg);


public:

  void markAsLaneMask(Register DstReg) const override;

  void getCandidatesForLowering(

      SmallVectorImpl<MachineInstr *> &Vreg1Phis) const override;

  void collectIncomingValuesFromPhi(

      const MachineInstr *MI,

      SmallVectorImpl<Incoming> &Incomings) const override;

  void replaceDstReg(Register NewReg, Register OldReg,

                     MachineBasicBlock *MBB) override;

  void buildMergeLaneMasks(MachineBasicBlock &MBB,

                           MachineBasicBlock::iterator I, const DebugLoc &DL,

                           Register DstReg, Register PrevReg,

                           Register CurReg) override;

  void constrainAsLaneMask(Incoming &In) override;


  bool lowerTemporalDivergence();

  bool lowerTemporalDivergenceI1();

};


DivergenceLoweringHelper::DivergenceLoweringHelper(

    MachineFunction *MF, MachineDominatorTree *DT,

    MachinePostDominatorTree *PDT, MachineUniformityInfo *MUI)

    : PhiLoweringHelper(MF, DT, PDT), MUI(MUI), B(*MF) {}


// _(s1) -> SReg_32/64(s1)

void DivergenceLoweringHelper::markAsLaneMask(Register DstReg) const {

  assert(MRI->getType(DstReg) == LLT::scalar(1));


  if (MRI->getRegClassOrNull(DstReg)) {

    if (MRI->constrainRegClass(DstReg, ST->getBoolRC()))

      return;

    llvm_unreachable("Failed to constrain register class");

  }


  MRI->setRegClass(DstReg, ST->getBoolRC());

}


void DivergenceLoweringHelper::getCandidatesForLowering(

    SmallVectorImpl<MachineInstr *> &Vreg1Phis) const {

  LLT S1 = LLT::scalar(1);


  // Add divergent i1 phis to the list

  for (MachineBasicBlock &MBB : *MF) {

    for (MachineInstr &MI : MBB.phis()) {

      Register Dst = MI.getOperand(0).getReg();

      if (MRI->getType(Dst) == S1 && MUI->isDivergent(Dst))

        Vreg1Phis.push_back(&MI);

    }

  }

}


void DivergenceLoweringHelper::collectIncomingValuesFromPhi(

    const MachineInstr *MI, SmallVectorImpl<Incoming> &Incomings) const {

  for (unsigned i = 1; i < MI->getNumOperands(); i += 2) {

    Incomings.emplace_back(MI->getOperand(i).getReg(),

                           MI->getOperand(i + 1).getMBB(), Register());

  }

}


void DivergenceLoweringHelper::replaceDstReg(Register NewReg, Register OldReg,

                                             MachineBasicBlock *MBB) {

  BuildMI(*MBB, MBB->getFirstNonPHI(), {}, TII->get(AMDGPU::COPY), OldReg)

      .addReg(NewReg);

}


// Copy Reg to new lane mask register, insert a copy after instruction that

// defines Reg while skipping phis if needed.

Register DivergenceLoweringHelper::buildRegCopyToLaneMask(Register Reg) {

  Register LaneMask = createLaneMaskReg(MRI, LaneMaskRegAttrs);

  MachineInstr *Instr = MRI->getVRegDef(Reg);

  MachineBasicBlock *MBB = Instr->getParent();

  B.setInsertPt(*MBB, MBB->SkipPHIsAndLabels(std::next(Instr->getIterator())));

  B.buildCopy(LaneMask, Reg);

  return LaneMask;

}


// bb.previous

//   %PrevReg = ...

//

// bb.current

//   %CurReg = ...

//

//   %DstReg - not defined

//

// -> (wave32 example, new registers have sreg_32 reg class and S1 LLT)

//

// bb.previous

//   %PrevReg = ...

//   %PrevRegCopy:sreg_32(s1) = COPY %PrevReg

//

// bb.current

//   %CurReg = ...

//   %CurRegCopy:sreg_32(s1) = COPY %CurReg

//   ...

//   %PrevMaskedReg:sreg_32(s1) = ANDN2 %PrevRegCopy, ExecReg - active lanes 0

//   %CurMaskedReg:sreg_32(s1)  = AND %ExecReg, CurRegCopy - inactive lanes to 0

//   %DstReg:sreg_32(s1)        = OR %PrevMaskedReg, CurMaskedReg

//

// DstReg = for active lanes rewrite bit in PrevReg with bit from CurReg

void DivergenceLoweringHelper::buildMergeLaneMasks(

    MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL,

    Register DstReg, Register PrevReg, Register CurReg) {

  // DstReg = (PrevReg & !EXEC) | (CurReg & EXEC)

  // TODO: check if inputs are constants or results of a compare.


  Register PrevRegCopy = buildRegCopyToLaneMask(PrevReg);

  Register CurRegCopy = buildRegCopyToLaneMask(CurReg);

  Register PrevMaskedReg = createLaneMaskReg(MRI, LaneMaskRegAttrs);

  Register CurMaskedReg = createLaneMaskReg(MRI, LaneMaskRegAttrs);


  B.setInsertPt(MBB, I);

  B.buildInstr(AndN2Op, {PrevMaskedReg}, {PrevRegCopy, ExecReg});

  B.buildInstr(AndOp, {CurMaskedReg}, {ExecReg, CurRegCopy});

  B.buildInstr(OrOp, {DstReg}, {PrevMaskedReg, CurMaskedReg});

}


// GlobalISel has to constrain S1 incoming taken as-is with lane mask register

// class. Insert a copy of Incoming.Reg to new lane mask inside Incoming.Block,

// Incoming.Reg becomes that new lane mask.

void DivergenceLoweringHelper::constrainAsLaneMask(Incoming &In) {

  B.setInsertPt(*In.Block, In.Block->getFirstTerminator());


  auto Copy = B.buildCopy(LLT::scalar(1), In.Reg);

  MRI->setRegClass(Copy.getReg(0), ST->getBoolRC());

  In.Reg = Copy.getReg(0);

}


void replaceUsesOfRegInInstWith(Register Reg, MachineInstr *Inst,

                                Register NewReg) {

  for (MachineOperand &Op : Inst->operands()) {

    if (Op.isReg() && Op.getReg() == Reg)

      Op.setReg(NewReg);

  }

}


bool DivergenceLoweringHelper::lowerTemporalDivergence() {

  AMDGPU::IntrinsicLaneMaskAnalyzer ILMA(*MF);

  DenseMap<Register, Register> TDCache;


  for (auto [Reg, UseInst, _] : MUI->getTemporalDivergenceList()) {

    if (MRI->getType(Reg) == LLT::scalar(1) || MUI->isDivergent(Reg) ||

        ILMA.isS32S64LaneMask(Reg))

      continue;


    Register CachedTDCopy = TDCache.lookup(Reg);

    if (CachedTDCopy) {

      replaceUsesOfRegInInstWith(Reg, UseInst, CachedTDCopy);

      continue;

    }


    MachineInstr *Inst = MRI->getVRegDef(Reg);

    MachineBasicBlock *MBB = Inst->getParent();

    B.setInsertPt(*MBB, MBB->SkipPHIsAndLabels(std::next(Inst->getIterator())));


    Register VgprReg = MRI->createGenericVirtualRegister(MRI->getType(Reg));

    B.buildInstr(AMDGPU::COPY, {VgprReg}, {Reg})

        .addUse(ExecReg, RegState::Implicit);


    replaceUsesOfRegInInstWith(Reg, UseInst, VgprReg);

    TDCache[Reg] = VgprReg;

  }

  return false;

}


bool DivergenceLoweringHelper::lowerTemporalDivergenceI1() {

  MachineRegisterInfo::VRegAttrs BoolS1 = {ST->getBoolRC(), LLT::scalar(1)};

  initializeLaneMaskRegisterAttributes(BoolS1);

  MachineSSAUpdater SSAUpdater(*MF);


  // In case of use outside muliple nested cycles or muliple uses we only need

  // to merge lane mask across largest relevant cycle.

  SmallDenseMap<Register, std::pair<const MachineCycle *, Register>> LRCCache;

  for (auto [Reg, UseInst, LRC] : MUI->getTemporalDivergenceList()) {

    if (MRI->getType(Reg) != LLT::scalar(1))

      continue;


    auto [LRCCacheIter, RegNotCached] = LRCCache.try_emplace(Reg);

    auto &CycleMergedMask = LRCCacheIter->getSecond();

    const MachineCycle *&CachedLRC = CycleMergedMask.first;

    if (RegNotCached || LRC->contains(CachedLRC)) {

      CachedLRC = LRC;

    }

  }


  for (auto &LRCCacheEntry : LRCCache) {

    Register Reg = LRCCacheEntry.first;

    auto &CycleMergedMask = LRCCacheEntry.getSecond();

    const MachineCycle *Cycle = CycleMergedMask.first;


    Register MergedMask = MRI->createVirtualRegister(BoolS1);

    SSAUpdater.Initialize(MergedMask);


    MachineBasicBlock *MBB = MRI->getVRegDef(Reg)->getParent();

    SSAUpdater.AddAvailableValue(MBB, MergedMask);


    for (auto Entry : Cycle->getEntries()) {

      for (MachineBasicBlock *Pred : Entry->predecessors()) {

        if (!Cycle->contains(Pred)) {

          B.setInsertPt(*Pred, Pred->getFirstTerminator());

          auto ImplDef = B.buildInstr(AMDGPU::IMPLICIT_DEF, {BoolS1}, {});

          SSAUpdater.AddAvailableValue(Pred, ImplDef.getReg(0));

        }

      }

    }


    buildMergeLaneMasks(*MBB, MBB->getFirstTerminator(), {}, MergedMask,

                        SSAUpdater.GetValueInMiddleOfBlock(MBB), Reg);


    CycleMergedMask.second = MergedMask;

  }


  for (auto [Reg, UseInst, Cycle] : MUI->getTemporalDivergenceList()) {

    if (MRI->getType(Reg) != LLT::scalar(1))

      continue;


    replaceUsesOfRegInInstWith(Reg, UseInst, LRCCache.lookup(Reg).second);

  }


  return false;

}


} // End anonymous namespace.


INITIALIZE_PASS_BEGIN(AMDGPUGlobalISelDivergenceLowering, DEBUG_TYPE,

                      "AMDGPU GlobalISel divergence lowering", false, false)

INITIALIZE_PASS_DEPENDENCY(MachineDominatorTreeWrapperPass)

INITIALIZE_PASS_DEPENDENCY(MachinePostDominatorTreeWrapperPass)

INITIALIZE_PASS_DEPENDENCY(MachineUniformityAnalysisPass)

INITIALIZE_PASS_END(AMDGPUGlobalISelDivergenceLowering, DEBUG_TYPE,

                    "AMDGPU GlobalISel divergence lowering", false, false)


char AMDGPUGlobalISelDivergenceLowering::ID = 0;


char &llvm::AMDGPUGlobalISelDivergenceLoweringID =

    AMDGPUGlobalISelDivergenceLowering::ID;


FunctionPass *llvm::createAMDGPUGlobalISelDivergenceLoweringPass() {

  return new AMDGPUGlobalISelDivergenceLowering();

}


bool AMDGPUGlobalISelDivergenceLowering::runOnMachineFunction(

    MachineFunction &MF) {

  MachineDominatorTree &DT =

      getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();

  MachinePostDominatorTree &PDT =

      getAnalysis<MachinePostDominatorTreeWrapperPass>().getPostDomTree();

  MachineUniformityInfo &MUI =

      getAnalysis<MachineUniformityAnalysisPass>().getUniformityInfo();


  DivergenceLoweringHelper Helper(&MF, &DT, &PDT, &MUI);


  bool Changed = false;

  // Temporal divergence lowering needs to inspect list of instructions used

  // outside cycle with divergent exit provided by uniformity analysis. Uniform

  // instructions from the list require lowering, no instruction is deleted.

  // Thus it needs to be run before lowerPhis that deletes phis that require

  // lowering and replaces them with new instructions.


  // Non-i1 temporal divergence lowering.

  Changed |= Helper.lowerTemporalDivergence();

  // This covers both uniform and divergent i1s. Lane masks are in sgpr and need

  // to be updated in each iteration.

  Changed |= Helper.lowerTemporalDivergenceI1();

  // Temporal divergence lowering of divergent i1 phi used outside of the cycle

  // could also be handled by lowerPhis but we do it in lowerTempDivergenceI1

  // since in some case lowerPhis does unnecessary lane mask merging.

  Changed |= Helper.lowerPhis();

  return Changed;

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition AArch64AdvSIMDScalarPass.cpp:103

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AMDGPUGlobalISelUtils.h

S1
constexpr LLT S1
Definition AMDGPULegalizerInfo.cpp:294

AMDGPU.h

MBB
MachineBasicBlock & MBB
Definition ARMSLSHardening.cpp:71

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

DEBUG_TYPE
#define DEBUG_TYPE
Definition GenericCycleImpl.h:31

TII
const HexagonInstrInfo * TII
Definition HexagonCopyToCombine.cpp:118

_
#define _
Definition HexagonMCCodeEmitter.cpp:47

MI
IRTranslator LLVM IR MI
Definition IRTranslator.cpp:110

InitializePasses.h

I
#define I(x, y, z)
Definition MD5.cpp:58

MachineFunctionPass.h

MachineIRBuilder.h
This file declares the MachineIRBuilder class.

Reg
Register Reg
Definition MachineSink.cpp:2117

MachineUniformityAnalysis.h
Machine IR instance of the generic uniformity analysis.

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition PassSupport.h:42

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition PassSupport.h:44

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition PassSupport.h:39

SILowerI1Copies.h
Interface definition of the PhiLoweringHelper class that implements lane mask merging algorithm for d...

llvm::AMDGPU::IntrinsicLaneMaskAnalyzer
Definition AMDGPUGlobalISelUtils.h:40

llvm::AMDGPU::IntrinsicLaneMaskAnalyzer::isS32S64LaneMask
bool isS32S64LaneMask(Register Reg) const
Definition AMDGPUGlobalISelUtils.cpp:86

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition PassAnalysisSupport.h:48

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition PassAnalysisSupport.h:76

llvm::AnalysisUsage::setPreservesCFG
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
Definition Pass.cpp:270

llvm::DebugLoc
A debug info location.
Definition DebugLoc.h:124

llvm::DenseMapBase::lookup
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
Definition DenseMap.h:187

llvm::DenseMapBase::try_emplace
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition DenseMap.h:229

llvm::DenseMap
Definition DenseMap.h:700

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition Pass.h:314

llvm::GenericUniformityInfo::isDivergent
bool isDivergent(ConstValueRefT V) const
Whether V is divergent at its definition.
Definition GenericUniformityImpl.h:1273

llvm::GenericUniformityInfo::getTemporalDivergenceList
iterator_range< TemporalDivergenceTuple * > getTemporalDivergenceList() const
Definition GenericUniformityImpl.h:1255

llvm::LLT
Definition LowLevelType.h:40

llvm::LLT::scalar
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
Definition LowLevelType.h:43

llvm::MachineBasicBlock
Definition MachineBasicBlock.h:122

llvm::MachineBasicBlock::predecessors
iterator_range< pred_iterator > predecessors()
Definition MachineBasicBlock.h:460

llvm::MachineBasicBlock::iterator
MachineInstrBundleIterator< MachineInstr > iterator
Definition MachineBasicBlock.h:341

llvm::MachineDominatorTreeWrapperPass
Analysis pass which computes a MachineDominatorTree.
Definition MachineDominators.h:127

llvm::MachineDominatorTree
DominatorTree Class - Concrete subclass of DominatorTreeBase that is used to compute a normal dominat...
Definition MachineDominators.h:71

llvm::MachineFunctionPass
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
Definition MachineFunctionPass.h:31

llvm::MachineFunctionPass::getAnalysisUsage
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
Definition MachineFunctionPass.cpp:184

llvm::MachineFunction
Definition MachineFunction.h:286

llvm::MachineIRBuilder
Helper class to build MachineInstr.
Definition MachineIRBuilder.h:236

llvm::MachineInstrBuilder::addReg
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
Definition MachineInstrBuilder.h:126

llvm::MachineInstr
Representation of each machine instruction.
Definition MachineInstr.h:72

llvm::MachineInstr::getParent
const MachineBasicBlock * getParent() const
Definition MachineInstr.h:359

llvm::MachineInstr::operands
mop_range operands()
Definition MachineInstr.h:693

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition MachineOperand.h:48

llvm::MachinePostDominatorTreeWrapperPass
Definition MachinePostDominators.h:95

llvm::MachinePostDominatorTree
MachinePostDominatorTree - an analysis pass wrapper for DominatorTree used to compute the post-domina...
Definition MachinePostDominators.h:49

llvm::MachineSSAUpdater
MachineSSAUpdater - This class updates SSA form for a set of virtual registers defined in multiple bl...
Definition MachineSSAUpdater.h:35

llvm::MachineUniformityAnalysisPass
Legacy analysis pass which computes a MachineUniformityInfo.
Definition MachineUniformityAnalysis.h:37

llvm::PhiLoweringHelper
Definition SILowerI1Copies.h:38

llvm::Register
Wrapper class representing virtual and physical registers.
Definition Register.h:19

llvm::SSAUpdater
Helper class for SSA formation on a set of values defined in multiple blocks.
Definition SSAUpdater.h:39

llvm::SSAUpdater::Initialize
void Initialize(Type *Ty, StringRef Name)
Reset this object to get ready for a new set of SSA updates with type 'Ty'.
Definition SSAUpdater.cpp:52

llvm::SSAUpdater::GetValueInMiddleOfBlock
Value * GetValueInMiddleOfBlock(BasicBlock *BB)
Construct SSA form, materializing a value that is live in the middle of the specified block.
Definition SSAUpdater.cpp:97

llvm::SSAUpdater::AddAvailableValue
void AddAvailableValue(BasicBlock *BB, Value *V)
Indicate that a rewritten value is available in the specified block with the specified value.
Definition SSAUpdater.cpp:69

llvm::SmallDenseMap
Definition DenseMap.h:859

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:574

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition SmallVector.h:938

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:414

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition ilist_node.h:134

Changed
Changed
Definition ObjCARCOpts.cpp:2370

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

false
Definition MachinePipeliner.cpp:239

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::RegState::Implicit
@ Implicit
Not emitted register (e.g. carry, or temporary result).
Definition MachineInstrBuilder.h:49

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::MachineUniformityInfo
GenericUniformityInfo< MachineSSAContext > MachineUniformityInfo
Definition MachineUniformityAnalysis.h:26

llvm::BuildMI
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
Definition MachineInstrBuilder.h:369

llvm::AMDGPUGlobalISelDivergenceLoweringID
char & AMDGPUGlobalISelDivergenceLoweringID
Definition AMDGPUGlobalISelDivergenceLowering.cpp:298

llvm::Cycle
CycleInfo::CycleT Cycle
Definition CycleInfo.h:24

llvm::createLaneMaskReg
Register createLaneMaskReg(MachineRegisterInfo *MRI, MachineRegisterInfo::VRegAttrs LaneMaskRegAttrs)
Definition SILowerI1Copies.cpp:373

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:22

llvm::createAMDGPUGlobalISelDivergenceLoweringPass
FunctionPass * createAMDGPUGlobalISelDivergenceLoweringPass()
Definition AMDGPUGlobalISelDivergenceLowering.cpp:301

llvm::MachineCycle
MachineCycleInfo::CycleT MachineCycle
Definition MachineCycleAnalysis.h:26

llvm::Incoming
Incoming for lane maks phi as machine instruction, incoming register Reg and incoming block Block are...
Definition SILowerI1Copies.h:26

llvm::MachineRegisterInfo::VRegAttrs
All attributes(register class or bank and low-level type) a virtual register can have.
Definition MachineRegisterInfo.h:749