43#define DEBUG_TYPE "si-insert-hard-clauses"
47 cl::desc(
"Maximum number of memory instructions to "
48 "place in the same hard clause"),
65 HARDCLAUSE_MIMG_STORE,
66 HARDCLAUSE_MIMG_ATOMIC,
67 HARDCLAUSE_MIMG_SAMPLE,
70 HARDCLAUSE_VMEM_STORE,
71 HARDCLAUSE_VMEM_ATOMIC,
74 HARDCLAUSE_FLAT_STORE,
75 HARDCLAUSE_FLAT_ATOMIC,
87 LAST_REAL_HARDCLAUSE_TYPE = HARDCLAUSE_VALU,
99class SIInsertHardClauses {
101 const GCNSubtarget *ST =
nullptr;
103 HardClauseType getHardClauseType(
const MachineInstr &
MI) {
104 if (
MI.mayLoad() || (
MI.mayStore() && ST->shouldClusterStores())) {
105 if (ST->getGeneration() == AMDGPUSubtarget::GFX10 ||
106 ST->hasGFX1250Insts()) {
109 if (ST->hasNSAClauseBug()) {
111 if (
Info &&
Info->MIMGEncoding == AMDGPU::MIMGEncGfx10NSA)
112 return HARDCLAUSE_ILLEGAL;
114 return HARDCLAUSE_VMEM;
117 return HARDCLAUSE_FLAT;
121 const AMDGPU::MIMGBaseOpcodeInfo *BaseInfo =
124 return HARDCLAUSE_BVH;
126 return HARDCLAUSE_MIMG_SAMPLE;
127 return MI.mayLoad() ?
MI.mayStore() ? HARDCLAUSE_MIMG_ATOMIC
128 : HARDCLAUSE_MIMG_LOAD
129 : HARDCLAUSE_MIMG_STORE;
133 return MI.mayLoad() ?
MI.mayStore() ? HARDCLAUSE_VMEM_ATOMIC
134 : HARDCLAUSE_VMEM_LOAD
135 : HARDCLAUSE_VMEM_STORE;
138 return MI.mayLoad() ?
MI.mayStore() ? HARDCLAUSE_FLAT_ATOMIC
139 : HARDCLAUSE_FLAT_LOAD
140 : HARDCLAUSE_FLAT_STORE;
145 return HARDCLAUSE_SMEM;
152 if (
MI.getOpcode() == AMDGPU::S_NOP)
153 return HARDCLAUSE_INTERNAL;
154 if (
MI.isMetaInstruction())
155 return HARDCLAUSE_IGNORE;
156 return HARDCLAUSE_ILLEGAL;
162 HardClauseType Type = HARDCLAUSE_ILLEGAL;
164 MachineInstr *First =
nullptr;
166 MachineInstr *Last =
nullptr;
173 unsigned TrailingInternalLength = 0;
178 bool emitClause(
const ClauseInfo &CI,
const SIInstrInfo *SII) {
179 if (CI.First == CI.Last)
181 assert(CI.Length <= ST->maxHardClauseLength() &&
182 "Hard clause is too long!");
184 auto &
MBB = *CI.First->getParent();
189 std::next(CI.Last->getIterator()));
193 bool run(MachineFunction &MF) {
195 if (!ST->hasHardClauses())
199 "amdgpu-hard-clause-length-limit", 255);
202 MaxClauseLength = std::min(MaxClauseLength, ST->maxHardClauseLength());
203 if (MaxClauseLength <= 1)
206 const SIInstrInfo *SII = ST->getInstrInfo();
207 const TargetRegisterInfo *
TRI = ST->getRegisterInfo();
210 for (
auto &
MBB : MF) {
212 for (
auto &
MI :
MBB) {
213 HardClauseType
Type = getHardClauseType(
MI);
219 if (
Type <= LAST_REAL_HARDCLAUSE_TYPE) {
224 Type = HARDCLAUSE_ILLEGAL;
228 if (CI.Length == MaxClauseLength ||
229 (CI.Length &&
Type != HARDCLAUSE_INTERNAL &&
230 Type != HARDCLAUSE_IGNORE &&
242 Changed |= emitClause(CI, SII);
248 if (
Type != HARDCLAUSE_IGNORE) {
249 if (
Type == HARDCLAUSE_INTERNAL) {
250 ++CI.TrailingInternalLength;
253 CI.Length += CI.TrailingInternalLength;
254 CI.TrailingInternalLength = 0;
256 CI.BaseOps = std::move(BaseOps);
259 }
else if (
Type <= LAST_REAL_HARDCLAUSE_TYPE) {
261 CI = ClauseInfo{
Type, &
MI, &
MI, 1, 0, std::move(BaseOps)};
267 Changed |= emitClause(CI, SII);
277 SIInsertHardClausesLegacy() : MachineFunctionPass(ID) {}
279 bool runOnMachineFunction(MachineFunction &MF)
override {
283 return SIInsertHardClauses().run(MF);
286 void getAnalysisUsage(AnalysisUsage &AU)
const override {
297 if (!SIInsertHardClauses().
run(MF))
305char SIInsertHardClausesLegacy::ID = 0;
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
Provides AMDGPU specific target descriptions.
Analysis containing CSE Info
AMD GCN specific subclass of TargetSubtarget.
Register const TargetRegisterInfo * TRI
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
static cl::opt< unsigned > HardClauseLengthLimit("amdgpu-hard-clause-length-limit", cl::desc("Maximum number of memory instructions to " "place in the same hard clause"), cl::Hidden)
This file defines the SmallVector class.
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
Represents analyses that only rely on functions' control flow.
uint64_t getFnAttributeAsParsedInteger(StringRef Kind, uint64_t Default=0) const
For a string attribute Kind, parse attribute as an integer.
static LocationSize precise(uint64_t Value)
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Function & getFunction()
Return the LLVM function that this machine code represents.
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
static bool isVMEM(const MachineInstr &MI)
bool getMemOperandsWithOffsetWidth(const MachineInstr &LdSt, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const final
static bool isSMRD(const MachineInstr &MI)
bool shouldClusterMemOps(ArrayRef< const MachineOperand * > BaseOps1, int64_t Offset1, bool OffsetIsScalable1, ArrayRef< const MachineOperand * > BaseOps2, int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize, unsigned NumBytes) const override
static bool isSegmentSpecificFLAT(const MachineInstr &MI)
static bool isMIMG(const MachineInstr &MI)
static bool isFLAT(const MachineInstr &MI)
self_iterator getIterator()
LLVM_READONLY const MIMGInfo * getMIMGInfo(unsigned Opc)
LLVM_READONLY const MIMGBaseOpcodeInfo * getMIMGBaseOpcodeInfo(unsigned BaseOpcode)
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI void finalizeBundle(MachineBasicBlock &MBB, MachineBasicBlock::instr_iterator FirstMI, MachineBasicBlock::instr_iterator LastMI)
finalizeBundle - Finalize a machine instruction bundle which includes a sequence of instructions star...
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
LLVM_ABI PreservedAnalyses getMachineFunctionPassPreservedAnalyses()
Returns the minimum set of Analyses that all machine function passes must preserve.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
char & SIInsertHardClausesID