LLVM 22.0.0git
ARMISelLowering.h
Go to the documentation of this file.
1//===- ARMISelLowering.h - ARM DAG Lowering Interface -----------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the interfaces that ARM uses to lower LLVM code into a
10// selection DAG.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef LLVM_LIB_TARGET_ARM_ARMISELLOWERING_H
15#define LLVM_LIB_TARGET_ARM_ARMISELLOWERING_H
16
19#include "llvm/ADT/StringRef.h"
27#include "llvm/IR/Attributes.h"
28#include "llvm/IR/CallingConv.h"
29#include "llvm/IR/Function.h"
30#include "llvm/IR/InlineAsm.h"
32#include <optional>
33#include <utility>
34
35namespace llvm {
36
37class ARMBaseTargetMachine;
38class ARMSubtarget;
39class DataLayout;
40class FastISel;
41class FunctionLoweringInfo;
42class GlobalValue;
43class InstrItineraryData;
44class Instruction;
45class IRBuilderBase;
46class MachineBasicBlock;
47class MachineInstr;
48class SelectionDAG;
49class TargetLibraryInfo;
50class TargetMachine;
51class TargetRegisterInfo;
52class VectorType;
53
54 namespace ARMISD {
55
56 // ARM Specific DAG Nodes
57 enum NodeType : unsigned {
58 // Start the numbering where the builtin ops and target ops leave off.
60
61 Wrapper, // Wrapper - A wrapper node for TargetConstantPool,
62 // TargetExternalSymbol, and TargetGlobalAddress.
63 WrapperPIC, // WrapperPIC - A wrapper node for TargetGlobalAddress in
64 // PIC mode.
65 WrapperJT, // WrapperJT - A wrapper node for TargetJumpTable
66
67 // Add pseudo op to model memcpy for struct byval.
69
70 CALL, // Function call.
71 CALL_PRED, // Function call that's predicable.
72 CALL_NOLINK, // Function call with branch not branch-and-link.
73 tSECALL, // CMSE non-secure function call.
74 t2CALL_BTI, // Thumb function call followed by BTI instruction.
75 BRCOND, // Conditional branch.
76 BR_JT, // Jumptable branch.
77 BR2_JT, // Jumptable branch (2 level - jumptable entry is a jump).
78 RET_GLUE, // Return with a flag operand.
79 SERET_GLUE, // CMSE Entry function return with a flag operand.
80 INTRET_GLUE, // Interrupt return with an LR-offset and a flag operand.
81
82 PIC_ADD, // Add with a PC operand and a PIC label.
83
84 ASRL, // MVE long arithmetic shift right.
85 LSRL, // MVE long shift right.
86 LSLL, // MVE long shift left.
87
88 CMP, // ARM compare instructions.
89 CMN, // ARM CMN instructions.
90 CMPZ, // ARM compare that sets only Z flag.
91 CMPFP, // ARM VFP compare instruction, sets FPSCR.
92 CMPFPE, // ARM VFP signalling compare instruction, sets FPSCR.
93 CMPFPw0, // ARM VFP compare against zero instruction, sets FPSCR.
94 CMPFPEw0, // ARM VFP signalling compare against zero instruction, sets
95 // FPSCR.
96 FMSTAT, // ARM fmstat instruction.
97
98 CMOV, // ARM conditional move instructions.
99
100 SSAT, // Signed saturation
101 USAT, // Unsigned saturation
102
104
105 LSLS, // Flag-setting shift left.
106 LSRS1, // Flag-setting logical shift right by one bit.
107 ASRS1, // Flag-setting arithmetic shift right by one bit.
108 RRX, // Shift right one bit with carry in.
109
110 ADDC, // Add with carry
111 ADDE, // Add using carry
112 SUBC, // Sub with carry
113 SUBE, // Sub using carry
114
115 VMOVRRD, // double to two gprs.
116 VMOVDRR, // Two gprs to double.
117 VMOVSR, // move gpr to single, used for f32 literal constructed in a gpr
118
119 EH_SJLJ_SETJMP, // SjLj exception handling setjmp.
120 EH_SJLJ_LONGJMP, // SjLj exception handling longjmp.
121 EH_SJLJ_SETUP_DISPATCH, // SjLj exception handling setup_dispatch.
122
123 TC_RETURN, // Tail call return pseudo.
124
126
127 DYN_ALLOC, // Dynamic allocation on the stack.
128
129 MEMBARRIER_MCR, // Memory barrier (MCR)
130
131 PRELOAD, // Preload
132
133 WIN__CHKSTK, // Windows' __chkstk call to do stack probing.
134 WIN__DBZCHK, // Windows' divide by zero check
135
136 WLS, // Low-overhead loops, While Loop Start branch. See t2WhileLoopStart
137 WLSSETUP, // Setup for the iteration count of a WLS. See t2WhileLoopSetup.
138 LOOP_DEC, // Really a part of LE, performs the sub
139 LE, // Low-overhead loops, Loop End
140
141 PREDICATE_CAST, // Predicate cast for MVE i1 types
142 VECTOR_REG_CAST, // Reinterpret the current contents of a vector register
143
144 MVESEXT, // Legalization aids for extending a vector into two/four vectors.
145 MVEZEXT, // or truncating two/four vectors into one. Eventually becomes
146 MVETRUNC, // stack store/load sequence, if not optimized to anything else.
147
148 VCMP, // Vector compare.
149 VCMPZ, // Vector compare to zero.
150 VTST, // Vector test bits.
151
152 // Vector shift by vector
153 VSHLs, // ...left/right by signed
154 VSHLu, // ...left/right by unsigned
155
156 // Vector shift by immediate:
157 VSHLIMM, // ...left
158 VSHRsIMM, // ...right (signed)
159 VSHRuIMM, // ...right (unsigned)
160
161 // Vector rounding shift by immediate:
162 VRSHRsIMM, // ...right (signed)
163 VRSHRuIMM, // ...right (unsigned)
164 VRSHRNIMM, // ...right narrow
165
166 // Vector saturating shift by immediate:
167 VQSHLsIMM, // ...left (signed)
168 VQSHLuIMM, // ...left (unsigned)
169 VQSHLsuIMM, // ...left (signed to unsigned)
170 VQSHRNsIMM, // ...right narrow (signed)
171 VQSHRNuIMM, // ...right narrow (unsigned)
172 VQSHRNsuIMM, // ...right narrow (signed to unsigned)
173
174 // Vector saturating rounding shift by immediate:
175 VQRSHRNsIMM, // ...right narrow (signed)
176 VQRSHRNuIMM, // ...right narrow (unsigned)
177 VQRSHRNsuIMM, // ...right narrow (signed to unsigned)
178
179 // Vector shift and insert:
180 VSLIIMM, // ...left
181 VSRIIMM, // ...right
182
183 // Vector get lane (VMOV scalar to ARM core register)
184 // (These are used for 8- and 16-bit element types only.)
185 VGETLANEu, // zero-extend vector extract element
186 VGETLANEs, // sign-extend vector extract element
187
188 // Vector move immediate and move negated immediate:
191
192 // Vector move f32 immediate:
194
195 // Move H <-> R, clearing top 16 bits
198
199 // Vector duplicate:
202
203 // Vector shuffles:
204 VEXT, // extract
205 VREV64, // reverse elements within 64-bit doublewords
206 VREV32, // reverse elements within 32-bit words
207 VREV16, // reverse elements within 16-bit halfwords
208 VZIP, // zip (interleave)
209 VUZP, // unzip (deinterleave)
210 VTRN, // transpose
211 VTBL1, // 1-register shuffle with mask
212 VTBL2, // 2-register shuffle with mask
213 VMOVN, // MVE vmovn
214
215 // MVE Saturating truncates
216 VQMOVNs, // Vector (V) Saturating (Q) Move and Narrow (N), signed (s)
217 VQMOVNu, // Vector (V) Saturating (Q) Move and Narrow (N), unsigned (u)
218
219 // MVE float <> half converts
220 VCVTN, // MVE vcvt f32 -> f16, truncating into either the bottom or top
221 // lanes
222 VCVTL, // MVE vcvt f16 -> f32, extending from either the bottom or top lanes
223
224 // MVE VIDUP instruction, taking a start value and increment.
226
227 // Vector multiply long:
228 VMULLs, // ...signed
229 VMULLu, // ...unsigned
230
231 VQDMULH, // MVE vqdmulh instruction
232
233 // MVE reductions
234 VADDVs, // sign- or zero-extend the elements of a vector to i32,
235 VADDVu, // add them all together, and return an i32 of their sum
236 VADDVps, // Same as VADDV[su] but with a v4i1 predicate mask
238 VADDLVs, // sign- or zero-extend elements to i64 and sum, returning
239 VADDLVu, // the low and high 32-bit halves of the sum
240 VADDLVAs, // Same as VADDLV[su] but also add an input accumulator
241 VADDLVAu, // provided as low and high halves
242 VADDLVps, // Same as VADDLV[su] but with a v4i1 predicate mask
244 VADDLVAps, // Same as VADDLVp[su] but with a v4i1 predicate mask
246 VMLAVs, // sign- or zero-extend the elements of two vectors to i32, multiply
247 VMLAVu, // them and add the results together, returning an i32 of the sum
248 VMLAVps, // Same as VMLAV[su] with a v4i1 predicate mask
250 VMLALVs, // Same as VMLAV but with i64, returning the low and
251 VMLALVu, // high 32-bit halves of the sum
252 VMLALVps, // Same as VMLALV[su] with a v4i1 predicate mask
254 VMLALVAs, // Same as VMLALV but also add an input accumulator
255 VMLALVAu, // provided as low and high halves
256 VMLALVAps, // Same as VMLALVA[su] with a v4i1 predicate mask
258 VMINVu, // Find minimum unsigned value of a vector and register
259 VMINVs, // Find minimum signed value of a vector and register
260 VMAXVu, // Find maximum unsigned value of a vector and register
261 VMAXVs, // Find maximum signed value of a vector and register
262
263 SMULWB, // Signed multiply word by half word, bottom
264 SMULWT, // Signed multiply word by half word, top
265 UMLAL, // 64bit Unsigned Accumulate Multiply
266 SMLAL, // 64bit Signed Accumulate Multiply
267 UMAAL, // 64-bit Unsigned Accumulate Accumulate Multiply
268 SMLALBB, // 64-bit signed accumulate multiply bottom, bottom 16
269 SMLALBT, // 64-bit signed accumulate multiply bottom, top 16
270 SMLALTB, // 64-bit signed accumulate multiply top, bottom 16
271 SMLALTT, // 64-bit signed accumulate multiply top, top 16
272 SMLALD, // Signed multiply accumulate long dual
273 SMLALDX, // Signed multiply accumulate long dual exchange
274 SMLSLD, // Signed multiply subtract long dual
275 SMLSLDX, // Signed multiply subtract long dual exchange
276 SMMLAR, // Signed multiply long, round and add
277 SMMLSR, // Signed multiply long, subtract and round
278
279 // Single Lane QADD8 and QADD16. Only the bottom lane. That's what the b
280 // stands for.
289
290 // Operands of the standard BUILD_VECTOR node are not legalized, which
291 // is fine if BUILD_VECTORs are always lowered to shuffles or other
292 // operations, but for ARM some BUILD_VECTORs are legal as-is and their
293 // operands need to be legalized. Define an ARM-specific version of
294 // BUILD_VECTOR for this purpose.
296
297 // Bit-field insert
299
300 // Vector OR with immediate
302 // Vector AND with NOT of immediate
304
305 // Pseudo vector bitwise select
307
308 // Pseudo-instruction representing a memory copy using ldm/stm
309 // instructions.
311
312 // Pseudo-instruction representing a memory copy using a tail predicated
313 // loop
315 // Pseudo-instruction representing a memset using a tail predicated
316 // loop
318
319 // V8.1MMainline condition select
320 CSINV, // Conditional select invert.
321 CSNEG, // Conditional select negate.
322 CSINC, // Conditional select increment.
323
324 // Vector load N-element structure to all lanes:
330
331 // NEON loads with post-increment base updates:
346
347 // NEON stores with post-increment base updates:
358
359 // Load/Store of dual registers
363 };
364
365 } // end namespace ARMISD
366
367 namespace ARM {
368 /// Possible values of current rounding mode, which is specified in bits
369 /// 23:22 of FPSCR.
370 enum Rounding {
371 RN = 0, // Round to Nearest
372 RP = 1, // Round towards Plus infinity
373 RM = 2, // Round towards Minus infinity
374 RZ = 3, // Round towards Zero
375 rmMask = 3 // Bit mask selecting rounding mode
376 };
377
378 // Bit position of rounding mode bits in FPSCR.
379 const unsigned RoundingBitsPos = 22;
380
381 // Bits of floating-point status. These are NZCV flags, QC bit and cumulative
382 // FP exception bits.
383 const unsigned FPStatusBits = 0xf800009f;
384
385 // Some bits in the FPSCR are not yet defined. They must be preserved when
386 // modifying the contents.
387 const unsigned FPReservedBits = 0x00006060;
388 } // namespace ARM
389
390 /// Define some predicates that are used for node matching.
391 namespace ARM {
392
393 bool isBitFieldInvertedMask(unsigned v);
394
395 } // end namespace ARM
396
397 //===--------------------------------------------------------------------===//
398 // ARMTargetLowering - ARM Implementation of the TargetLowering interface
399
401 // Copying needed for an outgoing byval argument.
402 enum ByValCopyKind {
403 // Argument is already in the correct location, no copy needed.
404 NoCopy,
405 // Argument value is currently in the local stack frame, needs copying to
406 // outgoing arguemnt area.
407 CopyOnce,
408 // Argument value is currently in the outgoing argument area, but not at
409 // the correct offset, so needs copying via a temporary in local stack
410 // space.
411 CopyViaTemp,
412 };
413
414 public:
415 explicit ARMTargetLowering(const TargetMachine &TM,
416 const ARMSubtarget &STI);
417
418 const ARMBaseTargetMachine &getTM() const;
419
420 unsigned getJumpTableEncoding() const override;
421 bool useSoftFloat() const override;
422
423 SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
424
425 /// ReplaceNodeResults - Replace the results of node with an illegal result
426 /// type with new values built out of custom code.
428 SelectionDAG &DAG) const override;
429
430 const char *getTargetNodeName(unsigned Opcode) const override;
431
432 bool isSelectSupported(SelectSupportKind Kind) const override {
433 // ARM does not support scalar condition selects on vectors.
434 return (Kind != ScalarCondVectorVal);
435 }
436
437 bool isReadOnly(const GlobalValue *GV) const;
438
439 /// getSetCCResultType - Return the value type to use for ISD::SETCC.
441 EVT VT) const override;
442
445 MachineBasicBlock *MBB) const override;
446
448 SDNode *Node) const override;
449
453 SDValue PerformIntrinsicCombine(SDNode *N, DAGCombinerInfo &DCI) const;
454 SDValue PerformMVEExtCombine(SDNode *N, DAGCombinerInfo &DCI) const;
455 SDValue PerformMVETruncCombine(SDNode *N, DAGCombinerInfo &DCI) const;
456 SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
457
459 const APInt &OriginalDemandedBits,
460 const APInt &OriginalDemandedElts,
461 KnownBits &Known,
462 TargetLoweringOpt &TLO,
463 unsigned Depth) const override;
464
465 bool isDesirableToTransformToIntegerOp(unsigned Opc, EVT VT) const override;
466
467 /// allowsMisalignedMemoryAccesses - Returns true if the target allows
468 /// unaligned memory accesses of the specified type. Returns whether it
469 /// is "fast" by reference in the second argument.
470 bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AddrSpace,
471 Align Alignment,
473 unsigned *Fast) const override;
474
475 EVT getOptimalMemOpType(LLVMContext &Context, const MemOp &Op,
476 const AttributeList &FuncAttributes) const override;
477
478 bool isTruncateFree(Type *SrcTy, Type *DstTy) const override;
479 bool isTruncateFree(EVT SrcVT, EVT DstVT) const override;
480 bool isZExtFree(SDValue Val, EVT VT2) const override;
481 Type* shouldConvertSplatType(ShuffleVectorInst* SVI) const override;
482
483 bool isFNegFree(EVT VT) const override;
484
485 bool isVectorLoadExtDesirable(SDValue ExtVal) const override;
486
487 bool allowTruncateForTailCall(Type *Ty1, Type *Ty2) const override;
488
489
490 /// isLegalAddressingMode - Return true if the addressing mode represented
491 /// by AM is legal for this target, for a load/store of the specified type.
492 bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM,
493 Type *Ty, unsigned AS,
494 Instruction *I = nullptr) const override;
495
496 bool isLegalT2ScaledAddressingMode(const AddrMode &AM, EVT VT) const;
497
498 /// Returns true if the addressing mode representing by AM is legal
499 /// for the Thumb1 target, for a load/store of the specified type.
500 bool isLegalT1ScaledAddressingMode(const AddrMode &AM, EVT VT) const;
501
502 /// isLegalICmpImmediate - Return true if the specified immediate is legal
503 /// icmp immediate, that is the target has icmp instructions which can
504 /// compare a register against the immediate without having to materialize
505 /// the immediate into a register.
506 bool isLegalICmpImmediate(int64_t Imm) const override;
507
508 /// isLegalAddImmediate - Return true if the specified immediate is legal
509 /// add immediate, that is the target has add instructions which can
510 /// add a register and the immediate without having to materialize
511 /// the immediate into a register.
512 bool isLegalAddImmediate(int64_t Imm) const override;
513
514 /// getPreIndexedAddressParts - returns true by value, base pointer and
515 /// offset pointer and addressing mode by reference if the node's address
516 /// can be legally represented as pre-indexed load / store address.
519 SelectionDAG &DAG) const override;
520
521 /// getPostIndexedAddressParts - returns true by value, base pointer and
522 /// offset pointer and addressing mode by reference if this node can be
523 /// combined with a load / store to form a post-indexed load / store.
526 SelectionDAG &DAG) const override;
527
529 const APInt &DemandedElts,
530 const SelectionDAG &DAG,
531 unsigned Depth) const override;
532
534 const APInt &DemandedElts,
535 TargetLoweringOpt &TLO) const override;
536
537 bool ExpandInlineAsm(CallInst *CI) const override;
538
539 ConstraintType getConstraintType(StringRef Constraint) const override;
540
541 /// Examine constraint string and operand type and determine a weight value.
542 /// The operand object must already have been set up with the operand type.
544 AsmOperandInfo &info, const char *constraint) const override;
545
546 std::pair<unsigned, const TargetRegisterClass *>
548 StringRef Constraint, MVT VT) const override;
549
550 const char *LowerXConstraint(EVT ConstraintVT) const override;
551
552 /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
553 /// vector. If it is invalid, don't add anything to Ops. If hasMemory is
554 /// true it means one of the asm constraint of the inline asm instruction
555 /// being processed is 'm'.
557 std::vector<SDValue> &Ops,
558 SelectionDAG &DAG) const override;
559
561 getInlineAsmMemConstraint(StringRef ConstraintCode) const override {
562 if (ConstraintCode == "Q")
564 if (ConstraintCode.size() == 2) {
565 if (ConstraintCode[0] == 'U') {
566 switch(ConstraintCode[1]) {
567 default:
568 break;
569 case 'm':
571 case 'n':
573 case 'q':
575 case 's':
577 case 't':
579 case 'v':
581 case 'y':
583 }
584 }
585 }
586 return TargetLowering::getInlineAsmMemConstraint(ConstraintCode);
587 }
588
589 const ARMSubtarget* getSubtarget() const {
590 return Subtarget;
591 }
592
593 /// getRegClassFor - Return the register class that should be used for the
594 /// specified value type.
595 const TargetRegisterClass *
596 getRegClassFor(MVT VT, bool isDivergent = false) const override;
597
598 bool shouldAlignPointerArgs(CallInst *CI, unsigned &MinSize,
599 Align &PrefAlign) const override;
600
601 /// createFastISel - This method returns a target specific FastISel object,
602 /// or null if the target does not support "fast" ISel.
604 const TargetLibraryInfo *libInfo) const override;
605
607
608 bool preferZeroCompareBranch() const override { return true; }
609
610 bool shouldExpandCmpUsingSelects(EVT VT) const override;
611
612 bool isMaskAndCmp0FoldingBeneficial(const Instruction &AndI) const override;
613
614 bool hasAndNotCompare(SDValue V) const override {
615 // We can use bics for any scalar.
616 return V.getValueType().isScalarInteger();
617 }
618
619 bool
620 isShuffleMaskLegal(ArrayRef<int> M, EVT VT) const override;
621 bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override;
622
623 /// isFPImmLegal - Returns true if the target can instruction select the
624 /// specified FP immediate natively. If false, the legalizer will
625 /// materialize the FP immediate as a load from a constant pool.
626 bool isFPImmLegal(const APFloat &Imm, EVT VT,
627 bool ForCodeSize = false) const override;
628
629 bool getTgtMemIntrinsic(IntrinsicInfo &Info,
630 const CallInst &I,
631 MachineFunction &MF,
632 unsigned Intrinsic) const override;
633
634 /// Returns true if it is beneficial to convert a load of a constant
635 /// to just the constant itself.
637 Type *Ty) const override;
638
639 /// Return true if EXTRACT_SUBVECTOR is cheap for this result type
640 /// with this index.
641 bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
642 unsigned Index) const override;
643
644 bool shouldFormOverflowOp(unsigned Opcode, EVT VT,
645 bool MathUsed) const override {
646 // Using overflow ops for overflow checks only should beneficial on ARM.
647 return TargetLowering::shouldFormOverflowOp(Opcode, VT, true);
648 }
649
650 bool shouldReassociateReduction(unsigned Opc, EVT VT) const override {
651 return Opc != ISD::VECREDUCE_ADD;
652 }
653
654 /// Returns true if an argument of type Ty needs to be passed in a
655 /// contiguous block of registers in calling convention CallConv.
657 Type *Ty, CallingConv::ID CallConv, bool isVarArg,
658 const DataLayout &DL) const override;
659
660 /// If a physical register, this returns the register that receives the
661 /// exception address on entry to an EH pad.
663 getExceptionPointerRegister(const Constant *PersonalityFn) const override;
664
665 /// If a physical register, this returns the register that receives the
666 /// exception typeid on entry to a landing pad.
668 getExceptionSelectorRegister(const Constant *PersonalityFn) const override;
669
671 Value *emitLoadLinked(IRBuilderBase &Builder, Type *ValueTy, Value *Addr,
672 AtomicOrdering Ord) const override;
674 AtomicOrdering Ord) const override;
675
676 void
677 emitAtomicCmpXchgNoStoreLLBalance(IRBuilderBase &Builder) const override;
678
680 AtomicOrdering Ord) const override;
682 AtomicOrdering Ord) const override;
683
684 unsigned getMaxSupportedInterleaveFactor() const override;
685
686 bool lowerInterleavedLoad(Instruction *Load, Value *Mask,
688 ArrayRef<unsigned> Indices, unsigned Factor,
689 const APInt &GapMask) const override;
690 bool lowerInterleavedStore(Instruction *Store, Value *Mask,
691 ShuffleVectorInst *SVI, unsigned Factor,
692 const APInt &GapMask) const override;
693
694 bool shouldInsertFencesForAtomic(const Instruction *I) const override;
696 shouldExpandAtomicLoadInIR(LoadInst *LI) const override;
698 shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
700 shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
703
704 bool useLoadStackGuardNode(const Module &M) const override;
705
706 void insertSSPDeclarations(Module &M) const override;
707 Function *getSSPStackGuardCheck(const Module &M) const override;
708
709 bool canCombineStoreAndExtract(Type *VectorTy, Value *Idx,
710 unsigned &Cost) const override;
711
712 bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,
713 const MachineFunction &MF) const override {
714 // Do not merge to larger than i32.
715 return (MemVT.getSizeInBits() <= 32);
716 }
717
718 bool isCheapToSpeculateCttz(Type *Ty) const override;
719 bool isCheapToSpeculateCtlz(Type *Ty) const override;
720
721 bool convertSetCCLogicToBitwiseLogic(EVT VT) const override {
722 return VT.isScalarInteger();
723 }
724
725 bool supportSwiftError() const override {
726 return true;
727 }
728
729 bool supportSplitCSR(MachineFunction *MF) const override {
731 MF->getFunction().hasFnAttribute(Attribute::NoUnwind);
732 }
733
734 bool hasStandaloneRem(EVT VT) const override {
735 return HasStandaloneRem;
736 }
737
740 unsigned ExpansionFactor) const override;
741
742 CCAssignFn *CCAssignFnForCall(CallingConv::ID CC, bool isVarArg) const;
743 CCAssignFn *CCAssignFnForReturn(CallingConv::ID CC, bool isVarArg) const;
744
745 /// Returns true if \p VecTy is a legal interleaved access type. This
746 /// function checks the vector element type and the overall width of the
747 /// vector.
748 bool isLegalInterleavedAccessType(unsigned Factor, FixedVectorType *VecTy,
749 Align Alignment,
750 const DataLayout &DL) const;
751
753 SDValue ConstNode) const override;
754
755 bool alignLoopsWithOptSize() const override;
756
757 /// Returns the number of interleaved accesses that will be generated when
758 /// lowering accesses of the given type.
760 const DataLayout &DL) const;
761
762 void finalizeLowering(MachineFunction &MF) const override;
763
764 /// Return the correct alignment for the current calling convention.
766 const DataLayout &DL) const override;
767
769 CombineLevel Level) const override;
770
771 bool isDesirableToCommuteXorWithShift(const SDNode *N) const override;
772
774 CombineLevel Level) const override;
775
776 bool shouldFoldSelectWithIdentityConstant(unsigned BinOpcode, EVT VT,
777 unsigned SelectOpcode, SDValue X,
778 SDValue Y) const override;
779
780 bool preferIncOfAddToSubOfNot(EVT VT) const override;
781
782 bool shouldConvertFpToSat(unsigned Op, EVT FPVT, EVT VT) const override;
783
784 bool isComplexDeinterleavingSupported() const override;
786 ComplexDeinterleavingOperation Operation, Type *Ty) const override;
787
790 ComplexDeinterleavingRotation Rotation, Value *InputA, Value *InputB,
791 Value *Accumulator = nullptr) const override;
792
793 bool softPromoteHalfType() const override { return true; }
794
795 bool useFPRegsForHalfType() const override { return true; }
796
797 protected:
798 std::pair<const TargetRegisterClass *, uint8_t>
800 MVT VT) const override;
801
802 private:
803 /// Subtarget - Keep a pointer to the ARMSubtarget around so that we can
804 /// make the right decision when generating code for different targets.
805 const ARMSubtarget *Subtarget;
806
808
809 const InstrItineraryData *Itins;
810
811 // TODO: remove this, and have shouldInsertFencesForAtomic do the proper
812 // check.
813 bool InsertFencesForAtomic;
814
815 bool HasStandaloneRem = true;
816
817 void addTypeForNEON(MVT VT, MVT PromotedLdStVT);
818 void addDRTypeForNEON(MVT VT);
819 void addQRTypeForNEON(MVT VT);
820 std::pair<SDValue, SDValue> getARMXALUOOp(SDValue Op, SelectionDAG &DAG, SDValue &ARMcc) const;
821
822 using RegsToPassVector = SmallVector<std::pair<unsigned, SDValue>, 8>;
823
824 void PassF64ArgInRegs(const SDLoc &dl, SelectionDAG &DAG, SDValue Chain,
825 SDValue &Arg, RegsToPassVector &RegsToPass,
826 CCValAssign &VA, CCValAssign &NextVA,
827 SDValue &StackPtr,
828 SmallVectorImpl<SDValue> &MemOpChains,
829 bool IsTailCall,
830 int SPDiff) const;
831 SDValue GetF64FormalArgument(CCValAssign &VA, CCValAssign &NextVA,
832 SDValue &Root, SelectionDAG &DAG,
833 const SDLoc &dl) const;
834
835 CallingConv::ID getEffectiveCallingConv(CallingConv::ID CC,
836 bool isVarArg) const;
837 CCAssignFn *CCAssignFnForNode(CallingConv::ID CC, bool Return,
838 bool isVarArg) const;
839 std::pair<SDValue, MachinePointerInfo>
840 computeAddrForCallArg(const SDLoc &dl, SelectionDAG &DAG,
841 const CCValAssign &VA, SDValue StackPtr,
842 bool IsTailCall, int SPDiff) const;
843 ByValCopyKind ByValNeedsCopyForTailCall(SelectionDAG &DAG, SDValue Src,
844 SDValue Dst,
845 ISD::ArgFlagsTy Flags) const;
846 SDValue LowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;
847 SDValue LowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;
848 SDValue LowerEH_SJLJ_SETUP_DISPATCH(SDValue Op, SelectionDAG &DAG) const;
849 SDValue LowerINTRINSIC_VOID(SDValue Op, SelectionDAG &DAG,
850 const ARMSubtarget *Subtarget) const;
851 SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG,
852 const ARMSubtarget *Subtarget) const;
853 SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
854 SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
855 SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
856 SDValue LowerGlobalAddressDarwin(SDValue Op, SelectionDAG &DAG) const;
857 SDValue LowerGlobalAddressELF(SDValue Op, SelectionDAG &DAG) const;
858 SDValue LowerGlobalAddressWindows(SDValue Op, SelectionDAG &DAG) const;
859 SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
860 SDValue LowerToTLSGeneralDynamicModel(GlobalAddressSDNode *GA,
861 SelectionDAG &DAG) const;
862 SDValue LowerToTLSExecModels(GlobalAddressSDNode *GA,
863 SelectionDAG &DAG,
864 TLSModel::Model model) const;
865 SDValue LowerGlobalTLSAddressDarwin(SDValue Op, SelectionDAG &DAG) const;
866 SDValue LowerGlobalTLSAddressWindows(SDValue Op, SelectionDAG &DAG) const;
867 SDValue LowerBR_JT(SDValue Op, SelectionDAG &DAG) const;
868 SDValue LowerSignedALUO(SDValue Op, SelectionDAG &DAG) const;
869 SDValue LowerUnsignedALUO(SDValue Op, SelectionDAG &DAG) const;
870 SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
871 SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const;
872 SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
873 SDValue LowerBR_CC(SDValue Op, SelectionDAG &DAG) const;
874 SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) const;
875 SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
876 SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
877 SDValue LowerShiftRightParts(SDValue Op, SelectionDAG &DAG) const;
878 SDValue LowerShiftLeftParts(SDValue Op, SelectionDAG &DAG) const;
879 SDValue LowerGET_ROUNDING(SDValue Op, SelectionDAG &DAG) const;
880 SDValue LowerSET_ROUNDING(SDValue Op, SelectionDAG &DAG) const;
881 SDValue LowerSET_FPMODE(SDValue Op, SelectionDAG &DAG) const;
882 SDValue LowerRESET_FPMODE(SDValue Op, SelectionDAG &DAG) const;
883 SDValue LowerConstantFP(SDValue Op, SelectionDAG &DAG,
884 const ARMSubtarget *ST) const;
885 SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG,
886 const ARMSubtarget *ST) const;
887 SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
888 SDValue LowerFSINCOS(SDValue Op, SelectionDAG &DAG) const;
889 SDValue LowerDivRem(SDValue Op, SelectionDAG &DAG) const;
890 SDValue LowerDIV_Windows(SDValue Op, SelectionDAG &DAG, bool Signed) const;
891 void ExpandDIV_Windows(SDValue Op, SelectionDAG &DAG, bool Signed,
893 SDValue ExpandBITCAST(SDNode *N, SelectionDAG &DAG,
894 const ARMSubtarget *Subtarget) const;
895 SDValue LowerWindowsDIVLibCall(SDValue Op, SelectionDAG &DAG, bool Signed,
896 SDValue &Chain) const;
897 SDValue LowerREM(SDNode *N, SelectionDAG &DAG) const;
898 SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
899 SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;
900 SDValue LowerFP_EXTEND(SDValue Op, SelectionDAG &DAG) const;
901 SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;
902 SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
903 SDValue LowerFSETCC(SDValue Op, SelectionDAG &DAG) const;
904 SDValue LowerSPONENTRY(SDValue Op, SelectionDAG &DAG) const;
905 void LowerLOAD(SDNode *N, SmallVectorImpl<SDValue> &Results,
906 SelectionDAG &DAG) const;
907 SDValue LowerFP_TO_BF16(SDValue Op, SelectionDAG &DAG) const;
908 SDValue LowerCMP(SDValue Op, SelectionDAG &DAG) const;
909
910 Register getRegisterByName(const char* RegName, LLT VT,
911 const MachineFunction &MF) const override;
912
913 SDValue BuildSDIVPow2(SDNode *N, const APInt &Divisor, SelectionDAG &DAG,
914 SmallVectorImpl<SDNode *> &Created) const override;
915
916 bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,
917 EVT VT) const override;
918
919 SDValue MoveToHPR(const SDLoc &dl, SelectionDAG &DAG, MVT LocVT, MVT ValVT,
920 SDValue Val) const;
921 SDValue MoveFromHPR(const SDLoc &dl, SelectionDAG &DAG, MVT LocVT,
922 MVT ValVT, SDValue Val) const;
923
924 SDValue ReconstructShuffle(SDValue Op, SelectionDAG &DAG) const;
925
926 SDValue LowerCallResult(SDValue Chain, SDValue InGlue,
927 CallingConv::ID CallConv, bool isVarArg,
929 const SDLoc &dl, SelectionDAG &DAG,
930 SmallVectorImpl<SDValue> &InVals, bool isThisReturn,
931 SDValue ThisVal, bool isCmseNSCall) const;
932
933 void initializeSplitCSR(MachineBasicBlock *Entry) const override;
934 void insertCopiesSplitCSR(
935 MachineBasicBlock *Entry,
936 const SmallVectorImpl<MachineBasicBlock *> &Exits) const override;
937
938 bool splitValueIntoRegisterParts(
939 SelectionDAG & DAG, const SDLoc &DL, SDValue Val, SDValue *Parts,
940 unsigned NumParts, MVT PartVT, std::optional<CallingConv::ID> CC)
941 const override;
942
943 SDValue joinRegisterPartsIntoValue(
944 SelectionDAG & DAG, const SDLoc &DL, const SDValue *Parts,
945 unsigned NumParts, MVT PartVT, EVT ValueVT,
946 std::optional<CallingConv::ID> CC) const override;
947
948 SDValue
949 LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
951 const SDLoc &dl, SelectionDAG &DAG,
952 SmallVectorImpl<SDValue> &InVals) const override;
953
954 int StoreByValRegs(CCState &CCInfo, SelectionDAG &DAG, const SDLoc &dl,
955 SDValue &Chain, const Value *OrigArg,
956 unsigned InRegsParamRecordIdx, int ArgOffset,
957 unsigned ArgSize) const;
958
959 void VarArgStyleRegisters(CCState &CCInfo, SelectionDAG &DAG,
960 const SDLoc &dl, SDValue &Chain,
961 unsigned ArgOffset, unsigned TotalArgRegsSaveSize,
962 bool ForceMutable = false) const;
963
965 SmallVectorImpl<SDValue> &InVals) const override;
966
967 /// HandleByVal - Target-specific cleanup for ByVal support.
968 void HandleByVal(CCState *, unsigned &, Align) const override;
969
970 /// IsEligibleForTailCallOptimization - Check whether the call is eligible
971 /// for tail call optimization. Targets which want to do tail call
972 /// optimization should implement this function.
973 bool IsEligibleForTailCallOptimization(
975 SmallVectorImpl<CCValAssign> &ArgLocs, const bool isIndirect) const;
976
977 bool CanLowerReturn(CallingConv::ID CallConv,
978 MachineFunction &MF, bool isVarArg,
980 LLVMContext &Context, const Type *RetTy) const override;
981
982 SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
984 const SmallVectorImpl<SDValue> &OutVals,
985 const SDLoc &dl, SelectionDAG &DAG) const override;
986
987 bool isUsedByReturnOnly(SDNode *N, SDValue &Chain) const override;
988
989 bool mayBeEmittedAsTailCall(const CallInst *CI) const override;
990
991 bool shouldConsiderGEPOffsetSplit() const override { return true; }
992
993 bool isUnsupportedFloatingType(EVT VT) const;
994
995 SDValue getCMOV(const SDLoc &dl, EVT VT, SDValue FalseVal, SDValue TrueVal,
996 SDValue ARMcc, SDValue Flags, SelectionDAG &DAG) const;
997 SDValue getARMCmp(SDValue LHS, SDValue RHS, ISD::CondCode CC,
998 SDValue &ARMcc, SelectionDAG &DAG, const SDLoc &dl) const;
999 SDValue getVFPCmp(SDValue LHS, SDValue RHS, SelectionDAG &DAG,
1000 const SDLoc &dl, bool Signaling = false) const;
1001
1002 SDValue OptimizeVFPBrcond(SDValue Op, SelectionDAG &DAG) const;
1003
1004 void SetupEntryBlockForSjLj(MachineInstr &MI, MachineBasicBlock *MBB,
1005 MachineBasicBlock *DispatchBB, int FI) const;
1006
1007 void EmitSjLjDispatchBlock(MachineInstr &MI, MachineBasicBlock *MBB) const;
1008
1009 MachineBasicBlock *EmitStructByval(MachineInstr &MI,
1010 MachineBasicBlock *MBB) const;
1011
1012 MachineBasicBlock *EmitLowered__chkstk(MachineInstr &MI,
1013 MachineBasicBlock *MBB) const;
1014 MachineBasicBlock *EmitLowered__dbzchk(MachineInstr &MI,
1015 MachineBasicBlock *MBB) const;
1016 void addMVEVectorTypes(bool HasMVEFP);
1017 void addAllExtLoads(const MVT From, const MVT To, LegalizeAction Action);
1018 void setAllExpand(MVT VT);
1019 };
1020
1027
1028 namespace ARM {
1029
1030 FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
1031 const TargetLibraryInfo *libInfo);
1032
1033 } // end namespace ARM
1034
1035} // end namespace llvm
1036
1037#endif // LLVM_LIB_TARGET_ARM_ARMISELLOWERING_H
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
This file contains the simple types necessary to represent the attributes associated with functions a...
BlockVerifier::State From
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
Analysis containing CSE Info
Definition: CSEInfo.cpp:27
return RetTy
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
uint64_t Addr
uint32_t Index
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")
IRTranslator LLVM IR MI
#define RegName(no)
lazy value info
#define I(x, y, z)
Definition: MD5.cpp:58
Register const TargetRegisterInfo * TRI
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")
PowerPC Reduce CR logical Operation
This file defines the SmallVector class.
This file describes how to lower LLVM code to machine code.
Value * RHS
Value * LHS
Class for arbitrary precision integers.
Definition: APInt.h:78
bool shouldFoldSelectWithIdentityConstant(unsigned BinOpcode, EVT VT, unsigned SelectOpcode, SDValue X, SDValue Y) const override
Return true if pulling a binary operation into a select with an identity constant is profitable.
bool isReadOnly(const GlobalValue *GV) const
unsigned getMaxSupportedInterleaveFactor() const override
Get the maximum supported factor for interleaved memory accesses.
TargetLoweringBase::AtomicExpansionKind shouldExpandAtomicLoadInIR(LoadInst *LI) const override
Returns how the given (atomic) load should be expanded by the IR-level AtomicExpand pass.
unsigned getNumInterleavedAccesses(VectorType *VecTy, const DataLayout &DL) const
Returns the number of interleaved accesses that will be generated when lowering accesses of the given...
bool shouldInsertFencesForAtomic(const Instruction *I) const override
Whether AtomicExpandPass should automatically insert fences and reduce ordering for this atomic.
Align getABIAlignmentForCallingConv(Type *ArgTy, const DataLayout &DL) const override
Return the correct alignment for the current calling convention.
bool isDesirableToCommuteWithShift(const SDNode *N, CombineLevel Level) const override
Return true if it is profitable to move this shift by a constant amount through its operand,...
Register getExceptionPointerRegister(const Constant *PersonalityFn) const override
If a physical register, this returns the register that receives the exception address on entry to an ...
ConstraintWeight getSingleConstraintMatchWeight(AsmOperandInfo &info, const char *constraint) const override
Examine constraint string and operand type and determine a weight value.
bool shouldExpandCmpUsingSelects(EVT VT) const override
Should we expand [US]CMP nodes using two selects and two compares, or by doing arithmetic on boolean ...
bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty, unsigned AS, Instruction *I=nullptr) const override
isLegalAddressingMode - Return true if the addressing mode represented by AM is legal for this target...
const ARMSubtarget * getSubtarget() const
bool isLegalT2ScaledAddressingMode(const AddrMode &AM, EVT VT) const
bool isLegalT1ScaledAddressingMode(const AddrMode &AM, EVT VT) const
Returns true if the addressing mode representing by AM is legal for the Thumb1 target,...
bool getPreIndexedAddressParts(SDNode *N, SDValue &Base, SDValue &Offset, ISD::MemIndexedMode &AM, SelectionDAG &DAG) const override
getPreIndexedAddressParts - returns true by value, base pointer and offset pointer and addressing mod...
InlineAsm::ConstraintCode getInlineAsmMemConstraint(StringRef ConstraintCode) const override
bool shouldAlignPointerArgs(CallInst *CI, unsigned &MinSize, Align &PrefAlign) const override
Return true if the pointer arguments to CI should be aligned by aligning the object whose address is ...
void ReplaceNodeResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const override
ReplaceNodeResults - Replace the results of node with an illegal result type with new values built ou...
void emitAtomicCmpXchgNoStoreLLBalance(IRBuilderBase &Builder) const override
bool isMulAddWithConstProfitable(SDValue AddNode, SDValue ConstNode) const override
Return true if it may be profitable to transform (mul (add x, c1), c2) -> (add (mul x,...
bool isLegalAddImmediate(int64_t Imm) const override
isLegalAddImmediate - Return true if the specified immediate is legal add immediate,...
EVT getOptimalMemOpType(LLVMContext &Context, const MemOp &Op, const AttributeList &FuncAttributes) const override
Returns the target specific optimal type for load and store operations as a result of memset,...
Instruction * emitTrailingFence(IRBuilderBase &Builder, Instruction *Inst, AtomicOrdering Ord) const override
bool supportSwiftError() const override
Return true if the target supports swifterror attribute.
bool isFNegFree(EVT VT) const override
Return true if an fneg operation is free to the point where it is never worthwhile to replace it with...
void finalizeLowering(MachineFunction &MF) const override
Execute target specific actions to finalize target lowering.
SDValue PerformMVETruncCombine(SDNode *N, DAGCombinerInfo &DCI) const
bool isFPImmLegal(const APFloat &Imm, EVT VT, bool ForCodeSize=false) const override
isFPImmLegal - Returns true if the target can instruction select the specified FP immediate natively.
ConstraintType getConstraintType(StringRef Constraint) const override
getConstraintType - Given a constraint letter, return the type of constraint it is for this target.
bool preferIncOfAddToSubOfNot(EVT VT) const override
These two forms are equivalent: sub y, (xor x, -1) add (add x, 1), y The variant with two add's is IR...
Function * getSSPStackGuardCheck(const Module &M) const override
If the target has a standard stack protection check function that performs validation and error handl...
bool useFPRegsForHalfType() const override
void computeKnownBitsForTargetNode(const SDValue Op, KnownBits &Known, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth) const override
Determine which of the bits specified in Mask are known to be either zero or one and return them in t...
TargetLoweringBase::AtomicExpansionKind shouldExpandAtomicStoreInIR(StoreInst *SI) const override
Returns how the given (atomic) store should be expanded by the IR-level AtomicExpand pass into.
void insertSSPDeclarations(Module &M) const override
Inserts necessary declarations for SSP (stack protection) purpose.
SDValue PerformIntrinsicCombine(SDNode *N, DAGCombinerInfo &DCI) const
PerformIntrinsicCombine - ARM-specific DAG combining for intrinsics.
bool isDesirableToCommuteXorWithShift(const SDNode *N) const override
Return true if it is profitable to combine an XOR of a logical shift to create a logical shift of NOT...
bool ExpandInlineAsm(CallInst *CI) const override
This hook allows the target to expand an inline asm call to be explicit llvm code if it wants to.
SDValue PerformCMOVCombine(SDNode *N, SelectionDAG &DAG) const
PerformCMOVCombine - Target-specific DAG combining for ARMISD::CMOV.
Value * createComplexDeinterleavingIR(IRBuilderBase &B, ComplexDeinterleavingOperation OperationType, ComplexDeinterleavingRotation Rotation, Value *InputA, Value *InputB, Value *Accumulator=nullptr) const override
Create the IR node for the given complex deinterleaving operation.
bool isComplexDeinterleavingSupported() const override
Does this target support complex deinterleaving.
bool supportSplitCSR(MachineFunction *MF) const override
Return true if the target supports that a subset of CSRs for the given machine function is handled ex...
SDValue PerformMVEExtCombine(SDNode *N, DAGCombinerInfo &DCI) const
bool shouldFoldConstantShiftPairToMask(const SDNode *N, CombineLevel Level) const override
Return true if it is profitable to fold a pair of shifts into a mask.
bool SimplifyDemandedBitsForTargetNode(SDValue Op, const APInt &OriginalDemandedBits, const APInt &OriginalDemandedElts, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth) const override
Attempt to simplify any target nodes based on the demanded bits/elts, returning true on success.
EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const override
getSetCCResultType - Return the value type to use for ISD::SETCC.
MachineBasicBlock * EmitInstrWithCustomInserter(MachineInstr &MI, MachineBasicBlock *MBB) const override
This method should be implemented by targets that mark instructions with the 'usesCustomInserter' fla...
Value * emitStoreConditional(IRBuilderBase &Builder, Value *Val, Value *Addr, AtomicOrdering Ord) const override
Perform a store-conditional operation to Addr.
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
CCAssignFn * CCAssignFnForReturn(CallingConv::ID CC, bool isVarArg) const
FastISel * createFastISel(FunctionLoweringInfo &funcInfo, const TargetLibraryInfo *libInfo) const override
createFastISel - This method returns a target specific FastISel object, or null if the target does no...
void AdjustInstrPostInstrSelection(MachineInstr &MI, SDNode *Node) const override
This method should be implemented by targets that mark instructions with the 'hasPostISelHook' flag.
TargetLoweringBase::AtomicExpansionKind shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override
Returns how the IR-level AtomicExpand pass should expand the given AtomicRMW, if at all.
bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT, unsigned Index) const override
Return true if EXTRACT_SUBVECTOR is cheap for this result type with this index.
bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I, MachineFunction &MF, unsigned Intrinsic) const override
getTgtMemIntrinsic - Represent NEON load and store intrinsics as MemIntrinsicNodes.
bool isTruncateFree(Type *SrcTy, Type *DstTy) const override
Return true if it's free to truncate a value of type FromTy to type ToTy.
bool isShuffleMaskLegal(ArrayRef< int > M, EVT VT) const override
isShuffleMaskLegal - Targets can use this to indicate that they only support some VECTOR_SHUFFLE oper...
bool shouldConvertConstantLoadToIntImm(const APInt &Imm, Type *Ty) const override
Returns true if it is beneficial to convert a load of a constant to just the constant itself.
bool shouldFormOverflowOp(unsigned Opcode, EVT VT, bool MathUsed) const override
Try to convert math with an overflow comparison into the corresponding DAG node operation.
bool lowerInterleavedStore(Instruction *Store, Value *Mask, ShuffleVectorInst *SVI, unsigned Factor, const APInt &GapMask) const override
Lower an interleaved store into a vstN intrinsic.
bool isSelectSupported(SelectSupportKind Kind) const override
const TargetRegisterClass * getRegClassFor(MVT VT, bool isDivergent=false) const override
getRegClassFor - Return the register class that should be used for the specified value type.
bool useLoadStackGuardNode(const Module &M) const override
If this function returns true, SelectionDAGBuilder emits a LOAD_STACK_GUARD node when it is lowering ...
bool lowerInterleavedLoad(Instruction *Load, Value *Mask, ArrayRef< ShuffleVectorInst * > Shuffles, ArrayRef< unsigned > Indices, unsigned Factor, const APInt &GapMask) const override
Lower an interleaved load into a vldN intrinsic.
std::pair< const TargetRegisterClass *, uint8_t > findRepresentativeClass(const TargetRegisterInfo *TRI, MVT VT) const override
Return the largest legal super-reg register class of the register class for the specified type and it...
bool isZExtFree(SDValue Val, EVT VT2) const override
Return true if zero-extending the specific node Val to type VT2 is free (either because it's implicit...
bool isCheapToSpeculateCttz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic cttz.
bool shouldReassociateReduction(unsigned Opc, EVT VT) const override
SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override
This method will be invoked for all target nodes and for any target-independent nodes that the target...
bool convertSetCCLogicToBitwiseLogic(EVT VT) const override
Use bitwise logic to make pairs of compares more efficient.
bool isCheapToSpeculateCtlz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic ctlz.
bool targetShrinkDemandedConstant(SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, TargetLoweringOpt &TLO) const override
bool isComplexDeinterleavingOperationSupported(ComplexDeinterleavingOperation Operation, Type *Ty) const override
Does this target support complex deinterleaving with the given operation and type.
SDValue PerformBRCONDCombine(SDNode *N, SelectionDAG &DAG) const
PerformBRCONDCombine - Target-specific DAG combining for ARMISD::BRCOND.
const char * getTargetNodeName(unsigned Opcode) const override
This method returns the name of a target specific DAG node.
Register getExceptionSelectorRegister(const Constant *PersonalityFn) const override
If a physical register, this returns the register that receives the exception typeid on entry to a la...
Type * shouldConvertSplatType(ShuffleVectorInst *SVI) const override
Given a shuffle vector SVI representing a vector splat, return a new scalar type of size equal to SVI...
Value * emitLoadLinked(IRBuilderBase &Builder, Type *ValueTy, Value *Addr, AtomicOrdering Ord) const override
Perform a load-linked operation on Addr, returning a "Value *" with the corresponding pointee type.
Instruction * makeDMB(IRBuilderBase &Builder, ARM_MB::MemBOpt Domain) const
bool isLegalICmpImmediate(int64_t Imm) const override
isLegalICmpImmediate - Return true if the specified immediate is legal icmp immediate,...
const char * LowerXConstraint(EVT ConstraintVT) const override
Try to replace an X constraint, which matches anything, with another that has more specific requireme...
unsigned getJumpTableEncoding() const override
Return the entry encoding for a jump table in the current function.
bool isDesirableToTransformToIntegerOp(unsigned Opc, EVT VT) const override
Return true if it is profitable for dag combiner to transform a floating point op of specified opcode...
TargetLoweringBase::AtomicExpansionKind shouldExpandAtomicCmpXchgInIR(AtomicCmpXchgInst *AI) const override
Returns how the given atomic cmpxchg should be expanded by the IR-level AtomicExpand pass.
CCAssignFn * CCAssignFnForCall(CallingConv::ID CC, bool isVarArg) const
bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AddrSpace, Align Alignment, MachineMemOperand::Flags Flags, unsigned *Fast) const override
allowsMisalignedMemoryAccesses - Returns true if the target allows unaligned memory accesses of the s...
bool isLegalInterleavedAccessType(unsigned Factor, FixedVectorType *VecTy, Align Alignment, const DataLayout &DL) const
Returns true if VecTy is a legal interleaved access type.
bool isVectorLoadExtDesirable(SDValue ExtVal) const override
Return true if folding a vector load into ExtVal (a sign, zero, or any extend node) is profitable.
bool canCombineStoreAndExtract(Type *VectorTy, Value *Idx, unsigned &Cost) const override
Return true if the target can combine store(extractelement VectorTy, Idx).
bool preferZeroCompareBranch() const override
Return true if the heuristic to prefer icmp eq zero should be used in code gen prepare.
bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT, const MachineFunction &MF) const override
Returns if it's reasonable to merge stores to MemVT size.
bool useSoftFloat() const override
bool alignLoopsWithOptSize() const override
Should loops be aligned even when the function is marked OptSize (but not MinSize).
SDValue PerformCMOVToBFICombine(SDNode *N, SelectionDAG &DAG) const
bool allowTruncateForTailCall(Type *Ty1, Type *Ty2) const override
Return true if a truncation from FromTy to ToTy is permitted when deciding whether a call is in tail ...
void LowerAsmOperandForConstraint(SDValue Op, StringRef Constraint, std::vector< SDValue > &Ops, SelectionDAG &DAG) const override
LowerAsmOperandForConstraint - Lower the specified operand into the Ops vector.
bool hasAndNotCompare(SDValue V) const override
Return true if the target should transform: (X & Y) == Y —> (~X & Y) == 0 (X & Y) !...
std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const override
Given a physical register constraint (e.g.
bool shouldConvertFpToSat(unsigned Op, EVT FPVT, EVT VT) const override
Should we generate fp_to_si_sat and fp_to_ui_sat from type FPVT to type VT from min(max(fptoi)) satur...
bool functionArgumentNeedsConsecutiveRegisters(Type *Ty, CallingConv::ID CallConv, bool isVarArg, const DataLayout &DL) const override
Returns true if an argument of type Ty needs to be passed in a contiguous block of registers in calli...
bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override
Return true if folding a constant offset with the given GlobalAddress is legal.
const ARMBaseTargetMachine & getTM() const
bool isMaskAndCmp0FoldingBeneficial(const Instruction &AndI) const override
Return if the target supports combining a chain like:
bool softPromoteHalfType() const override
bool hasStandaloneRem(EVT VT) const override
Return true if the target can handle a standalone remainder operation.
ShiftLegalizationStrategy preferredShiftLegalizationStrategy(SelectionDAG &DAG, SDNode *N, unsigned ExpansionFactor) const override
bool getPostIndexedAddressParts(SDNode *N, SDNode *Op, SDValue &Base, SDValue &Offset, ISD::MemIndexedMode &AM, SelectionDAG &DAG) const override
getPostIndexedAddressParts - returns true by value, base pointer and offset pointer and addressing mo...
Instruction * emitLeadingFence(IRBuilderBase &Builder, Instruction *Inst, AtomicOrdering Ord) const override
Inserts in the IR a target-specific intrinsic specifying a fence.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41
An instruction that atomically checks whether a specified value is in a memory location,...
Definition: Instructions.h:506
an instruction that atomically reads a memory location, combines it with another value,...
Definition: Instructions.h:709
CCState - This class holds information needed while lowering arguments and return values.
CCValAssign - Represent assignment of one arg/retval to a location.
This class represents a function call, abstracting a target machine's calling convention.
This is an important base class in LLVM.
Definition: Constant.h:43
This class represents an Operation in the Expression.
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63
This is a fast-path instruction selection class that generates poor code and doesn't support illegal ...
Definition: FastISel.h:66
Class to represent fixed width SIMD vectors.
Definition: DerivedTypes.h:592
FunctionLoweringInfo - This contains information that is global to a function that is used when lower...
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition: Function.h:270
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
Definition: Function.cpp:727
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:114
Itinerary data supplied by a subtarget to be used by a target.
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:68
An instruction for reading from memory.
Definition: Instructions.h:180
Machine Value Type.
Function & getFunction()
Return the LLVM function that this machine code represents.
Representation of each machine instruction.
Definition: MachineInstr.h:72
Flags
Flags values. These may be or'd together.
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:67
Wrapper class representing virtual and physical registers.
Definition: Register.h:19
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:229
This instruction constructs a fixed permutation of two input vectors.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197
An instruction for storing to memory.
Definition: Instructions.h:296
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:55
constexpr size_t size() const
size - Get the string size.
Definition: StringRef.h:154
Provides information about what library functions are available for the current target.
LegalizeAction
This enum indicates whether operations are valid for a target, and if not, what action should be used...
virtual bool shouldFormOverflowOp(unsigned Opcode, EVT VT, bool MathUsed) const
Try to convert math with an overflow comparison into the corresponding DAG node operation.
ShiftLegalizationStrategy
Return the preferred strategy to legalize tihs SHIFT instruction, with ExpansionFactor being the recu...
SelectSupportKind
Enum that describes what type of support for selects the target has.
Sched::Preference getSchedulingPreference() const
Return target scheduling preference.
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
virtual InlineAsm::ConstraintCode getInlineAsmMemConstraint(StringRef ConstraintCode) const
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:83
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45
LLVM Value Representation.
Definition: Value.h:75
Base class of all SIMD vector types.
Definition: DerivedTypes.h:430
bool isBitFieldInvertedMask(unsigned v)
const unsigned FPStatusBits
const unsigned FPReservedBits
Rounding
Possible values of current rounding mode, which is specified in bits 23:22 of FPSCR.
const unsigned RoundingBitsPos
FastISel * createFastISel(FunctionLoweringInfo &funcInfo, const TargetLibraryInfo *libInfo)
@ CXX_FAST_TLS
Used for access functions.
Definition: CallingConv.h:72
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition: CallingConv.h:41
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition: ISDOpcodes.h:1568
@ VECREDUCE_ADD
Integer reductions may have a result type larger than the vector element type.
Definition: ISDOpcodes.h:1485
MemIndexedMode
MemIndexedMode enum - This enum defines the load / store indexed addressing modes.
Definition: ISDOpcodes.h:1634
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
Definition: ISDOpcodes.h:1685
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
@ Offset
Definition: DWP.cpp:477
bool CCAssignFn(unsigned ValNo, MVT ValVT, MVT LocVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, Type *OrigTy, CCState &State)
CCAssignFn - This function assigns a location for Val, updating State to reflect the change.
AtomicOrdering
Atomic ordering for LLVM's memory model.
CombineLevel
Definition: DAGCombine.h:15
DWARFExpression::Operation Op
#define N
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39
Extended Value Type.
Definition: ValueTypes.h:35
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition: ValueTypes.h:368
bool isScalarInteger() const
Return true if this is an integer, but not a vector.
Definition: ValueTypes.h:157
This structure contains all information that is necessary for lowering calls.