51#define DEBUG_TYPE "x86-instr-info"
53#define GET_INSTRINFO_CTOR_DTOR
54#include "X86GenInstrInfo.inc"
60 cl::desc(
"Disable fusing of spill code into instructions"),
64 cl::desc(
"Print instructions that the allocator wants to"
65 " fuse, but the X86 backend currently can't"),
69 cl::desc(
"Re-materialize load from stub in PIC mode"),
73 cl::desc(
"Clearance between two register writes "
74 "for inserting XOR to avoid partial "
78 "undef-reg-clearance",
79 cl::desc(
"How many idle instructions we would like before "
80 "certain undef register reads"),
84void X86InstrInfo::anchor() {}
88 (STI.isTarget64BitLP64() ?
X86::ADJCALLSTACKDOWN64
89 :
X86::ADJCALLSTACKDOWN32),
90 (STI.isTarget64BitLP64() ?
X86::ADJCALLSTACKUP64
91 :
X86::ADJCALLSTACKUP32),
93 Subtarget(STI), RI(STI.getTargetTriple()) {}
102 if (!RC || !Subtarget.hasEGPR())
114 unsigned &SubIdx)
const {
115 switch (
MI.getOpcode()) {
118 case X86::MOVSX16rr8:
119 case X86::MOVZX16rr8:
120 case X86::MOVSX32rr8:
121 case X86::MOVZX32rr8:
122 case X86::MOVSX64rr8:
123 if (!Subtarget.is64Bit())
128 case X86::MOVSX32rr16:
129 case X86::MOVZX32rr16:
130 case X86::MOVSX64rr16:
131 case X86::MOVSX64rr32: {
132 if (
MI.getOperand(0).getSubReg() ||
MI.getOperand(1).getSubReg())
135 SrcReg =
MI.getOperand(1).getReg();
136 DstReg =
MI.getOperand(0).getReg();
137 switch (
MI.getOpcode()) {
140 case X86::MOVSX16rr8:
141 case X86::MOVZX16rr8:
142 case X86::MOVSX32rr8:
143 case X86::MOVZX32rr8:
144 case X86::MOVSX64rr8:
145 SubIdx = X86::sub_8bit;
147 case X86::MOVSX32rr16:
148 case X86::MOVZX32rr16:
149 case X86::MOVSX64rr16:
150 SubIdx = X86::sub_16bit;
152 case X86::MOVSX64rr32:
153 SubIdx = X86::sub_32bit;
163 if (
MI.mayLoad() ||
MI.mayStore())
168 if (
MI.isCopyLike() ||
MI.isInsertSubreg())
171 unsigned Opcode =
MI.getOpcode();
182 if (isBSF(Opcode) || isBSR(Opcode) || isLZCNT(Opcode) || isPOPCNT(Opcode) ||
188 if (isBLCFILL(Opcode) || isBLCI(Opcode) || isBLCIC(Opcode) ||
189 isBLCMSK(Opcode) || isBLCS(Opcode) || isBLSFILL(Opcode) ||
190 isBLSI(Opcode) || isBLSIC(Opcode) || isBLSMSK(Opcode) || isBLSR(Opcode) ||
195 if (isBEXTR(Opcode) || isBZHI(Opcode))
198 if (isROL(Opcode) || isROR(Opcode) || isSAR(Opcode) || isSHL(Opcode) ||
199 isSHR(Opcode) || isSHLD(Opcode) || isSHRD(Opcode))
202 if (isADC(Opcode) || isADD(Opcode) || isAND(Opcode) || isOR(Opcode) ||
203 isSBB(Opcode) || isSUB(Opcode) || isXOR(Opcode))
209 if (isDEC(Opcode) || isINC(Opcode) || isNEG(Opcode))
217 if (isMOVSX(Opcode) || isMOVZX(Opcode) || isMOVSXD(Opcode) || isMOV(Opcode))
220 if (isRORX(Opcode) || isSARX(Opcode) || isSHLX(Opcode) || isSHRX(Opcode))
230 switch (
MI.getOpcode()) {
243 case X86::IMUL64rmi32:
258 case X86::POPCNT16rm:
259 case X86::POPCNT32rm:
260 case X86::POPCNT64rm:
268 case X86::BLCFILL32rm:
269 case X86::BLCFILL64rm:
274 case X86::BLCMSK32rm:
275 case X86::BLCMSK64rm:
278 case X86::BLSFILL32rm:
279 case X86::BLSFILL64rm:
284 case X86::BLSMSK32rm:
285 case X86::BLSMSK64rm:
295 case X86::BEXTRI32mi:
296 case X86::BEXTRI64mi:
349 case X86::CVTTSD2SI64rm:
350 case X86::VCVTTSD2SI64rm:
351 case X86::VCVTTSD2SI64Zrm:
352 case X86::CVTTSD2SIrm:
353 case X86::VCVTTSD2SIrm:
354 case X86::VCVTTSD2SIZrm:
355 case X86::CVTTSS2SI64rm:
356 case X86::VCVTTSS2SI64rm:
357 case X86::VCVTTSS2SI64Zrm:
358 case X86::CVTTSS2SIrm:
359 case X86::VCVTTSS2SIrm:
360 case X86::VCVTTSS2SIZrm:
361 case X86::CVTSI2SDrm:
362 case X86::VCVTSI2SDrm:
363 case X86::VCVTSI2SDZrm:
364 case X86::CVTSI2SSrm:
365 case X86::VCVTSI2SSrm:
366 case X86::VCVTSI2SSZrm:
367 case X86::CVTSI642SDrm:
368 case X86::VCVTSI642SDrm:
369 case X86::VCVTSI642SDZrm:
370 case X86::CVTSI642SSrm:
371 case X86::VCVTSI642SSrm:
372 case X86::VCVTSI642SSZrm:
373 case X86::CVTSS2SDrm:
374 case X86::VCVTSS2SDrm:
375 case X86::VCVTSS2SDZrm:
376 case X86::CVTSD2SSrm:
377 case X86::VCVTSD2SSrm:
378 case X86::VCVTSD2SSZrm:
380 case X86::VCVTTSD2USI64Zrm:
381 case X86::VCVTTSD2USIZrm:
382 case X86::VCVTTSS2USI64Zrm:
383 case X86::VCVTTSS2USIZrm:
384 case X86::VCVTUSI2SDZrm:
385 case X86::VCVTUSI642SDZrm:
386 case X86::VCVTUSI2SSZrm:
387 case X86::VCVTUSI642SSZrm:
391 case X86::MOV8rm_NOREX:
395 case X86::MOVSX16rm8:
396 case X86::MOVSX32rm16:
397 case X86::MOVSX32rm8:
398 case X86::MOVSX32rm8_NOREX:
399 case X86::MOVSX64rm16:
400 case X86::MOVSX64rm32:
401 case X86::MOVSX64rm8:
402 case X86::MOVZX16rm8:
403 case X86::MOVZX32rm16:
404 case X86::MOVZX32rm8:
405 case X86::MOVZX32rm8_NOREX:
406 case X86::MOVZX64rm16:
407 case X86::MOVZX64rm8:
416 if (isFrameInstr(
MI)) {
419 if (!isFrameSetup(
MI))
430 for (
auto E =
MBB->end();
I != E; ++
I) {
431 if (
I->getOpcode() == getCallFrameDestroyOpcode() ||
I->isCall())
437 if (
I->getOpcode() != getCallFrameDestroyOpcode())
440 return -(
I->getOperand(1).
getImm());
445 switch (
MI.getOpcode()) {
464 int &FrameIndex)
const {
484 case X86::KMOVBkm_EVEX:
489 case X86::KMOVWkm_EVEX:
491 case X86::VMOVSHZrm_alt:
496 case X86::MOVSSrm_alt:
498 case X86::VMOVSSrm_alt:
500 case X86::VMOVSSZrm_alt:
502 case X86::KMOVDkm_EVEX:
508 case X86::MOVSDrm_alt:
510 case X86::VMOVSDrm_alt:
512 case X86::VMOVSDZrm_alt:
513 case X86::MMX_MOVD64rm:
514 case X86::MMX_MOVQ64rm:
516 case X86::KMOVQkm_EVEX:
531 case X86::VMOVAPSZ128rm:
532 case X86::VMOVUPSZ128rm:
533 case X86::VMOVAPSZ128rm_NOVLX:
534 case X86::VMOVUPSZ128rm_NOVLX:
535 case X86::VMOVAPDZ128rm:
536 case X86::VMOVUPDZ128rm:
537 case X86::VMOVDQU8Z128rm:
538 case X86::VMOVDQU16Z128rm:
539 case X86::VMOVDQA32Z128rm:
540 case X86::VMOVDQU32Z128rm:
541 case X86::VMOVDQA64Z128rm:
542 case X86::VMOVDQU64Z128rm:
545 case X86::VMOVAPSYrm:
546 case X86::VMOVUPSYrm:
547 case X86::VMOVAPDYrm:
548 case X86::VMOVUPDYrm:
549 case X86::VMOVDQAYrm:
550 case X86::VMOVDQUYrm:
551 case X86::VMOVAPSZ256rm:
552 case X86::VMOVUPSZ256rm:
553 case X86::VMOVAPSZ256rm_NOVLX:
554 case X86::VMOVUPSZ256rm_NOVLX:
555 case X86::VMOVAPDZ256rm:
556 case X86::VMOVUPDZ256rm:
557 case X86::VMOVDQU8Z256rm:
558 case X86::VMOVDQU16Z256rm:
559 case X86::VMOVDQA32Z256rm:
560 case X86::VMOVDQU32Z256rm:
561 case X86::VMOVDQA64Z256rm:
562 case X86::VMOVDQU64Z256rm:
565 case X86::VMOVAPSZrm:
566 case X86::VMOVUPSZrm:
567 case X86::VMOVAPDZrm:
568 case X86::VMOVUPDZrm:
569 case X86::VMOVDQU8Zrm:
570 case X86::VMOVDQU16Zrm:
571 case X86::VMOVDQA32Zrm:
572 case X86::VMOVDQU32Zrm:
573 case X86::VMOVDQA64Zrm:
574 case X86::VMOVDQU64Zrm:
586 case X86::KMOVBmk_EVEX:
591 case X86::KMOVWmk_EVEX:
600 case X86::KMOVDmk_EVEX:
608 case X86::MMX_MOVD64mr:
609 case X86::MMX_MOVQ64mr:
610 case X86::MMX_MOVNTQmr:
612 case X86::KMOVQmk_EVEX:
627 case X86::VMOVUPSZ128mr:
628 case X86::VMOVAPSZ128mr:
629 case X86::VMOVUPSZ128mr_NOVLX:
630 case X86::VMOVAPSZ128mr_NOVLX:
631 case X86::VMOVUPDZ128mr:
632 case X86::VMOVAPDZ128mr:
633 case X86::VMOVDQA32Z128mr:
634 case X86::VMOVDQU32Z128mr:
635 case X86::VMOVDQA64Z128mr:
636 case X86::VMOVDQU64Z128mr:
637 case X86::VMOVDQU8Z128mr:
638 case X86::VMOVDQU16Z128mr:
641 case X86::VMOVUPSYmr:
642 case X86::VMOVAPSYmr:
643 case X86::VMOVUPDYmr:
644 case X86::VMOVAPDYmr:
645 case X86::VMOVDQUYmr:
646 case X86::VMOVDQAYmr:
647 case X86::VMOVUPSZ256mr:
648 case X86::VMOVAPSZ256mr:
649 case X86::VMOVUPSZ256mr_NOVLX:
650 case X86::VMOVAPSZ256mr_NOVLX:
651 case X86::VMOVUPDZ256mr:
652 case X86::VMOVAPDZ256mr:
653 case X86::VMOVDQU8Z256mr:
654 case X86::VMOVDQU16Z256mr:
655 case X86::VMOVDQA32Z256mr:
656 case X86::VMOVDQU32Z256mr:
657 case X86::VMOVDQA64Z256mr:
658 case X86::VMOVDQU64Z256mr:
661 case X86::VMOVUPSZmr:
662 case X86::VMOVAPSZmr:
663 case X86::VMOVUPDZmr:
664 case X86::VMOVAPDZmr:
665 case X86::VMOVDQU8Zmr:
666 case X86::VMOVDQU16Zmr:
667 case X86::VMOVDQA32Zmr:
668 case X86::VMOVDQU32Zmr:
669 case X86::VMOVDQA64Zmr:
670 case X86::VMOVDQU64Zmr:
678 int &FrameIndex)
const {
687 if (
MI.getOperand(0).getSubReg() == 0 && isFrameOperand(
MI, 1, FrameIndex))
688 return MI.getOperand(0).getReg();
693 int &FrameIndex)
const {
704 return MI.getOperand(0).getReg();
711 int &FrameIndex)
const {
721 isFrameOperand(
MI, 0, FrameIndex))
727 int &FrameIndex)
const {
747 if (!BaseReg.isVirtual())
749 bool isPICBase =
false;
751 if (
DefMI.getOpcode() != X86::MOVPC32r)
753 assert(!isPICBase &&
"More than one PIC base?");
761 switch (
MI.getOpcode()) {
767 case X86::IMPLICIT_DEF:
770 case X86::LOAD_STACK_GUARD:
777 case X86::AVX1_SETALLONES:
778 case X86::AVX2_SETALLONES:
779 case X86::AVX512_128_SET0:
780 case X86::AVX512_256_SET0:
781 case X86::AVX512_512_SET0:
782 case X86::AVX512_512_SETALLONES:
783 case X86::AVX512_FsFLD0SD:
784 case X86::AVX512_FsFLD0SH:
785 case X86::AVX512_FsFLD0SS:
786 case X86::AVX512_FsFLD0F128:
791 case X86::FsFLD0F128:
799 case X86::MOV32ImmSExti8:
804 case X86::MOV64ImmSExti8:
806 case X86::V_SETALLONES:
812 case X86::PTILEZEROV:
816 case X86::MOV8rm_NOREX:
821 case X86::MOVSSrm_alt:
823 case X86::MOVSDrm_alt:
831 case X86::VMOVSSrm_alt:
833 case X86::VMOVSDrm_alt:
840 case X86::VMOVAPSYrm:
841 case X86::VMOVUPSYrm:
842 case X86::VMOVAPDYrm:
843 case X86::VMOVUPDYrm:
844 case X86::VMOVDQAYrm:
845 case X86::VMOVDQUYrm:
846 case X86::MMX_MOVD64rm:
847 case X86::MMX_MOVQ64rm:
848 case X86::VBROADCASTSSrm:
849 case X86::VBROADCASTSSYrm:
850 case X86::VBROADCASTSDYrm:
852 case X86::VPBROADCASTBZ128rm:
853 case X86::VPBROADCASTBZ256rm:
854 case X86::VPBROADCASTBZrm:
855 case X86::VBROADCASTF32X2Z256rm:
856 case X86::VBROADCASTF32X2Zrm:
857 case X86::VBROADCASTI32X2Z128rm:
858 case X86::VBROADCASTI32X2Z256rm:
859 case X86::VBROADCASTI32X2Zrm:
860 case X86::VPBROADCASTWZ128rm:
861 case X86::VPBROADCASTWZ256rm:
862 case X86::VPBROADCASTWZrm:
863 case X86::VPBROADCASTDZ128rm:
864 case X86::VPBROADCASTDZ256rm:
865 case X86::VPBROADCASTDZrm:
866 case X86::VBROADCASTSSZ128rm:
867 case X86::VBROADCASTSSZ256rm:
868 case X86::VBROADCASTSSZrm:
869 case X86::VPBROADCASTQZ128rm:
870 case X86::VPBROADCASTQZ256rm:
871 case X86::VPBROADCASTQZrm:
872 case X86::VBROADCASTSDZ256rm:
873 case X86::VBROADCASTSDZrm:
875 case X86::VMOVSSZrm_alt:
877 case X86::VMOVSDZrm_alt:
879 case X86::VMOVSHZrm_alt:
880 case X86::VMOVAPDZ128rm:
881 case X86::VMOVAPDZ256rm:
882 case X86::VMOVAPDZrm:
883 case X86::VMOVAPSZ128rm:
884 case X86::VMOVAPSZ256rm:
885 case X86::VMOVAPSZ128rm_NOVLX:
886 case X86::VMOVAPSZ256rm_NOVLX:
887 case X86::VMOVAPSZrm:
888 case X86::VMOVDQA32Z128rm:
889 case X86::VMOVDQA32Z256rm:
890 case X86::VMOVDQA32Zrm:
891 case X86::VMOVDQA64Z128rm:
892 case X86::VMOVDQA64Z256rm:
893 case X86::VMOVDQA64Zrm:
894 case X86::VMOVDQU16Z128rm:
895 case X86::VMOVDQU16Z256rm:
896 case X86::VMOVDQU16Zrm:
897 case X86::VMOVDQU32Z128rm:
898 case X86::VMOVDQU32Z256rm:
899 case X86::VMOVDQU32Zrm:
900 case X86::VMOVDQU64Z128rm:
901 case X86::VMOVDQU64Z256rm:
902 case X86::VMOVDQU64Zrm:
903 case X86::VMOVDQU8Z128rm:
904 case X86::VMOVDQU8Z256rm:
905 case X86::VMOVDQU8Zrm:
906 case X86::VMOVUPDZ128rm:
907 case X86::VMOVUPDZ256rm:
908 case X86::VMOVUPDZrm:
909 case X86::VMOVUPSZ128rm:
910 case X86::VMOVUPSZ256rm:
911 case X86::VMOVUPSZ128rm_NOVLX:
912 case X86::VMOVUPSZ256rm_NOVLX:
913 case X86::VMOVUPSZrm: {
919 MI.isDereferenceableInvariantLoad()) {
921 if (BaseReg == 0 || BaseReg == X86::RIP)
964 if (ClobbersEFLAGS &&
MBB.computeRegisterLiveness(&
TRI, X86::EFLAGS,
I) !=
999 if (MO.isReg() && MO.isDef() && MO.getReg() == X86::EFLAGS &&
1009 unsigned ShiftAmtOperandIdx) {
1011 unsigned ShiftCountMask = (
MI.getDesc().TSFlags &
X86II::REX_W) ? 63 : 31;
1012 unsigned Imm =
MI.getOperand(ShiftAmtOperandIdx).getImm();
1013 return Imm & ShiftCountMask;
1024 return ShAmt < 4 && ShAmt > 0;
1031 bool &NoSignFlag,
bool &ClearsOverflowFlag) {
1032 if (!(CmpValDefInstr.
getOpcode() == X86::SUBREG_TO_REG &&
1033 CmpInstr.
getOpcode() == X86::TEST64rr) &&
1034 !(CmpValDefInstr.
getOpcode() == X86::COPY &&
1042 "CmpInstr is an analyzable TEST16rr/TEST64rr, and "
1043 "`X86InstrInfo::analyzeCompare` requires two reg operands are the"
1052 "Caller guarantees that TEST64rr is a user of SUBREG_TO_REG or TEST16rr "
1053 "is a user of COPY sub16bit.");
1055 if (CmpInstr.
getOpcode() == X86::TEST16rr) {
1064 if (!((VregDefInstr->
getOpcode() == X86::AND32ri ||
1065 VregDefInstr->
getOpcode() == X86::AND64ri32) &&
1070 if (CmpInstr.
getOpcode() == X86::TEST64rr) {
1084 assert(VregDefInstr &&
"Must have a definition (SSA)");
1094 if (X86::isAND(VregDefInstr->
getOpcode()) &&
1115 if (Instr.modifiesRegister(X86::EFLAGS,
TRI))
1119 *AndInstr = VregDefInstr;
1140 ClearsOverflowFlag =
true;
1148 unsigned &NewSrcSubReg,
bool &isKill,
1154 RC =
Opc != X86::LEA32r ? &X86::GR64RegClass : &X86::GR32RegClass;
1156 RC =
Opc != X86::LEA32r ? &X86::GR64_NOSPRegClass : &X86::GR32_NOSPRegClass;
1159 unsigned SubReg = Src.getSubReg();
1160 isKill =
MI.killsRegister(SrcReg,
nullptr);
1162 NewSrcSubReg = X86::NoSubRegister;
1166 if (
Opc != X86::LEA64_32r) {
1169 assert(!Src.isUndef() &&
"Undef op doesn't need optimization");
1186 assert(!Src.isUndef() &&
"Undef op doesn't need optimization");
1191 NewSrcSubReg = X86::NoSubRegister;
1217MachineInstr *X86InstrInfo::convertToThreeAddressWithLEA(
unsigned MIOpc,
1221 bool Is8BitOp)
const {
1226 RegInfo.getTargetRegisterInfo()->getRegSizeInBits(
1227 *RegInfo.getRegClass(
MI.getOperand(0).getReg())) == 16) &&
1228 "Unexpected type for LEA transform");
1237 if (!Subtarget.is64Bit())
1240 unsigned Opcode = X86::LEA64_32r;
1241 Register InRegLEA = RegInfo.createVirtualRegister(&X86::GR64_NOSPRegClass);
1242 Register OutRegLEA = RegInfo.createVirtualRegister(&X86::GR32RegClass);
1255 unsigned SrcSubReg =
MI.getOperand(1).getSubReg();
1257 unsigned Src2SubReg;
1258 bool IsDead =
MI.getOperand(0).isDead();
1259 bool IsKill =
MI.getOperand(1).isKill();
1260 unsigned SubReg = Is8BitOp ? X86::sub_8bit : X86::sub_16bit;
1261 assert(!
MI.getOperand(1).isUndef() &&
"Undef op doesn't need optimization");
1273#define CASE_NF(OP) \
1281 unsigned ShAmt =
MI.getOperand(2).getImm();
1299 case X86::ADD8ri_DB:
1300 case X86::ADD16ri_DB:
1305 case X86::ADD8rr_DB:
1306 case X86::ADD16rr_DB: {
1307 Src2 =
MI.getOperand(2).getReg();
1308 Src2SubReg =
MI.getOperand(2).getSubReg();
1309 bool IsKill2 =
MI.getOperand(2).isKill();
1310 assert(!
MI.getOperand(2).isUndef() &&
"Undef op doesn't need optimization");
1314 addRegReg(MIB, InRegLEA,
true, X86::NoSubRegister, InRegLEA,
false,
1315 X86::NoSubRegister);
1317 if (Subtarget.is64Bit())
1323 ImpDef2 =
BuildMI(
MBB, &*MIB,
MI.getDebugLoc(),
get(X86::IMPLICIT_DEF),
1325 InsMI2 =
BuildMI(
MBB, &*MIB,
MI.getDebugLoc(),
get(TargetOpcode::COPY))
1328 addRegReg(MIB, InRegLEA,
true, X86::NoSubRegister, InRegLEA2,
true,
1329 X86::NoSubRegister);
1331 if (LV && IsKill2 && InsMI2)
1337 MachineInstr *NewMI = MIB;
1338 MachineInstr *ExtMI =
1386 LiveRange::Segment *DestSeg =
1427 if (
MI.getNumOperands() > 2)
1428 if (
MI.getOperand(2).isReg() &&
MI.getOperand(2).isUndef())
1433 unsigned SrcSubReg, SrcSubReg2;
1434 bool Is64Bit = Subtarget.is64Bit();
1436 bool Is8BitOp =
false;
1437 unsigned NumRegOperands = 2;
1438 unsigned MIOpc =
MI.getOpcode();
1443 assert(
MI.getNumOperands() >= 3 &&
"Unknown shift instruction!");
1450 Src.getReg(), &X86::GR64_NOSPRegClass))
1453 NewMI =
BuildMI(MF,
MI.getDebugLoc(),
get(X86::LEA64r))
1463 assert(
MI.getNumOperands() >= 3 &&
"Unknown shift instruction!");
1468 unsigned Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1474 isKill, ImplicitOp, LV, LIS))
1485 if (ImplicitOp.
getReg() != 0)
1486 MIB.
add(ImplicitOp);
1490 if (LV && SrcReg != Src.getReg())
1498 assert(
MI.getNumOperands() >= 3 &&
"Unknown shift instruction!");
1502 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1506 assert(
MI.getNumOperands() >= 2 &&
"Unknown inc instruction!");
1507 unsigned Opc = (MIOpc == X86::INC64r || MIOpc == X86::INC64r_NF)
1509 : (Is64Bit ? X86::LEA64_32r : X86::LEA32r);
1513 isKill, ImplicitOp, LV, LIS))
1519 if (ImplicitOp.
getReg() != 0)
1520 MIB.
add(ImplicitOp);
1525 if (LV && SrcReg != Src.getReg())
1531 assert(
MI.getNumOperands() >= 2 &&
"Unknown dec instruction!");
1532 unsigned Opc = (MIOpc == X86::DEC64r || MIOpc == X86::DEC64r_NF)
1534 : (Is64Bit ? X86::LEA64_32r : X86::LEA32r);
1539 isKill, ImplicitOp, LV, LIS))
1545 if (ImplicitOp.
getReg() != 0)
1546 MIB.
add(ImplicitOp);
1551 if (LV && SrcReg != Src.getReg())
1561 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1564 case X86::ADD64rr_DB:
1565 case X86::ADD32rr_DB: {
1566 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1568 if (MIOpc == X86::ADD64rr || MIOpc == X86::ADD64rr_NF ||
1569 MIOpc == X86::ADD64rr_DB)
1572 Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1578 isKill2, ImplicitOp2, LV, LIS))
1583 if (Src.getReg() == Src2.
getReg()) {
1588 SrcSubReg = SrcSubReg2;
1591 isKill, ImplicitOp, LV, LIS))
1596 if (ImplicitOp.
getReg() != 0)
1597 MIB.
add(ImplicitOp);
1598 if (ImplicitOp2.
getReg() != 0)
1599 MIB.
add(ImplicitOp2);
1602 addRegReg(MIB, SrcReg, isKill, SrcSubReg, SrcReg2, isKill2, SrcSubReg2);
1606 if (SrcReg2 != Src2.
getReg())
1608 if (SrcReg != SrcReg2 && SrcReg != Src.getReg())
1615 case X86::ADD8rr_DB:
1619 case X86::ADD16rr_DB:
1620 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1622 case X86::ADD64ri32_DB:
1623 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1625 BuildMI(MF,
MI.getDebugLoc(),
get(X86::LEA64r)).add(Dest).add(Src),
1629 case X86::ADD32ri_DB: {
1630 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1631 unsigned Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1636 isKill, ImplicitOp, LV, LIS))
1643 if (ImplicitOp.
getReg() != 0)
1644 MIB.
add(ImplicitOp);
1649 if (LV && SrcReg != Src.getReg())
1654 case X86::ADD8ri_DB:
1658 case X86::ADD16ri_DB:
1659 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1665 if (!
MI.getOperand(2).isImm())
1667 int64_t Imm =
MI.getOperand(2).getImm();
1671 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1672 unsigned Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1677 isKill, ImplicitOp, LV, LIS))
1684 if (ImplicitOp.
getReg() != 0)
1685 MIB.
add(ImplicitOp);
1690 if (LV && SrcReg != Src.getReg())
1696 if (!
MI.getOperand(2).isImm())
1698 int64_t Imm =
MI.getOperand(2).getImm();
1702 assert(
MI.getNumOperands() >= 3 &&
"Unknown sub instruction!");
1710 case X86::VMOVDQU8Z128rmk:
1711 case X86::VMOVDQU8Z256rmk:
1712 case X86::VMOVDQU8Zrmk:
1713 case X86::VMOVDQU16Z128rmk:
1714 case X86::VMOVDQU16Z256rmk:
1715 case X86::VMOVDQU16Zrmk:
1716 case X86::VMOVDQU32Z128rmk:
1717 case X86::VMOVDQA32Z128rmk:
1718 case X86::VMOVDQU32Z256rmk:
1719 case X86::VMOVDQA32Z256rmk:
1720 case X86::VMOVDQU32Zrmk:
1721 case X86::VMOVDQA32Zrmk:
1722 case X86::VMOVDQU64Z128rmk:
1723 case X86::VMOVDQA64Z128rmk:
1724 case X86::VMOVDQU64Z256rmk:
1725 case X86::VMOVDQA64Z256rmk:
1726 case X86::VMOVDQU64Zrmk:
1727 case X86::VMOVDQA64Zrmk:
1728 case X86::VMOVUPDZ128rmk:
1729 case X86::VMOVAPDZ128rmk:
1730 case X86::VMOVUPDZ256rmk:
1731 case X86::VMOVAPDZ256rmk:
1732 case X86::VMOVUPDZrmk:
1733 case X86::VMOVAPDZrmk:
1734 case X86::VMOVUPSZ128rmk:
1735 case X86::VMOVAPSZ128rmk:
1736 case X86::VMOVUPSZ256rmk:
1737 case X86::VMOVAPSZ256rmk:
1738 case X86::VMOVUPSZrmk:
1739 case X86::VMOVAPSZrmk:
1740 case X86::VBROADCASTSDZ256rmk:
1741 case X86::VBROADCASTSDZrmk:
1742 case X86::VBROADCASTSSZ128rmk:
1743 case X86::VBROADCASTSSZ256rmk:
1744 case X86::VBROADCASTSSZrmk:
1745 case X86::VPBROADCASTDZ128rmk:
1746 case X86::VPBROADCASTDZ256rmk:
1747 case X86::VPBROADCASTDZrmk:
1748 case X86::VPBROADCASTQZ128rmk:
1749 case X86::VPBROADCASTQZ256rmk:
1750 case X86::VPBROADCASTQZrmk: {
1755 case X86::VMOVDQU8Z128rmk:
1756 Opc = X86::VPBLENDMBZ128rmk;
1758 case X86::VMOVDQU8Z256rmk:
1759 Opc = X86::VPBLENDMBZ256rmk;
1761 case X86::VMOVDQU8Zrmk:
1762 Opc = X86::VPBLENDMBZrmk;
1764 case X86::VMOVDQU16Z128rmk:
1765 Opc = X86::VPBLENDMWZ128rmk;
1767 case X86::VMOVDQU16Z256rmk:
1768 Opc = X86::VPBLENDMWZ256rmk;
1770 case X86::VMOVDQU16Zrmk:
1771 Opc = X86::VPBLENDMWZrmk;
1773 case X86::VMOVDQU32Z128rmk:
1774 Opc = X86::VPBLENDMDZ128rmk;
1776 case X86::VMOVDQU32Z256rmk:
1777 Opc = X86::VPBLENDMDZ256rmk;
1779 case X86::VMOVDQU32Zrmk:
1780 Opc = X86::VPBLENDMDZrmk;
1782 case X86::VMOVDQU64Z128rmk:
1783 Opc = X86::VPBLENDMQZ128rmk;
1785 case X86::VMOVDQU64Z256rmk:
1786 Opc = X86::VPBLENDMQZ256rmk;
1788 case X86::VMOVDQU64Zrmk:
1789 Opc = X86::VPBLENDMQZrmk;
1791 case X86::VMOVUPDZ128rmk:
1792 Opc = X86::VBLENDMPDZ128rmk;
1794 case X86::VMOVUPDZ256rmk:
1795 Opc = X86::VBLENDMPDZ256rmk;
1797 case X86::VMOVUPDZrmk:
1798 Opc = X86::VBLENDMPDZrmk;
1800 case X86::VMOVUPSZ128rmk:
1801 Opc = X86::VBLENDMPSZ128rmk;
1803 case X86::VMOVUPSZ256rmk:
1804 Opc = X86::VBLENDMPSZ256rmk;
1806 case X86::VMOVUPSZrmk:
1807 Opc = X86::VBLENDMPSZrmk;
1809 case X86::VMOVDQA32Z128rmk:
1810 Opc = X86::VPBLENDMDZ128rmk;
1812 case X86::VMOVDQA32Z256rmk:
1813 Opc = X86::VPBLENDMDZ256rmk;
1815 case X86::VMOVDQA32Zrmk:
1816 Opc = X86::VPBLENDMDZrmk;
1818 case X86::VMOVDQA64Z128rmk:
1819 Opc = X86::VPBLENDMQZ128rmk;
1821 case X86::VMOVDQA64Z256rmk:
1822 Opc = X86::VPBLENDMQZ256rmk;
1824 case X86::VMOVDQA64Zrmk:
1825 Opc = X86::VPBLENDMQZrmk;
1827 case X86::VMOVAPDZ128rmk:
1828 Opc = X86::VBLENDMPDZ128rmk;
1830 case X86::VMOVAPDZ256rmk:
1831 Opc = X86::VBLENDMPDZ256rmk;
1833 case X86::VMOVAPDZrmk:
1834 Opc = X86::VBLENDMPDZrmk;
1836 case X86::VMOVAPSZ128rmk:
1837 Opc = X86::VBLENDMPSZ128rmk;
1839 case X86::VMOVAPSZ256rmk:
1840 Opc = X86::VBLENDMPSZ256rmk;
1842 case X86::VMOVAPSZrmk:
1843 Opc = X86::VBLENDMPSZrmk;
1845 case X86::VBROADCASTSDZ256rmk:
1846 Opc = X86::VBLENDMPDZ256rmbk;
1848 case X86::VBROADCASTSDZrmk:
1849 Opc = X86::VBLENDMPDZrmbk;
1851 case X86::VBROADCASTSSZ128rmk:
1852 Opc = X86::VBLENDMPSZ128rmbk;
1854 case X86::VBROADCASTSSZ256rmk:
1855 Opc = X86::VBLENDMPSZ256rmbk;
1857 case X86::VBROADCASTSSZrmk:
1858 Opc = X86::VBLENDMPSZrmbk;
1860 case X86::VPBROADCASTDZ128rmk:
1861 Opc = X86::VPBLENDMDZ128rmbk;
1863 case X86::VPBROADCASTDZ256rmk:
1864 Opc = X86::VPBLENDMDZ256rmbk;
1866 case X86::VPBROADCASTDZrmk:
1867 Opc = X86::VPBLENDMDZrmbk;
1869 case X86::VPBROADCASTQZ128rmk:
1870 Opc = X86::VPBLENDMQZ128rmbk;
1872 case X86::VPBROADCASTQZ256rmk:
1873 Opc = X86::VPBLENDMQZ256rmbk;
1875 case X86::VPBROADCASTQZrmk:
1876 Opc = X86::VPBLENDMQZrmbk;
1882 .
add(
MI.getOperand(2))
1884 .
add(
MI.getOperand(3))
1885 .
add(
MI.getOperand(4))
1886 .
add(
MI.getOperand(5))
1887 .
add(
MI.getOperand(6))
1888 .
add(
MI.getOperand(7));
1893 case X86::VMOVDQU8Z128rrk:
1894 case X86::VMOVDQU8Z256rrk:
1895 case X86::VMOVDQU8Zrrk:
1896 case X86::VMOVDQU16Z128rrk:
1897 case X86::VMOVDQU16Z256rrk:
1898 case X86::VMOVDQU16Zrrk:
1899 case X86::VMOVDQU32Z128rrk:
1900 case X86::VMOVDQA32Z128rrk:
1901 case X86::VMOVDQU32Z256rrk:
1902 case X86::VMOVDQA32Z256rrk:
1903 case X86::VMOVDQU32Zrrk:
1904 case X86::VMOVDQA32Zrrk:
1905 case X86::VMOVDQU64Z128rrk:
1906 case X86::VMOVDQA64Z128rrk:
1907 case X86::VMOVDQU64Z256rrk:
1908 case X86::VMOVDQA64Z256rrk:
1909 case X86::VMOVDQU64Zrrk:
1910 case X86::VMOVDQA64Zrrk:
1911 case X86::VMOVUPDZ128rrk:
1912 case X86::VMOVAPDZ128rrk:
1913 case X86::VMOVUPDZ256rrk:
1914 case X86::VMOVAPDZ256rrk:
1915 case X86::VMOVUPDZrrk:
1916 case X86::VMOVAPDZrrk:
1917 case X86::VMOVUPSZ128rrk:
1918 case X86::VMOVAPSZ128rrk:
1919 case X86::VMOVUPSZ256rrk:
1920 case X86::VMOVAPSZ256rrk:
1921 case X86::VMOVUPSZrrk:
1922 case X86::VMOVAPSZrrk: {
1927 case X86::VMOVDQU8Z128rrk:
1928 Opc = X86::VPBLENDMBZ128rrk;
1930 case X86::VMOVDQU8Z256rrk:
1931 Opc = X86::VPBLENDMBZ256rrk;
1933 case X86::VMOVDQU8Zrrk:
1934 Opc = X86::VPBLENDMBZrrk;
1936 case X86::VMOVDQU16Z128rrk:
1937 Opc = X86::VPBLENDMWZ128rrk;
1939 case X86::VMOVDQU16Z256rrk:
1940 Opc = X86::VPBLENDMWZ256rrk;
1942 case X86::VMOVDQU16Zrrk:
1943 Opc = X86::VPBLENDMWZrrk;
1945 case X86::VMOVDQU32Z128rrk:
1946 Opc = X86::VPBLENDMDZ128rrk;
1948 case X86::VMOVDQU32Z256rrk:
1949 Opc = X86::VPBLENDMDZ256rrk;
1951 case X86::VMOVDQU32Zrrk:
1952 Opc = X86::VPBLENDMDZrrk;
1954 case X86::VMOVDQU64Z128rrk:
1955 Opc = X86::VPBLENDMQZ128rrk;
1957 case X86::VMOVDQU64Z256rrk:
1958 Opc = X86::VPBLENDMQZ256rrk;
1960 case X86::VMOVDQU64Zrrk:
1961 Opc = X86::VPBLENDMQZrrk;
1963 case X86::VMOVUPDZ128rrk:
1964 Opc = X86::VBLENDMPDZ128rrk;
1966 case X86::VMOVUPDZ256rrk:
1967 Opc = X86::VBLENDMPDZ256rrk;
1969 case X86::VMOVUPDZrrk:
1970 Opc = X86::VBLENDMPDZrrk;
1972 case X86::VMOVUPSZ128rrk:
1973 Opc = X86::VBLENDMPSZ128rrk;
1975 case X86::VMOVUPSZ256rrk:
1976 Opc = X86::VBLENDMPSZ256rrk;
1978 case X86::VMOVUPSZrrk:
1979 Opc = X86::VBLENDMPSZrrk;
1981 case X86::VMOVDQA32Z128rrk:
1982 Opc = X86::VPBLENDMDZ128rrk;
1984 case X86::VMOVDQA32Z256rrk:
1985 Opc = X86::VPBLENDMDZ256rrk;
1987 case X86::VMOVDQA32Zrrk:
1988 Opc = X86::VPBLENDMDZrrk;
1990 case X86::VMOVDQA64Z128rrk:
1991 Opc = X86::VPBLENDMQZ128rrk;
1993 case X86::VMOVDQA64Z256rrk:
1994 Opc = X86::VPBLENDMQZ256rrk;
1996 case X86::VMOVDQA64Zrrk:
1997 Opc = X86::VPBLENDMQZrrk;
1999 case X86::VMOVAPDZ128rrk:
2000 Opc = X86::VBLENDMPDZ128rrk;
2002 case X86::VMOVAPDZ256rrk:
2003 Opc = X86::VBLENDMPDZ256rrk;
2005 case X86::VMOVAPDZrrk:
2006 Opc = X86::VBLENDMPDZrrk;
2008 case X86::VMOVAPSZ128rrk:
2009 Opc = X86::VBLENDMPSZ128rrk;
2011 case X86::VMOVAPSZ256rrk:
2012 Opc = X86::VBLENDMPSZ256rrk;
2014 case X86::VMOVAPSZrrk:
2015 Opc = X86::VBLENDMPSZrrk;
2021 .
add(
MI.getOperand(2))
2023 .
add(
MI.getOperand(3));
2034 for (
unsigned I = 0;
I < NumRegOperands; ++
I) {
2036 if (
Op.isReg() && (
Op.isDead() ||
Op.isKill()))
2042 MBB.insert(
MI.getIterator(), NewMI);
2063 unsigned SrcOpIdx2) {
2065 if (SrcOpIdx1 > SrcOpIdx2)
2068 unsigned Op1 = 1, Op2 = 2, Op3 = 3;
2074 if (SrcOpIdx1 == Op1 && SrcOpIdx2 == Op2)
2076 if (SrcOpIdx1 == Op1 && SrcOpIdx2 == Op3)
2078 if (SrcOpIdx1 == Op2 && SrcOpIdx2 == Op3)
2087 unsigned Opc =
MI.getOpcode();
2096 "Intrinsic instructions can't commute operand 1");
2101 assert(Case < 3 &&
"Unexpected case number!");
2106 const unsigned Form132Index = 0;
2107 const unsigned Form213Index = 1;
2108 const unsigned Form231Index = 2;
2109 static const unsigned FormMapping[][3] = {
2114 {Form231Index, Form213Index, Form132Index},
2119 {Form132Index, Form231Index, Form213Index},
2124 {Form213Index, Form132Index, Form231Index}};
2126 unsigned FMAForms[3];
2132 for (
unsigned FormIndex = 0; FormIndex < 3; FormIndex++)
2133 if (
Opc == FMAForms[FormIndex])
2134 return FMAForms[FormMapping[Case][FormIndex]];
2140 unsigned SrcOpIdx2) {
2144 assert(Case < 3 &&
"Unexpected case value!");
2147 static const uint8_t SwapMasks[3][4] = {
2148 {0x04, 0x10, 0x08, 0x20},
2149 {0x02, 0x10, 0x08, 0x40},
2150 {0x02, 0x04, 0x20, 0x40},
2153 uint8_t Imm =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
2155 uint8_t NewImm = Imm & ~(SwapMasks[Case][0] | SwapMasks[Case][1] |
2156 SwapMasks[Case][2] | SwapMasks[Case][3]);
2158 if (Imm & SwapMasks[Case][0])
2159 NewImm |= SwapMasks[Case][1];
2160 if (Imm & SwapMasks[Case][1])
2161 NewImm |= SwapMasks[Case][0];
2162 if (Imm & SwapMasks[Case][2])
2163 NewImm |= SwapMasks[Case][3];
2164 if (Imm & SwapMasks[Case][3])
2165 NewImm |= SwapMasks[Case][2];
2166 MI.getOperand(
MI.getNumOperands() - 1).setImm(NewImm);
2172#define VPERM_CASES(Suffix) \
2173 case X86::VPERMI2##Suffix##Z128rr: \
2174 case X86::VPERMT2##Suffix##Z128rr: \
2175 case X86::VPERMI2##Suffix##Z256rr: \
2176 case X86::VPERMT2##Suffix##Z256rr: \
2177 case X86::VPERMI2##Suffix##Zrr: \
2178 case X86::VPERMT2##Suffix##Zrr: \
2179 case X86::VPERMI2##Suffix##Z128rm: \
2180 case X86::VPERMT2##Suffix##Z128rm: \
2181 case X86::VPERMI2##Suffix##Z256rm: \
2182 case X86::VPERMT2##Suffix##Z256rm: \
2183 case X86::VPERMI2##Suffix##Zrm: \
2184 case X86::VPERMT2##Suffix##Zrm: \
2185 case X86::VPERMI2##Suffix##Z128rrkz: \
2186 case X86::VPERMT2##Suffix##Z128rrkz: \
2187 case X86::VPERMI2##Suffix##Z256rrkz: \
2188 case X86::VPERMT2##Suffix##Z256rrkz: \
2189 case X86::VPERMI2##Suffix##Zrrkz: \
2190 case X86::VPERMT2##Suffix##Zrrkz: \
2191 case X86::VPERMI2##Suffix##Z128rmkz: \
2192 case X86::VPERMT2##Suffix##Z128rmkz: \
2193 case X86::VPERMI2##Suffix##Z256rmkz: \
2194 case X86::VPERMT2##Suffix##Z256rmkz: \
2195 case X86::VPERMI2##Suffix##Zrmkz: \
2196 case X86::VPERMT2##Suffix##Zrmkz:
2198#define VPERM_CASES_BROADCAST(Suffix) \
2199 VPERM_CASES(Suffix) \
2200 case X86::VPERMI2##Suffix##Z128rmb: \
2201 case X86::VPERMT2##Suffix##Z128rmb: \
2202 case X86::VPERMI2##Suffix##Z256rmb: \
2203 case X86::VPERMT2##Suffix##Z256rmb: \
2204 case X86::VPERMI2##Suffix##Zrmb: \
2205 case X86::VPERMT2##Suffix##Zrmb: \
2206 case X86::VPERMI2##Suffix##Z128rmbkz: \
2207 case X86::VPERMT2##Suffix##Z128rmbkz: \
2208 case X86::VPERMI2##Suffix##Z256rmbkz: \
2209 case X86::VPERMT2##Suffix##Z256rmbkz: \
2210 case X86::VPERMI2##Suffix##Zrmbkz: \
2211 case X86::VPERMT2##Suffix##Zrmbkz:
2224#undef VPERM_CASES_BROADCAST
2231#define VPERM_CASES(Orig, New) \
2232 case X86::Orig##Z128rr: \
2233 return X86::New##Z128rr; \
2234 case X86::Orig##Z128rrkz: \
2235 return X86::New##Z128rrkz; \
2236 case X86::Orig##Z128rm: \
2237 return X86::New##Z128rm; \
2238 case X86::Orig##Z128rmkz: \
2239 return X86::New##Z128rmkz; \
2240 case X86::Orig##Z256rr: \
2241 return X86::New##Z256rr; \
2242 case X86::Orig##Z256rrkz: \
2243 return X86::New##Z256rrkz; \
2244 case X86::Orig##Z256rm: \
2245 return X86::New##Z256rm; \
2246 case X86::Orig##Z256rmkz: \
2247 return X86::New##Z256rmkz; \
2248 case X86::Orig##Zrr: \
2249 return X86::New##Zrr; \
2250 case X86::Orig##Zrrkz: \
2251 return X86::New##Zrrkz; \
2252 case X86::Orig##Zrm: \
2253 return X86::New##Zrm; \
2254 case X86::Orig##Zrmkz: \
2255 return X86::New##Zrmkz;
2257#define VPERM_CASES_BROADCAST(Orig, New) \
2258 VPERM_CASES(Orig, New) \
2259 case X86::Orig##Z128rmb: \
2260 return X86::New##Z128rmb; \
2261 case X86::Orig##Z128rmbkz: \
2262 return X86::New##Z128rmbkz; \
2263 case X86::Orig##Z256rmb: \
2264 return X86::New##Z256rmb; \
2265 case X86::Orig##Z256rmbkz: \
2266 return X86::New##Z256rmbkz; \
2267 case X86::Orig##Zrmb: \
2268 return X86::New##Zrmb; \
2269 case X86::Orig##Zrmbkz: \
2270 return X86::New##Zrmbkz;
2288#undef VPERM_CASES_BROADCAST
2294 unsigned OpIdx2)
const {
2296 return std::exchange(NewMI,
false)
2297 ?
MI.getParent()->getParent()->CloneMachineInstr(&
MI)
2301 unsigned Opc =
MI.getOpcode();
2303#define CASE_ND(OP) \
2319#define FROM_TO_SIZE(A, B, S) \
2325 Opc = X86::B##_ND; \
2333 Opc = X86::A##_ND; \
2342 WorkingMI = CloneIfNew(
MI);
2351 WorkingMI = CloneIfNew(
MI);
2353 get(X86::PFSUBRrr ==
Opc ? X86::PFSUBrr : X86::PFSUBRrr));
2355 case X86::BLENDPDrri:
2356 case X86::BLENDPSrri:
2357 case X86::PBLENDWrri:
2358 case X86::VBLENDPDrri:
2359 case X86::VBLENDPSrri:
2360 case X86::VBLENDPDYrri:
2361 case X86::VBLENDPSYrri:
2362 case X86::VPBLENDDrri:
2363 case X86::VPBLENDWrri:
2364 case X86::VPBLENDDYrri:
2365 case X86::VPBLENDWYrri: {
2370 case X86::BLENDPDrri:
2371 Mask = (int8_t)0x03;
2373 case X86::BLENDPSrri:
2374 Mask = (int8_t)0x0F;
2376 case X86::PBLENDWrri:
2377 Mask = (int8_t)0xFF;
2379 case X86::VBLENDPDrri:
2380 Mask = (int8_t)0x03;
2382 case X86::VBLENDPSrri:
2383 Mask = (int8_t)0x0F;
2385 case X86::VBLENDPDYrri:
2386 Mask = (int8_t)0x0F;
2388 case X86::VBLENDPSYrri:
2389 Mask = (int8_t)0xFF;
2391 case X86::VPBLENDDrri:
2392 Mask = (int8_t)0x0F;
2394 case X86::VPBLENDWrri:
2395 Mask = (int8_t)0xFF;
2397 case X86::VPBLENDDYrri:
2398 Mask = (int8_t)0xFF;
2400 case X86::VPBLENDWYrri:
2401 Mask = (int8_t)0xFF;
2407 int8_t Imm =
MI.getOperand(3).getImm() & Mask;
2408 WorkingMI = CloneIfNew(
MI);
2412 case X86::INSERTPSrri:
2413 case X86::VINSERTPSrri:
2414 case X86::VINSERTPSZrri: {
2415 unsigned Imm =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
2416 unsigned ZMask = Imm & 15;
2417 unsigned DstIdx = (Imm >> 4) & 3;
2418 unsigned SrcIdx = (Imm >> 6) & 3;
2422 if (DstIdx == SrcIdx && (ZMask & (1 << DstIdx)) == 0 &&
2425 assert(AltIdx < 4 &&
"Illegal insertion index");
2426 unsigned AltImm = (AltIdx << 6) | (AltIdx << 4) | ZMask;
2427 WorkingMI = CloneIfNew(
MI);
2436 case X86::VMOVSSrr: {
2438 if (Subtarget.hasSSE41()) {
2444 Opc = X86::BLENDPDrri;
2448 Opc = X86::BLENDPSrri;
2452 Opc = X86::VBLENDPDrri;
2456 Opc = X86::VBLENDPSrri;
2461 WorkingMI = CloneIfNew(
MI);
2467 assert(
Opc == X86::MOVSDrr &&
"Only MOVSD can commute to SHUFPD");
2468 WorkingMI = CloneIfNew(
MI);
2473 case X86::SHUFPDrri: {
2475 assert(
MI.getOperand(3).getImm() == 0x02 &&
"Unexpected immediate!");
2476 WorkingMI = CloneIfNew(
MI);
2481 case X86::PCLMULQDQrri:
2482 case X86::VPCLMULQDQrri:
2483 case X86::VPCLMULQDQYrri:
2484 case X86::VPCLMULQDQZrri:
2485 case X86::VPCLMULQDQZ128rri:
2486 case X86::VPCLMULQDQZ256rri: {
2489 unsigned Imm =
MI.getOperand(3).getImm();
2490 unsigned Src1Hi = Imm & 0x01;
2491 unsigned Src2Hi = Imm & 0x10;
2492 WorkingMI = CloneIfNew(
MI);
2496 case X86::VPCMPBZ128rri:
2497 case X86::VPCMPUBZ128rri:
2498 case X86::VPCMPBZ256rri:
2499 case X86::VPCMPUBZ256rri:
2500 case X86::VPCMPBZrri:
2501 case X86::VPCMPUBZrri:
2502 case X86::VPCMPDZ128rri:
2503 case X86::VPCMPUDZ128rri:
2504 case X86::VPCMPDZ256rri:
2505 case X86::VPCMPUDZ256rri:
2506 case X86::VPCMPDZrri:
2507 case X86::VPCMPUDZrri:
2508 case X86::VPCMPQZ128rri:
2509 case X86::VPCMPUQZ128rri:
2510 case X86::VPCMPQZ256rri:
2511 case X86::VPCMPUQZ256rri:
2512 case X86::VPCMPQZrri:
2513 case X86::VPCMPUQZrri:
2514 case X86::VPCMPWZ128rri:
2515 case X86::VPCMPUWZ128rri:
2516 case X86::VPCMPWZ256rri:
2517 case X86::VPCMPUWZ256rri:
2518 case X86::VPCMPWZrri:
2519 case X86::VPCMPUWZrri:
2520 case X86::VPCMPBZ128rrik:
2521 case X86::VPCMPUBZ128rrik:
2522 case X86::VPCMPBZ256rrik:
2523 case X86::VPCMPUBZ256rrik:
2524 case X86::VPCMPBZrrik:
2525 case X86::VPCMPUBZrrik:
2526 case X86::VPCMPDZ128rrik:
2527 case X86::VPCMPUDZ128rrik:
2528 case X86::VPCMPDZ256rrik:
2529 case X86::VPCMPUDZ256rrik:
2530 case X86::VPCMPDZrrik:
2531 case X86::VPCMPUDZrrik:
2532 case X86::VPCMPQZ128rrik:
2533 case X86::VPCMPUQZ128rrik:
2534 case X86::VPCMPQZ256rrik:
2535 case X86::VPCMPUQZ256rrik:
2536 case X86::VPCMPQZrrik:
2537 case X86::VPCMPUQZrrik:
2538 case X86::VPCMPWZ128rrik:
2539 case X86::VPCMPUWZ128rrik:
2540 case X86::VPCMPWZ256rrik:
2541 case X86::VPCMPUWZ256rrik:
2542 case X86::VPCMPWZrrik:
2543 case X86::VPCMPUWZrrik:
2544 WorkingMI = CloneIfNew(
MI);
2548 MI.getOperand(
MI.getNumOperands() - 1).getImm() & 0x7));
2551 case X86::VPCOMUBri:
2553 case X86::VPCOMUDri:
2555 case X86::VPCOMUQri:
2557 case X86::VPCOMUWri:
2558 WorkingMI = CloneIfNew(
MI);
2563 case X86::VCMPSDZrri:
2564 case X86::VCMPSSZrri:
2565 case X86::VCMPPDZrri:
2566 case X86::VCMPPSZrri:
2567 case X86::VCMPSHZrri:
2568 case X86::VCMPPHZrri:
2569 case X86::VCMPPHZ128rri:
2570 case X86::VCMPPHZ256rri:
2571 case X86::VCMPPDZ128rri:
2572 case X86::VCMPPSZ128rri:
2573 case X86::VCMPPDZ256rri:
2574 case X86::VCMPPSZ256rri:
2575 case X86::VCMPPDZrrik:
2576 case X86::VCMPPSZrrik:
2577 case X86::VCMPPDZ128rrik:
2578 case X86::VCMPPSZ128rrik:
2579 case X86::VCMPPDZ256rrik:
2580 case X86::VCMPPSZ256rrik:
2581 WorkingMI = CloneIfNew(
MI);
2584 MI.getOperand(
MI.getNumExplicitOperands() - 1).getImm() & 0x1f));
2586 case X86::VPERM2F128rri:
2587 case X86::VPERM2I128rri:
2591 WorkingMI = CloneIfNew(
MI);
2594 case X86::MOVHLPSrr:
2595 case X86::UNPCKHPDrr:
2596 case X86::VMOVHLPSrr:
2597 case X86::VUNPCKHPDrr:
2598 case X86::VMOVHLPSZrr:
2599 case X86::VUNPCKHPDZ128rr:
2600 assert(Subtarget.hasSSE2() &&
"Commuting MOVHLP/UNPCKHPD requires SSE2!");
2605 case X86::MOVHLPSrr:
2606 Opc = X86::UNPCKHPDrr;
2608 case X86::UNPCKHPDrr:
2609 Opc = X86::MOVHLPSrr;
2611 case X86::VMOVHLPSrr:
2612 Opc = X86::VUNPCKHPDrr;
2614 case X86::VUNPCKHPDrr:
2615 Opc = X86::VMOVHLPSrr;
2617 case X86::VMOVHLPSZrr:
2618 Opc = X86::VUNPCKHPDZ128rr;
2620 case X86::VUNPCKHPDZ128rr:
2621 Opc = X86::VMOVHLPSZrr;
2624 WorkingMI = CloneIfNew(
MI);
2630 WorkingMI = CloneIfNew(
MI);
2631 unsigned OpNo =
MI.getDesc().getNumOperands() - 1;
2636 case X86::VPTERNLOGDZrri:
2637 case X86::VPTERNLOGDZrmi:
2638 case X86::VPTERNLOGDZ128rri:
2639 case X86::VPTERNLOGDZ128rmi:
2640 case X86::VPTERNLOGDZ256rri:
2641 case X86::VPTERNLOGDZ256rmi:
2642 case X86::VPTERNLOGQZrri:
2643 case X86::VPTERNLOGQZrmi:
2644 case X86::VPTERNLOGQZ128rri:
2645 case X86::VPTERNLOGQZ128rmi:
2646 case X86::VPTERNLOGQZ256rri:
2647 case X86::VPTERNLOGQZ256rmi:
2648 case X86::VPTERNLOGDZrrik:
2649 case X86::VPTERNLOGDZ128rrik:
2650 case X86::VPTERNLOGDZ256rrik:
2651 case X86::VPTERNLOGQZrrik:
2652 case X86::VPTERNLOGQZ128rrik:
2653 case X86::VPTERNLOGQZ256rrik:
2654 case X86::VPTERNLOGDZrrikz:
2655 case X86::VPTERNLOGDZrmikz:
2656 case X86::VPTERNLOGDZ128rrikz:
2657 case X86::VPTERNLOGDZ128rmikz:
2658 case X86::VPTERNLOGDZ256rrikz:
2659 case X86::VPTERNLOGDZ256rmikz:
2660 case X86::VPTERNLOGQZrrikz:
2661 case X86::VPTERNLOGQZrmikz:
2662 case X86::VPTERNLOGQZ128rrikz:
2663 case X86::VPTERNLOGQZ128rmikz:
2664 case X86::VPTERNLOGQZ256rrikz:
2665 case X86::VPTERNLOGQZ256rmikz:
2666 case X86::VPTERNLOGDZ128rmbi:
2667 case X86::VPTERNLOGDZ256rmbi:
2668 case X86::VPTERNLOGDZrmbi:
2669 case X86::VPTERNLOGQZ128rmbi:
2670 case X86::VPTERNLOGQZ256rmbi:
2671 case X86::VPTERNLOGQZrmbi:
2672 case X86::VPTERNLOGDZ128rmbikz:
2673 case X86::VPTERNLOGDZ256rmbikz:
2674 case X86::VPTERNLOGDZrmbikz:
2675 case X86::VPTERNLOGQZ128rmbikz:
2676 case X86::VPTERNLOGQZ256rmbikz:
2677 case X86::VPTERNLOGQZrmbikz: {
2678 WorkingMI = CloneIfNew(
MI);
2684 WorkingMI = CloneIfNew(
MI);
2690 WorkingMI = CloneIfNew(
MI);
2699bool X86InstrInfo::findThreeSrcCommutedOpIndices(
const MachineInstr &
MI,
2700 unsigned &SrcOpIdx1,
2701 unsigned &SrcOpIdx2,
2702 bool IsIntrinsic)
const {
2705 unsigned FirstCommutableVecOp = 1;
2706 unsigned LastCommutableVecOp = 3;
2707 unsigned KMaskOp = -1U;
2730 FirstCommutableVecOp = 3;
2732 LastCommutableVecOp++;
2733 }
else if (IsIntrinsic) {
2736 FirstCommutableVecOp = 2;
2739 if (
isMem(
MI, LastCommutableVecOp))
2740 LastCommutableVecOp--;
2745 if (SrcOpIdx1 != CommuteAnyOperandIndex &&
2746 (SrcOpIdx1 < FirstCommutableVecOp || SrcOpIdx1 > LastCommutableVecOp ||
2747 SrcOpIdx1 == KMaskOp))
2749 if (SrcOpIdx2 != CommuteAnyOperandIndex &&
2750 (SrcOpIdx2 < FirstCommutableVecOp || SrcOpIdx2 > LastCommutableVecOp ||
2751 SrcOpIdx2 == KMaskOp))
2756 if (SrcOpIdx1 == CommuteAnyOperandIndex ||
2757 SrcOpIdx2 == CommuteAnyOperandIndex) {
2758 unsigned CommutableOpIdx2 = SrcOpIdx2;
2762 if (SrcOpIdx1 == SrcOpIdx2)
2765 CommutableOpIdx2 = LastCommutableVecOp;
2766 else if (SrcOpIdx2 == CommuteAnyOperandIndex)
2768 CommutableOpIdx2 = SrcOpIdx1;
2772 Register Op2Reg =
MI.getOperand(CommutableOpIdx2).getReg();
2774 unsigned CommutableOpIdx1;
2775 for (CommutableOpIdx1 = LastCommutableVecOp;
2776 CommutableOpIdx1 >= FirstCommutableVecOp; CommutableOpIdx1--) {
2778 if (CommutableOpIdx1 == KMaskOp)
2784 if (Op2Reg !=
MI.getOperand(CommutableOpIdx1).getReg())
2789 if (CommutableOpIdx1 < FirstCommutableVecOp)
2794 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
2803 unsigned &SrcOpIdx1,
2804 unsigned &SrcOpIdx2)
const {
2806 if (!
Desc.isCommutable())
2809 switch (
MI.getOpcode()) {
2814 case X86::VCMPSDrri:
2815 case X86::VCMPSSrri:
2816 case X86::VCMPPDrri:
2817 case X86::VCMPPSrri:
2818 case X86::VCMPPDYrri:
2819 case X86::VCMPPSYrri:
2820 case X86::VCMPSDZrri:
2821 case X86::VCMPSSZrri:
2822 case X86::VCMPPDZrri:
2823 case X86::VCMPPSZrri:
2824 case X86::VCMPSHZrri:
2825 case X86::VCMPPHZrri:
2826 case X86::VCMPPHZ128rri:
2827 case X86::VCMPPHZ256rri:
2828 case X86::VCMPPDZ128rri:
2829 case X86::VCMPPSZ128rri:
2830 case X86::VCMPPDZ256rri:
2831 case X86::VCMPPSZ256rri:
2832 case X86::VCMPPDZrrik:
2833 case X86::VCMPPSZrrik:
2834 case X86::VCMPPDZ128rrik:
2835 case X86::VCMPPSZ128rrik:
2836 case X86::VCMPPDZ256rrik:
2837 case X86::VCMPPSZ256rrik: {
2842 unsigned Imm =
MI.getOperand(3 + OpOffset).getImm() & 0x7;
2859 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1 + OpOffset,
2866 if (Subtarget.hasSSE41())
2869 case X86::SHUFPDrri:
2871 if (
MI.getOperand(3).getImm() == 0x02)
2874 case X86::MOVHLPSrr:
2875 case X86::UNPCKHPDrr:
2876 case X86::VMOVHLPSrr:
2877 case X86::VUNPCKHPDrr:
2878 case X86::VMOVHLPSZrr:
2879 case X86::VUNPCKHPDZ128rr:
2880 if (Subtarget.hasSSE2())
2883 case X86::VPTERNLOGDZrri:
2884 case X86::VPTERNLOGDZrmi:
2885 case X86::VPTERNLOGDZ128rri:
2886 case X86::VPTERNLOGDZ128rmi:
2887 case X86::VPTERNLOGDZ256rri:
2888 case X86::VPTERNLOGDZ256rmi:
2889 case X86::VPTERNLOGQZrri:
2890 case X86::VPTERNLOGQZrmi:
2891 case X86::VPTERNLOGQZ128rri:
2892 case X86::VPTERNLOGQZ128rmi:
2893 case X86::VPTERNLOGQZ256rri:
2894 case X86::VPTERNLOGQZ256rmi:
2895 case X86::VPTERNLOGDZrrik:
2896 case X86::VPTERNLOGDZ128rrik:
2897 case X86::VPTERNLOGDZ256rrik:
2898 case X86::VPTERNLOGQZrrik:
2899 case X86::VPTERNLOGQZ128rrik:
2900 case X86::VPTERNLOGQZ256rrik:
2901 case X86::VPTERNLOGDZrrikz:
2902 case X86::VPTERNLOGDZrmikz:
2903 case X86::VPTERNLOGDZ128rrikz:
2904 case X86::VPTERNLOGDZ128rmikz:
2905 case X86::VPTERNLOGDZ256rrikz:
2906 case X86::VPTERNLOGDZ256rmikz:
2907 case X86::VPTERNLOGQZrrikz:
2908 case X86::VPTERNLOGQZrmikz:
2909 case X86::VPTERNLOGQZ128rrikz:
2910 case X86::VPTERNLOGQZ128rmikz:
2911 case X86::VPTERNLOGQZ256rrikz:
2912 case X86::VPTERNLOGQZ256rmikz:
2913 case X86::VPTERNLOGDZ128rmbi:
2914 case X86::VPTERNLOGDZ256rmbi:
2915 case X86::VPTERNLOGDZrmbi:
2916 case X86::VPTERNLOGQZ128rmbi:
2917 case X86::VPTERNLOGQZ256rmbi:
2918 case X86::VPTERNLOGQZrmbi:
2919 case X86::VPTERNLOGDZ128rmbikz:
2920 case X86::VPTERNLOGDZ256rmbikz:
2921 case X86::VPTERNLOGDZrmbikz:
2922 case X86::VPTERNLOGQZ128rmbikz:
2923 case X86::VPTERNLOGQZ256rmbikz:
2924 case X86::VPTERNLOGQZrmbikz:
2925 return findThreeSrcCommutedOpIndices(
MI, SrcOpIdx1, SrcOpIdx2);
2926 case X86::VPDPWSSDYrr:
2927 case X86::VPDPWSSDrr:
2928 case X86::VPDPWSSDSYrr:
2929 case X86::VPDPWSSDSrr:
2930 case X86::VPDPWUUDrr:
2931 case X86::VPDPWUUDYrr:
2932 case X86::VPDPWUUDSrr:
2933 case X86::VPDPWUUDSYrr:
2934 case X86::VPDPBSSDSrr:
2935 case X86::VPDPBSSDSYrr:
2936 case X86::VPDPBSSDrr:
2937 case X86::VPDPBSSDYrr:
2938 case X86::VPDPBUUDSrr:
2939 case X86::VPDPBUUDSYrr:
2940 case X86::VPDPBUUDrr:
2941 case X86::VPDPBUUDYrr:
2942 case X86::VPDPBSSDSZ128r:
2943 case X86::VPDPBSSDSZ128rk:
2944 case X86::VPDPBSSDSZ128rkz:
2945 case X86::VPDPBSSDSZ256r:
2946 case X86::VPDPBSSDSZ256rk:
2947 case X86::VPDPBSSDSZ256rkz:
2948 case X86::VPDPBSSDSZr:
2949 case X86::VPDPBSSDSZrk:
2950 case X86::VPDPBSSDSZrkz:
2951 case X86::VPDPBSSDZ128r:
2952 case X86::VPDPBSSDZ128rk:
2953 case X86::VPDPBSSDZ128rkz:
2954 case X86::VPDPBSSDZ256r:
2955 case X86::VPDPBSSDZ256rk:
2956 case X86::VPDPBSSDZ256rkz:
2957 case X86::VPDPBSSDZr:
2958 case X86::VPDPBSSDZrk:
2959 case X86::VPDPBSSDZrkz:
2960 case X86::VPDPBUUDSZ128r:
2961 case X86::VPDPBUUDSZ128rk:
2962 case X86::VPDPBUUDSZ128rkz:
2963 case X86::VPDPBUUDSZ256r:
2964 case X86::VPDPBUUDSZ256rk:
2965 case X86::VPDPBUUDSZ256rkz:
2966 case X86::VPDPBUUDSZr:
2967 case X86::VPDPBUUDSZrk:
2968 case X86::VPDPBUUDSZrkz:
2969 case X86::VPDPBUUDZ128r:
2970 case X86::VPDPBUUDZ128rk:
2971 case X86::VPDPBUUDZ128rkz:
2972 case X86::VPDPBUUDZ256r:
2973 case X86::VPDPBUUDZ256rk:
2974 case X86::VPDPBUUDZ256rkz:
2975 case X86::VPDPBUUDZr:
2976 case X86::VPDPBUUDZrk:
2977 case X86::VPDPBUUDZrkz:
2978 case X86::VPDPWSSDZ128r:
2979 case X86::VPDPWSSDZ128rk:
2980 case X86::VPDPWSSDZ128rkz:
2981 case X86::VPDPWSSDZ256r:
2982 case X86::VPDPWSSDZ256rk:
2983 case X86::VPDPWSSDZ256rkz:
2984 case X86::VPDPWSSDZr:
2985 case X86::VPDPWSSDZrk:
2986 case X86::VPDPWSSDZrkz:
2987 case X86::VPDPWSSDSZ128r:
2988 case X86::VPDPWSSDSZ128rk:
2989 case X86::VPDPWSSDSZ128rkz:
2990 case X86::VPDPWSSDSZ256r:
2991 case X86::VPDPWSSDSZ256rk:
2992 case X86::VPDPWSSDSZ256rkz:
2993 case X86::VPDPWSSDSZr:
2994 case X86::VPDPWSSDSZrk:
2995 case X86::VPDPWSSDSZrkz:
2996 case X86::VPDPWUUDZ128r:
2997 case X86::VPDPWUUDZ128rk:
2998 case X86::VPDPWUUDZ128rkz:
2999 case X86::VPDPWUUDZ256r:
3000 case X86::VPDPWUUDZ256rk:
3001 case X86::VPDPWUUDZ256rkz:
3002 case X86::VPDPWUUDZr:
3003 case X86::VPDPWUUDZrk:
3004 case X86::VPDPWUUDZrkz:
3005 case X86::VPDPWUUDSZ128r:
3006 case X86::VPDPWUUDSZ128rk:
3007 case X86::VPDPWUUDSZ128rkz:
3008 case X86::VPDPWUUDSZ256r:
3009 case X86::VPDPWUUDSZ256rk:
3010 case X86::VPDPWUUDSZ256rkz:
3011 case X86::VPDPWUUDSZr:
3012 case X86::VPDPWUUDSZrk:
3013 case X86::VPDPWUUDSZrkz:
3014 case X86::VPMADD52HUQrr:
3015 case X86::VPMADD52HUQYrr:
3016 case X86::VPMADD52HUQZ128r:
3017 case X86::VPMADD52HUQZ128rk:
3018 case X86::VPMADD52HUQZ128rkz:
3019 case X86::VPMADD52HUQZ256r:
3020 case X86::VPMADD52HUQZ256rk:
3021 case X86::VPMADD52HUQZ256rkz:
3022 case X86::VPMADD52HUQZr:
3023 case X86::VPMADD52HUQZrk:
3024 case X86::VPMADD52HUQZrkz:
3025 case X86::VPMADD52LUQrr:
3026 case X86::VPMADD52LUQYrr:
3027 case X86::VPMADD52LUQZ128r:
3028 case X86::VPMADD52LUQZ128rk:
3029 case X86::VPMADD52LUQZ128rkz:
3030 case X86::VPMADD52LUQZ256r:
3031 case X86::VPMADD52LUQZ256rk:
3032 case X86::VPMADD52LUQZ256rkz:
3033 case X86::VPMADD52LUQZr:
3034 case X86::VPMADD52LUQZrk:
3035 case X86::VPMADD52LUQZrkz:
3036 case X86::VFMADDCPHZr:
3037 case X86::VFMADDCPHZrk:
3038 case X86::VFMADDCPHZrkz:
3039 case X86::VFMADDCPHZ128r:
3040 case X86::VFMADDCPHZ128rk:
3041 case X86::VFMADDCPHZ128rkz:
3042 case X86::VFMADDCPHZ256r:
3043 case X86::VFMADDCPHZ256rk:
3044 case X86::VFMADDCPHZ256rkz:
3045 case X86::VFMADDCSHZr:
3046 case X86::VFMADDCSHZrk:
3047 case X86::VFMADDCSHZrkz: {
3048 unsigned CommutableOpIdx1 = 2;
3049 unsigned CommutableOpIdx2 = 3;
3055 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
3058 if (!
MI.getOperand(SrcOpIdx1).isReg() || !
MI.getOperand(SrcOpIdx2).isReg())
3068 return findThreeSrcCommutedOpIndices(
MI, SrcOpIdx1, SrcOpIdx2,
3075 unsigned CommutableOpIdx1 =
Desc.getNumDefs() + 1;
3076 unsigned CommutableOpIdx2 =
Desc.getNumDefs() + 2;
3079 if ((
MI.getDesc().getOperandConstraint(
Desc.getNumDefs(),
3094 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
3098 if (!
MI.getOperand(SrcOpIdx1).isReg() ||
3099 !
MI.getOperand(SrcOpIdx2).isReg())
3111 unsigned Opcode =
MI->getOpcode();
3112 if (Opcode != X86::LEA32r && Opcode != X86::LEA64r &&
3113 Opcode != X86::LEA64_32r)
3135 unsigned Opcode =
MI.getOpcode();
3136 if (Opcode != X86::ADD32rr && Opcode != X86::ADD64rr)
3163 unsigned Opcode =
MCID.getOpcode();
3164 if (!(X86::isJCC(Opcode) || X86::isSETCC(Opcode) || X86::isSETZUCC(Opcode) ||
3165 X86::isCMOVCC(Opcode) || X86::isCFCMOVCC(Opcode) ||
3166 X86::isCCMPCC(Opcode) || X86::isCTESTCC(Opcode)))
3169 unsigned NumUses =
MCID.getNumOperands() -
MCID.getNumDefs();
3178 CondNo +=
MCID.getNumDefs();
3188 return X86::isSETCC(
MI.getOpcode()) || X86::isSETZUCC(
MI.getOpcode())
3204 return X86::isCCMPCC(
MI.getOpcode()) || X86::isCTESTCC(
MI.getOpcode())
3235 enum { CF = 1, ZF = 2, SF = 4, OF = 8, PF = CF };
3266#define GET_X86_NF_TRANSFORM_TABLE
3267#define GET_X86_ND2NONND_TABLE
3268#include "X86GenInstrMapping.inc"
3273 return (
I == Table.
end() ||
I->OldOpc !=
Opc) ? 0U :
I->NewOpc;
3276#if defined(EXPENSIVE_CHECKS) && !defined(NDEBUG)
3278 static std::atomic<bool> NFTableChecked(
false);
3279 if (!NFTableChecked.load(std::memory_order_relaxed)) {
3281 "X86NFTransformTable is not sorted!");
3282 NFTableChecked.store(
true, std::memory_order_relaxed);
3289#if defined(EXPENSIVE_CHECKS) && !defined(NDEBUG)
3291 static std::atomic<bool> NDTableChecked(
false);
3292 if (!NDTableChecked.load(std::memory_order_relaxed)) {
3294 "X86ND2NonNDTableis not sorted!");
3295 NDTableChecked.store(
true, std::memory_order_relaxed);
3375std::pair<X86::CondCode, bool>
3378 bool NeedSwap =
false;
3379 switch (Predicate) {
3458 return std::make_pair(CC, NeedSwap);
3467#define GET_ND_IF_ENABLED(OPC) (HasNDD ? OPC##_ND : OPC)
3561 switch (Imm & 0x3) {
3579 if (Info.RegClass == X86::VR128RegClassID ||
3580 Info.RegClass == X86::VR128XRegClassID)
3582 if (Info.RegClass == X86::VR256RegClassID ||
3583 Info.RegClass == X86::VR256XRegClassID)
3585 if (Info.RegClass == X86::VR512RegClassID)
3592 return (
Reg == X86::FPCW ||
Reg == X86::FPSW ||
3593 (
Reg >= X86::ST0 &&
Reg <= X86::ST7));
3601 if (
MI.isCall() ||
MI.isInlineAsm())
3625#ifdef EXPENSIVE_CHECKS
3627 "Got false negative from X86II::getMemoryOperandNo()!");
3637#ifdef EXPENSIVE_CHECKS
3639 "Expected no operands to have OPERAND_MEMORY type!");
3648 if (IsMemOp(
Desc.operands()[
I])) {
3649#ifdef EXPENSIVE_CHECKS
3653 "Expected all five operands in the memory reference to have "
3654 "OPERAND_MEMORY type!");
3666 "Unexpected number of operands!");
3669 if (!Index.isReg() || Index.getReg() != X86::NoRegister)
3677 MI.getParent()->getParent()->getConstantPool()->getConstants();
3689 switch (
MI.getOpcode()) {
3690 case X86::TCRETURNdi:
3691 case X86::TCRETURNri:
3692 case X86::TCRETURNmi:
3693 case X86::TCRETURNdi64:
3694 case X86::TCRETURNri64:
3695 case X86::TCRETURNri64_ImpCall:
3696 case X86::TCRETURNmi64:
3715 if (Symbol ==
"__x86_indirect_thunk_r11")
3720 if (TailCall.getOpcode() != X86::TCRETURNdi &&
3721 TailCall.getOpcode() != X86::TCRETURNdi64) {
3726 if (Subtarget.isTargetWin64() && MF->
hasWinCFI()) {
3739 TailCall.getOperand(1).getImm() != 0) {
3753 while (
I !=
MBB.begin()) {
3755 if (
I->isDebugInstr())
3758 assert(0 &&
"Can't find the branch to replace!");
3762 if (CC != BranchCond[0].
getImm())
3768 unsigned Opc = TailCall.getOpcode() == X86::TCRETURNdi ? X86::TCRETURNdicc
3769 : X86::TCRETURNdi64cc;
3780 LiveRegs.addLiveOuts(
MBB);
3782 LiveRegs.stepForward(*MIB, Clobbers);
3783 for (
const auto &
C : Clobbers) {
3788 I->eraseFromParent();
3802 if (Succ->isEHPad() || (Succ ==
TBB && FallthroughBB))
3805 if (FallthroughBB && FallthroughBB !=
TBB)
3807 FallthroughBB = Succ;
3809 return FallthroughBB;
3812bool X86InstrInfo::analyzeBranchImpl(
3823 if (
I->isDebugInstr())
3828 if (!isUnpredicatedTerminator(*
I))
3837 if (
I->getOpcode() == X86::JMP_1) {
3841 TBB =
I->getOperand(0).getMBB();
3856 UnCondBrIter =
MBB.
end();
3861 TBB =
I->getOperand(0).getMBB();
3872 if (
I->findRegisterUseOperand(X86::EFLAGS,
nullptr)->isUndef())
3878 TBB =
I->getOperand(0).getMBB();
3893 if (OldBranchCode == BranchCode &&
TBB == NewTBB)
3899 if (
TBB == NewTBB &&
3932 Cond[0].setImm(BranchCode);
3943 bool AllowModify)
const {
3945 return analyzeBranchImpl(
MBB,
TBB, FBB,
Cond, CondBranches, AllowModify);
3951 assert(MemRefBegin >= 0 &&
"instr should have memory operand");
3963 if (!
Reg.isVirtual())
3968 unsigned Opcode =
MI->getOpcode();
3969 if (Opcode != X86::LEA64r && Opcode != X86::LEA32r)
3975 unsigned Opcode =
MI.getOpcode();
3978 if (Opcode == X86::JMP64m || Opcode == X86::JMP32m) {
3986 if (Opcode == X86::JMP64r || Opcode == X86::JMP32r) {
3988 if (!Reg.isVirtual())
3995 if (
Add->getOpcode() != X86::ADD64rr &&
Add->getOpcode() != X86::ADD32rr)
4008 MachineBranchPredicate &MBP,
4009 bool AllowModify)
const {
4010 using namespace std::placeholders;
4014 if (analyzeBranchImpl(
MBB, MBP.TrueDest, MBP.FalseDest,
Cond, CondBranches,
4018 if (
Cond.size() != 1)
4021 assert(MBP.TrueDest &&
"expected!");
4024 MBP.FalseDest =
MBB.getNextNode();
4029 bool SingleUseCondition =
true;
4032 if (
MI.modifiesRegister(X86::EFLAGS,
TRI)) {
4037 if (
MI.readsRegister(X86::EFLAGS,
TRI))
4038 SingleUseCondition =
false;
4044 if (SingleUseCondition) {
4045 for (
auto *Succ :
MBB.successors())
4046 if (Succ->isLiveIn(X86::EFLAGS))
4047 SingleUseCondition =
false;
4050 MBP.ConditionDef = ConditionDef;
4051 MBP.SingleUseCondition = SingleUseCondition;
4058 const unsigned TestOpcode =
4059 Subtarget.is64Bit() ? X86::TEST64rr : X86::TEST32rr;
4061 if (ConditionDef->
getOpcode() == TestOpcode &&
4068 ? MachineBranchPredicate::PRED_NE
4069 : MachineBranchPredicate::PRED_EQ;
4077 int *BytesRemoved)
const {
4078 assert(!BytesRemoved &&
"code size not handled");
4083 while (
I !=
MBB.begin()) {
4085 if (
I->isDebugInstr())
4087 if (
I->getOpcode() != X86::JMP_1 &&
4091 I->eraseFromParent();
4105 assert(
TBB &&
"insertBranch must not be told to insert a fallthrough");
4107 "X86 branch conditions have one component!");
4108 assert(!BytesAdded &&
"code size not handled");
4112 assert(!FBB &&
"Unconditional branch with multiple successors!");
4118 bool FallThru = FBB ==
nullptr;
4133 if (FBB ==
nullptr) {
4135 assert(FBB &&
"MBB cannot be the last block in function when the false "
4136 "body is a fall-through.");
4160 Register FalseReg,
int &CondCycles,
4161 int &TrueCycles,
int &FalseCycles)
const {
4163 if (!Subtarget.canUseCMOV())
4165 if (
Cond.size() != 1)
4174 RI.getCommonSubClass(
MRI.getRegClass(TrueReg),
MRI.getRegClass(FalseReg));
4179 if (X86::GR16RegClass.hasSubClassEq(RC) ||
4180 X86::GR32RegClass.hasSubClassEq(RC) ||
4181 X86::GR64RegClass.hasSubClassEq(RC)) {
4202 assert(
Cond.size() == 1 &&
"Invalid Cond array");
4205 false , Subtarget.hasNDD());
4214 return X86::GR8_ABCD_HRegClass.contains(
Reg);
4220 bool HasAVX = Subtarget.
hasAVX();
4222 bool HasEGPR = Subtarget.hasEGPR();
4229 if (X86::VK16RegClass.
contains(SrcReg)) {
4230 if (X86::GR64RegClass.
contains(DestReg)) {
4231 assert(Subtarget.hasBWI());
4232 return HasEGPR ? X86::KMOVQrk_EVEX : X86::KMOVQrk;
4234 if (X86::GR32RegClass.
contains(DestReg))
4235 return Subtarget.hasBWI() ? (HasEGPR ? X86::KMOVDrk_EVEX : X86::KMOVDrk)
4236 : (HasEGPR ? X86::KMOVWrk_EVEX : X86::KMOVWrk);
4244 if (X86::VK16RegClass.
contains(DestReg)) {
4245 if (X86::GR64RegClass.
contains(SrcReg)) {
4246 assert(Subtarget.hasBWI());
4247 return HasEGPR ? X86::KMOVQkr_EVEX : X86::KMOVQkr;
4249 if (X86::GR32RegClass.
contains(SrcReg))
4250 return Subtarget.hasBWI() ? (HasEGPR ? X86::KMOVDkr_EVEX : X86::KMOVDkr)
4251 : (HasEGPR ? X86::KMOVWkr_EVEX : X86::KMOVWkr);
4259 if (X86::GR64RegClass.
contains(DestReg)) {
4260 if (X86::VR128XRegClass.
contains(SrcReg))
4262 return HasAVX512 ? X86::VMOVPQIto64Zrr
4263 : HasAVX ? X86::VMOVPQIto64rr
4264 : X86::MOVPQIto64rr;
4265 if (X86::VR64RegClass.
contains(SrcReg))
4267 return X86::MMX_MOVD64from64rr;
4268 }
else if (X86::GR64RegClass.
contains(SrcReg)) {
4270 if (X86::VR128XRegClass.
contains(DestReg))
4271 return HasAVX512 ? X86::VMOV64toPQIZrr
4272 : HasAVX ? X86::VMOV64toPQIrr
4273 : X86::MOV64toPQIrr;
4275 if (X86::VR64RegClass.
contains(DestReg))
4276 return X86::MMX_MOVD64to64rr;
4282 if (X86::GR32RegClass.
contains(DestReg) &&
4283 X86::VR128XRegClass.
contains(SrcReg))
4285 return HasAVX512 ? X86::VMOVPDI2DIZrr
4286 : HasAVX ? X86::VMOVPDI2DIrr
4289 if (X86::VR128XRegClass.
contains(DestReg) &&
4290 X86::GR32RegClass.
contains(SrcReg))
4292 return HasAVX512 ? X86::VMOVDI2PDIZrr
4293 : HasAVX ? X86::VMOVDI2PDIrr
4302 bool RenamableDest,
bool RenamableSrc)
const {
4304 bool HasAVX = Subtarget.hasAVX();
4305 bool HasVLX = Subtarget.hasVLX();
4306 bool HasEGPR = Subtarget.hasEGPR();
4308 if (X86::GR64RegClass.
contains(DestReg, SrcReg))
4310 else if (X86::GR32RegClass.
contains(DestReg, SrcReg))
4312 else if (X86::GR16RegClass.
contains(DestReg, SrcReg))
4314 else if (X86::GR8RegClass.
contains(DestReg, SrcReg)) {
4317 if ((
isHReg(DestReg) ||
isHReg(SrcReg)) && Subtarget.is64Bit()) {
4318 Opc = X86::MOV8rr_NOREX;
4321 "8-bit H register can not be copied outside GR8_NOREX");
4324 }
else if (X86::VR64RegClass.
contains(DestReg, SrcReg))
4325 Opc = X86::MMX_MOVQ64rr;
4326 else if (X86::VR128XRegClass.
contains(DestReg, SrcReg)) {
4328 Opc = X86::VMOVAPSZ128rr;
4329 else if (X86::VR128RegClass.
contains(DestReg, SrcReg))
4330 Opc = HasAVX ? X86::VMOVAPSrr : X86::MOVAPSrr;
4334 Opc = X86::VMOVAPSZrr;
4337 TRI->getMatchingSuperReg(DestReg, X86::sub_xmm, &X86::VR512RegClass);
4339 TRI->getMatchingSuperReg(SrcReg, X86::sub_xmm, &X86::VR512RegClass);
4341 }
else if (X86::VR256XRegClass.
contains(DestReg, SrcReg)) {
4343 Opc = X86::VMOVAPSZ256rr;
4344 else if (X86::VR256RegClass.
contains(DestReg, SrcReg))
4345 Opc = X86::VMOVAPSYrr;
4349 Opc = X86::VMOVAPSZrr;
4352 TRI->getMatchingSuperReg(DestReg, X86::sub_ymm, &X86::VR512RegClass);
4354 TRI->getMatchingSuperReg(SrcReg, X86::sub_ymm, &X86::VR512RegClass);
4356 }
else if (X86::VR512RegClass.
contains(DestReg, SrcReg))
4357 Opc = X86::VMOVAPSZrr;
4360 else if (X86::VK16RegClass.
contains(DestReg, SrcReg))
4361 Opc = Subtarget.hasBWI() ? (HasEGPR ? X86::KMOVQkk_EVEX : X86::KMOVQkk)
4362 : (HasEGPR ? X86::KMOVQkk_EVEX : X86::KMOVWkk);
4372 if (SrcReg == X86::EFLAGS || DestReg == X86::EFLAGS) {
4380 LLVM_DEBUG(
dbgs() <<
"Cannot copy " << RI.getName(SrcReg) <<
" to "
4381 << RI.getName(DestReg) <<
'\n');
4385std::optional<DestSourcePair>
4387 if (
MI.isMoveReg()) {
4391 if (
MI.getOperand(0).isUndef() &&
MI.getOperand(0).getSubReg())
4392 return std::nullopt;
4396 return std::nullopt;
4401 return Load ? X86::VMOVSHZrm_alt : X86::VMOVSHZmr;
4403 return X86::MOVSHPrm;
4404 return X86::MOVSHPmr;
4409 bool IsStackAligned,
4411 bool HasAVX = STI.
hasAVX();
4413 bool HasVLX = STI.hasVLX();
4414 bool HasEGPR = STI.hasEGPR();
4416 assert(RC !=
nullptr &&
"Invalid target register class");
4421 assert(X86::GR8RegClass.hasSubClassEq(RC) &&
"Unknown 1-byte regclass");
4425 if (
isHReg(
Reg) || X86::GR8_ABCD_HRegClass.hasSubClassEq(RC))
4426 return Load ? X86::MOV8rm_NOREX : X86::MOV8mr_NOREX;
4427 return Load ? X86::MOV8rm : X86::MOV8mr;
4429 if (X86::VK16RegClass.hasSubClassEq(RC))
4430 return Load ? (HasEGPR ? X86::KMOVWkm_EVEX : X86::KMOVWkm)
4431 : (HasEGPR ? X86::KMOVWmk_EVEX : X86::KMOVWmk);
4432 assert(X86::GR16RegClass.hasSubClassEq(RC) &&
"Unknown 2-byte regclass");
4433 return Load ? X86::MOV16rm : X86::MOV16mr;
4435 if (X86::GR32RegClass.hasSubClassEq(RC))
4436 return Load ? X86::MOV32rm : X86::MOV32mr;
4437 if (X86::FR32XRegClass.hasSubClassEq(RC))
4438 return Load ? (HasAVX512 ? X86::VMOVSSZrm_alt
4439 : HasAVX ? X86::VMOVSSrm_alt
4441 : (HasAVX512 ? X86::VMOVSSZmr
4442 : HasAVX ? X86::VMOVSSmr
4444 if (X86::RFP32RegClass.hasSubClassEq(RC))
4445 return Load ? X86::LD_Fp32m : X86::ST_Fp32m;
4446 if (X86::VK32RegClass.hasSubClassEq(RC)) {
4447 assert(STI.hasBWI() &&
"KMOVD requires BWI");
4448 return Load ? (HasEGPR ? X86::KMOVDkm_EVEX : X86::KMOVDkm)
4449 : (HasEGPR ? X86::KMOVDmk_EVEX : X86::KMOVDmk);
4453 if (X86::VK1PAIRRegClass.hasSubClassEq(RC) ||
4454 X86::VK2PAIRRegClass.hasSubClassEq(RC) ||
4455 X86::VK4PAIRRegClass.hasSubClassEq(RC) ||
4456 X86::VK8PAIRRegClass.hasSubClassEq(RC) ||
4457 X86::VK16PAIRRegClass.hasSubClassEq(RC))
4458 return Load ? X86::MASKPAIR16LOAD : X86::MASKPAIR16STORE;
4459 if (X86::FR16RegClass.hasSubClassEq(RC) ||
4460 X86::FR16XRegClass.hasSubClassEq(RC))
4464 if (X86::GR64RegClass.hasSubClassEq(RC))
4465 return Load ? X86::MOV64rm : X86::MOV64mr;
4466 if (X86::FR64XRegClass.hasSubClassEq(RC))
4467 return Load ? (HasAVX512 ? X86::VMOVSDZrm_alt
4468 : HasAVX ? X86::VMOVSDrm_alt
4470 : (HasAVX512 ? X86::VMOVSDZmr
4471 : HasAVX ? X86::VMOVSDmr
4473 if (X86::VR64RegClass.hasSubClassEq(RC))
4474 return Load ? X86::MMX_MOVQ64rm : X86::MMX_MOVQ64mr;
4475 if (X86::RFP64RegClass.hasSubClassEq(RC))
4476 return Load ? X86::LD_Fp64m : X86::ST_Fp64m;
4477 if (X86::VK64RegClass.hasSubClassEq(RC)) {
4478 assert(STI.hasBWI() &&
"KMOVQ requires BWI");
4479 return Load ? (HasEGPR ? X86::KMOVQkm_EVEX : X86::KMOVQkm)
4480 : (HasEGPR ? X86::KMOVQmk_EVEX : X86::KMOVQmk);
4484 assert(X86::RFP80RegClass.hasSubClassEq(RC) &&
"Unknown 10-byte regclass");
4485 return Load ? X86::LD_Fp80m : X86::ST_FpP80m;
4487 if (X86::VR128XRegClass.hasSubClassEq(RC)) {
4490 return Load ? (HasVLX ? X86::VMOVAPSZ128rm
4491 : HasAVX512 ? X86::VMOVAPSZ128rm_NOVLX
4492 : HasAVX ? X86::VMOVAPSrm
4494 : (HasVLX ? X86::VMOVAPSZ128mr
4495 : HasAVX512 ? X86::VMOVAPSZ128mr_NOVLX
4496 : HasAVX ? X86::VMOVAPSmr
4499 return Load ? (HasVLX ? X86::VMOVUPSZ128rm
4500 : HasAVX512 ? X86::VMOVUPSZ128rm_NOVLX
4501 : HasAVX ? X86::VMOVUPSrm
4503 : (HasVLX ? X86::VMOVUPSZ128mr
4504 : HasAVX512 ? X86::VMOVUPSZ128mr_NOVLX
4505 : HasAVX ? X86::VMOVUPSmr
4511 assert(X86::VR256XRegClass.hasSubClassEq(RC) &&
"Unknown 32-byte regclass");
4514 return Load ? (HasVLX ? X86::VMOVAPSZ256rm
4515 : HasAVX512 ? X86::VMOVAPSZ256rm_NOVLX
4517 : (HasVLX ? X86::VMOVAPSZ256mr
4518 : HasAVX512 ? X86::VMOVAPSZ256mr_NOVLX
4521 return Load ? (HasVLX ? X86::VMOVUPSZ256rm
4522 : HasAVX512 ? X86::VMOVUPSZ256rm_NOVLX
4524 : (HasVLX ? X86::VMOVUPSZ256mr
4525 : HasAVX512 ? X86::VMOVUPSZ256mr_NOVLX
4528 assert(X86::VR512RegClass.hasSubClassEq(RC) &&
"Unknown 64-byte regclass");
4531 return Load ? X86::VMOVAPSZrm : X86::VMOVAPSZmr;
4533 return Load ? X86::VMOVUPSZrm : X86::VMOVUPSZmr;
4535 assert(X86::TILERegClass.hasSubClassEq(RC) &&
"Unknown 1024-byte regclass");
4536 assert(STI.hasAMXTILE() &&
"Using 8*1024-bit register requires AMX-TILE");
4537#define GET_EGPR_IF_ENABLED(OPC) (STI.hasEGPR() ? OPC##_EVEX : OPC)
4540#undef GET_EGPR_IF_ENABLED
4542 assert(X86::TILEPAIRRegClass.hasSubClassEq(RC) &&
4543 "Unknown 2048-byte regclass");
4544 assert(STI.hasAMXTILE() &&
"Using 2048-bit register requires AMX-TILE");
4545 return Load ? X86::PTILEPAIRLOAD : X86::PTILEPAIRSTORE;
4549std::optional<ExtAddrMode>
4554 if (MemRefBegin < 0)
4555 return std::nullopt;
4560 if (!BaseOp.isReg())
4561 return std::nullopt;
4565 if (!DispMO.
isImm())
4566 return std::nullopt;
4592 ErrInfo =
"Scale factor in address must be 1, 2, 4 or 8";
4597 ErrInfo =
"Displacement in address must fit into 32-bit signed "
4607 int64_t &ImmVal)
const {
4613 if (
MI.isSubregToReg()) {
4617 if (!
MI.getOperand(1).isImm())
4619 unsigned FillBits =
MI.getOperand(1).getImm();
4620 unsigned SubIdx =
MI.getOperand(3).getImm();
4621 MovReg =
MI.getOperand(2).getReg();
4622 if (SubIdx != X86::sub_32bit || FillBits != 0)
4625 MovMI =
MRI.getUniqueVRegDef(MovReg);
4630 if (MovMI->
getOpcode() == X86::MOV32r0 &&
4636 if (MovMI->
getOpcode() != X86::MOV32ri &&
4650 if (!
MI->modifiesRegister(NullValueReg,
TRI))
4652 switch (
MI->getOpcode()) {
4659 assert(
MI->getOperand(0).isDef() &&
MI->getOperand(1).isUse() &&
4660 "expected for shift opcode!");
4661 return MI->getOperand(0).getReg() == NullValueReg &&
4662 MI->getOperand(1).getReg() == NullValueReg;
4667 return TRI->isSubRegisterEq(NullValueReg, MO.getReg());
4681 if (MemRefBegin < 0)
4688 if (!BaseOp->
isReg())
4701 if (!DispMO.
isImm())
4706 if (!BaseOp->
isReg())
4709 OffsetIsScalable =
false;
4713 Width = !
MemOp.memoperands_empty() ?
MemOp.memoperands().front()->getSize()
4721 bool IsStackAligned,
4736 case X86::TILELOADD:
4737 case X86::TILESTORED:
4738 case X86::TILELOADD_EVEX:
4739 case X86::TILESTORED_EVEX:
4740 case X86::PTILEPAIRLOAD:
4741 case X86::PTILEPAIRSTORE:
4749 bool isKill)
const {
4753 case X86::TILESTORED:
4754 case X86::TILESTORED_EVEX:
4755 case X86::PTILEPAIRSTORE: {
4758 Register VirtReg = RegInfo.createVirtualRegister(&X86::GR64_NOSPRegClass);
4768 case X86::TILELOADD:
4769 case X86::TILELOADD_EVEX:
4770 case X86::PTILEPAIRLOAD: {
4773 Register VirtReg = RegInfo.createVirtualRegister(&X86::GR64_NOSPRegClass);
4793 "Stack slot too small for store");
4795 unsigned Alignment = std::max<uint32_t>(
TRI->getSpillSize(*RC), 16);
4797 (Subtarget.getFrameLowering()->getStackAlign() >= Alignment) ||
4816 "Load size exceeds stack slot");
4817 unsigned Alignment = std::max<uint32_t>(
TRI->getSpillSize(*RC), 16);
4819 (Subtarget.getFrameLowering()->getStackAlign() >= Alignment) ||
4831 Register &SrcReg2, int64_t &CmpMask,
4832 int64_t &CmpValue)
const {
4833 switch (
MI.getOpcode()) {
4836 case X86::CMP64ri32:
4840 SrcReg =
MI.getOperand(0).getReg();
4842 if (
MI.getOperand(1).isImm()) {
4844 CmpValue =
MI.getOperand(1).getImm();
4846 CmpMask = CmpValue = 0;
4854 SrcReg =
MI.getOperand(1).getReg();
4863 SrcReg =
MI.getOperand(1).getReg();
4864 SrcReg2 =
MI.getOperand(2).getReg();
4872 SrcReg =
MI.getOperand(1).getReg();
4874 if (
MI.getOperand(2).isImm()) {
4876 CmpValue =
MI.getOperand(2).getImm();
4878 CmpMask = CmpValue = 0;
4885 SrcReg =
MI.getOperand(0).getReg();
4886 SrcReg2 =
MI.getOperand(1).getReg();
4894 SrcReg =
MI.getOperand(0).getReg();
4895 if (
MI.getOperand(1).getReg() != SrcReg)
4902 case X86::TEST64ri32:
4906 SrcReg =
MI.getOperand(0).getReg();
4916bool X86InstrInfo::isRedundantFlagInstr(
const MachineInstr &FlagI,
4918 int64_t ImmMask, int64_t ImmValue,
4920 int64_t *ImmDelta)
const {
4935 OIMask != ImmMask || OIValue != ImmValue)
4937 if (SrcReg == OISrcReg && SrcReg2 == OISrcReg2) {
4941 if (SrcReg == OISrcReg2 && SrcReg2 == OISrcReg) {
4947 case X86::CMP64ri32:
4951 case X86::TEST64ri32:
4962 case X86::TEST8rr: {
4969 SrcReg == OISrcReg && ImmMask == OIMask) {
4970 if (OIValue == ImmValue) {
4973 }
else if (
static_cast<uint64_t
>(ImmValue) ==
4974 static_cast<uint64_t
>(OIValue) - 1) {
4977 }
else if (
static_cast<uint64_t
>(ImmValue) ==
4978 static_cast<uint64_t
>(OIValue) + 1) {
4996 bool &ClearsOverflowFlag) {
4998 ClearsOverflowFlag =
false;
5004 if (
MI.getOpcode() == X86::ADD64rm ||
MI.getOpcode() == X86::ADD32rm) {
5005 unsigned Flags =
MI.getOperand(5).getTargetFlags();
5011 switch (
MI.getOpcode()) {
5107 case X86::LZCNT16rr:
5108 case X86::LZCNT16rm:
5109 case X86::LZCNT32rr:
5110 case X86::LZCNT32rm:
5111 case X86::LZCNT64rr:
5112 case X86::LZCNT64rm:
5113 case X86::POPCNT16rr:
5114 case X86::POPCNT16rm:
5115 case X86::POPCNT32rr:
5116 case X86::POPCNT32rm:
5117 case X86::POPCNT64rr:
5118 case X86::POPCNT64rm:
5119 case X86::TZCNT16rr:
5120 case X86::TZCNT16rm:
5121 case X86::TZCNT32rr:
5122 case X86::TZCNT32rm:
5123 case X86::TZCNT64rr:
5124 case X86::TZCNT64rm:
5170 case X86::BLSMSK32rr:
5171 case X86::BLSMSK32rm:
5172 case X86::BLSMSK64rr:
5173 case X86::BLSMSK64rm:
5178 case X86::BLCFILL32rr:
5179 case X86::BLCFILL32rm:
5180 case X86::BLCFILL64rr:
5181 case X86::BLCFILL64rm:
5186 case X86::BLCIC32rr:
5187 case X86::BLCIC32rm:
5188 case X86::BLCIC64rr:
5189 case X86::BLCIC64rm:
5190 case X86::BLCMSK32rr:
5191 case X86::BLCMSK32rm:
5192 case X86::BLCMSK64rr:
5193 case X86::BLCMSK64rm:
5198 case X86::BLSFILL32rr:
5199 case X86::BLSFILL32rm:
5200 case X86::BLSFILL64rr:
5201 case X86::BLSFILL64rm:
5202 case X86::BLSIC32rr:
5203 case X86::BLSIC32rm:
5204 case X86::BLSIC64rr:
5205 case X86::BLSIC64rm:
5210 case X86::T1MSKC32rr:
5211 case X86::T1MSKC32rm:
5212 case X86::T1MSKC64rr:
5213 case X86::T1MSKC64rm:
5214 case X86::TZMSK32rr:
5215 case X86::TZMSK32rm:
5216 case X86::TZMSK64rr:
5217 case X86::TZMSK64rm:
5221 ClearsOverflowFlag =
true;
5223 case X86::BEXTR32rr:
5224 case X86::BEXTR64rr:
5225 case X86::BEXTR32rm:
5226 case X86::BEXTR64rm:
5227 case X86::BEXTRI32ri:
5228 case X86::BEXTRI32mi:
5229 case X86::BEXTRI64ri:
5230 case X86::BEXTRI64mi:
5241 switch (
MI.getOpcode()) {
5249 case X86::LZCNT16rr:
5250 case X86::LZCNT32rr:
5251 case X86::LZCNT64rr:
5253 case X86::POPCNT16rr:
5254 case X86::POPCNT32rr:
5255 case X86::POPCNT64rr:
5257 case X86::TZCNT16rr:
5258 case X86::TZCNT32rr:
5259 case X86::TZCNT64rr:
5273 case X86::BLSMSK32rr:
5274 case X86::BLSMSK64rr:
5306 unsigned NewOpcode = 0;
5307#define FROM_TO(A, B) \
5308 CASE_ND(A) NewOpcode = X86::B; \
5332 if (NewOpcode == X86::CMP64rm || NewOpcode == X86::CMP32rm ||
5333 NewOpcode == X86::CMP16rm || NewOpcode == X86::CMP8rm)
5341 bool IsCmpZero = (CmpMask != 0 && CmpValue == 0);
5347 assert(SrcRegDef &&
"Must have a definition (SSA)");
5353 bool NoSignFlag =
false;
5354 bool ClearsOverflowFlag =
false;
5355 bool ShouldUpdateCC =
false;
5356 bool IsSwapped =
false;
5357 bool HasNF = Subtarget.hasNF();
5360 int64_t ImmDelta = 0;
5373 if (&Inst == SrcRegDef) {
5396 Subtarget, NoSignFlag, ClearsOverflowFlag)) {
5405 if (Inst.modifiesRegister(X86::EFLAGS,
TRI)) {
5416 Inst.getOperand(OpNo).getReg() == SrcReg) {
5417 ShouldUpdateCC =
true;
5428 if (isRedundantFlagInstr(CmpInstr, SrcReg, SrcReg2, CmpMask, CmpValue,
5429 Inst, &IsSwapped, &ImmDelta)) {
5437 if (!Movr0Inst && Inst.
getOpcode() == X86::MOV32r0 &&
5438 Inst.registerDefIsDead(X86::EFLAGS,
TRI)) {
5452 if (HasNF && Inst.registerDefIsDead(X86::EFLAGS,
TRI) && !IsWithReloc) {
5457 InstsToUpdate.
push_back(std::make_pair(&Inst, NewOp));
5471 if (
MBB->pred_size() != 1)
5473 MBB = *
MBB->pred_begin();
5474 From =
MBB->rbegin();
5481 bool FlagsMayLiveOut =
true;
5486 bool ModifyEFLAGS = Instr.modifiesRegister(X86::EFLAGS,
TRI);
5487 bool UseEFLAGS = Instr.readsRegister(X86::EFLAGS,
TRI);
5489 if (!UseEFLAGS && ModifyEFLAGS) {
5491 FlagsMayLiveOut =
false;
5494 if (!UseEFLAGS && !ModifyEFLAGS)
5525 if (!ClearsOverflowFlag)
5544 ReplacementCC = NewCC;
5550 }
else if (IsSwapped) {
5557 ShouldUpdateCC =
true;
5558 }
else if (ImmDelta != 0) {
5559 unsigned BitWidth =
TRI->getRegSizeInBits(*
MRI->getRegClass(SrcReg));
5569 if (ImmDelta != 1 || CmpValue == 0)
5579 if (ImmDelta != 1 || CmpValue == 0)
5606 ShouldUpdateCC =
true;
5609 if (ShouldUpdateCC && ReplacementCC != OldCC) {
5613 OpsToUpdate.
push_back(std::make_pair(&Instr, ReplacementCC));
5615 if (ModifyEFLAGS || Instr.killsRegister(X86::EFLAGS,
TRI)) {
5617 FlagsMayLiveOut =
false;
5624 if ((
MI !=
nullptr || ShouldUpdateCC) && FlagsMayLiveOut) {
5631 assert((
MI ==
nullptr ||
Sub ==
nullptr) &&
"Should not have Sub and MI set");
5638 if (&CmpMBB != SubBB)
5642 InsertE =
Sub->getParent()->rend();
5643 for (; InsertI != InsertE; ++InsertI) {
5645 if (!Instr->readsRegister(X86::EFLAGS,
TRI) &&
5646 Instr->modifiesRegister(X86::EFLAGS,
TRI)) {
5653 if (InsertI == InsertE)
5658 for (
auto &Inst : InstsToUpdate) {
5659 Inst.first->setDesc(
get(Inst.second));
5660 Inst.first->removeOperand(
5661 Inst.first->findRegisterDefOperandIdx(X86::EFLAGS,
nullptr));
5666 Sub->findRegisterDefOperand(X86::EFLAGS,
nullptr);
5667 assert(FlagDef &&
"Unable to locate a def EFLAGS operand");
5673 for (
auto &
Op : OpsToUpdate) {
5674 Op.first->getOperand(
Op.first->getDesc().getNumOperands() - 1)
5679 MBB = *
MBB->pred_begin()) {
5680 assert(
MBB->pred_size() == 1 &&
"Expected exactly one predecessor");
5681 if (!
MBB->isLiveIn(X86::EFLAGS))
5682 MBB->addLiveIn(X86::EFLAGS);
5710#define FROM_TO(FROM, TO) \
5713 case X86::FROM##_ND: \
5714 return X86::TO##_ND;
5744#define FROM_TO(FROM, TO) \
5748 FROM_TO(CTEST64rr, CTEST64ri32)
5767 bool MakeChange)
const {
5773 const TargetRegisterClass *RC =
nullptr;
5775 RC =
MRI->getRegClass(
Reg);
5777 (
Reg.
isVirtual() && X86::GR64RegClass.hasSubClassEq(RC))) {
5782 if (
UseMI.findRegisterUseOperand(
Reg,
nullptr)->getSubReg())
5787 !
MRI->hasOneNonDBGUse(
Reg))
5792 if (
Opc == TargetOpcode::COPY) {
5794 const TargetRegisterClass *RC =
nullptr;
5796 RC =
MRI->getRegClass(ToReg);
5797 bool GR32Reg = (ToReg.
isVirtual() && X86::GR32RegClass.hasSubClassEq(RC)) ||
5799 bool GR64Reg = (ToReg.
isVirtual() && X86::GR64RegClass.hasSubClassEq(RC)) ||
5801 bool GR8Reg = (ToReg.
isVirtual() && X86::GR8RegClass.hasSubClassEq(RC)) ||
5812 NewOpc = X86::MOV32ri64;
5814 NewOpc = X86::MOV64ri;
5815 }
else if (GR32Reg) {
5816 NewOpc = X86::MOV32ri;
5820 if (
UseMI.getParent()->computeRegisterLiveness(
5829 UseMI.removeOperand(
5830 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr));
5838 NewOpc = X86::MOV8ri;
5848 if ((NewOpc == X86::SUB64ri32 || NewOpc == X86::SUB32ri ||
5849 NewOpc == X86::SBB64ri32 || NewOpc == X86::SBB32ri ||
5850 NewOpc == X86::SUB64ri32_ND || NewOpc == X86::SUB32ri_ND ||
5851 NewOpc == X86::SBB64ri32_ND || NewOpc == X86::SBB32ri_ND) &&
5852 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr) != 2)
5855 if (((NewOpc == X86::CMP64ri32 || NewOpc == X86::CMP32ri) ||
5856 (NewOpc == X86::CCMP64ri32 || NewOpc == X86::CCMP32ri)) &&
5857 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr) != 1)
5860 using namespace X86;
5861 if (isSHL(
Opc) || isSHR(
Opc) || isSAR(
Opc) || isROL(
Opc) || isROR(
Opc) ||
5862 isRCL(
Opc) || isRCR(
Opc)) {
5863 unsigned RegIdx =
UseMI.findRegisterUseOperandIdx(
Reg,
nullptr);
5873 UseMI.removeOperand(RegIdx);
5887 UseMI.registerDefIsDead(X86::EFLAGS,
nullptr)) {
5891 UseMI.setDesc(
get(TargetOpcode::COPY));
5892 UseMI.removeOperand(
5893 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr));
5894 UseMI.removeOperand(
5895 UseMI.findRegisterDefOperandIdx(X86::EFLAGS,
nullptr));
5896 UseMI.untieRegOperand(0);
5900 unsigned Op1 = 1, Op2 = CommuteAnyOperandIndex;
5901 unsigned ImmOpNum = 2;
5902 if (!
UseMI.getOperand(0).isDef()) {
5906 if (
Opc == TargetOpcode::COPY)
5910 commuteInstruction(
UseMI);
5914 UseMI.getOperand(ImmOpNum).ChangeToImmediate(ImmVal);
5932 return foldImmediateImpl(
UseMI, &
DefMI, Reg, ImmVal,
MRI,
true);
5944 assert(
Desc.getNumOperands() == 3 &&
"Expected two-addr instruction.");
5964 assert(
Desc.getNumOperands() == 3 &&
"Expected two-addr instruction.");
5982 MIB->
setDesc(
TII.get(MinusOne ? X86::DEC32r : X86::INC32r));
5994 assert(Imm != 0 &&
"Using push/pop for 0 is not efficient.");
5997 int StackAdjustment;
5999 if (Subtarget.is64Bit()) {
6001 MIB->
getOpcode() == X86::MOV32ImmSExti8);
6015 StackAdjustment = 8;
6021 StackAdjustment = 4;
6033 bool EmitCFI = !TFL->
hasFP(MF) && NeedsDwarfCFI;
6080 MIB->
getOpcode() == X86::XOR64_FP ? X86::XOR64rr : X86::XOR32rr;
6092 const MCInstrDesc &BroadcastDesc,
unsigned SubIdx) {
6095 if (
TRI->getEncodingValue(DestReg) < 16) {
6102 DestReg =
TRI->getMatchingSuperReg(DestReg, SubIdx, &X86::VR512RegClass);
6114 const MCInstrDesc &ExtractDesc,
unsigned SubIdx) {
6117 if (
TRI->getEncodingValue(SrcReg) < 16) {
6124 SrcReg =
TRI->getMatchingSuperReg(SrcReg, SubIdx, &X86::VR512RegClass);
6147 if (
MI.getOpcode() == X86::MOVSHPrm) {
6148 NewOpc = HasAVX ? X86::VMOVSSrm : X86::MOVSSrm;
6150 if (
Reg > X86::XMM15)
6151 NewOpc = X86::VMOVSSZrm;
6153 NewOpc = HasAVX ? X86::VMOVSSmr : X86::MOVSSmr;
6155 if (
Reg > X86::XMM15)
6156 NewOpc = X86::VMOVSSZmr;
6164 bool HasAVX = Subtarget.hasAVX();
6166 switch (
MI.getOpcode()) {
6173 case X86::MOV32ImmSExti8:
6174 case X86::MOV64ImmSExti8:
6176 case X86::SETB_C32r:
6178 case X86::SETB_C64r:
6186 case X86::FsFLD0F128:
6188 case X86::AVX_SET0: {
6189 assert(HasAVX &&
"AVX not supported");
6192 Register XReg =
TRI->getSubReg(SrcReg, X86::sub_xmm);
6198 case X86::AVX512_128_SET0:
6199 case X86::AVX512_FsFLD0SH:
6200 case X86::AVX512_FsFLD0SS:
6201 case X86::AVX512_FsFLD0SD:
6202 case X86::AVX512_FsFLD0F128: {
6203 bool HasVLX = Subtarget.hasVLX();
6206 if (HasVLX ||
TRI->getEncodingValue(SrcReg) < 16)
6208 get(HasVLX ? X86::VPXORDZ128rr : X86::VXORPSrr));
6211 TRI->getMatchingSuperReg(SrcReg, X86::sub_xmm, &X86::VR512RegClass);
6215 case X86::AVX512_256_SET0:
6216 case X86::AVX512_512_SET0: {
6217 bool HasVLX = Subtarget.hasVLX();
6220 if (HasVLX ||
TRI->getEncodingValue(SrcReg) < 16) {
6221 Register XReg =
TRI->getSubReg(SrcReg, X86::sub_xmm);
6227 if (
MI.getOpcode() == X86::AVX512_256_SET0) {
6230 TRI->getMatchingSuperReg(SrcReg, X86::sub_ymm, &X86::VR512RegClass);
6238 case X86::V_SETALLONES:
6240 get(HasAVX ? X86::VPCMPEQDrr : X86::PCMPEQDrr));
6241 case X86::AVX2_SETALLONES:
6243 case X86::AVX1_SETALLONES: {
6250 case X86::AVX512_512_SETALLONES: {
6261 case X86::AVX512_512_SEXT_MASK_32:
6262 case X86::AVX512_512_SEXT_MASK_64: {
6266 unsigned Opc = (
MI.getOpcode() == X86::AVX512_512_SEXT_MASK_64)
6267 ? X86::VPTERNLOGQZrrikz
6268 : X86::VPTERNLOGDZrrikz;
6269 MI.removeOperand(1);
6274 .
addReg(MaskReg, MaskState)
6280 case X86::VMOVAPSZ128rm_NOVLX:
6282 get(X86::VBROADCASTF32X4Zrm), X86::sub_xmm);
6283 case X86::VMOVUPSZ128rm_NOVLX:
6285 get(X86::VBROADCASTF32X4Zrm), X86::sub_xmm);
6286 case X86::VMOVAPSZ256rm_NOVLX:
6288 get(X86::VBROADCASTF64X4Zrm), X86::sub_ymm);
6289 case X86::VMOVUPSZ256rm_NOVLX:
6291 get(X86::VBROADCASTF64X4Zrm), X86::sub_ymm);
6292 case X86::VMOVAPSZ128mr_NOVLX:
6294 get(X86::VEXTRACTF32X4Zmri), X86::sub_xmm);
6295 case X86::VMOVUPSZ128mr_NOVLX:
6297 get(X86::VEXTRACTF32X4Zmri), X86::sub_xmm);
6298 case X86::VMOVAPSZ256mr_NOVLX:
6300 get(X86::VEXTRACTF64X4Zmri), X86::sub_ymm);
6301 case X86::VMOVUPSZ256mr_NOVLX:
6303 get(X86::VEXTRACTF64X4Zmri), X86::sub_ymm);
6304 case X86::MOV32ri64: {
6306 Register Reg32 = RI.getSubReg(Reg, X86::sub_32bit);
6307 MI.setDesc(
get(X86::MOV32ri));
6313 case X86::RDFLAGS32:
6314 case X86::RDFLAGS64: {
6315 unsigned Is64Bit =
MI.getOpcode() == X86::RDFLAGS64;
6319 get(Is64Bit ? X86::PUSHF64 : X86::PUSHF32))
6327 "Unexpected register in operand! Should be EFLAGS.");
6330 "Unexpected register in operand! Should be DF.");
6333 MIB->
setDesc(
get(Is64Bit ? X86::POP64r : X86::POP32r));
6337 case X86::WRFLAGS32:
6338 case X86::WRFLAGS64: {
6339 unsigned Is64Bit =
MI.getOpcode() == X86::WRFLAGS64;
6343 get(Is64Bit ? X86::PUSH64r : X86::PUSH32r))
6344 .
addReg(
MI.getOperand(0).getReg());
6346 get(Is64Bit ? X86::POPF64 : X86::POPF32));
6347 MI.eraseFromParent();
6370 case TargetOpcode::LOAD_STACK_GUARD:
6376 case X86::SHLDROT32ri:
6378 case X86::SHLDROT64ri:
6380 case X86::SHRDROT32ri:
6382 case X86::SHRDROT64ri:
6384 case X86::ADD8rr_DB:
6387 case X86::ADD16rr_DB:
6390 case X86::ADD32rr_DB:
6393 case X86::ADD64rr_DB:
6396 case X86::ADD8ri_DB:
6399 case X86::ADD16ri_DB:
6402 case X86::ADD32ri_DB:
6405 case X86::ADD64ri32_DB:
6429 bool ForLoadFold =
false) {
6431 case X86::CVTSI2SSrr:
6432 case X86::CVTSI2SSrm:
6433 case X86::CVTSI642SSrr:
6434 case X86::CVTSI642SSrm:
6435 case X86::CVTSI2SDrr:
6436 case X86::CVTSI2SDrm:
6437 case X86::CVTSI642SDrr:
6438 case X86::CVTSI642SDrm:
6441 return !ForLoadFold;
6442 case X86::CVTSD2SSrr:
6443 case X86::CVTSD2SSrm:
6444 case X86::CVTSS2SDrr:
6445 case X86::CVTSS2SDrm:
6452 case X86::RCPSSr_Int:
6453 case X86::RCPSSm_Int:
6454 case X86::ROUNDSDri:
6455 case X86::ROUNDSDmi:
6456 case X86::ROUNDSSri:
6457 case X86::ROUNDSSmi:
6460 case X86::RSQRTSSr_Int:
6461 case X86::RSQRTSSm_Int:
6464 case X86::SQRTSSr_Int:
6465 case X86::SQRTSSm_Int:
6468 case X86::SQRTSDr_Int:
6469 case X86::SQRTSDm_Int:
6471 case X86::VFCMULCPHZ128rm:
6472 case X86::VFCMULCPHZ128rmb:
6473 case X86::VFCMULCPHZ128rmbkz:
6474 case X86::VFCMULCPHZ128rmkz:
6475 case X86::VFCMULCPHZ128rr:
6476 case X86::VFCMULCPHZ128rrkz:
6477 case X86::VFCMULCPHZ256rm:
6478 case X86::VFCMULCPHZ256rmb:
6479 case X86::VFCMULCPHZ256rmbkz:
6480 case X86::VFCMULCPHZ256rmkz:
6481 case X86::VFCMULCPHZ256rr:
6482 case X86::VFCMULCPHZ256rrkz:
6483 case X86::VFCMULCPHZrm:
6484 case X86::VFCMULCPHZrmb:
6485 case X86::VFCMULCPHZrmbkz:
6486 case X86::VFCMULCPHZrmkz:
6487 case X86::VFCMULCPHZrr:
6488 case X86::VFCMULCPHZrrb:
6489 case X86::VFCMULCPHZrrbkz:
6490 case X86::VFCMULCPHZrrkz:
6491 case X86::VFMULCPHZ128rm:
6492 case X86::VFMULCPHZ128rmb:
6493 case X86::VFMULCPHZ128rmbkz:
6494 case X86::VFMULCPHZ128rmkz:
6495 case X86::VFMULCPHZ128rr:
6496 case X86::VFMULCPHZ128rrkz:
6497 case X86::VFMULCPHZ256rm:
6498 case X86::VFMULCPHZ256rmb:
6499 case X86::VFMULCPHZ256rmbkz:
6500 case X86::VFMULCPHZ256rmkz:
6501 case X86::VFMULCPHZ256rr:
6502 case X86::VFMULCPHZ256rrkz:
6503 case X86::VFMULCPHZrm:
6504 case X86::VFMULCPHZrmb:
6505 case X86::VFMULCPHZrmbkz:
6506 case X86::VFMULCPHZrmkz:
6507 case X86::VFMULCPHZrr:
6508 case X86::VFMULCPHZrrb:
6509 case X86::VFMULCPHZrrbkz:
6510 case X86::VFMULCPHZrrkz:
6511 case X86::VFCMULCSHZrm:
6512 case X86::VFCMULCSHZrmkz:
6513 case X86::VFCMULCSHZrr:
6514 case X86::VFCMULCSHZrrb:
6515 case X86::VFCMULCSHZrrbkz:
6516 case X86::VFCMULCSHZrrkz:
6517 case X86::VFMULCSHZrm:
6518 case X86::VFMULCSHZrmkz:
6519 case X86::VFMULCSHZrr:
6520 case X86::VFMULCSHZrrb:
6521 case X86::VFMULCSHZrrbkz:
6522 case X86::VFMULCSHZrrkz:
6523 return Subtarget.hasMULCFalseDeps();
6524 case X86::VPERMDYrm:
6525 case X86::VPERMDYrr:
6526 case X86::VPERMQYmi:
6527 case X86::VPERMQYri:
6528 case X86::VPERMPSYrm:
6529 case X86::VPERMPSYrr:
6530 case X86::VPERMPDYmi:
6531 case X86::VPERMPDYri:
6532 case X86::VPERMDZ256rm:
6533 case X86::VPERMDZ256rmb:
6534 case X86::VPERMDZ256rmbkz:
6535 case X86::VPERMDZ256rmkz:
6536 case X86::VPERMDZ256rr:
6537 case X86::VPERMDZ256rrkz:
6538 case X86::VPERMDZrm:
6539 case X86::VPERMDZrmb:
6540 case X86::VPERMDZrmbkz:
6541 case X86::VPERMDZrmkz:
6542 case X86::VPERMDZrr:
6543 case X86::VPERMDZrrkz:
6544 case X86::VPERMQZ256mbi:
6545 case X86::VPERMQZ256mbikz:
6546 case X86::VPERMQZ256mi:
6547 case X86::VPERMQZ256mikz:
6548 case X86::VPERMQZ256ri:
6549 case X86::VPERMQZ256rikz:
6550 case X86::VPERMQZ256rm:
6551 case X86::VPERMQZ256rmb:
6552 case X86::VPERMQZ256rmbkz:
6553 case X86::VPERMQZ256rmkz:
6554 case X86::VPERMQZ256rr:
6555 case X86::VPERMQZ256rrkz:
6556 case X86::VPERMQZmbi:
6557 case X86::VPERMQZmbikz:
6558 case X86::VPERMQZmi:
6559 case X86::VPERMQZmikz:
6560 case X86::VPERMQZri:
6561 case X86::VPERMQZrikz:
6562 case X86::VPERMQZrm:
6563 case X86::VPERMQZrmb:
6564 case X86::VPERMQZrmbkz:
6565 case X86::VPERMQZrmkz:
6566 case X86::VPERMQZrr:
6567 case X86::VPERMQZrrkz:
6568 case X86::VPERMPSZ256rm:
6569 case X86::VPERMPSZ256rmb:
6570 case X86::VPERMPSZ256rmbkz:
6571 case X86::VPERMPSZ256rmkz:
6572 case X86::VPERMPSZ256rr:
6573 case X86::VPERMPSZ256rrkz:
6574 case X86::VPERMPSZrm:
6575 case X86::VPERMPSZrmb:
6576 case X86::VPERMPSZrmbkz:
6577 case X86::VPERMPSZrmkz:
6578 case X86::VPERMPSZrr:
6579 case X86::VPERMPSZrrkz:
6580 case X86::VPERMPDZ256mbi:
6581 case X86::VPERMPDZ256mbikz:
6582 case X86::VPERMPDZ256mi:
6583 case X86::VPERMPDZ256mikz:
6584 case X86::VPERMPDZ256ri:
6585 case X86::VPERMPDZ256rikz:
6586 case X86::VPERMPDZ256rm:
6587 case X86::VPERMPDZ256rmb:
6588 case X86::VPERMPDZ256rmbkz:
6589 case X86::VPERMPDZ256rmkz:
6590 case X86::VPERMPDZ256rr:
6591 case X86::VPERMPDZ256rrkz:
6592 case X86::VPERMPDZmbi:
6593 case X86::VPERMPDZmbikz:
6594 case X86::VPERMPDZmi:
6595 case X86::VPERMPDZmikz:
6596 case X86::VPERMPDZri:
6597 case X86::VPERMPDZrikz:
6598 case X86::VPERMPDZrm:
6599 case X86::VPERMPDZrmb:
6600 case X86::VPERMPDZrmbkz:
6601 case X86::VPERMPDZrmkz:
6602 case X86::VPERMPDZrr:
6603 case X86::VPERMPDZrrkz:
6604 return Subtarget.hasPERMFalseDeps();
6605 case X86::VRANGEPDZ128rmbi:
6606 case X86::VRANGEPDZ128rmbikz:
6607 case X86::VRANGEPDZ128rmi:
6608 case X86::VRANGEPDZ128rmikz:
6609 case X86::VRANGEPDZ128rri:
6610 case X86::VRANGEPDZ128rrikz:
6611 case X86::VRANGEPDZ256rmbi:
6612 case X86::VRANGEPDZ256rmbikz:
6613 case X86::VRANGEPDZ256rmi:
6614 case X86::VRANGEPDZ256rmikz:
6615 case X86::VRANGEPDZ256rri:
6616 case X86::VRANGEPDZ256rrikz:
6617 case X86::VRANGEPDZrmbi:
6618 case X86::VRANGEPDZrmbikz:
6619 case X86::VRANGEPDZrmi:
6620 case X86::VRANGEPDZrmikz:
6621 case X86::VRANGEPDZrri:
6622 case X86::VRANGEPDZrrib:
6623 case X86::VRANGEPDZrribkz:
6624 case X86::VRANGEPDZrrikz:
6625 case X86::VRANGEPSZ128rmbi:
6626 case X86::VRANGEPSZ128rmbikz:
6627 case X86::VRANGEPSZ128rmi:
6628 case X86::VRANGEPSZ128rmikz:
6629 case X86::VRANGEPSZ128rri:
6630 case X86::VRANGEPSZ128rrikz:
6631 case X86::VRANGEPSZ256rmbi:
6632 case X86::VRANGEPSZ256rmbikz:
6633 case X86::VRANGEPSZ256rmi:
6634 case X86::VRANGEPSZ256rmikz:
6635 case X86::VRANGEPSZ256rri:
6636 case X86::VRANGEPSZ256rrikz:
6637 case X86::VRANGEPSZrmbi:
6638 case X86::VRANGEPSZrmbikz:
6639 case X86::VRANGEPSZrmi:
6640 case X86::VRANGEPSZrmikz:
6641 case X86::VRANGEPSZrri:
6642 case X86::VRANGEPSZrrib:
6643 case X86::VRANGEPSZrribkz:
6644 case X86::VRANGEPSZrrikz:
6645 case X86::VRANGESDZrmi:
6646 case X86::VRANGESDZrmikz:
6647 case X86::VRANGESDZrri:
6648 case X86::VRANGESDZrrib:
6649 case X86::VRANGESDZrribkz:
6650 case X86::VRANGESDZrrikz:
6651 case X86::VRANGESSZrmi:
6652 case X86::VRANGESSZrmikz:
6653 case X86::VRANGESSZrri:
6654 case X86::VRANGESSZrrib:
6655 case X86::VRANGESSZrribkz:
6656 case X86::VRANGESSZrrikz:
6657 return Subtarget.hasRANGEFalseDeps();
6658 case X86::VGETMANTSSZrmi:
6659 case X86::VGETMANTSSZrmikz:
6660 case X86::VGETMANTSSZrri:
6661 case X86::VGETMANTSSZrrib:
6662 case X86::VGETMANTSSZrribkz:
6663 case X86::VGETMANTSSZrrikz:
6664 case X86::VGETMANTSDZrmi:
6665 case X86::VGETMANTSDZrmikz:
6666 case X86::VGETMANTSDZrri:
6667 case X86::VGETMANTSDZrrib:
6668 case X86::VGETMANTSDZrribkz:
6669 case X86::VGETMANTSDZrrikz:
6670 case X86::VGETMANTSHZrmi:
6671 case X86::VGETMANTSHZrmikz:
6672 case X86::VGETMANTSHZrri:
6673 case X86::VGETMANTSHZrrib:
6674 case X86::VGETMANTSHZrribkz:
6675 case X86::VGETMANTSHZrrikz:
6676 case X86::VGETMANTPSZ128rmbi:
6677 case X86::VGETMANTPSZ128rmbikz:
6678 case X86::VGETMANTPSZ128rmi:
6679 case X86::VGETMANTPSZ128rmikz:
6680 case X86::VGETMANTPSZ256rmbi:
6681 case X86::VGETMANTPSZ256rmbikz:
6682 case X86::VGETMANTPSZ256rmi:
6683 case X86::VGETMANTPSZ256rmikz:
6684 case X86::VGETMANTPSZrmbi:
6685 case X86::VGETMANTPSZrmbikz:
6686 case X86::VGETMANTPSZrmi:
6687 case X86::VGETMANTPSZrmikz:
6688 case X86::VGETMANTPDZ128rmbi:
6689 case X86::VGETMANTPDZ128rmbikz:
6690 case X86::VGETMANTPDZ128rmi:
6691 case X86::VGETMANTPDZ128rmikz:
6692 case X86::VGETMANTPDZ256rmbi:
6693 case X86::VGETMANTPDZ256rmbikz:
6694 case X86::VGETMANTPDZ256rmi:
6695 case X86::VGETMANTPDZ256rmikz:
6696 case X86::VGETMANTPDZrmbi:
6697 case X86::VGETMANTPDZrmbikz:
6698 case X86::VGETMANTPDZrmi:
6699 case X86::VGETMANTPDZrmikz:
6700 return Subtarget.hasGETMANTFalseDeps();
6701 case X86::VPMULLQZ128rm:
6702 case X86::VPMULLQZ128rmb:
6703 case X86::VPMULLQZ128rmbkz:
6704 case X86::VPMULLQZ128rmkz:
6705 case X86::VPMULLQZ128rr:
6706 case X86::VPMULLQZ128rrkz:
6707 case X86::VPMULLQZ256rm:
6708 case X86::VPMULLQZ256rmb:
6709 case X86::VPMULLQZ256rmbkz:
6710 case X86::VPMULLQZ256rmkz:
6711 case X86::VPMULLQZ256rr:
6712 case X86::VPMULLQZ256rrkz:
6713 case X86::VPMULLQZrm:
6714 case X86::VPMULLQZrmb:
6715 case X86::VPMULLQZrmbkz:
6716 case X86::VPMULLQZrmkz:
6717 case X86::VPMULLQZrr:
6718 case X86::VPMULLQZrrkz:
6719 return Subtarget.hasMULLQFalseDeps();
6721 case X86::POPCNT32rm:
6722 case X86::POPCNT32rr:
6723 case X86::POPCNT64rm:
6724 case X86::POPCNT64rr:
6725 return Subtarget.hasPOPCNTFalseDeps();
6726 case X86::LZCNT32rm:
6727 case X86::LZCNT32rr:
6728 case X86::LZCNT64rm:
6729 case X86::LZCNT64rr:
6730 case X86::TZCNT32rm:
6731 case X86::TZCNT32rr:
6732 case X86::TZCNT64rm:
6733 case X86::TZCNT64rr:
6734 return Subtarget.hasLZCNTFalseDeps();
6751 bool HasNDDPartialWrite =
false;
6754 if (!Reg.isVirtual())
6755 HasNDDPartialWrite =
6756 X86::GR8RegClass.contains(Reg) || X86::GR16RegClass.contains(Reg);
6769 bool ReadsReg =
false;
6770 if (Reg.isVirtual())
6771 ReadsReg = (MO.
readsReg() ||
MI.readsVirtualRegister(Reg));
6773 ReadsReg =
MI.readsRegister(Reg,
TRI);
6774 if (ReadsReg != HasNDDPartialWrite)
6788 bool ForLoadFold =
false) {
6791 case X86::MMX_PUNPCKHBWrr:
6792 case X86::MMX_PUNPCKHWDrr:
6793 case X86::MMX_PUNPCKHDQrr:
6794 case X86::MMX_PUNPCKLBWrr:
6795 case X86::MMX_PUNPCKLWDrr:
6796 case X86::MMX_PUNPCKLDQrr:
6797 case X86::MOVHLPSrr:
6798 case X86::PACKSSWBrr:
6799 case X86::PACKUSWBrr:
6800 case X86::PACKSSDWrr:
6801 case X86::PACKUSDWrr:
6802 case X86::PUNPCKHBWrr:
6803 case X86::PUNPCKLBWrr:
6804 case X86::PUNPCKHWDrr:
6805 case X86::PUNPCKLWDrr:
6806 case X86::PUNPCKHDQrr:
6807 case X86::PUNPCKLDQrr:
6808 case X86::PUNPCKHQDQrr:
6809 case X86::PUNPCKLQDQrr:
6810 case X86::SHUFPDrri:
6811 case X86::SHUFPSrri:
6817 return OpNum == 2 && !ForLoadFold;
6819 case X86::VMOVLHPSrr:
6820 case X86::VMOVLHPSZrr:
6821 case X86::VPACKSSWBrr:
6822 case X86::VPACKUSWBrr:
6823 case X86::VPACKSSDWrr:
6824 case X86::VPACKUSDWrr:
6825 case X86::VPACKSSWBZ128rr:
6826 case X86::VPACKUSWBZ128rr:
6827 case X86::VPACKSSDWZ128rr:
6828 case X86::VPACKUSDWZ128rr:
6829 case X86::VPERM2F128rri:
6830 case X86::VPERM2I128rri:
6831 case X86::VSHUFF32X4Z256rri:
6832 case X86::VSHUFF32X4Zrri:
6833 case X86::VSHUFF64X2Z256rri:
6834 case X86::VSHUFF64X2Zrri:
6835 case X86::VSHUFI32X4Z256rri:
6836 case X86::VSHUFI32X4Zrri:
6837 case X86::VSHUFI64X2Z256rri:
6838 case X86::VSHUFI64X2Zrri:
6839 case X86::VPUNPCKHBWrr:
6840 case X86::VPUNPCKLBWrr:
6841 case X86::VPUNPCKHBWYrr:
6842 case X86::VPUNPCKLBWYrr:
6843 case X86::VPUNPCKHBWZ128rr:
6844 case X86::VPUNPCKLBWZ128rr:
6845 case X86::VPUNPCKHBWZ256rr:
6846 case X86::VPUNPCKLBWZ256rr:
6847 case X86::VPUNPCKHBWZrr:
6848 case X86::VPUNPCKLBWZrr:
6849 case X86::VPUNPCKHWDrr:
6850 case X86::VPUNPCKLWDrr:
6851 case X86::VPUNPCKHWDYrr:
6852 case X86::VPUNPCKLWDYrr:
6853 case X86::VPUNPCKHWDZ128rr:
6854 case X86::VPUNPCKLWDZ128rr:
6855 case X86::VPUNPCKHWDZ256rr:
6856 case X86::VPUNPCKLWDZ256rr:
6857 case X86::VPUNPCKHWDZrr:
6858 case X86::VPUNPCKLWDZrr:
6859 case X86::VPUNPCKHDQrr:
6860 case X86::VPUNPCKLDQrr:
6861 case X86::VPUNPCKHDQYrr:
6862 case X86::VPUNPCKLDQYrr:
6863 case X86::VPUNPCKHDQZ128rr:
6864 case X86::VPUNPCKLDQZ128rr:
6865 case X86::VPUNPCKHDQZ256rr:
6866 case X86::VPUNPCKLDQZ256rr:
6867 case X86::VPUNPCKHDQZrr:
6868 case X86::VPUNPCKLDQZrr:
6869 case X86::VPUNPCKHQDQrr:
6870 case X86::VPUNPCKLQDQrr:
6871 case X86::VPUNPCKHQDQYrr:
6872 case X86::VPUNPCKLQDQYrr:
6873 case X86::VPUNPCKHQDQZ128rr:
6874 case X86::VPUNPCKLQDQZ128rr:
6875 case X86::VPUNPCKHQDQZ256rr:
6876 case X86::VPUNPCKLQDQZ256rr:
6877 case X86::VPUNPCKHQDQZrr:
6878 case X86::VPUNPCKLQDQZrr:
6882 return (OpNum == 1 || OpNum == 2) && !ForLoadFold;
6884 case X86::VCVTSI2SSrr:
6885 case X86::VCVTSI2SSrm:
6886 case X86::VCVTSI2SSrr_Int:
6887 case X86::VCVTSI2SSrm_Int:
6888 case X86::VCVTSI642SSrr:
6889 case X86::VCVTSI642SSrm:
6890 case X86::VCVTSI642SSrr_Int:
6891 case X86::VCVTSI642SSrm_Int:
6892 case X86::VCVTSI2SDrr:
6893 case X86::VCVTSI2SDrm:
6894 case X86::VCVTSI2SDrr_Int:
6895 case X86::VCVTSI2SDrm_Int:
6896 case X86::VCVTSI642SDrr:
6897 case X86::VCVTSI642SDrm:
6898 case X86::VCVTSI642SDrr_Int:
6899 case X86::VCVTSI642SDrm_Int:
6901 case X86::VCVTSI2SSZrr:
6902 case X86::VCVTSI2SSZrm:
6903 case X86::VCVTSI2SSZrr_Int:
6904 case X86::VCVTSI2SSZrrb_Int:
6905 case X86::VCVTSI2SSZrm_Int:
6906 case X86::VCVTSI642SSZrr:
6907 case X86::VCVTSI642SSZrm:
6908 case X86::VCVTSI642SSZrr_Int:
6909 case X86::VCVTSI642SSZrrb_Int:
6910 case X86::VCVTSI642SSZrm_Int:
6911 case X86::VCVTSI2SDZrr:
6912 case X86::VCVTSI2SDZrm:
6913 case X86::VCVTSI2SDZrr_Int:
6914 case X86::VCVTSI2SDZrm_Int:
6915 case X86::VCVTSI642SDZrr:
6916 case X86::VCVTSI642SDZrm:
6917 case X86::VCVTSI642SDZrr_Int:
6918 case X86::VCVTSI642SDZrrb_Int:
6919 case X86::VCVTSI642SDZrm_Int:
6920 case X86::VCVTUSI2SSZrr:
6921 case X86::VCVTUSI2SSZrm:
6922 case X86::VCVTUSI2SSZrr_Int:
6923 case X86::VCVTUSI2SSZrrb_Int:
6924 case X86::VCVTUSI2SSZrm_Int:
6925 case X86::VCVTUSI642SSZrr:
6926 case X86::VCVTUSI642SSZrm:
6927 case X86::VCVTUSI642SSZrr_Int:
6928 case X86::VCVTUSI642SSZrrb_Int:
6929 case X86::VCVTUSI642SSZrm_Int:
6930 case X86::VCVTUSI2SDZrr:
6931 case X86::VCVTUSI2SDZrm:
6932 case X86::VCVTUSI2SDZrr_Int:
6933 case X86::VCVTUSI2SDZrm_Int:
6934 case X86::VCVTUSI642SDZrr:
6935 case X86::VCVTUSI642SDZrm:
6936 case X86::VCVTUSI642SDZrr_Int:
6937 case X86::VCVTUSI642SDZrrb_Int:
6938 case X86::VCVTUSI642SDZrm_Int:
6939 case X86::VCVTSI2SHZrr:
6940 case X86::VCVTSI2SHZrm:
6941 case X86::VCVTSI2SHZrr_Int:
6942 case X86::VCVTSI2SHZrrb_Int:
6943 case X86::VCVTSI2SHZrm_Int:
6944 case X86::VCVTSI642SHZrr:
6945 case X86::VCVTSI642SHZrm:
6946 case X86::VCVTSI642SHZrr_Int:
6947 case X86::VCVTSI642SHZrrb_Int:
6948 case X86::VCVTSI642SHZrm_Int:
6949 case X86::VCVTUSI2SHZrr:
6950 case X86::VCVTUSI2SHZrm:
6951 case X86::VCVTUSI2SHZrr_Int:
6952 case X86::VCVTUSI2SHZrrb_Int:
6953 case X86::VCVTUSI2SHZrm_Int:
6954 case X86::VCVTUSI642SHZrr:
6955 case X86::VCVTUSI642SHZrm:
6956 case X86::VCVTUSI642SHZrr_Int:
6957 case X86::VCVTUSI642SHZrrb_Int:
6958 case X86::VCVTUSI642SHZrm_Int:
6961 return OpNum == 1 && !ForLoadFold;
6962 case X86::VCVTSD2SSrr:
6963 case X86::VCVTSD2SSrm:
6964 case X86::VCVTSD2SSrr_Int:
6965 case X86::VCVTSD2SSrm_Int:
6966 case X86::VCVTSS2SDrr:
6967 case X86::VCVTSS2SDrm:
6968 case X86::VCVTSS2SDrr_Int:
6969 case X86::VCVTSS2SDrm_Int:
6971 case X86::VRCPSSr_Int:
6973 case X86::VRCPSSm_Int:
6974 case X86::VROUNDSDri:
6975 case X86::VROUNDSDmi:
6976 case X86::VROUNDSDri_Int:
6977 case X86::VROUNDSDmi_Int:
6978 case X86::VROUNDSSri:
6979 case X86::VROUNDSSmi:
6980 case X86::VROUNDSSri_Int:
6981 case X86::VROUNDSSmi_Int:
6982 case X86::VRSQRTSSr:
6983 case X86::VRSQRTSSr_Int:
6984 case X86::VRSQRTSSm:
6985 case X86::VRSQRTSSm_Int:
6987 case X86::VSQRTSSr_Int:
6989 case X86::VSQRTSSm_Int:
6991 case X86::VSQRTSDr_Int:
6993 case X86::VSQRTSDm_Int:
6995 case X86::VCVTSD2SSZrr:
6996 case X86::VCVTSD2SSZrr_Int:
6997 case X86::VCVTSD2SSZrrb_Int:
6998 case X86::VCVTSD2SSZrm:
6999 case X86::VCVTSD2SSZrm_Int:
7000 case X86::VCVTSS2SDZrr:
7001 case X86::VCVTSS2SDZrr_Int:
7002 case X86::VCVTSS2SDZrrb_Int:
7003 case X86::VCVTSS2SDZrm:
7004 case X86::VCVTSS2SDZrm_Int:
7005 case X86::VGETEXPSDZr:
7006 case X86::VGETEXPSDZrb:
7007 case X86::VGETEXPSDZm:
7008 case X86::VGETEXPSSZr:
7009 case X86::VGETEXPSSZrb:
7010 case X86::VGETEXPSSZm:
7011 case X86::VGETMANTSDZrri:
7012 case X86::VGETMANTSDZrrib:
7013 case X86::VGETMANTSDZrmi:
7014 case X86::VGETMANTSSZrri:
7015 case X86::VGETMANTSSZrrib:
7016 case X86::VGETMANTSSZrmi:
7017 case X86::VRNDSCALESDZrri:
7018 case X86::VRNDSCALESDZrri_Int:
7019 case X86::VRNDSCALESDZrrib_Int:
7020 case X86::VRNDSCALESDZrmi:
7021 case X86::VRNDSCALESDZrmi_Int:
7022 case X86::VRNDSCALESSZrri:
7023 case X86::VRNDSCALESSZrri_Int:
7024 case X86::VRNDSCALESSZrrib_Int:
7025 case X86::VRNDSCALESSZrmi:
7026 case X86::VRNDSCALESSZrmi_Int:
7027 case X86::VRCP14SDZrr:
7028 case X86::VRCP14SDZrm:
7029 case X86::VRCP14SSZrr:
7030 case X86::VRCP14SSZrm:
7031 case X86::VRCPSHZrr:
7032 case X86::VRCPSHZrm:
7033 case X86::VRSQRTSHZrr:
7034 case X86::VRSQRTSHZrm:
7035 case X86::VREDUCESHZrmi:
7036 case X86::VREDUCESHZrri:
7037 case X86::VREDUCESHZrrib:
7038 case X86::VGETEXPSHZr:
7039 case X86::VGETEXPSHZrb:
7040 case X86::VGETEXPSHZm:
7041 case X86::VGETMANTSHZrri:
7042 case X86::VGETMANTSHZrrib:
7043 case X86::VGETMANTSHZrmi:
7044 case X86::VRNDSCALESHZrri:
7045 case X86::VRNDSCALESHZrri_Int:
7046 case X86::VRNDSCALESHZrrib_Int:
7047 case X86::VRNDSCALESHZrmi:
7048 case X86::VRNDSCALESHZrmi_Int:
7049 case X86::VSQRTSHZr:
7050 case X86::VSQRTSHZr_Int:
7051 case X86::VSQRTSHZrb_Int:
7052 case X86::VSQRTSHZm:
7053 case X86::VSQRTSHZm_Int:
7054 case X86::VRCP28SDZr:
7055 case X86::VRCP28SDZrb:
7056 case X86::VRCP28SDZm:
7057 case X86::VRCP28SSZr:
7058 case X86::VRCP28SSZrb:
7059 case X86::VRCP28SSZm:
7060 case X86::VREDUCESSZrmi:
7061 case X86::VREDUCESSZrri:
7062 case X86::VREDUCESSZrrib:
7063 case X86::VRSQRT14SDZrr:
7064 case X86::VRSQRT14SDZrm:
7065 case X86::VRSQRT14SSZrr:
7066 case X86::VRSQRT14SSZrm:
7067 case X86::VRSQRT28SDZr:
7068 case X86::VRSQRT28SDZrb:
7069 case X86::VRSQRT28SDZm:
7070 case X86::VRSQRT28SSZr:
7071 case X86::VRSQRT28SSZrb:
7072 case X86::VRSQRT28SSZm:
7073 case X86::VSQRTSSZr:
7074 case X86::VSQRTSSZr_Int:
7075 case X86::VSQRTSSZrb_Int:
7076 case X86::VSQRTSSZm:
7077 case X86::VSQRTSSZm_Int:
7078 case X86::VSQRTSDZr:
7079 case X86::VSQRTSDZr_Int:
7080 case X86::VSQRTSDZrb_Int:
7081 case X86::VSQRTSDZm:
7082 case X86::VSQRTSDZm_Int:
7083 case X86::VCVTSD2SHZrr:
7084 case X86::VCVTSD2SHZrr_Int:
7085 case X86::VCVTSD2SHZrrb_Int:
7086 case X86::VCVTSD2SHZrm:
7087 case X86::VCVTSD2SHZrm_Int:
7088 case X86::VCVTSS2SHZrr:
7089 case X86::VCVTSS2SHZrr_Int:
7090 case X86::VCVTSS2SHZrrb_Int:
7091 case X86::VCVTSS2SHZrm:
7092 case X86::VCVTSS2SHZrm_Int:
7093 case X86::VCVTSH2SDZrr:
7094 case X86::VCVTSH2SDZrr_Int:
7095 case X86::VCVTSH2SDZrrb_Int:
7096 case X86::VCVTSH2SDZrm:
7097 case X86::VCVTSH2SDZrm_Int:
7098 case X86::VCVTSH2SSZrr:
7099 case X86::VCVTSH2SSZrr_Int:
7100 case X86::VCVTSH2SSZrrb_Int:
7101 case X86::VCVTSH2SSZrm:
7102 case X86::VCVTSH2SSZrm_Int:
7104 case X86::VMOVSSZrrk:
7105 case X86::VMOVSDZrrk:
7106 return OpNum == 3 && !ForLoadFold;
7107 case X86::VMOVSSZrrkz:
7108 case X86::VMOVSDZrrkz:
7109 return OpNum == 2 && !ForLoadFold;
7141 Register Reg =
MI.getOperand(OpNum).getReg();
7143 if (
MI.killsRegister(Reg,
TRI))
7146 if (X86::VR128RegClass.
contains(Reg)) {
7149 unsigned Opc = Subtarget.hasAVX() ? X86::VXORPSrr : X86::XORPSrr;
7153 MI.addRegisterKilled(Reg,
TRI,
true);
7154 }
else if (X86::VR256RegClass.
contains(Reg)) {
7157 Register XReg =
TRI->getSubReg(Reg, X86::sub_xmm);
7162 MI.addRegisterKilled(Reg,
TRI,
true);
7163 }
else if (X86::VR128XRegClass.
contains(Reg)) {
7165 if (!Subtarget.hasVLX())
7168 BuildMI(*
MI.getParent(),
MI,
MI.getDebugLoc(),
get(X86::VPXORDZ128rr), Reg)
7171 MI.addRegisterKilled(Reg,
TRI,
true);
7172 }
else if (X86::VR256XRegClass.
contains(Reg) ||
7173 X86::VR512RegClass.
contains(Reg)) {
7175 if (!Subtarget.hasVLX())
7179 Register XReg =
TRI->getSubReg(Reg, X86::sub_xmm);
7180 BuildMI(*
MI.getParent(),
MI,
MI.getDebugLoc(),
get(X86::VPXORDZ128rr), XReg)
7184 MI.addRegisterKilled(Reg,
TRI,
true);
7185 }
else if (X86::GR64RegClass.
contains(Reg)) {
7188 Register XReg =
TRI->getSubReg(Reg, X86::sub_32bit);
7193 MI.addRegisterKilled(Reg,
TRI,
true);
7194 }
else if (X86::GR32RegClass.
contains(Reg)) {
7198 MI.addRegisterKilled(Reg,
TRI,
true);
7199 }
else if ((X86::GR16RegClass.
contains(Reg) ||
7208 if (!
MI.definesRegister(SuperReg,
nullptr))
7214 int PtrOffset = 0) {
7215 unsigned NumAddrOps = MOs.
size();
7217 if (NumAddrOps < 4) {
7219 for (
unsigned i = 0; i != NumAddrOps; ++i)
7225 assert(MOs.
size() == 5 &&
"Unexpected memory operand list length");
7226 for (
unsigned i = 0; i != NumAddrOps; ++i) {
7228 if (i == 3 && PtrOffset != 0) {
7249 if (!
Reg.isVirtual())
7252 auto *NewRC =
MRI.constrainRegClass(
7256 dbgs() <<
"WARNING: Unable to update register constraint for operand "
7257 << Idx <<
" of instruction:\n";
7271 MF.CreateMachineInstr(
TII.get(Opcode),
MI.getDebugLoc(),
true);
7276 unsigned NumOps =
MI.getDesc().getNumOperands() - 2;
7277 for (
unsigned i = 0; i !=
NumOps; ++i) {
7287 MBB->insert(InsertPt, NewMI);
7296 int PtrOffset = 0) {
7299 MF.CreateMachineInstr(
TII.get(Opcode),
MI.getDebugLoc(),
true);
7302 for (
unsigned i = 0, e =
MI.getNumOperands(); i != e; ++i) {
7305 assert(MO.
isReg() &&
"Expected to fold into reg operand!");
7319 MBB->insert(InsertPt, NewMI);
7329 MI.getDebugLoc(),
TII.get(Opcode));
7338 switch (
MI.getOpcode()) {
7339 case X86::INSERTPSrri:
7340 case X86::VINSERTPSrri:
7341 case X86::VINSERTPSZrri:
7345 unsigned Imm =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
7346 unsigned ZMask =
Imm & 15;
7347 unsigned DstIdx = (
Imm >> 4) & 3;
7348 unsigned SrcIdx = (
Imm >> 6) & 3;
7351 const TargetRegisterClass *RC =
getRegClass(
MI.getDesc(), OpNum, &RI, MF);
7352 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7353 if ((
Size == 0 ||
Size >= 16) && RCSize >= 16 &&
7354 (
MI.getOpcode() != X86::INSERTPSrri || Alignment >=
Align(4))) {
7355 int PtrOffset = SrcIdx * 4;
7356 unsigned NewImm = (DstIdx << 4) | ZMask;
7357 unsigned NewOpCode =
7358 (
MI.getOpcode() == X86::VINSERTPSZrri) ? X86::VINSERTPSZrmi
7359 : (
MI.getOpcode() == X86::VINSERTPSrri) ? X86::VINSERTPSrmi
7361 MachineInstr *NewMI =
7362 fuseInst(MF, NewOpCode, OpNum, MOs, InsertPt,
MI, *
this, PtrOffset);
7368 case X86::MOVHLPSrr:
7369 case X86::VMOVHLPSrr:
7370 case X86::VMOVHLPSZrr:
7376 const TargetRegisterClass *RC =
getRegClass(
MI.getDesc(), OpNum, &RI, MF);
7377 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7378 if ((
Size == 0 ||
Size >= 16) && RCSize >= 16 && Alignment >=
Align(8)) {
7379 unsigned NewOpCode =
7380 (
MI.getOpcode() == X86::VMOVHLPSZrr) ? X86::VMOVLPSZ128rm
7381 : (
MI.getOpcode() == X86::VMOVHLPSrr) ? X86::VMOVLPSrm
7383 MachineInstr *NewMI =
7384 fuseInst(MF, NewOpCode, OpNum, MOs, InsertPt,
MI, *
this, 8);
7389 case X86::UNPCKLPDrr:
7395 const TargetRegisterClass *RC =
getRegClass(
MI.getDesc(), OpNum, &RI, MF);
7396 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7397 if ((
Size == 0 ||
Size >= 16) && RCSize >= 16 && Alignment <
Align(16)) {
7398 MachineInstr *NewMI =
7399 fuseInst(MF, X86::MOVHPDrm, OpNum, MOs, InsertPt,
MI, *
this);
7406 makeM0Inst(*
this, (
Size == 4) ? X86::MOV32mi : X86::MOV64mi32, MOs,
7418 !
MI.getOperand(1).isReg())
7426 if (
MI.getOperand(1).isUndef())
7435 unsigned Idx1)
const {
7436 unsigned Idx2 = CommuteAnyOperandIndex;
7440 bool HasDef =
MI.getDesc().getNumDefs();
7442 Register Reg1 =
MI.getOperand(Idx1).getReg();
7443 Register Reg2 =
MI.getOperand(Idx2).getReg();
7444 bool Tied1 = 0 ==
MI.getDesc().getOperandConstraint(Idx1,
MCOI::TIED_TO);
7445 bool Tied2 = 0 ==
MI.getDesc().getOperandConstraint(Idx2,
MCOI::TIED_TO);
7449 if ((HasDef && Reg0 == Reg1 && Tied1) || (HasDef && Reg0 == Reg2 && Tied2))
7452 return commuteInstruction(
MI,
false, Idx1, Idx2) ? Idx2 : Idx1;
7457 dbgs() <<
"We failed to fuse operand " << Idx <<
" in " <<
MI;
7463 unsigned Size,
Align Alignment,
bool AllowCommute)
const {
7464 bool isSlowTwoMemOps = Subtarget.slowTwoMemOps();
7465 unsigned Opc =
MI.getOpcode();
7471 (
Opc == X86::CALL32r ||
Opc == X86::CALL64r ||
7472 Opc == X86::CALL64r_ImpCall ||
Opc == X86::PUSH16r ||
7473 Opc == X86::PUSH32r ||
Opc == X86::PUSH64r))
7482 unsigned NumOps =
MI.getDesc().getNumOperands();
7483 bool IsTwoAddr =
NumOps > 1 && OpNum < 2 &&
MI.getOperand(0).isReg() &&
7484 MI.getOperand(1).isReg() &&
7485 MI.getOperand(0).getReg() ==
MI.getOperand(1).getReg();
7489 if (
Opc == X86::ADD32ri &&
7498 Opc != X86::ADD64rr)
7503 if (
MI.isCall() &&
MI.getCFIType())
7507 if (
auto *CustomMI = foldMemoryOperandCustom(MF,
MI, OpNum, MOs, InsertPt,
7523 unsigned Opcode =
I->DstOp;
7527 bool NarrowToMOV32rm =
false;
7531 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7539 if (Opcode != X86::MOV64rm || RCSize != 8 ||
Size != 4)
7541 if (
MI.getOperand(0).getSubReg() ||
MI.getOperand(1).getSubReg())
7543 Opcode = X86::MOV32rm;
7544 NarrowToMOV32rm =
true;
7554 :
fuseInst(MF, Opcode, OpNum, MOs, InsertPt,
MI, *
this);
7556 if (NarrowToMOV32rm) {
7572 unsigned CommuteOpIdx2 = commuteOperandsForFold(
MI, OpNum);
7573 if (CommuteOpIdx2 == OpNum) {
7583 commuteInstruction(
MI,
false, OpNum, CommuteOpIdx2);
7605 for (
auto Op :
Ops) {
7610 if (
MI.getOpcode() == X86::MOV32r0 &&
SubReg == X86::sub_32bit)
7621 if (!RI.hasStackRealignment(MF))
7623 std::min(Alignment, Subtarget.getFrameLowering()->getStackAlign());
7628 Size, Alignment,
true);
7630 if (
Ops.size() == 2 &&
Ops[0] == 0 &&
Ops[1] == 1) {
7631 unsigned NewOpc = 0;
7632 unsigned RCSize = 0;
7633 unsigned Opc =
MI.getOpcode();
7640 NewOpc = X86::CMP8ri;
7644 NewOpc = X86::CMP16ri;
7648 NewOpc = X86::CMP32ri;
7652 NewOpc = X86::CMP64ri32;
7661 MI.setDesc(
get(NewOpc));
7662 MI.getOperand(1).ChangeToImmediate(0);
7663 }
else if (
Ops.size() != 1)
7691 unsigned RegSize =
TRI.getRegSizeInBits(*RC);
7693 if ((
Opc == X86::MOVSSrm ||
Opc == X86::VMOVSSrm ||
Opc == X86::VMOVSSZrm ||
7694 Opc == X86::MOVSSrm_alt ||
Opc == X86::VMOVSSrm_alt ||
7695 Opc == X86::VMOVSSZrm_alt) &&
7701 case X86::CVTSS2SDrr_Int:
7702 case X86::VCVTSS2SDrr_Int:
7703 case X86::VCVTSS2SDZrr_Int:
7704 case X86::VCVTSS2SDZrrk_Int:
7705 case X86::VCVTSS2SDZrrkz_Int:
7706 case X86::CVTSS2SIrr_Int:
7707 case X86::CVTSS2SI64rr_Int:
7708 case X86::VCVTSS2SIrr_Int:
7709 case X86::VCVTSS2SI64rr_Int:
7710 case X86::VCVTSS2SIZrr_Int:
7711 case X86::VCVTSS2SI64Zrr_Int:
7712 case X86::CVTTSS2SIrr_Int:
7713 case X86::CVTTSS2SI64rr_Int:
7714 case X86::VCVTTSS2SIrr_Int:
7715 case X86::VCVTTSS2SI64rr_Int:
7716 case X86::VCVTTSS2SIZrr_Int:
7717 case X86::VCVTTSS2SI64Zrr_Int:
7718 case X86::VCVTSS2USIZrr_Int:
7719 case X86::VCVTSS2USI64Zrr_Int:
7720 case X86::VCVTTSS2USIZrr_Int:
7721 case X86::VCVTTSS2USI64Zrr_Int:
7722 case X86::RCPSSr_Int:
7723 case X86::VRCPSSr_Int:
7724 case X86::RSQRTSSr_Int:
7725 case X86::VRSQRTSSr_Int:
7726 case X86::ROUNDSSri_Int:
7727 case X86::VROUNDSSri_Int:
7728 case X86::COMISSrr_Int:
7729 case X86::VCOMISSrr_Int:
7730 case X86::VCOMISSZrr_Int:
7731 case X86::UCOMISSrr_Int:
7732 case X86::VUCOMISSrr_Int:
7733 case X86::VUCOMISSZrr_Int:
7734 case X86::ADDSSrr_Int:
7735 case X86::VADDSSrr_Int:
7736 case X86::VADDSSZrr_Int:
7737 case X86::CMPSSrri_Int:
7738 case X86::VCMPSSrri_Int:
7739 case X86::VCMPSSZrri_Int:
7740 case X86::DIVSSrr_Int:
7741 case X86::VDIVSSrr_Int:
7742 case X86::VDIVSSZrr_Int:
7743 case X86::MAXSSrr_Int:
7744 case X86::VMAXSSrr_Int:
7745 case X86::VMAXSSZrr_Int:
7746 case X86::MINSSrr_Int:
7747 case X86::VMINSSrr_Int:
7748 case X86::VMINSSZrr_Int:
7749 case X86::MULSSrr_Int:
7750 case X86::VMULSSrr_Int:
7751 case X86::VMULSSZrr_Int:
7752 case X86::SQRTSSr_Int:
7753 case X86::VSQRTSSr_Int:
7754 case X86::VSQRTSSZr_Int:
7755 case X86::SUBSSrr_Int:
7756 case X86::VSUBSSrr_Int:
7757 case X86::VSUBSSZrr_Int:
7758 case X86::VADDSSZrrk_Int:
7759 case X86::VADDSSZrrkz_Int:
7760 case X86::VCMPSSZrrik_Int:
7761 case X86::VDIVSSZrrk_Int:
7762 case X86::VDIVSSZrrkz_Int:
7763 case X86::VMAXSSZrrk_Int:
7764 case X86::VMAXSSZrrkz_Int:
7765 case X86::VMINSSZrrk_Int:
7766 case X86::VMINSSZrrkz_Int:
7767 case X86::VMULSSZrrk_Int:
7768 case X86::VMULSSZrrkz_Int:
7769 case X86::VSQRTSSZrk_Int:
7770 case X86::VSQRTSSZrkz_Int:
7771 case X86::VSUBSSZrrk_Int:
7772 case X86::VSUBSSZrrkz_Int:
7773 case X86::VFMADDSS4rr_Int:
7774 case X86::VFNMADDSS4rr_Int:
7775 case X86::VFMSUBSS4rr_Int:
7776 case X86::VFNMSUBSS4rr_Int:
7777 case X86::VFMADD132SSr_Int:
7778 case X86::VFNMADD132SSr_Int:
7779 case X86::VFMADD213SSr_Int:
7780 case X86::VFNMADD213SSr_Int:
7781 case X86::VFMADD231SSr_Int:
7782 case X86::VFNMADD231SSr_Int:
7783 case X86::VFMSUB132SSr_Int:
7784 case X86::VFNMSUB132SSr_Int:
7785 case X86::VFMSUB213SSr_Int:
7786 case X86::VFNMSUB213SSr_Int:
7787 case X86::VFMSUB231SSr_Int:
7788 case X86::VFNMSUB231SSr_Int:
7789 case X86::VFMADD132SSZr_Int:
7790 case X86::VFNMADD132SSZr_Int:
7791 case X86::VFMADD213SSZr_Int:
7792 case X86::VFNMADD213SSZr_Int:
7793 case X86::VFMADD231SSZr_Int:
7794 case X86::VFNMADD231SSZr_Int:
7795 case X86::VFMSUB132SSZr_Int:
7796 case X86::VFNMSUB132SSZr_Int:
7797 case X86::VFMSUB213SSZr_Int:
7798 case X86::VFNMSUB213SSZr_Int:
7799 case X86::VFMSUB231SSZr_Int:
7800 case X86::VFNMSUB231SSZr_Int:
7801 case X86::VFMADD132SSZrk_Int:
7802 case X86::VFNMADD132SSZrk_Int:
7803 case X86::VFMADD213SSZrk_Int:
7804 case X86::VFNMADD213SSZrk_Int:
7805 case X86::VFMADD231SSZrk_Int:
7806 case X86::VFNMADD231SSZrk_Int:
7807 case X86::VFMSUB132SSZrk_Int:
7808 case X86::VFNMSUB132SSZrk_Int:
7809 case X86::VFMSUB213SSZrk_Int:
7810 case X86::VFNMSUB213SSZrk_Int:
7811 case X86::VFMSUB231SSZrk_Int:
7812 case X86::VFNMSUB231SSZrk_Int:
7813 case X86::VFMADD132SSZrkz_Int:
7814 case X86::VFNMADD132SSZrkz_Int:
7815 case X86::VFMADD213SSZrkz_Int:
7816 case X86::VFNMADD213SSZrkz_Int:
7817 case X86::VFMADD231SSZrkz_Int:
7818 case X86::VFNMADD231SSZrkz_Int:
7819 case X86::VFMSUB132SSZrkz_Int:
7820 case X86::VFNMSUB132SSZrkz_Int:
7821 case X86::VFMSUB213SSZrkz_Int:
7822 case X86::VFNMSUB213SSZrkz_Int:
7823 case X86::VFMSUB231SSZrkz_Int:
7824 case X86::VFNMSUB231SSZrkz_Int:
7825 case X86::VFIXUPIMMSSZrri:
7826 case X86::VFIXUPIMMSSZrrik:
7827 case X86::VFIXUPIMMSSZrrikz:
7828 case X86::VFPCLASSSSZri:
7829 case X86::VFPCLASSSSZrik:
7830 case X86::VGETEXPSSZr:
7831 case X86::VGETEXPSSZrk:
7832 case X86::VGETEXPSSZrkz:
7833 case X86::VGETMANTSSZrri:
7834 case X86::VGETMANTSSZrrik:
7835 case X86::VGETMANTSSZrrikz:
7836 case X86::VRANGESSZrri:
7837 case X86::VRANGESSZrrik:
7838 case X86::VRANGESSZrrikz:
7839 case X86::VRCP14SSZrr:
7840 case X86::VRCP14SSZrrk:
7841 case X86::VRCP14SSZrrkz:
7842 case X86::VRCP28SSZr:
7843 case X86::VRCP28SSZrk:
7844 case X86::VRCP28SSZrkz:
7845 case X86::VREDUCESSZrri:
7846 case X86::VREDUCESSZrrik:
7847 case X86::VREDUCESSZrrikz:
7848 case X86::VRNDSCALESSZrri_Int:
7849 case X86::VRNDSCALESSZrrik_Int:
7850 case X86::VRNDSCALESSZrrikz_Int:
7851 case X86::VRSQRT14SSZrr:
7852 case X86::VRSQRT14SSZrrk:
7853 case X86::VRSQRT14SSZrrkz:
7854 case X86::VRSQRT28SSZr:
7855 case X86::VRSQRT28SSZrk:
7856 case X86::VRSQRT28SSZrkz:
7857 case X86::VSCALEFSSZrr:
7858 case X86::VSCALEFSSZrrk:
7859 case X86::VSCALEFSSZrrkz:
7866 if ((
Opc == X86::MOVSDrm ||
Opc == X86::VMOVSDrm ||
Opc == X86::VMOVSDZrm ||
7867 Opc == X86::MOVSDrm_alt ||
Opc == X86::VMOVSDrm_alt ||
7868 Opc == X86::VMOVSDZrm_alt) &&
7874 case X86::CVTSD2SSrr_Int:
7875 case X86::VCVTSD2SSrr_Int:
7876 case X86::VCVTSD2SSZrr_Int:
7877 case X86::VCVTSD2SSZrrk_Int:
7878 case X86::VCVTSD2SSZrrkz_Int:
7879 case X86::CVTSD2SIrr_Int:
7880 case X86::CVTSD2SI64rr_Int:
7881 case X86::VCVTSD2SIrr_Int:
7882 case X86::VCVTSD2SI64rr_Int:
7883 case X86::VCVTSD2SIZrr_Int:
7884 case X86::VCVTSD2SI64Zrr_Int:
7885 case X86::CVTTSD2SIrr_Int:
7886 case X86::CVTTSD2SI64rr_Int:
7887 case X86::VCVTTSD2SIrr_Int:
7888 case X86::VCVTTSD2SI64rr_Int:
7889 case X86::VCVTTSD2SIZrr_Int:
7890 case X86::VCVTTSD2SI64Zrr_Int:
7891 case X86::VCVTSD2USIZrr_Int:
7892 case X86::VCVTSD2USI64Zrr_Int:
7893 case X86::VCVTTSD2USIZrr_Int:
7894 case X86::VCVTTSD2USI64Zrr_Int:
7895 case X86::ROUNDSDri_Int:
7896 case X86::VROUNDSDri_Int:
7897 case X86::COMISDrr_Int:
7898 case X86::VCOMISDrr_Int:
7899 case X86::VCOMISDZrr_Int:
7900 case X86::UCOMISDrr_Int:
7901 case X86::VUCOMISDrr_Int:
7902 case X86::VUCOMISDZrr_Int:
7903 case X86::ADDSDrr_Int:
7904 case X86::VADDSDrr_Int:
7905 case X86::VADDSDZrr_Int:
7906 case X86::CMPSDrri_Int:
7907 case X86::VCMPSDrri_Int:
7908 case X86::VCMPSDZrri_Int:
7909 case X86::DIVSDrr_Int:
7910 case X86::VDIVSDrr_Int:
7911 case X86::VDIVSDZrr_Int:
7912 case X86::MAXSDrr_Int:
7913 case X86::VMAXSDrr_Int:
7914 case X86::VMAXSDZrr_Int:
7915 case X86::MINSDrr_Int:
7916 case X86::VMINSDrr_Int:
7917 case X86::VMINSDZrr_Int:
7918 case X86::MULSDrr_Int:
7919 case X86::VMULSDrr_Int:
7920 case X86::VMULSDZrr_Int:
7921 case X86::SQRTSDr_Int:
7922 case X86::VSQRTSDr_Int:
7923 case X86::VSQRTSDZr_Int:
7924 case X86::SUBSDrr_Int:
7925 case X86::VSUBSDrr_Int:
7926 case X86::VSUBSDZrr_Int:
7927 case X86::VADDSDZrrk_Int:
7928 case X86::VADDSDZrrkz_Int:
7929 case X86::VCMPSDZrrik_Int:
7930 case X86::VDIVSDZrrk_Int:
7931 case X86::VDIVSDZrrkz_Int:
7932 case X86::VMAXSDZrrk_Int:
7933 case X86::VMAXSDZrrkz_Int:
7934 case X86::VMINSDZrrk_Int:
7935 case X86::VMINSDZrrkz_Int:
7936 case X86::VMULSDZrrk_Int:
7937 case X86::VMULSDZrrkz_Int:
7938 case X86::VSQRTSDZrk_Int:
7939 case X86::VSQRTSDZrkz_Int:
7940 case X86::VSUBSDZrrk_Int:
7941 case X86::VSUBSDZrrkz_Int:
7942 case X86::VFMADDSD4rr_Int:
7943 case X86::VFNMADDSD4rr_Int:
7944 case X86::VFMSUBSD4rr_Int:
7945 case X86::VFNMSUBSD4rr_Int:
7946 case X86::VFMADD132SDr_Int:
7947 case X86::VFNMADD132SDr_Int:
7948 case X86::VFMADD213SDr_Int:
7949 case X86::VFNMADD213SDr_Int:
7950 case X86::VFMADD231SDr_Int:
7951 case X86::VFNMADD231SDr_Int:
7952 case X86::VFMSUB132SDr_Int:
7953 case X86::VFNMSUB132SDr_Int:
7954 case X86::VFMSUB213SDr_Int:
7955 case X86::VFNMSUB213SDr_Int:
7956 case X86::VFMSUB231SDr_Int:
7957 case X86::VFNMSUB231SDr_Int:
7958 case X86::VFMADD132SDZr_Int:
7959 case X86::VFNMADD132SDZr_Int:
7960 case X86::VFMADD213SDZr_Int:
7961 case X86::VFNMADD213SDZr_Int:
7962 case X86::VFMADD231SDZr_Int:
7963 case X86::VFNMADD231SDZr_Int:
7964 case X86::VFMSUB132SDZr_Int:
7965 case X86::VFNMSUB132SDZr_Int:
7966 case X86::VFMSUB213SDZr_Int:
7967 case X86::VFNMSUB213SDZr_Int:
7968 case X86::VFMSUB231SDZr_Int:
7969 case X86::VFNMSUB231SDZr_Int:
7970 case X86::VFMADD132SDZrk_Int:
7971 case X86::VFNMADD132SDZrk_Int:
7972 case X86::VFMADD213SDZrk_Int:
7973 case X86::VFNMADD213SDZrk_Int:
7974 case X86::VFMADD231SDZrk_Int:
7975 case X86::VFNMADD231SDZrk_Int:
7976 case X86::VFMSUB132SDZrk_Int:
7977 case X86::VFNMSUB132SDZrk_Int:
7978 case X86::VFMSUB213SDZrk_Int:
7979 case X86::VFNMSUB213SDZrk_Int:
7980 case X86::VFMSUB231SDZrk_Int:
7981 case X86::VFNMSUB231SDZrk_Int:
7982 case X86::VFMADD132SDZrkz_Int:
7983 case X86::VFNMADD132SDZrkz_Int:
7984 case X86::VFMADD213SDZrkz_Int:
7985 case X86::VFNMADD213SDZrkz_Int:
7986 case X86::VFMADD231SDZrkz_Int:
7987 case X86::VFNMADD231SDZrkz_Int:
7988 case X86::VFMSUB132SDZrkz_Int:
7989 case X86::VFNMSUB132SDZrkz_Int:
7990 case X86::VFMSUB213SDZrkz_Int:
7991 case X86::VFNMSUB213SDZrkz_Int:
7992 case X86::VFMSUB231SDZrkz_Int:
7993 case X86::VFNMSUB231SDZrkz_Int:
7994 case X86::VFIXUPIMMSDZrri:
7995 case X86::VFIXUPIMMSDZrrik:
7996 case X86::VFIXUPIMMSDZrrikz:
7997 case X86::VFPCLASSSDZri:
7998 case X86::VFPCLASSSDZrik:
7999 case X86::VGETEXPSDZr:
8000 case X86::VGETEXPSDZrk:
8001 case X86::VGETEXPSDZrkz:
8002 case X86::VGETMANTSDZrri:
8003 case X86::VGETMANTSDZrrik:
8004 case X86::VGETMANTSDZrrikz:
8005 case X86::VRANGESDZrri:
8006 case X86::VRANGESDZrrik:
8007 case X86::VRANGESDZrrikz:
8008 case X86::VRCP14SDZrr:
8009 case X86::VRCP14SDZrrk:
8010 case X86::VRCP14SDZrrkz:
8011 case X86::VRCP28SDZr:
8012 case X86::VRCP28SDZrk:
8013 case X86::VRCP28SDZrkz:
8014 case X86::VREDUCESDZrri:
8015 case X86::VREDUCESDZrrik:
8016 case X86::VREDUCESDZrrikz:
8017 case X86::VRNDSCALESDZrri_Int:
8018 case X86::VRNDSCALESDZrrik_Int:
8019 case X86::VRNDSCALESDZrrikz_Int:
8020 case X86::VRSQRT14SDZrr:
8021 case X86::VRSQRT14SDZrrk:
8022 case X86::VRSQRT14SDZrrkz:
8023 case X86::VRSQRT28SDZr:
8024 case X86::VRSQRT28SDZrk:
8025 case X86::VRSQRT28SDZrkz:
8026 case X86::VSCALEFSDZrr:
8027 case X86::VSCALEFSDZrrk:
8028 case X86::VSCALEFSDZrrkz:
8035 if ((
Opc == X86::VMOVSHZrm ||
Opc == X86::VMOVSHZrm_alt) &&
RegSize > 16) {
8040 case X86::VADDSHZrr_Int:
8041 case X86::VCMPSHZrri_Int:
8042 case X86::VDIVSHZrr_Int:
8043 case X86::VMAXSHZrr_Int:
8044 case X86::VMINSHZrr_Int:
8045 case X86::VMULSHZrr_Int:
8046 case X86::VSUBSHZrr_Int:
8047 case X86::VADDSHZrrk_Int:
8048 case X86::VADDSHZrrkz_Int:
8049 case X86::VCMPSHZrrik_Int:
8050 case X86::VDIVSHZrrk_Int:
8051 case X86::VDIVSHZrrkz_Int:
8052 case X86::VMAXSHZrrk_Int:
8053 case X86::VMAXSHZrrkz_Int:
8054 case X86::VMINSHZrrk_Int:
8055 case X86::VMINSHZrrkz_Int:
8056 case X86::VMULSHZrrk_Int:
8057 case X86::VMULSHZrrkz_Int:
8058 case X86::VSUBSHZrrk_Int:
8059 case X86::VSUBSHZrrkz_Int:
8060 case X86::VFMADD132SHZr_Int:
8061 case X86::VFNMADD132SHZr_Int:
8062 case X86::VFMADD213SHZr_Int:
8063 case X86::VFNMADD213SHZr_Int:
8064 case X86::VFMADD231SHZr_Int:
8065 case X86::VFNMADD231SHZr_Int:
8066 case X86::VFMSUB132SHZr_Int:
8067 case X86::VFNMSUB132SHZr_Int:
8068 case X86::VFMSUB213SHZr_Int:
8069 case X86::VFNMSUB213SHZr_Int:
8070 case X86::VFMSUB231SHZr_Int:
8071 case X86::VFNMSUB231SHZr_Int:
8072 case X86::VFMADD132SHZrk_Int:
8073 case X86::VFNMADD132SHZrk_Int:
8074 case X86::VFMADD213SHZrk_Int:
8075 case X86::VFNMADD213SHZrk_Int:
8076 case X86::VFMADD231SHZrk_Int:
8077 case X86::VFNMADD231SHZrk_Int:
8078 case X86::VFMSUB132SHZrk_Int:
8079 case X86::VFNMSUB132SHZrk_Int:
8080 case X86::VFMSUB213SHZrk_Int:
8081 case X86::VFNMSUB213SHZrk_Int:
8082 case X86::VFMSUB231SHZrk_Int:
8083 case X86::VFNMSUB231SHZrk_Int:
8084 case X86::VFMADD132SHZrkz_Int:
8085 case X86::VFNMADD132SHZrkz_Int:
8086 case X86::VFMADD213SHZrkz_Int:
8087 case X86::VFNMADD213SHZrkz_Int:
8088 case X86::VFMADD231SHZrkz_Int:
8089 case X86::VFNMADD231SHZrkz_Int:
8090 case X86::VFMSUB132SHZrkz_Int:
8091 case X86::VFNMSUB132SHZrkz_Int:
8092 case X86::VFMSUB213SHZrkz_Int:
8093 case X86::VFNMSUB213SHZrkz_Int:
8094 case X86::VFMSUB231SHZrkz_Int:
8095 case X86::VFNMSUB231SHZrkz_Int:
8112 for (
auto Op :
Ops) {
8113 if (
MI.getOperand(
Op).getSubReg())
8151 case X86::AVX512_512_SET0:
8152 case X86::AVX512_512_SETALLONES:
8153 Alignment =
Align(64);
8155 case X86::AVX2_SETALLONES:
8156 case X86::AVX1_SETALLONES:
8158 case X86::AVX512_256_SET0:
8159 Alignment =
Align(32);
8162 case X86::V_SETALLONES:
8163 case X86::AVX512_128_SET0:
8164 case X86::FsFLD0F128:
8165 case X86::AVX512_FsFLD0F128:
8166 Alignment =
Align(16);
8170 case X86::AVX512_FsFLD0SD:
8171 Alignment =
Align(8);
8174 case X86::AVX512_FsFLD0SS:
8175 Alignment =
Align(4);
8178 case X86::AVX512_FsFLD0SH:
8179 Alignment =
Align(2);
8184 if (
Ops.size() == 2 &&
Ops[0] == 0 &&
Ops[1] == 1) {
8185 unsigned NewOpc = 0;
8186 switch (
MI.getOpcode()) {
8190 NewOpc = X86::CMP8ri;
8193 NewOpc = X86::CMP16ri;
8196 NewOpc = X86::CMP32ri;
8199 NewOpc = X86::CMP64ri32;
8203 MI.setDesc(
get(NewOpc));
8204 MI.getOperand(1).ChangeToImmediate(0);
8205 }
else if (
Ops.size() != 1)
8217 case X86::V_SETALLONES:
8218 case X86::AVX2_SETALLONES:
8219 case X86::AVX1_SETALLONES:
8221 case X86::AVX512_128_SET0:
8222 case X86::AVX512_256_SET0:
8223 case X86::AVX512_512_SET0:
8224 case X86::AVX512_512_SETALLONES:
8226 case X86::AVX512_FsFLD0SH:
8228 case X86::AVX512_FsFLD0SD:
8230 case X86::AVX512_FsFLD0SS:
8231 case X86::FsFLD0F128:
8232 case X86::AVX512_FsFLD0F128: {
8241 unsigned PICBase = 0;
8244 if (Subtarget.is64Bit()) {
8257 bool IsAllOnes =
false;
8260 case X86::AVX512_FsFLD0SS:
8264 case X86::AVX512_FsFLD0SD:
8267 case X86::FsFLD0F128:
8268 case X86::AVX512_FsFLD0F128:
8272 case X86::AVX512_FsFLD0SH:
8275 case X86::AVX512_512_SETALLONES:
8278 case X86::AVX512_512_SET0:
8282 case X86::AVX1_SETALLONES:
8283 case X86::AVX2_SETALLONES:
8286 case X86::AVX512_256_SET0:
8296 case X86::V_SETALLONES:
8300 case X86::AVX512_128_SET0:
8318 case X86::VPBROADCASTBZ128rm:
8319 case X86::VPBROADCASTBZ256rm:
8320 case X86::VPBROADCASTBZrm:
8321 case X86::VBROADCASTF32X2Z256rm:
8322 case X86::VBROADCASTF32X2Zrm:
8323 case X86::VBROADCASTI32X2Z128rm:
8324 case X86::VBROADCASTI32X2Z256rm:
8325 case X86::VBROADCASTI32X2Zrm:
8329#define FOLD_BROADCAST(SIZE) \
8330 MOs.append(LoadMI.operands_begin() + NumOps - X86::AddrNumOperands, \
8331 LoadMI.operands_begin() + NumOps); \
8332 return foldMemoryBroadcast(MF, MI, Ops[0], MOs, InsertPt, SIZE, \
8334 case X86::VPBROADCASTWZ128rm:
8335 case X86::VPBROADCASTWZ256rm:
8336 case X86::VPBROADCASTWZrm:
8338 case X86::VPBROADCASTDZ128rm:
8339 case X86::VPBROADCASTDZ256rm:
8340 case X86::VPBROADCASTDZrm:
8341 case X86::VBROADCASTSSZ128rm:
8342 case X86::VBROADCASTSSZ256rm:
8343 case X86::VBROADCASTSSZrm:
8345 case X86::VPBROADCASTQZ128rm:
8346 case X86::VPBROADCASTQZ256rm:
8347 case X86::VPBROADCASTQZrm:
8348 case X86::VBROADCASTSDZ256rm:
8349 case X86::VBROADCASTSDZrm:
8362 0, Alignment,
true);
8369 unsigned BitsSize,
bool AllowCommute)
const {
8373 ?
fuseInst(MF,
I->DstOp, OpNum, MOs, InsertPt,
MI, *
this)
8379 unsigned CommuteOpIdx2 = commuteOperandsForFold(
MI, OpNum);
8380 if (CommuteOpIdx2 == OpNum) {
8385 foldMemoryBroadcast(MF,
MI, CommuteOpIdx2, MOs, InsertPt, BitsSize,
8390 commuteInstruction(
MI,
false, OpNum, CommuteOpIdx2);
8405 if (!MMO->isStore()) {
8423 if (!MMO->isStore())
8426 if (!MMO->isLoad()) {
8444 assert((SpillSize == 64 || STI.hasVLX()) &&
8445 "Can't broadcast less than 64 bytes without AVX512VL!");
8447#define CASE_BCAST_TYPE_OPC(TYPE, OP16, OP32, OP64) \
8449 switch (SpillSize) { \
8451 llvm_unreachable("Unknown spill size"); \
8485 unsigned Opc =
I->DstOp;
8489 if (UnfoldLoad && !FoldedLoad)
8491 UnfoldLoad &= FoldedLoad;
8492 if (UnfoldStore && !FoldedStore)
8494 UnfoldStore &= FoldedStore;
8501 if (!
MI.hasOneMemOperand() && RC == &X86::VR128RegClass &&
8502 Subtarget.isUnalignedMem16Slow())
8511 for (
unsigned i = 0, e =
MI.getNumOperands(); i != e; ++i) {
8515 else if (
Op.isReg() &&
Op.isImplicit())
8531 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*RC), 16);
8532 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8576 case X86::CMP64ri32:
8587 case X86::CMP64ri32:
8588 NewOpc = X86::TEST64rr;
8591 NewOpc = X86::TEST32rr;
8594 NewOpc = X86::TEST16rr;
8597 NewOpc = X86::TEST8rr;
8611 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*DstRC), 16);
8612 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8628 if (!
N->isMachineOpcode())
8634 unsigned Opc =
I->DstOp;
8642 unsigned NumDefs =
MCID.NumDefs;
8643 std::vector<SDValue> AddrOps;
8644 std::vector<SDValue> BeforeOps;
8645 std::vector<SDValue> AfterOps;
8647 unsigned NumOps =
N->getNumOperands();
8648 for (
unsigned i = 0; i !=
NumOps - 1; ++i) {
8651 AddrOps.push_back(
Op);
8652 else if (i < Index - NumDefs)
8653 BeforeOps.push_back(
Op);
8654 else if (i > Index - NumDefs)
8655 AfterOps.push_back(
Op);
8658 AddrOps.push_back(Chain);
8663 EVT VT = *
TRI.legalclasstypes_begin(*RC);
8665 if (MMOs.empty() && RC == &X86::VR128RegClass &&
8666 Subtarget.isUnalignedMem16Slow())
8676 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*RC), 16);
8677 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8689 std::vector<EVT> VTs;
8691 if (
MCID.getNumDefs() > 0) {
8693 VTs.push_back(*
TRI.legalclasstypes_begin(*DstRC));
8695 for (
unsigned i = 0, e =
N->getNumValues(); i != e; ++i) {
8696 EVT VT =
N->getValueType(i);
8697 if (VT != MVT::Other && i >= (
unsigned)
MCID.getNumDefs())
8701 BeforeOps.push_back(
SDValue(Load, 0));
8707 case X86::CMP64ri32:
8715 case X86::CMP64ri32:
8716 Opc = X86::TEST64rr;
8719 Opc = X86::TEST32rr;
8722 Opc = X86::TEST16rr;
8728 BeforeOps[1] = BeforeOps[0];
8737 AddrOps.push_back(
SDValue(NewNode, 0));
8738 AddrOps.push_back(Chain);
8740 if (MMOs.empty() && RC == &X86::VR128RegClass &&
8741 Subtarget.isUnalignedMem16Slow())
8746 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*RC), 16);
8747 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8750 dl, MVT::Other, AddrOps);
8763 unsigned *LoadRegIndex)
const {
8769 if (UnfoldLoad && !FoldedLoad)
8771 if (UnfoldStore && !FoldedStore)
8780 int64_t &Offset2)
const {
8784 auto IsLoadOpcode = [&](
unsigned Opcode) {
8796 case X86::MOVSSrm_alt:
8798 case X86::MOVSDrm_alt:
8799 case X86::MMX_MOVD64rm:
8800 case X86::MMX_MOVQ64rm:
8809 case X86::VMOVSSrm_alt:
8811 case X86::VMOVSDrm_alt:
8812 case X86::VMOVAPSrm:
8813 case X86::VMOVUPSrm:
8814 case X86::VMOVAPDrm:
8815 case X86::VMOVUPDrm:
8816 case X86::VMOVDQArm:
8817 case X86::VMOVDQUrm:
8818 case X86::VMOVAPSYrm:
8819 case X86::VMOVUPSYrm:
8820 case X86::VMOVAPDYrm:
8821 case X86::VMOVUPDYrm:
8822 case X86::VMOVDQAYrm:
8823 case X86::VMOVDQUYrm:
8825 case X86::VMOVSSZrm:
8826 case X86::VMOVSSZrm_alt:
8827 case X86::VMOVSDZrm:
8828 case X86::VMOVSDZrm_alt:
8829 case X86::VMOVAPSZ128rm:
8830 case X86::VMOVUPSZ128rm:
8831 case X86::VMOVAPSZ128rm_NOVLX:
8832 case X86::VMOVUPSZ128rm_NOVLX:
8833 case X86::VMOVAPDZ128rm:
8834 case X86::VMOVUPDZ128rm:
8835 case X86::VMOVDQU8Z128rm:
8836 case X86::VMOVDQU16Z128rm:
8837 case X86::VMOVDQA32Z128rm:
8838 case X86::VMOVDQU32Z128rm:
8839 case X86::VMOVDQA64Z128rm:
8840 case X86::VMOVDQU64Z128rm:
8841 case X86::VMOVAPSZ256rm:
8842 case X86::VMOVUPSZ256rm:
8843 case X86::VMOVAPSZ256rm_NOVLX:
8844 case X86::VMOVUPSZ256rm_NOVLX:
8845 case X86::VMOVAPDZ256rm:
8846 case X86::VMOVUPDZ256rm:
8847 case X86::VMOVDQU8Z256rm:
8848 case X86::VMOVDQU16Z256rm:
8849 case X86::VMOVDQA32Z256rm:
8850 case X86::VMOVDQU32Z256rm:
8851 case X86::VMOVDQA64Z256rm:
8852 case X86::VMOVDQU64Z256rm:
8853 case X86::VMOVAPSZrm:
8854 case X86::VMOVUPSZrm:
8855 case X86::VMOVAPDZrm:
8856 case X86::VMOVUPDZrm:
8857 case X86::VMOVDQU8Zrm:
8858 case X86::VMOVDQU16Zrm:
8859 case X86::VMOVDQA32Zrm:
8860 case X86::VMOVDQU32Zrm:
8861 case X86::VMOVDQA64Zrm:
8862 case X86::VMOVDQU64Zrm:
8864 case X86::KMOVBkm_EVEX:
8866 case X86::KMOVWkm_EVEX:
8868 case X86::KMOVDkm_EVEX:
8870 case X86::KMOVQkm_EVEX:
8880 auto HasSameOp = [&](
int I) {
8896 if (!Disp1 || !Disp2)
8899 Offset1 = Disp1->getSExtValue();
8900 Offset2 = Disp2->getSExtValue();
8905 int64_t Offset1, int64_t Offset2,
8906 unsigned NumLoads)
const {
8907 assert(Offset2 > Offset1);
8908 if ((Offset2 - Offset1) / 8 > 64)
8922 case X86::MMX_MOVD64rm:
8923 case X86::MMX_MOVQ64rm:
8932 if (Subtarget.is64Bit()) {
8935 }
else if (NumLoads) {
8958 unsigned Opcode =
MI.getOpcode();
8959 if (Opcode == X86::ENDBR64 || Opcode == X86::ENDBR32 ||
8960 Opcode == X86::PLDTILECFGV)
8973 assert(
Cond.size() == 1 &&
"Invalid X86 branch condition!");
8983 return !(RC == &X86::CCRRegClass || RC == &X86::DFCCRRegClass ||
8984 RC == &X86::RFP32RegClass || RC == &X86::RFP64RegClass ||
8985 RC == &X86::RFP80RegClass);
8998 return GlobalBaseReg;
9003 GlobalBaseReg = RegInfo.createVirtualRegister(
9004 Subtarget.is64Bit() ? &X86::GR64_NOSPRegClass : &X86::GR32_NOSPRegClass);
9006 return GlobalBaseReg;
9014 for (
const uint16_t(&Row)[3] : Table)
9015 if (Row[domain - 1] == opcode)
9023 for (
const uint16_t(&Row)[4] : Table)
9024 if (Row[domain - 1] == opcode || (domain == 3 && Row[3] == opcode))
9031 unsigned NewWidth,
unsigned *pNewMask =
nullptr) {
9032 assert(((OldWidth % NewWidth) == 0 || (NewWidth % OldWidth) == 0) &&
9033 "Illegal blend mask scale");
9034 unsigned NewMask = 0;
9036 if ((OldWidth % NewWidth) == 0) {
9037 unsigned Scale = OldWidth / NewWidth;
9038 unsigned SubMask = (1u << Scale) - 1;
9039 for (
unsigned i = 0; i != NewWidth; ++i) {
9040 unsigned Sub = (OldMask >> (i * Scale)) & SubMask;
9042 NewMask |= (1u << i);
9043 else if (
Sub != 0x0)
9047 unsigned Scale = NewWidth / OldWidth;
9048 unsigned SubMask = (1u << Scale) - 1;
9049 for (
unsigned i = 0; i != OldWidth; ++i) {
9050 if (OldMask & (1 << i)) {
9051 NewMask |= (SubMask << (i * Scale));
9057 *pNewMask = NewMask;
9062 unsigned Opcode =
MI.getOpcode();
9063 unsigned NumOperands =
MI.getDesc().getNumOperands();
9065 auto GetBlendDomains = [&](
unsigned ImmWidth,
bool Is256) {
9067 if (
MI.getOperand(NumOperands - 1).isImm()) {
9068 unsigned Imm =
MI.getOperand(NumOperands - 1).getImm();
9070 validDomains |= 0x2;
9072 validDomains |= 0x4;
9073 if (!Is256 || Subtarget.hasAVX2())
9074 validDomains |= 0x8;
9076 return validDomains;
9080 case X86::BLENDPDrmi:
9081 case X86::BLENDPDrri:
9082 case X86::VBLENDPDrmi:
9083 case X86::VBLENDPDrri:
9084 return GetBlendDomains(2,
false);
9085 case X86::VBLENDPDYrmi:
9086 case X86::VBLENDPDYrri:
9087 return GetBlendDomains(4,
true);
9088 case X86::BLENDPSrmi:
9089 case X86::BLENDPSrri:
9090 case X86::VBLENDPSrmi:
9091 case X86::VBLENDPSrri:
9092 case X86::VPBLENDDrmi:
9093 case X86::VPBLENDDrri:
9094 return GetBlendDomains(4,
false);
9095 case X86::VBLENDPSYrmi:
9096 case X86::VBLENDPSYrri:
9097 case X86::VPBLENDDYrmi:
9098 case X86::VPBLENDDYrri:
9099 return GetBlendDomains(8,
true);
9100 case X86::PBLENDWrmi:
9101 case X86::PBLENDWrri:
9102 case X86::VPBLENDWrmi:
9103 case X86::VPBLENDWrri:
9105 case X86::VPBLENDWYrmi:
9106 case X86::VPBLENDWYrri:
9107 return GetBlendDomains(8,
false);
9108 case X86::VPANDDZ128rr:
9109 case X86::VPANDDZ128rm:
9110 case X86::VPANDDZ256rr:
9111 case X86::VPANDDZ256rm:
9112 case X86::VPANDQZ128rr:
9113 case X86::VPANDQZ128rm:
9114 case X86::VPANDQZ256rr:
9115 case X86::VPANDQZ256rm:
9116 case X86::VPANDNDZ128rr:
9117 case X86::VPANDNDZ128rm:
9118 case X86::VPANDNDZ256rr:
9119 case X86::VPANDNDZ256rm:
9120 case X86::VPANDNQZ128rr:
9121 case X86::VPANDNQZ128rm:
9122 case X86::VPANDNQZ256rr:
9123 case X86::VPANDNQZ256rm:
9124 case X86::VPORDZ128rr:
9125 case X86::VPORDZ128rm:
9126 case X86::VPORDZ256rr:
9127 case X86::VPORDZ256rm:
9128 case X86::VPORQZ128rr:
9129 case X86::VPORQZ128rm:
9130 case X86::VPORQZ256rr:
9131 case X86::VPORQZ256rm:
9132 case X86::VPXORDZ128rr:
9133 case X86::VPXORDZ128rm:
9134 case X86::VPXORDZ256rr:
9135 case X86::VPXORDZ256rm:
9136 case X86::VPXORQZ128rr:
9137 case X86::VPXORQZ128rm:
9138 case X86::VPXORQZ256rr:
9139 case X86::VPXORQZ256rm:
9142 if (Subtarget.hasDQI())
9145 if (RI.getEncodingValue(
MI.getOperand(0).getReg()) >= 16)
9147 if (RI.getEncodingValue(
MI.getOperand(1).getReg()) >= 16)
9150 if (NumOperands == 3 &&
9151 RI.getEncodingValue(
MI.getOperand(2).getReg()) >= 16)
9156 case X86::MOVHLPSrr:
9163 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg() &&
9164 MI.getOperand(0).getSubReg() == 0 &&
9165 MI.getOperand(1).getSubReg() == 0 &&
MI.getOperand(2).getSubReg() == 0)
9168 case X86::SHUFPDrri:
9174#include "X86ReplaceableInstrs.def"
9180 assert(dom &&
"Not an SSE instruction");
9182 unsigned Opcode =
MI.getOpcode();
9183 unsigned NumOperands =
MI.getDesc().getNumOperands();
9185 auto SetBlendDomain = [&](
unsigned ImmWidth,
bool Is256) {
9186 if (
MI.getOperand(NumOperands - 1).isImm()) {
9187 unsigned Imm =
MI.getOperand(NumOperands - 1).getImm() & 255;
9188 Imm = (ImmWidth == 16 ? ((Imm << 8) | Imm) : Imm);
9189 unsigned NewImm = Imm;
9191 const uint16_t *table =
lookup(Opcode, dom, ReplaceableBlendInstrs);
9193 table =
lookup(Opcode, dom, ReplaceableBlendAVX2Instrs);
9197 }
else if (
Domain == 2) {
9199 }
else if (
Domain == 3) {
9200 if (Subtarget.hasAVX2()) {
9202 if ((ImmWidth / (Is256 ? 2 : 1)) != 8) {
9203 table =
lookup(Opcode, dom, ReplaceableBlendAVX2Instrs);
9207 assert(!Is256 &&
"128-bit vector expected");
9212 assert(table && table[
Domain - 1] &&
"Unknown domain op");
9214 MI.getOperand(NumOperands - 1).setImm(NewImm & 255);
9220 case X86::BLENDPDrmi:
9221 case X86::BLENDPDrri:
9222 case X86::VBLENDPDrmi:
9223 case X86::VBLENDPDrri:
9224 return SetBlendDomain(2,
false);
9225 case X86::VBLENDPDYrmi:
9226 case X86::VBLENDPDYrri:
9227 return SetBlendDomain(4,
true);
9228 case X86::BLENDPSrmi:
9229 case X86::BLENDPSrri:
9230 case X86::VBLENDPSrmi:
9231 case X86::VBLENDPSrri:
9232 case X86::VPBLENDDrmi:
9233 case X86::VPBLENDDrri:
9234 return SetBlendDomain(4,
false);
9235 case X86::VBLENDPSYrmi:
9236 case X86::VBLENDPSYrri:
9237 case X86::VPBLENDDYrmi:
9238 case X86::VPBLENDDYrri:
9239 return SetBlendDomain(8,
true);
9240 case X86::PBLENDWrmi:
9241 case X86::PBLENDWrri:
9242 case X86::VPBLENDWrmi:
9243 case X86::VPBLENDWrri:
9244 return SetBlendDomain(8,
false);
9245 case X86::VPBLENDWYrmi:
9246 case X86::VPBLENDWYrri:
9247 return SetBlendDomain(16,
true);
9248 case X86::VPANDDZ128rr:
9249 case X86::VPANDDZ128rm:
9250 case X86::VPANDDZ256rr:
9251 case X86::VPANDDZ256rm:
9252 case X86::VPANDQZ128rr:
9253 case X86::VPANDQZ128rm:
9254 case X86::VPANDQZ256rr:
9255 case X86::VPANDQZ256rm:
9256 case X86::VPANDNDZ128rr:
9257 case X86::VPANDNDZ128rm:
9258 case X86::VPANDNDZ256rr:
9259 case X86::VPANDNDZ256rm:
9260 case X86::VPANDNQZ128rr:
9261 case X86::VPANDNQZ128rm:
9262 case X86::VPANDNQZ256rr:
9263 case X86::VPANDNQZ256rm:
9264 case X86::VPORDZ128rr:
9265 case X86::VPORDZ128rm:
9266 case X86::VPORDZ256rr:
9267 case X86::VPORDZ256rm:
9268 case X86::VPORQZ128rr:
9269 case X86::VPORQZ128rm:
9270 case X86::VPORQZ256rr:
9271 case X86::VPORQZ256rm:
9272 case X86::VPXORDZ128rr:
9273 case X86::VPXORDZ128rm:
9274 case X86::VPXORDZ256rr:
9275 case X86::VPXORDZ256rm:
9276 case X86::VPXORQZ128rr:
9277 case X86::VPXORQZ128rm:
9278 case X86::VPXORQZ256rr:
9279 case X86::VPXORQZ256rm: {
9281 if (Subtarget.hasDQI())
9285 lookupAVX512(
MI.getOpcode(), dom, ReplaceableCustomAVX512LogicInstrs);
9286 assert(table &&
"Instruction not found in table?");
9289 if (
Domain == 3 && (dom == 1 || table[3] ==
MI.getOpcode()))
9294 case X86::UNPCKHPDrr:
9295 case X86::MOVHLPSrr:
9298 MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg() &&
9299 MI.getOperand(0).getSubReg() == 0 &&
9300 MI.getOperand(1).getSubReg() == 0 &&
9301 MI.getOperand(2).getSubReg() == 0) {
9302 commuteInstruction(
MI,
false);
9306 if (Opcode == X86::MOVHLPSrr)
9309 case X86::SHUFPDrri: {
9311 unsigned Imm =
MI.getOperand(3).getImm();
9312 unsigned NewImm = 0x44;
9317 MI.getOperand(3).setImm(NewImm);
9318 MI.setDesc(
get(X86::SHUFPSrri));
9326std::pair<uint16_t, uint16_t>
9329 unsigned opcode =
MI.getOpcode();
9335 return std::make_pair(domain, validDomains);
9337 if (
lookup(opcode, domain, ReplaceableInstrs)) {
9339 }
else if (
lookup(opcode, domain, ReplaceableInstrsAVX2)) {
9340 validDomains = Subtarget.hasAVX2() ? 0xe : 0x6;
9341 }
else if (
lookup(opcode, domain, ReplaceableInstrsFP)) {
9343 }
else if (
lookup(opcode, domain, ReplaceableInstrsAVX2InsertExtract)) {
9346 if (!Subtarget.hasAVX2())
9347 return std::make_pair(0, 0);
9349 }
else if (
lookupAVX512(opcode, domain, ReplaceableInstrsAVX512)) {
9351 }
else if (Subtarget.hasDQI() &&
9352 lookupAVX512(opcode, domain, ReplaceableInstrsAVX512DQ)) {
9354 }
else if (Subtarget.hasDQI()) {
9356 lookupAVX512(opcode, domain, ReplaceableInstrsAVX512DQMasked)) {
9357 if (domain == 1 || (domain == 3 && table[3] == opcode))
9364 return std::make_pair(domain, validDomains);
9370 assert(dom &&
"Not an SSE instruction");
9379 "256-bit vector operations only available in AVX2");
9380 table =
lookup(
MI.getOpcode(), dom, ReplaceableInstrsAVX2);
9383 table =
lookup(
MI.getOpcode(), dom, ReplaceableInstrsFP);
9385 "Can only select PackedSingle or PackedDouble");
9388 assert(Subtarget.hasAVX2() &&
9389 "256-bit insert/extract only available in AVX2");
9390 table =
lookup(
MI.getOpcode(), dom, ReplaceableInstrsAVX2InsertExtract);
9393 assert(Subtarget.hasAVX512() &&
"Requires AVX-512");
9394 table =
lookupAVX512(
MI.getOpcode(), dom, ReplaceableInstrsAVX512);
9396 if (table &&
Domain == 3 && table[3] ==
MI.getOpcode())
9400 assert((Subtarget.hasDQI() ||
Domain >= 3) &&
"Requires AVX-512DQ");
9401 table =
lookupAVX512(
MI.getOpcode(), dom, ReplaceableInstrsAVX512DQ);
9404 if (table &&
Domain == 3 && (dom == 1 || table[3] ==
MI.getOpcode()))
9408 assert((Subtarget.hasDQI() ||
Domain >= 3) &&
"Requires AVX-512DQ");
9409 table =
lookupAVX512(
MI.getOpcode(), dom, ReplaceableInstrsAVX512DQMasked);
9410 if (table &&
Domain == 3 && (dom == 1 || table[3] ==
MI.getOpcode()))
9413 assert(table &&
"Cannot change domain");
9439 case X86::DIVSDrm_Int:
9441 case X86::DIVSDrr_Int:
9443 case X86::DIVSSrm_Int:
9445 case X86::DIVSSrr_Int:
9451 case X86::SQRTSDm_Int:
9453 case X86::SQRTSDr_Int:
9455 case X86::SQRTSSm_Int:
9457 case X86::SQRTSSr_Int:
9461 case X86::VDIVPDYrm:
9462 case X86::VDIVPDYrr:
9465 case X86::VDIVPSYrm:
9466 case X86::VDIVPSYrr:
9468 case X86::VDIVSDrm_Int:
9470 case X86::VDIVSDrr_Int:
9472 case X86::VDIVSSrm_Int:
9474 case X86::VDIVSSrr_Int:
9477 case X86::VSQRTPDYm:
9478 case X86::VSQRTPDYr:
9481 case X86::VSQRTPSYm:
9482 case X86::VSQRTPSYr:
9484 case X86::VSQRTSDm_Int:
9486 case X86::VSQRTSDr_Int:
9488 case X86::VSQRTSSm_Int:
9490 case X86::VSQRTSSr_Int:
9492 case X86::VDIVPDZ128rm:
9493 case X86::VDIVPDZ128rmb:
9494 case X86::VDIVPDZ128rmbk:
9495 case X86::VDIVPDZ128rmbkz:
9496 case X86::VDIVPDZ128rmk:
9497 case X86::VDIVPDZ128rmkz:
9498 case X86::VDIVPDZ128rr:
9499 case X86::VDIVPDZ128rrk:
9500 case X86::VDIVPDZ128rrkz:
9501 case X86::VDIVPDZ256rm:
9502 case X86::VDIVPDZ256rmb:
9503 case X86::VDIVPDZ256rmbk:
9504 case X86::VDIVPDZ256rmbkz:
9505 case X86::VDIVPDZ256rmk:
9506 case X86::VDIVPDZ256rmkz:
9507 case X86::VDIVPDZ256rr:
9508 case X86::VDIVPDZ256rrk:
9509 case X86::VDIVPDZ256rrkz:
9510 case X86::VDIVPDZrrb:
9511 case X86::VDIVPDZrrbk:
9512 case X86::VDIVPDZrrbkz:
9513 case X86::VDIVPDZrm:
9514 case X86::VDIVPDZrmb:
9515 case X86::VDIVPDZrmbk:
9516 case X86::VDIVPDZrmbkz:
9517 case X86::VDIVPDZrmk:
9518 case X86::VDIVPDZrmkz:
9519 case X86::VDIVPDZrr:
9520 case X86::VDIVPDZrrk:
9521 case X86::VDIVPDZrrkz:
9522 case X86::VDIVPSZ128rm:
9523 case X86::VDIVPSZ128rmb:
9524 case X86::VDIVPSZ128rmbk:
9525 case X86::VDIVPSZ128rmbkz:
9526 case X86::VDIVPSZ128rmk:
9527 case X86::VDIVPSZ128rmkz:
9528 case X86::VDIVPSZ128rr:
9529 case X86::VDIVPSZ128rrk:
9530 case X86::VDIVPSZ128rrkz:
9531 case X86::VDIVPSZ256rm:
9532 case X86::VDIVPSZ256rmb:
9533 case X86::VDIVPSZ256rmbk:
9534 case X86::VDIVPSZ256rmbkz:
9535 case X86::VDIVPSZ256rmk:
9536 case X86::VDIVPSZ256rmkz:
9537 case X86::VDIVPSZ256rr:
9538 case X86::VDIVPSZ256rrk:
9539 case X86::VDIVPSZ256rrkz:
9540 case X86::VDIVPSZrrb:
9541 case X86::VDIVPSZrrbk:
9542 case X86::VDIVPSZrrbkz:
9543 case X86::VDIVPSZrm:
9544 case X86::VDIVPSZrmb:
9545 case X86::VDIVPSZrmbk:
9546 case X86::VDIVPSZrmbkz:
9547 case X86::VDIVPSZrmk:
9548 case X86::VDIVPSZrmkz:
9549 case X86::VDIVPSZrr:
9550 case X86::VDIVPSZrrk:
9551 case X86::VDIVPSZrrkz:
9552 case X86::VDIVSDZrm:
9553 case X86::VDIVSDZrr:
9554 case X86::VDIVSDZrm_Int:
9555 case X86::VDIVSDZrmk_Int:
9556 case X86::VDIVSDZrmkz_Int:
9557 case X86::VDIVSDZrr_Int:
9558 case X86::VDIVSDZrrk_Int:
9559 case X86::VDIVSDZrrkz_Int:
9560 case X86::VDIVSDZrrb_Int:
9561 case X86::VDIVSDZrrbk_Int:
9562 case X86::VDIVSDZrrbkz_Int:
9563 case X86::VDIVSSZrm:
9564 case X86::VDIVSSZrr:
9565 case X86::VDIVSSZrm_Int:
9566 case X86::VDIVSSZrmk_Int:
9567 case X86::VDIVSSZrmkz_Int:
9568 case X86::VDIVSSZrr_Int:
9569 case X86::VDIVSSZrrk_Int:
9570 case X86::VDIVSSZrrkz_Int:
9571 case X86::VDIVSSZrrb_Int:
9572 case X86::VDIVSSZrrbk_Int:
9573 case X86::VDIVSSZrrbkz_Int:
9574 case X86::VSQRTPDZ128m:
9575 case X86::VSQRTPDZ128mb:
9576 case X86::VSQRTPDZ128mbk:
9577 case X86::VSQRTPDZ128mbkz:
9578 case X86::VSQRTPDZ128mk:
9579 case X86::VSQRTPDZ128mkz:
9580 case X86::VSQRTPDZ128r:
9581 case X86::VSQRTPDZ128rk:
9582 case X86::VSQRTPDZ128rkz:
9583 case X86::VSQRTPDZ256m:
9584 case X86::VSQRTPDZ256mb:
9585 case X86::VSQRTPDZ256mbk:
9586 case X86::VSQRTPDZ256mbkz:
9587 case X86::VSQRTPDZ256mk:
9588 case X86::VSQRTPDZ256mkz:
9589 case X86::VSQRTPDZ256r:
9590 case X86::VSQRTPDZ256rk:
9591 case X86::VSQRTPDZ256rkz:
9592 case X86::VSQRTPDZm:
9593 case X86::VSQRTPDZmb:
9594 case X86::VSQRTPDZmbk:
9595 case X86::VSQRTPDZmbkz:
9596 case X86::VSQRTPDZmk:
9597 case X86::VSQRTPDZmkz:
9598 case X86::VSQRTPDZr:
9599 case X86::VSQRTPDZrb:
9600 case X86::VSQRTPDZrbk:
9601 case X86::VSQRTPDZrbkz:
9602 case X86::VSQRTPDZrk:
9603 case X86::VSQRTPDZrkz:
9604 case X86::VSQRTPSZ128m:
9605 case X86::VSQRTPSZ128mb:
9606 case X86::VSQRTPSZ128mbk:
9607 case X86::VSQRTPSZ128mbkz:
9608 case X86::VSQRTPSZ128mk:
9609 case X86::VSQRTPSZ128mkz:
9610 case X86::VSQRTPSZ128r:
9611 case X86::VSQRTPSZ128rk:
9612 case X86::VSQRTPSZ128rkz:
9613 case X86::VSQRTPSZ256m:
9614 case X86::VSQRTPSZ256mb:
9615 case X86::VSQRTPSZ256mbk:
9616 case X86::VSQRTPSZ256mbkz:
9617 case X86::VSQRTPSZ256mk:
9618 case X86::VSQRTPSZ256mkz:
9619 case X86::VSQRTPSZ256r:
9620 case X86::VSQRTPSZ256rk:
9621 case X86::VSQRTPSZ256rkz:
9622 case X86::VSQRTPSZm:
9623 case X86::VSQRTPSZmb:
9624 case X86::VSQRTPSZmbk:
9625 case X86::VSQRTPSZmbkz:
9626 case X86::VSQRTPSZmk:
9627 case X86::VSQRTPSZmkz:
9628 case X86::VSQRTPSZr:
9629 case X86::VSQRTPSZrb:
9630 case X86::VSQRTPSZrbk:
9631 case X86::VSQRTPSZrbkz:
9632 case X86::VSQRTPSZrk:
9633 case X86::VSQRTPSZrkz:
9634 case X86::VSQRTSDZm:
9635 case X86::VSQRTSDZm_Int:
9636 case X86::VSQRTSDZmk_Int:
9637 case X86::VSQRTSDZmkz_Int:
9638 case X86::VSQRTSDZr:
9639 case X86::VSQRTSDZr_Int:
9640 case X86::VSQRTSDZrk_Int:
9641 case X86::VSQRTSDZrkz_Int:
9642 case X86::VSQRTSDZrb_Int:
9643 case X86::VSQRTSDZrbk_Int:
9644 case X86::VSQRTSDZrbkz_Int:
9645 case X86::VSQRTSSZm:
9646 case X86::VSQRTSSZm_Int:
9647 case X86::VSQRTSSZmk_Int:
9648 case X86::VSQRTSSZmkz_Int:
9649 case X86::VSQRTSSZr:
9650 case X86::VSQRTSSZr_Int:
9651 case X86::VSQRTSSZrk_Int:
9652 case X86::VSQRTSSZrkz_Int:
9653 case X86::VSQRTSSZrb_Int:
9654 case X86::VSQRTSSZrbk_Int:
9655 case X86::VSQRTSSZrbkz_Int:
9657 case X86::VGATHERDPDYrm:
9658 case X86::VGATHERDPDZ128rm:
9659 case X86::VGATHERDPDZ256rm:
9660 case X86::VGATHERDPDZrm:
9661 case X86::VGATHERDPDrm:
9662 case X86::VGATHERDPSYrm:
9663 case X86::VGATHERDPSZ128rm:
9664 case X86::VGATHERDPSZ256rm:
9665 case X86::VGATHERDPSZrm:
9666 case X86::VGATHERDPSrm:
9667 case X86::VGATHERPF0DPDm:
9668 case X86::VGATHERPF0DPSm:
9669 case X86::VGATHERPF0QPDm:
9670 case X86::VGATHERPF0QPSm:
9671 case X86::VGATHERPF1DPDm:
9672 case X86::VGATHERPF1DPSm:
9673 case X86::VGATHERPF1QPDm:
9674 case X86::VGATHERPF1QPSm:
9675 case X86::VGATHERQPDYrm:
9676 case X86::VGATHERQPDZ128rm:
9677 case X86::VGATHERQPDZ256rm:
9678 case X86::VGATHERQPDZrm:
9679 case X86::VGATHERQPDrm:
9680 case X86::VGATHERQPSYrm:
9681 case X86::VGATHERQPSZ128rm:
9682 case X86::VGATHERQPSZ256rm:
9683 case X86::VGATHERQPSZrm:
9684 case X86::VGATHERQPSrm:
9685 case X86::VPGATHERDDYrm:
9686 case X86::VPGATHERDDZ128rm:
9687 case X86::VPGATHERDDZ256rm:
9688 case X86::VPGATHERDDZrm:
9689 case X86::VPGATHERDDrm:
9690 case X86::VPGATHERDQYrm:
9691 case X86::VPGATHERDQZ128rm:
9692 case X86::VPGATHERDQZ256rm:
9693 case X86::VPGATHERDQZrm:
9694 case X86::VPGATHERDQrm:
9695 case X86::VPGATHERQDYrm:
9696 case X86::VPGATHERQDZ128rm:
9697 case X86::VPGATHERQDZ256rm:
9698 case X86::VPGATHERQDZrm:
9699 case X86::VPGATHERQDrm:
9700 case X86::VPGATHERQQYrm:
9701 case X86::VPGATHERQQZ128rm:
9702 case X86::VPGATHERQQZ256rm:
9703 case X86::VPGATHERQQZrm:
9704 case X86::VPGATHERQQrm:
9705 case X86::VSCATTERDPDZ128mr:
9706 case X86::VSCATTERDPDZ256mr:
9707 case X86::VSCATTERDPDZmr:
9708 case X86::VSCATTERDPSZ128mr:
9709 case X86::VSCATTERDPSZ256mr:
9710 case X86::VSCATTERDPSZmr:
9711 case X86::VSCATTERPF0DPDm:
9712 case X86::VSCATTERPF0DPSm:
9713 case X86::VSCATTERPF0QPDm:
9714 case X86::VSCATTERPF0QPSm:
9715 case X86::VSCATTERPF1DPDm:
9716 case X86::VSCATTERPF1DPSm:
9717 case X86::VSCATTERPF1QPDm:
9718 case X86::VSCATTERPF1QPSm:
9719 case X86::VSCATTERQPDZ128mr:
9720 case X86::VSCATTERQPDZ256mr:
9721 case X86::VSCATTERQPDZmr:
9722 case X86::VSCATTERQPSZ128mr:
9723 case X86::VSCATTERQPSZ256mr:
9724 case X86::VSCATTERQPSZmr:
9725 case X86::VPSCATTERDDZ128mr:
9726 case X86::VPSCATTERDDZ256mr:
9727 case X86::VPSCATTERDDZmr:
9728 case X86::VPSCATTERDQZ128mr:
9729 case X86::VPSCATTERDQZ256mr:
9730 case X86::VPSCATTERDQZmr:
9731 case X86::VPSCATTERQDZ128mr:
9732 case X86::VPSCATTERQDZ256mr:
9733 case X86::VPSCATTERQDZmr:
9734 case X86::VPSCATTERQQZ128mr:
9735 case X86::VPSCATTERQQZ256mr:
9736 case X86::VPSCATTERQQZmr:
9746 unsigned UseIdx)
const {
9753 Inst.
getNumDefs() <= 2 &&
"Reassociation needs binary operators");
9763 assert((Inst.
getNumDefs() == 1 || FlagDef) &&
"Implicit def isn't flags?");
9764 if (FlagDef && !FlagDef->
isDead())
9775 bool Invert)
const {
9827 case X86::VPANDDZ128rr:
9828 case X86::VPANDDZ256rr:
9829 case X86::VPANDDZrr:
9830 case X86::VPANDQZ128rr:
9831 case X86::VPANDQZ256rr:
9832 case X86::VPANDQZrr:
9835 case X86::VPORDZ128rr:
9836 case X86::VPORDZ256rr:
9838 case X86::VPORQZ128rr:
9839 case X86::VPORQZ256rr:
9843 case X86::VPXORDZ128rr:
9844 case X86::VPXORDZ256rr:
9845 case X86::VPXORDZrr:
9846 case X86::VPXORQZ128rr:
9847 case X86::VPXORQZ256rr:
9848 case X86::VPXORQZrr:
9851 case X86::VANDPDYrr:
9852 case X86::VANDPSYrr:
9853 case X86::VANDPDZ128rr:
9854 case X86::VANDPSZ128rr:
9855 case X86::VANDPDZ256rr:
9856 case X86::VANDPSZ256rr:
9857 case X86::VANDPDZrr:
9858 case X86::VANDPSZrr:
9863 case X86::VORPDZ128rr:
9864 case X86::VORPSZ128rr:
9865 case X86::VORPDZ256rr:
9866 case X86::VORPSZ256rr:
9871 case X86::VXORPDYrr:
9872 case X86::VXORPSYrr:
9873 case X86::VXORPDZ128rr:
9874 case X86::VXORPSZ128rr:
9875 case X86::VXORPDZ256rr:
9876 case X86::VXORPSZ256rr:
9877 case X86::VXORPDZrr:
9878 case X86::VXORPSZrr:
9899 case X86::VPADDBYrr:
9900 case X86::VPADDWYrr:
9901 case X86::VPADDDYrr:
9902 case X86::VPADDQYrr:
9903 case X86::VPADDBZ128rr:
9904 case X86::VPADDWZ128rr:
9905 case X86::VPADDDZ128rr:
9906 case X86::VPADDQZ128rr:
9907 case X86::VPADDBZ256rr:
9908 case X86::VPADDWZ256rr:
9909 case X86::VPADDDZ256rr:
9910 case X86::VPADDQZ256rr:
9911 case X86::VPADDBZrr:
9912 case X86::VPADDWZrr:
9913 case X86::VPADDDZrr:
9914 case X86::VPADDQZrr:
9915 case X86::VPMULLWrr:
9916 case X86::VPMULLWYrr:
9917 case X86::VPMULLWZ128rr:
9918 case X86::VPMULLWZ256rr:
9919 case X86::VPMULLWZrr:
9920 case X86::VPMULLDrr:
9921 case X86::VPMULLDYrr:
9922 case X86::VPMULLDZ128rr:
9923 case X86::VPMULLDZ256rr:
9924 case X86::VPMULLDZrr:
9925 case X86::VPMULLQZ128rr:
9926 case X86::VPMULLQZ256rr:
9927 case X86::VPMULLQZrr:
9928 case X86::VPMAXSBrr:
9929 case X86::VPMAXSBYrr:
9930 case X86::VPMAXSBZ128rr:
9931 case X86::VPMAXSBZ256rr:
9932 case X86::VPMAXSBZrr:
9933 case X86::VPMAXSDrr:
9934 case X86::VPMAXSDYrr:
9935 case X86::VPMAXSDZ128rr:
9936 case X86::VPMAXSDZ256rr:
9937 case X86::VPMAXSDZrr:
9938 case X86::VPMAXSQZ128rr:
9939 case X86::VPMAXSQZ256rr:
9940 case X86::VPMAXSQZrr:
9941 case X86::VPMAXSWrr:
9942 case X86::VPMAXSWYrr:
9943 case X86::VPMAXSWZ128rr:
9944 case X86::VPMAXSWZ256rr:
9945 case X86::VPMAXSWZrr:
9946 case X86::VPMAXUBrr:
9947 case X86::VPMAXUBYrr:
9948 case X86::VPMAXUBZ128rr:
9949 case X86::VPMAXUBZ256rr:
9950 case X86::VPMAXUBZrr:
9951 case X86::VPMAXUDrr:
9952 case X86::VPMAXUDYrr:
9953 case X86::VPMAXUDZ128rr:
9954 case X86::VPMAXUDZ256rr:
9955 case X86::VPMAXUDZrr:
9956 case X86::VPMAXUQZ128rr:
9957 case X86::VPMAXUQZ256rr:
9958 case X86::VPMAXUQZrr:
9959 case X86::VPMAXUWrr:
9960 case X86::VPMAXUWYrr:
9961 case X86::VPMAXUWZ128rr:
9962 case X86::VPMAXUWZ256rr:
9963 case X86::VPMAXUWZrr:
9964 case X86::VPMINSBrr:
9965 case X86::VPMINSBYrr:
9966 case X86::VPMINSBZ128rr:
9967 case X86::VPMINSBZ256rr:
9968 case X86::VPMINSBZrr:
9969 case X86::VPMINSDrr:
9970 case X86::VPMINSDYrr:
9971 case X86::VPMINSDZ128rr:
9972 case X86::VPMINSDZ256rr:
9973 case X86::VPMINSDZrr:
9974 case X86::VPMINSQZ128rr:
9975 case X86::VPMINSQZ256rr:
9976 case X86::VPMINSQZrr:
9977 case X86::VPMINSWrr:
9978 case X86::VPMINSWYrr:
9979 case X86::VPMINSWZ128rr:
9980 case X86::VPMINSWZ256rr:
9981 case X86::VPMINSWZrr:
9982 case X86::VPMINUBrr:
9983 case X86::VPMINUBYrr:
9984 case X86::VPMINUBZ128rr:
9985 case X86::VPMINUBZ256rr:
9986 case X86::VPMINUBZrr:
9987 case X86::VPMINUDrr:
9988 case X86::VPMINUDYrr:
9989 case X86::VPMINUDZ128rr:
9990 case X86::VPMINUDZ256rr:
9991 case X86::VPMINUDZrr:
9992 case X86::VPMINUQZ128rr:
9993 case X86::VPMINUQZ256rr:
9994 case X86::VPMINUQZrr:
9995 case X86::VPMINUWrr:
9996 case X86::VPMINUWYrr:
9997 case X86::VPMINUWZ128rr:
9998 case X86::VPMINUWZ256rr:
9999 case X86::VPMINUWZrr:
10003 case X86::MAXCPDrr:
10004 case X86::MAXCPSrr:
10005 case X86::MAXCSDrr:
10006 case X86::MAXCSSrr:
10007 case X86::MINCPDrr:
10008 case X86::MINCPSrr:
10009 case X86::MINCSDrr:
10010 case X86::MINCSSrr:
10011 case X86::VMAXCPDrr:
10012 case X86::VMAXCPSrr:
10013 case X86::VMAXCPDYrr:
10014 case X86::VMAXCPSYrr:
10015 case X86::VMAXCPDZ128rr:
10016 case X86::VMAXCPSZ128rr:
10017 case X86::VMAXCPDZ256rr:
10018 case X86::VMAXCPSZ256rr:
10019 case X86::VMAXCPDZrr:
10020 case X86::VMAXCPSZrr:
10021 case X86::VMAXCSDrr:
10022 case X86::VMAXCSSrr:
10023 case X86::VMAXCSDZrr:
10024 case X86::VMAXCSSZrr:
10025 case X86::VMINCPDrr:
10026 case X86::VMINCPSrr:
10027 case X86::VMINCPDYrr:
10028 case X86::VMINCPSYrr:
10029 case X86::VMINCPDZ128rr:
10030 case X86::VMINCPSZ128rr:
10031 case X86::VMINCPDZ256rr:
10032 case X86::VMINCPSZ256rr:
10033 case X86::VMINCPDZrr:
10034 case X86::VMINCPSZrr:
10035 case X86::VMINCSDrr:
10036 case X86::VMINCSSrr:
10037 case X86::VMINCSDZrr:
10038 case X86::VMINCSSZrr:
10039 case X86::VMAXCPHZ128rr:
10040 case X86::VMAXCPHZ256rr:
10041 case X86::VMAXCPHZrr:
10042 case X86::VMAXCSHZrr:
10043 case X86::VMINCPHZ128rr:
10044 case X86::VMINCPHZ256rr:
10045 case X86::VMINCPHZrr:
10046 case X86::VMINCSHZrr:
10056 case X86::VADDPDrr:
10057 case X86::VADDPSrr:
10058 case X86::VADDPDYrr:
10059 case X86::VADDPSYrr:
10060 case X86::VADDPDZ128rr:
10061 case X86::VADDPSZ128rr:
10062 case X86::VADDPDZ256rr:
10063 case X86::VADDPSZ256rr:
10064 case X86::VADDPDZrr:
10065 case X86::VADDPSZrr:
10066 case X86::VADDSDrr:
10067 case X86::VADDSSrr:
10068 case X86::VADDSDZrr:
10069 case X86::VADDSSZrr:
10070 case X86::VMULPDrr:
10071 case X86::VMULPSrr:
10072 case X86::VMULPDYrr:
10073 case X86::VMULPSYrr:
10074 case X86::VMULPDZ128rr:
10075 case X86::VMULPSZ128rr:
10076 case X86::VMULPDZ256rr:
10077 case X86::VMULPSZ256rr:
10078 case X86::VMULPDZrr:
10079 case X86::VMULPSZrr:
10080 case X86::VMULSDrr:
10081 case X86::VMULSSrr:
10082 case X86::VMULSDZrr:
10083 case X86::VMULSSZrr:
10084 case X86::VADDPHZ128rr:
10085 case X86::VADDPHZ256rr:
10086 case X86::VADDPHZrr:
10087 case X86::VADDSHZrr:
10088 case X86::VMULPHZ128rr:
10089 case X86::VMULPHZ256rr:
10090 case X86::VMULPHZrr:
10091 case X86::VMULSHZrr:
10102static std::optional<ParamLoadedValue>
10105 Register DestReg =
MI.getOperand(0).getReg();
10106 Register SrcReg =
MI.getOperand(1).getReg();
10111 if (DestReg == DescribedReg)
10116 if (
unsigned SubRegIdx =
TRI->getSubRegIndex(DestReg, DescribedReg)) {
10117 Register SrcSubReg =
TRI->getSubReg(SrcReg, SubRegIdx);
10127 if (
MI.getOpcode() == X86::MOV8rr ||
MI.getOpcode() == X86::MOV16rr ||
10128 !
TRI->isSuperRegister(DestReg, DescribedReg))
10129 return std::nullopt;
10131 assert(
MI.getOpcode() == X86::MOV32rr &&
"Unexpected super-register case");
10135std::optional<ParamLoadedValue>
10142 switch (
MI.getOpcode()) {
10145 case X86::LEA64_32r: {
10147 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(), Reg))
10148 return std::nullopt;
10152 if (!
MI.getOperand(4).isImm() || !
MI.getOperand(2).isImm())
10153 return std::nullopt;
10162 if ((Op1.
isReg() && Op1.
getReg() ==
MI.getOperand(0).getReg()) ||
10163 Op2.
getReg() ==
MI.getOperand(0).getReg())
10164 return std::nullopt;
10165 else if ((Op1.
isReg() && Op1.
getReg() != X86::NoRegister &&
10166 TRI->regsOverlap(Op1.
getReg(),
MI.getOperand(0).getReg())) ||
10167 (Op2.
getReg() != X86::NoRegister &&
10168 TRI->regsOverlap(Op2.
getReg(),
MI.getOperand(0).getReg())))
10169 return std::nullopt;
10171 int64_t Coef =
MI.getOperand(2).getImm();
10172 int64_t
Offset =
MI.getOperand(4).getImm();
10175 if ((Op1.
isReg() && Op1.
getReg() != X86::NoRegister)) {
10177 }
else if (Op1.
isFI())
10180 if (
Op &&
Op->isReg() &&
Op->getReg() == Op2.
getReg() && Coef > 0) {
10181 Ops.push_back(dwarf::DW_OP_constu);
10182 Ops.push_back(Coef + 1);
10183 Ops.push_back(dwarf::DW_OP_mul);
10185 if (
Op && Op2.
getReg() != X86::NoRegister) {
10186 int dwarfReg =
TRI->getDwarfRegNum(Op2.
getReg(),
false);
10188 return std::nullopt;
10189 else if (dwarfReg < 32) {
10190 Ops.push_back(dwarf::DW_OP_breg0 + dwarfReg);
10193 Ops.push_back(dwarf::DW_OP_bregx);
10194 Ops.push_back(dwarfReg);
10204 Ops.push_back(dwarf::DW_OP_constu);
10205 Ops.push_back(Coef);
10206 Ops.push_back(dwarf::DW_OP_mul);
10209 if (((Op1.
isReg() && Op1.
getReg() != X86::NoRegister) || Op1.
isFI()) &&
10210 Op2.
getReg() != X86::NoRegister) {
10211 Ops.push_back(dwarf::DW_OP_plus);
10223 return std::nullopt;
10226 case X86::MOV64ri32:
10229 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(), Reg))
10230 return std::nullopt;
10237 case X86::XOR32rr: {
10240 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(), Reg))
10241 return std::nullopt;
10242 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg())
10244 return std::nullopt;
10246 case X86::MOVSX64rr32: {
10253 if (!
TRI->isSubRegisterEq(
MI.getOperand(0).getReg(), Reg))
10254 return std::nullopt;
10263 if (Reg ==
MI.getOperand(0).getReg())
10266 assert(X86MCRegisterClasses[X86::GR32RegClassID].
contains(Reg) &&
10267 "Unhandled sub-register case for MOVSX64rr32");
10272 assert(!
MI.isMoveImmediate() &&
"Unexpected MoveImm instruction");
10289 assert(!OldFlagDef1 == !OldFlagDef2 &&
10290 "Unexpected instruction type for reassociation");
10292 if (!OldFlagDef1 || !OldFlagDef2)
10296 "Must have dead EFLAGS operand in reassociable instruction");
10303 assert(NewFlagDef1 && NewFlagDef2 &&
10304 "Unexpected operand in reassociable instruction");
10314std::pair<unsigned, unsigned>
10316 return std::make_pair(TF, 0u);
10321 using namespace X86II;
10322 static const std::pair<unsigned, const char *> TargetFlags[] = {
10323 {MO_GOT_ABSOLUTE_ADDRESS,
"x86-got-absolute-address"},
10324 {MO_PIC_BASE_OFFSET,
"x86-pic-base-offset"},
10325 {MO_GOT,
"x86-got"},
10326 {MO_GOTOFF,
"x86-gotoff"},
10327 {MO_GOTPCREL,
"x86-gotpcrel"},
10328 {MO_GOTPCREL_NORELAX,
"x86-gotpcrel-norelax"},
10329 {MO_PLT,
"x86-plt"},
10330 {MO_TLSGD,
"x86-tlsgd"},
10331 {MO_TLSLD,
"x86-tlsld"},
10332 {MO_TLSLDM,
"x86-tlsldm"},
10333 {MO_GOTTPOFF,
"x86-gottpoff"},
10334 {MO_INDNTPOFF,
"x86-indntpoff"},
10335 {MO_TPOFF,
"x86-tpoff"},
10336 {MO_DTPOFF,
"x86-dtpoff"},
10337 {MO_NTPOFF,
"x86-ntpoff"},
10338 {MO_GOTNTPOFF,
"x86-gotntpoff"},
10339 {MO_DLLIMPORT,
"x86-dllimport"},
10340 {MO_DARWIN_NONLAZY,
"x86-darwin-nonlazy"},
10341 {MO_DARWIN_NONLAZY_PIC_BASE,
"x86-darwin-nonlazy-pic-base"},
10342 {MO_TLVP,
"x86-tlvp"},
10343 {MO_TLVP_PIC_BASE,
"x86-tlvp-pic-base"},
10344 {MO_SECREL,
"x86-secrel"},
10345 {MO_COFFSTUB,
"x86-coffstub"}};
10362 if (!TM->isPositionIndependent())
10369 if (GlobalBaseReg == 0)
10381 PC =
RegInfo.createVirtualRegister(&X86::GR32RegClass);
10383 PC = GlobalBaseReg;
10385 if (STI.is64Bit()) {
10438 StringRef getPassName()
const override {
10439 return "X86 PIC Global Base Reg Initialization";
10442 void getAnalysisUsage(AnalysisUsage &AU)
const override {
10457 bool runOnMachineFunction(MachineFunction &MF)
override {
10461 X86MachineFunctionInfo *MFI = MF.
getInfo<X86MachineFunctionInfo>();
10467 MachineDominatorTree *DT =
10468 &getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();
10478 MachineBasicBlock *BB =
Node->getBlock();
10484 switch (
I->getOpcode()) {
10485 case X86::TLS_base_addr32:
10486 case X86::TLS_base_addr64:
10487 if (TLSBaseAddrReg)
10488 I = ReplaceTLSBaseAddrCall(*
I, TLSBaseAddrReg);
10490 I = SetRegister(*
I, &TLSBaseAddrReg);
10499 for (
auto &
I : *Node) {
10500 Changed |= VisitNode(
I, TLSBaseAddrReg);
10508 MachineInstr *ReplaceTLSBaseAddrCall(MachineInstr &
I,
10510 MachineFunction *MF =
I.getParent()->getParent();
10511 const X86Subtarget &STI = MF->
getSubtarget<X86Subtarget>();
10512 const bool is64Bit = STI.is64Bit();
10516 MachineInstr *
Copy =
10518 TII->get(TargetOpcode::COPY),
is64Bit ? X86::RAX : X86::EAX)
10519 .
addReg(TLSBaseAddrReg);
10522 I.eraseFromParent();
10529 MachineInstr *SetRegister(MachineInstr &
I,
Register *TLSBaseAddrReg) {
10530 MachineFunction *MF =
I.getParent()->getParent();
10531 const X86Subtarget &STI = MF->
getSubtarget<X86Subtarget>();
10532 const bool is64Bit = STI.is64Bit();
10536 MachineRegisterInfo &RegInfo = MF->
getRegInfo();
10538 is64Bit ? &X86::GR64RegClass : &X86::GR32RegClass);
10541 MachineInstr *
Next =
I.getNextNode();
10543 TII->get(TargetOpcode::COPY), *TLSBaseAddrReg)
10549 StringRef getPassName()
const override {
10550 return "Local Dynamic TLS Access Clean-up";
10553 void getAnalysisUsage(AnalysisUsage &AU)
const override {
10555 AU.
addRequired<MachineDominatorTreeWrapperPass>();
10561char LDTLSCleanup::ID = 0;
10563 return new LDTLSCleanup();
10596std::optional<std::unique_ptr<outliner::OutlinedFunction>>
10599 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
10600 unsigned MinRepeats)
const {
10601 unsigned SequenceSize = 0;
10602 for (
auto &
MI : RepeatedSequenceLocs[0]) {
10606 if (
MI.isDebugInstr() ||
MI.isKill())
10613 unsigned CFICount = 0;
10614 for (
auto &
I : RepeatedSequenceLocs[0]) {
10615 if (
I.isCFIInstruction())
10625 std::vector<MCCFIInstruction> CFIInstructions =
10626 C.getMF()->getFrameInstructions();
10628 if (CFICount > 0 && CFICount != CFIInstructions.size())
10629 return std::nullopt;
10633 if (RepeatedSequenceLocs[0].back().isTerminator()) {
10637 return std::make_unique<outliner::OutlinedFunction>(
10638 RepeatedSequenceLocs, SequenceSize,
10645 return std::nullopt;
10650 return std::make_unique<outliner::OutlinedFunction>(
10660 if (Subtarget.getFrameLowering()->has128ByteRedZone(MF)) {
10669 if (!OutlineFromLinkOnceODRs &&
F.hasLinkOnceODRLinkage())
10679 unsigned Flags)
const {
10683 if (
MI.isTerminator())
10697 if (
MI.modifiesRegister(X86::RSP, &RI) ||
MI.readsRegister(X86::RSP, &RI) ||
10698 MI.getDesc().hasImplicitUseOfPhysReg(X86::RSP) ||
10699 MI.getDesc().hasImplicitDefOfPhysReg(X86::RSP))
10703 if (
MI.readsRegister(X86::RIP, &RI) ||
10704 MI.getDesc().hasImplicitUseOfPhysReg(X86::RIP) ||
10705 MI.getDesc().hasImplicitDefOfPhysReg(X86::RIP))
10709 if (
MI.isCFIInstruction())
10725 MBB.insert(
MBB.end(), retq);
10735 .addGlobalAddress(M.getNamedValue(MF.
getName())));
10739 .addGlobalAddress(M.getNamedValue(MF.
getName())));
10748 bool AllowSideEffects)
const {
10753 if (ST.hasMMX() && X86::VR64RegClass.contains(Reg))
10757 if (
TRI.isGeneralPurposeRegister(MF, Reg)) {
10762 if (!AllowSideEffects)
10769 }
else if (X86::VR128RegClass.
contains(Reg)) {
10778 }
else if (X86::VR256RegClass.
contains(Reg)) {
10787 }
else if (X86::VR512RegClass.
contains(Reg)) {
10789 if (!ST.hasAVX512())
10796 }
else if (X86::VK1RegClass.
contains(Reg) || X86::VK2RegClass.
contains(Reg) ||
10798 X86::VK16RegClass.
contains(Reg)) {
10803 unsigned Op = ST.hasBWI() ? X86::KXORQkk : X86::KXORWkk;
10812 bool DoRegPressureReduce)
const {
10815 case X86::VPDPWSSDrr:
10816 case X86::VPDPWSSDrm:
10817 case X86::VPDPWSSDYrr:
10818 case X86::VPDPWSSDYrm: {
10819 if (!Subtarget.hasFastDPWSSD()) {
10825 case X86::VPDPWSSDZ128r:
10826 case X86::VPDPWSSDZ128m:
10827 case X86::VPDPWSSDZ256r:
10828 case X86::VPDPWSSDZ256m:
10829 case X86::VPDPWSSDZr:
10830 case X86::VPDPWSSDZm: {
10831 if (Subtarget.hasBWI() && !Subtarget.hasFastDPWSSD()) {
10839 Patterns, DoRegPressureReduce);
10851 unsigned AddOpc = 0;
10852 unsigned MaddOpc = 0;
10855 assert(
false &&
"It should not reach here");
10861 case X86::VPDPWSSDrr:
10862 MaddOpc = X86::VPMADDWDrr;
10863 AddOpc = X86::VPADDDrr;
10865 case X86::VPDPWSSDrm:
10866 MaddOpc = X86::VPMADDWDrm;
10867 AddOpc = X86::VPADDDrr;
10869 case X86::VPDPWSSDZ128r:
10870 MaddOpc = X86::VPMADDWDZ128rr;
10871 AddOpc = X86::VPADDDZ128rr;
10873 case X86::VPDPWSSDZ128m:
10874 MaddOpc = X86::VPMADDWDZ128rm;
10875 AddOpc = X86::VPADDDZ128rr;
10881 case X86::VPDPWSSDYrr:
10882 MaddOpc = X86::VPMADDWDYrr;
10883 AddOpc = X86::VPADDDYrr;
10885 case X86::VPDPWSSDYrm:
10886 MaddOpc = X86::VPMADDWDYrm;
10887 AddOpc = X86::VPADDDYrr;
10889 case X86::VPDPWSSDZ256r:
10890 MaddOpc = X86::VPMADDWDZ256rr;
10891 AddOpc = X86::VPADDDZ256rr;
10893 case X86::VPDPWSSDZ256m:
10894 MaddOpc = X86::VPMADDWDZ256rm;
10895 AddOpc = X86::VPADDDZ256rr;
10901 case X86::VPDPWSSDZr:
10902 MaddOpc = X86::VPMADDWDZrr;
10903 AddOpc = X86::VPADDDZrr;
10905 case X86::VPDPWSSDZm:
10906 MaddOpc = X86::VPMADDWDZrm;
10907 AddOpc = X86::VPADDDZrr;
10919 InstrIdxForVirtReg.
insert(std::make_pair(NewReg, 0));
10941 DelInstrs, InstrIdxForVirtReg);
10945 InstrIdxForVirtReg);
10955 M.Base.FrameIndex = FI;
10956 M.getFullAddress(
Ops);
10959#define GET_INSTRINFO_HELPERS
10960#include "X86GenInstrInfo.inc"
unsigned const MachineRegisterInfo * MRI
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
MachineOutlinerClass
Constants defining how certain sequences should be outlined.
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
DXIL Forward Handle Accesses
const HexagonInstrInfo * TII
Module.h This file contains the declarations for the Module class.
static bool lookup(const GsymReader &GR, DataExtractor &Data, uint64_t &Offset, uint64_t BaseAddr, uint64_t Addr, SourceLocations &SrcLocs, llvm::Error &Err)
A Lookup helper functions.
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
This file implements the LivePhysRegs utility for tracking liveness of physical registers.
static bool Expand2AddrUndef(MachineInstrBuilder &MIB, const MCInstrDesc &Desc)
Expand a single-def pseudo instruction to a two-addr instruction with two undef reads of the register...
This file declares the MachineConstantPool class which is an abstract constant pool to keep track of ...
Register const TargetRegisterInfo * TRI
Promote Memory to Register
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Provides some synthesis utilities to produce sequences of values.
static SPCC::CondCodes GetOppositeBranchCondition(SPCC::CondCodes CC)
#define FROM_TO(FROM, TO)
cl::opt< bool > X86EnableAPXForRelocation
static bool is64Bit(const char *name)
#define GET_EGPR_IF_ENABLED(OPC)
static bool isLEA(unsigned Opcode)
static void addOperands(MachineInstrBuilder &MIB, ArrayRef< MachineOperand > MOs, int PtrOffset=0)
static std::optional< ParamLoadedValue > describeMOVrrLoadedValue(const MachineInstr &MI, Register DescribedReg, const TargetRegisterInfo *TRI)
If DescribedReg overlaps with the MOVrr instruction's destination register then, if possible,...
static cl::opt< unsigned > PartialRegUpdateClearance("partial-reg-update-clearance", cl::desc("Clearance between two register writes " "for inserting XOR to avoid partial " "register update"), cl::init(64), cl::Hidden)
static bool shouldPreventUndefRegUpdateMemFold(MachineFunction &MF, MachineInstr &MI)
static unsigned CopyToFromAsymmetricReg(Register DestReg, Register SrcReg, const X86Subtarget &Subtarget)
static bool isConvertibleLEA(MachineInstr *MI)
static bool ExpandMOVImmSExti8(MachineInstrBuilder &MIB, const TargetInstrInfo &TII, const X86Subtarget &Subtarget)
static bool isAMXOpcode(unsigned Opc)
static int getJumpTableIndexFromReg(const MachineRegisterInfo &MRI, Register Reg)
static void updateOperandRegConstraints(MachineFunction &MF, MachineInstr &NewMI, const TargetInstrInfo &TII)
static int getJumpTableIndexFromAddr(const MachineInstr &MI)
static bool AdjustBlendMask(unsigned OldMask, unsigned OldWidth, unsigned NewWidth, unsigned *pNewMask=nullptr)
static bool expandMOV32r1(MachineInstrBuilder &MIB, const TargetInstrInfo &TII, bool MinusOne)
static unsigned getNewOpcFromTable(ArrayRef< X86TableEntry > Table, unsigned Opc)
static unsigned getStoreRegOpcode(Register SrcReg, const TargetRegisterClass *RC, bool IsStackAligned, const X86Subtarget &STI)
#define FOLD_BROADCAST(SIZE)
static cl::opt< unsigned > UndefRegClearance("undef-reg-clearance", cl::desc("How many idle instructions we would like before " "certain undef register reads"), cl::init(128), cl::Hidden)
#define CASE_BCAST_TYPE_OPC(TYPE, OP16, OP32, OP64)
static bool isTruncatedShiftCountForLEA(unsigned ShAmt)
Check whether the given shift count is appropriate can be represented by a LEA instruction.
static cl::opt< bool > ReMatPICStubLoad("remat-pic-stub-load", cl::desc("Re-materialize load from stub in PIC mode"), cl::init(false), cl::Hidden)
static SmallVector< MachineMemOperand *, 2 > extractLoadMMOs(ArrayRef< MachineMemOperand * > MMOs, MachineFunction &MF)
static MachineInstr * fuseTwoAddrInst(MachineFunction &MF, unsigned Opcode, ArrayRef< MachineOperand > MOs, MachineBasicBlock::iterator InsertPt, MachineInstr &MI, const TargetInstrInfo &TII)
static void printFailMsgforFold(const MachineInstr &MI, unsigned Idx)
static bool canConvert2Copy(unsigned Opc)
static cl::opt< bool > NoFusing("disable-spill-fusing", cl::desc("Disable fusing of spill code into instructions"), cl::Hidden)
static bool expandNOVLXStore(MachineInstrBuilder &MIB, const TargetRegisterInfo *TRI, const MCInstrDesc &StoreDesc, const MCInstrDesc &ExtractDesc, unsigned SubIdx)
static bool isX87Reg(Register Reg)
Return true if the Reg is X87 register.
static bool Expand2AddrKreg(MachineInstrBuilder &MIB, const MCInstrDesc &Desc, Register Reg)
Expand a single-def pseudo instruction to a two-addr instruction with two k0 reads.
static bool isFrameLoadOpcode(int Opcode, TypeSize &MemBytes)
#define VPERM_CASES_BROADCAST(Suffix)
static std::pair< X86::CondCode, unsigned > isUseDefConvertible(const MachineInstr &MI)
Check whether the use can be converted to remove a comparison against zero.
static bool findRedundantFlagInstr(MachineInstr &CmpInstr, MachineInstr &CmpValDefInstr, const MachineRegisterInfo *MRI, MachineInstr **AndInstr, const TargetRegisterInfo *TRI, const X86Subtarget &ST, bool &NoSignFlag, bool &ClearsOverflowFlag)
static bool expandSHXDROT(MachineInstrBuilder &MIB, const MCInstrDesc &Desc)
static unsigned getLoadRegOpcode(Register DestReg, const TargetRegisterClass *RC, bool IsStackAligned, const X86Subtarget &STI)
static void expandLoadStackGuard(MachineInstrBuilder &MIB, const TargetInstrInfo &TII)
static bool hasUndefRegUpdate(unsigned Opcode, unsigned OpNum, bool ForLoadFold=false)
static MachineInstr * makeM0Inst(const TargetInstrInfo &TII, unsigned Opcode, ArrayRef< MachineOperand > MOs, MachineBasicBlock::iterator InsertPt, MachineInstr &MI)
#define GET_ND_IF_ENABLED(OPC)
static bool expandMOVSHP(MachineInstrBuilder &MIB, MachineInstr &MI, const TargetInstrInfo &TII, bool HasAVX)
static bool hasPartialRegUpdate(unsigned Opcode, const X86Subtarget &Subtarget, bool ForLoadFold=false)
Return true for all instructions that only update the first 32 or 64-bits of the destination register...
static const uint16_t * lookupAVX512(unsigned opcode, unsigned domain, ArrayRef< uint16_t[4]> Table)
static unsigned getLoadStoreRegOpcode(Register Reg, const TargetRegisterClass *RC, bool IsStackAligned, const X86Subtarget &STI, bool Load)
#define VPERM_CASES(Suffix)
#define FROM_TO_SIZE(A, B, S)
static void commuteVPTERNLOG(MachineInstr &MI, unsigned SrcOpIdx1, unsigned SrcOpIdx2)
static bool isDefConvertible(const MachineInstr &MI, bool &NoSignFlag, bool &ClearsOverflowFlag)
Check whether the definition can be converted to remove a comparison against zero.
static MachineInstr * fuseInst(MachineFunction &MF, unsigned Opcode, unsigned OpNo, ArrayRef< MachineOperand > MOs, MachineBasicBlock::iterator InsertPt, MachineInstr &MI, const TargetInstrInfo &TII, int PtrOffset=0)
static X86::CondCode getSwappedCondition(X86::CondCode CC)
Assuming the flags are set by MI(a,b), return the condition code if we modify the instructions such t...
static unsigned getCommutedVPERMV3Opcode(unsigned Opcode)
static bool expandXorFP(MachineInstrBuilder &MIB, const TargetInstrInfo &TII)
static MachineBasicBlock * getFallThroughMBB(MachineBasicBlock *MBB, MachineBasicBlock *TBB)
static bool isNonFoldablePartialRegisterLoad(const MachineInstr &LoadMI, const MachineInstr &UserMI, const MachineFunction &MF)
Check if LoadMI is a partial register load that we can't fold into MI because the latter uses content...
static unsigned getLoadStoreOpcodeForFP16(bool Load, const X86Subtarget &STI)
static bool isHReg(Register Reg)
Test if the given register is a physical h register.
static cl::opt< bool > PrintFailedFusing("print-failed-fuse-candidates", cl::desc("Print instructions that the allocator wants to" " fuse, but the X86 backend currently can't"), cl::Hidden)
static bool expandNOVLXLoad(MachineInstrBuilder &MIB, const TargetRegisterInfo *TRI, const MCInstrDesc &LoadDesc, const MCInstrDesc &BroadcastDesc, unsigned SubIdx)
static void genAlternativeDpCodeSequence(MachineInstr &Root, const TargetInstrInfo &TII, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
static unsigned getThreeSrcCommuteCase(uint64_t TSFlags, unsigned SrcOpIdx1, unsigned SrcOpIdx2)
This determines which of three possible cases of a three source commute the source indexes correspond...
static bool isFrameStoreOpcode(int Opcode, TypeSize &MemBytes)
static unsigned getTruncatedShiftCount(const MachineInstr &MI, unsigned ShiftAmtOperandIdx)
Check whether the shift count for a machine operand is non-zero.
static SmallVector< MachineMemOperand *, 2 > extractStoreMMOs(ArrayRef< MachineMemOperand * > MMOs, MachineFunction &MF)
static unsigned getBroadcastOpcode(const X86FoldTableEntry *I, const TargetRegisterClass *RC, const X86Subtarget &STI)
static unsigned convertALUrr2ALUri(unsigned Opc)
Convert an ALUrr opcode to corresponding ALUri opcode.
static bool regIsPICBase(Register BaseReg, const MachineRegisterInfo &MRI)
Return true if register is PIC base; i.e.g defined by X86::MOVPC32r.
static bool isCommutableVPERMV3Instruction(unsigned Opcode)
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
AnalysisUsage & addRequired()
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
size - Get the array size.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
@ ICMP_SLT
signed less than
@ ICMP_SLE
signed less or equal
@ FCMP_OLT
0 1 0 0 True if ordered and less than
@ FCMP_ULE
1 1 0 1 True if unordered, less than, or equal
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
@ ICMP_UGE
unsigned greater or equal
@ ICMP_UGT
unsigned greater than
@ ICMP_SGT
signed greater than
@ FCMP_ULT
1 1 0 0 True if unordered or less than
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
@ ICMP_ULT
unsigned less than
@ FCMP_UGT
1 0 1 0 True if unordered or greater than
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
@ FCMP_ORD
0 1 1 1 True if ordered (no nans)
@ ICMP_SGE
signed greater or equal
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
@ ICMP_ULE
unsigned less or equal
@ FCMP_UGE
1 0 1 1 True if unordered, greater than, or equal
@ FCMP_UNO
1 0 0 0 True if unordered: isnan(X) | isnan(Y)
This is an important base class in LLVM.
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
static LLVM_ABI void appendOffset(SmallVectorImpl< uint64_t > &Ops, int64_t Offset)
Append Ops with operations to apply the Offset.
static LLVM_ABI DIExpression * appendExt(const DIExpression *Expr, unsigned FromSize, unsigned ToSize, bool Signed)
Append a zero- or sign-extension to Expr.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
DomTreeNodeBase< NodeT > * getRootNode()
getRootNode - This returns the entry node for the CFG of the function.
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
FunctionPass class - This class is used to implement most global optimizations.
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
LiveInterval - This class represents the liveness of a register, or stack slot.
SlotIndex InsertMachineInstrInMaps(MachineInstr &MI)
SlotIndex getInstructionIndex(const MachineInstr &Instr) const
Returns the base index of the given instruction.
LiveInterval & getInterval(Register Reg)
SlotIndex ReplaceMachineInstrInMaps(MachineInstr &MI, MachineInstr &NewMI)
A set of physical registers with utility functions to track liveness when walking backward/forward th...
const Segment * getSegmentContaining(SlotIndex Idx) const
Return the segment that contains the specified index, or null if there is none.
LLVM_ABI void replaceKillInstruction(Register Reg, MachineInstr &OldMI, MachineInstr &NewMI)
replaceKillInstruction - Update register kill info by replacing a kill instruction with a new one.
LLVM_ABI VarInfo & getVarInfo(Register Reg)
getVarInfo - Return the VarInfo structure for the specified VIRTUAL register.
static LocationSize precise(uint64_t Value)
bool usesWindowsCFI() const
static MCCFIInstruction createAdjustCfaOffset(MCSymbol *L, int64_t Adjustment, SMLoc Loc={})
.cfi_adjust_cfa_offset Same as .cfi_def_cfa_offset, but Offset is a relative value that is added/subt...
Instances of this class represent a single low-level machine instruction.
void setOpcode(unsigned Op)
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
This holds information about one operand of a machine instruction, indicating the register class for ...
Wrapper class representing physical registers. Should be passed by value.
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
MachineInstrBundleIterator< const MachineInstr > const_iterator
void push_back(MachineInstr *MI)
MachineInstr * remove(MachineInstr *I)
Remove the unbundled instruction from the instruction list without deleting it.
LLVM_ABI DebugLoc findDebugLoc(instr_iterator MBBI)
Find the next valid DebugLoc starting at MBBI, skipping any debug instructions.
MachineInstrBundleIterator< MachineInstr, true > reverse_iterator
LLVM_ABI bool isLayoutSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB will be emitted immediately after this block, such that if this bloc...
LLVM_ABI void eraseFromParent()
This method unlinks 'this' from the containing function and deletes it.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
iterator_range< succ_iterator > successors()
MachineInstrBundleIterator< MachineInstr > iterator
@ LQR_Dead
Register is known to be fully dead.
This class is a data container for one entry in a MachineConstantPool.
union llvm::MachineConstantPoolEntry::@004270020304201266316354007027341142157160323045 Val
The constant itself.
bool isMachineConstantPoolEntry() const
isMachineConstantPoolEntry - Return true if the MachineConstantPoolEntry is indeed a target specific ...
const Constant * ConstVal
The MachineConstantPool class keeps track of constants referenced by a function which must be spilled...
unsigned getConstantPoolIndex(const Constant *C, Align Alignment)
getConstantPoolIndex - Create a new entry in the constant pool or return an existing one.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
bool isFixedObjectIndex(int ObjectIdx) const
Returns true if the specified index corresponds to a fixed stack object.
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
MCSymbol * getPICBaseSymbol() const
getPICBaseSymbol - Return a function-local symbol to represent the PIC base.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
bool needsFrameMoves() const
True if this function needs frame moves for debug or exceptions.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
MachineConstantPool * getConstantPool()
getConstantPool - Return the constant pool object for the current function.
const MachineBasicBlock & front() const
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Register getReg(unsigned Idx) const
Get the register for the operand index.
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addExternalSymbol(const char *FnName, unsigned TargetFlags=0) const
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addGlobalAddress(const GlobalValue *GV, int64_t Offset=0, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDisp(const MachineOperand &Disp, int64_t off, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & copyImplicitOps(const MachineInstr &OtherMI) const
Copy all the implicit operands from OtherMI onto this one.
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
MachineInstr * getInstr() const
If conversion operators fail, use this method to get the MachineInstr explicitly.
Representation of each machine instruction.
mop_iterator operands_begin()
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool isImplicitDef() const
const MachineBasicBlock * getParent() const
void dropDebugNumber()
Drop any variable location debugging information associated with this instruction.
LLVM_ABI void setPreInstrSymbol(MachineFunction &MF, MCSymbol *Symbol)
Set a symbol that will be emitted just prior to the instruction itself.
LLVM_ABI void addImplicitDefUseOperands(MachineFunction &MF)
Add all implicit def and use operands to this instruction.
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
unsigned getNumOperands() const
Retuns the total number of operands.
LLVM_ABI void addOperand(MachineFunction &MF, const MachineOperand &Op)
Add the specified operand to the instruction.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool modifiesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr modifies (fully define or partially define) the specified register.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
void untieRegOperand(unsigned OpIdx)
Break any tie involving OpIdx.
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
LLVM_ABI unsigned getNumExplicitDefs() const
Returns the number of non-implicit definitions.
LLVM_ABI void eraseFromBundle()
Unlink 'this' from its basic block and delete it.
bool hasOneMemOperand() const
Return true if this instruction has exactly one MachineMemOperand.
LLVM_ABI void substituteRegister(Register FromReg, Register ToReg, unsigned SubIdx, const TargetRegisterInfo &RegInfo)
Replace all occurrences of FromReg with ToReg:SubIdx, properly composing subreg indices where necessa...
mmo_iterator memoperands_begin() const
Access to memory operands of the instruction.
LLVM_ABI bool isIdenticalTo(const MachineInstr &Other, MICheckType Check=CheckDefs) const
Return true if this instruction is identical to Other.
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
void setFlag(MIFlag Flag)
Set a MI flag.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
LLVM_ABI void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
LLVM_ABI void dump() const
const MachineOperand & getOperand(unsigned i) const
unsigned getNumDefs() const
Returns the total number of definitions.
void setDebugLoc(DebugLoc DL)
Replace current source information with new such.
MachineOperand * findRegisterDefOperand(Register Reg, const TargetRegisterInfo *TRI, bool isDead=false, bool Overlap=false)
Wrapper for findRegisterDefOperandIdx, it returns a pointer to the MachineOperand rather than an inde...
A description of a memory reference used in the backend.
@ MODereferenceable
The memory access is dereferenceable (i.e., doesn't trap).
@ MOLoad
The memory access reads data.
@ MOInvariant
The memory access always returns the same value (or traps).
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
void setImplicit(bool Val=true)
void setImm(int64_t immVal)
bool readsReg() const
readsReg - Returns true if this operand reads the previous value of its register.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
bool isCPI() const
isCPI - Tests if this is a MO_ConstantPoolIndex operand.
void setIsDead(bool Val=true)
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
void setIsKill(bool Val=true)
bool isJTI() const
isJTI - Tests if this is a MO_JumpTableIndex operand.
LLVM_ABI void ChangeToRegister(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isDebug=false)
ChangeToRegister - Replace this operand with a new register operand of the specified value.
static MachineOperand CreateImm(int64_t Val)
void setIsUndef(bool Val=true)
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
static MachineOperand CreateCPI(unsigned Idx, int Offset, unsigned TargetFlags=0)
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
int64_t getOffset() const
Return the offset from the symbol in this operand.
static MachineOperand CreateFI(int Idx)
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
A Module instance is used to store all the information related to an LLVM module.
Wrapper class representing virtual and physical registers.
constexpr bool isValid() const
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
bool isMachineOpcode() const
Test if this node has a post-isel opcode, directly corresponding to a MachineInstr opcode.
unsigned getMachineOpcode() const
This may only be called if isMachineOpcode returns true.
const SDValue & getOperand(unsigned Num) const
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
LLVM_ABI MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
LLVM_ABI void setNodeMemRefs(MachineSDNode *N, ArrayRef< MachineMemOperand * > NewMemRefs)
Mutate the specified machine node's memory references to the provided list.
MachineFunction & getMachineFunction() const
SlotIndex - An opaque wrapper around machine indexes.
SlotIndex getBaseIndex() const
Returns the base index for associated with this index.
SlotIndex getRegSlot(bool EC=false) const
Returns the register use/def slot in the current instruction for a normal or early-clobber def.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Information about stack frame layout on the target.
bool hasFP(const MachineFunction &MF) const
hasFP - Return true if the specified function should have a dedicated frame pointer register.
Align getStackAlign() const
getStackAlignment - This method returns the number of bytes to which the stack pointer must be aligne...
TargetInstrInfo - Interface to description of machine instruction set.
virtual bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const
Returns true iff the routine could find two commutable operands in the given machine instruction.
virtual bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const
Return true when \P Inst has reassociable operands in the same \P MBB.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const
Produce the expression describing the MI loading a value into the physical register Reg.
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isReallyTriviallyReMaterializable(const MachineInstr &MI) const
For instructions with opcodes for which the M_REMATERIALIZABLE flag is set, this hook lets the target...
virtual bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const
Test if the given instruction should be considered a scheduling boundary.
virtual MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned OpIdx1, unsigned OpIdx2) const
This method commutes the operands of the given machine instruction MI.
virtual const TargetRegisterClass * getRegClass(const MCInstrDesc &MCID, unsigned OpNum, const TargetRegisterInfo *TRI, const MachineFunction &MF) const
Given a machine instruction descriptor, returns the register class constraint for OpNum,...
bool isPositionIndependent() const
CodeModel::Model getCodeModel() const
Returns the code model.
const MCAsmInfo * getMCAsmInfo() const
Return target specific asm information.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Provide an instruction scheduling machine model to CodeGen passes.
virtual const TargetFrameLowering * getFrameLowering() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
static constexpr TypeSize getZero()
The instances of the Type class are immutable: once they are created, they are never changed.
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
static LLVM_ABI Type * getFP128Ty(LLVMContext &C)
static LLVM_ABI Type * getDoubleTy(LLVMContext &C)
static LLVM_ABI Type * getFloatTy(LLVMContext &C)
static LLVM_ABI Type * getHalfTy(LLVMContext &C)
SlotIndex def
The index of the defining instruction.
LLVM Value Representation.
void BuildCFI(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, const MCCFIInstruction &CFIInst, MachineInstr::MIFlag Flag=MachineInstr::NoFlags) const
Wraps up getting a CFI index and building a MachineInstr for it.
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register DestReg, int FrameIndex, const TargetRegisterClass *RC, const TargetRegisterInfo *TRI, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
void getFrameIndexOperands(SmallVectorImpl< MachineOperand > &Ops, int FI) const override
bool optimizeCompareInstr(MachineInstr &CmpInstr, Register SrcReg, Register SrcReg2, int64_t CmpMask, int64_t CmpValue, const MachineRegisterInfo *MRI) const override
Check if there exists an earlier instruction that operates on the same source operands and sets eflag...
bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DestReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const override
Overrides the isSchedulingBoundary from Codegen/TargetInstrInfo.cpp to make it capable of identifying...
MachineBasicBlock::iterator insertOutlinedCall(Module &M, MachineBasicBlock &MBB, MachineBasicBlock::iterator &It, MachineFunction &MF, outliner::Candidate &C) const override
const TargetRegisterClass * getRegClass(const MCInstrDesc &MCID, unsigned OpNum, const TargetRegisterInfo *TRI, const MachineFunction &MF) const override
Given a machine instruction descriptor, returns the register class constraint for OpNum,...
void replaceBranchWithTailCall(MachineBasicBlock &MBB, SmallVectorImpl< MachineOperand > &Cond, const MachineInstr &TailCall) const override
void reMaterialize(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register DestReg, unsigned SubIdx, const MachineInstr &Orig, const TargetRegisterInfo &TRI) const override
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
bool canInsertSelect(const MachineBasicBlock &, ArrayRef< MachineOperand > Cond, Register, Register, Register, int &, int &, int &) const override
void insertSelect(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DstReg, ArrayRef< MachineOperand > Cond, Register TrueReg, Register FalseReg) const override
unsigned getOpcodeAfterMemoryUnfold(unsigned Opc, bool UnfoldLoad, bool UnfoldStore, unsigned *LoadRegIndex=nullptr) const override
bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const override
Returns true iff the routine could find two commutable operands in the given machine instruction.
bool areLoadsFromSameBasePtr(SDNode *Load1, SDNode *Load2, int64_t &Offset1, int64_t &Offset2) const override
X86InstrInfo(const X86Subtarget &STI)
static bool isDataInvariantLoad(MachineInstr &MI)
Returns true if the instruction has no behavior (specified or otherwise) that is based on the value l...
MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned CommuteOpIdx1, unsigned CommuteOpIdx2) const override
bool isFunctionSafeToOutlineFrom(MachineFunction &MF, bool OutlineFromLinkOnceODRs) const override
const X86RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
bool isReallyTriviallyReMaterializable(const MachineInstr &MI) const override
bool hasCommutePreference(MachineInstr &MI, bool &Commute) const override
Returns true if we have preference on the operands order in MI, the commute decision is returned in C...
bool hasLiveCondCodeDef(MachineInstr &MI) const
True if MI has a condition code def, e.g.
std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const override
bool canMakeTailCallConditional(SmallVectorImpl< MachineOperand > &Cond, const MachineInstr &TailCall) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &LdSt, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
bool unfoldMemoryOperand(MachineFunction &MF, MachineInstr &MI, Register Reg, bool UnfoldLoad, bool UnfoldStore, SmallVectorImpl< MachineInstr * > &NewMIs) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
MachineInstr * convertToThreeAddress(MachineInstr &MI, LiveVariables *LV, LiveIntervals *LIS) const override
convertToThreeAddress - This method must be implemented by targets that set the M_CONVERTIBLE_TO_3_AD...
std::pair< unsigned, unsigned > decomposeMachineOperandsTargetFlags(unsigned TF) const override
bool expandPostRAPseudo(MachineInstr &MI) const override
bool isAssociativeAndCommutative(const MachineInstr &Inst, bool Invert) const override
MCInst getNop() const override
Return the noop instruction to use for a noop.
outliner::InstrType getOutliningTypeImpl(const MachineModuleInfo &MMI, MachineBasicBlock::iterator &MIT, unsigned Flags) const override
bool shouldScheduleLoadsNear(SDNode *Load1, SDNode *Load2, int64_t Offset1, int64_t Offset2, unsigned NumLoads) const override
This is a used by the pre-regalloc scheduler to determine (in conjunction with areLoadsFromSameBasePt...
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, MachineBasicBlock::iterator InsertPt, int FrameIndex, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
Fold a load or store of the specified stack slot into the specified machine instruction for the speci...
bool analyzeCompare(const MachineInstr &MI, Register &SrcReg, Register &SrcReg2, int64_t &CmpMask, int64_t &CmpValue) const override
bool getConstValDefinedInReg(const MachineInstr &MI, const Register Reg, int64_t &ImmVal) const override
std::optional< ExtAddrMode > getAddrModeFromMemoryOp(const MachineInstr &MemI, const TargetRegisterInfo *TRI) const override
Register isStoreToStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
isStoreToStackSlotPostFE - Check for post-frame ptr elimination stack locations as well.
bool isUnconditionalTailCall(const MachineInstr &MI) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
std::optional< std::unique_ptr< outliner::OutlinedFunction > > getOutliningCandidateInfo(const MachineModuleInfo &MMI, std::vector< outliner::Candidate > &RepeatedSequenceLocs, unsigned MinRepeats) const override
bool classifyLEAReg(MachineInstr &MI, const MachineOperand &Src, unsigned LEAOpcode, bool AllowSP, Register &NewSrc, unsigned &NewSrcSubReg, bool &isKill, MachineOperand &ImplicitOp, LiveVariables *LV, LiveIntervals *LIS) const
Given an operand within a MachineInstr, insert preceding code to put it into the right format for a p...
Register isLoadFromStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
isLoadFromStackSlotPostFE - Check for post-frame ptr elimination stack locations as well.
void setExecutionDomain(MachineInstr &MI, unsigned Domain) const override
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register SrcReg, bool isKill, int FrameIndex, const TargetRegisterClass *RC, const TargetRegisterInfo *TRI, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const override
ArrayRef< std::pair< unsigned, const char * > > getSerializableDirectMachineOperandTargetFlags() const override
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
bool setExecutionDomainCustom(MachineInstr &MI, unsigned Domain) const
int getSPAdjust(const MachineInstr &MI) const override
getSPAdjust - This returns the stack pointer adjustment made by this instruction.
bool verifyInstruction(const MachineInstr &MI, StringRef &ErrInfo) const override
Register getGlobalBaseReg(MachineFunction *MF) const
getGlobalBaseReg - Return a virtual register initialized with the the global base register value.
int getJumpTableIndex(const MachineInstr &MI) const override
void insertNoop(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const override
void setSpecialOperandAttr(MachineInstr &OldMI1, MachineInstr &OldMI2, MachineInstr &NewMI1, MachineInstr &NewMI2) const override
This is an architecture-specific helper function of reassociateOps.
std::pair< uint16_t, uint16_t > getExecutionDomain(const MachineInstr &MI) const override
bool isCoalescableExtInstr(const MachineInstr &MI, Register &SrcReg, Register &DstReg, unsigned &SubIdx) const override
isCoalescableExtInstr - Return true if the instruction is a "coalescable" extension instruction.
void loadStoreTileReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, unsigned Opc, Register Reg, int FrameIdx, bool isKill=false) const
void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg) const override
When getMachineCombinerPatterns() finds potential patterns, this function generates the instructions ...
bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const override
bool analyzeBranchPredicate(MachineBasicBlock &MBB, TargetInstrInfo::MachineBranchPredicate &MBP, bool AllowModify=false) const override
static bool isDataInvariant(MachineInstr &MI)
Returns true if the instruction has no behavior (specified or otherwise) that is based on the value o...
unsigned getUndefRegClearance(const MachineInstr &MI, unsigned OpNum, const TargetRegisterInfo *TRI) const override
Inform the BreakFalseDeps pass how many idle instructions we would like before certain undef register...
void breakPartialRegDependency(MachineInstr &MI, unsigned OpNum, const TargetRegisterInfo *TRI) const override
void buildClearRegister(Register Reg, MachineBasicBlock &MBB, MachineBasicBlock::iterator Iter, DebugLoc &DL, bool AllowSideEffects=true) const override
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
int64_t getFrameAdjustment(const MachineInstr &I) const
Returns the stack pointer adjustment that happens inside the frame setup..destroy sequence (e....
bool hasHighOperandLatency(const TargetSchedModel &SchedModel, const MachineRegisterInfo *MRI, const MachineInstr &DefMI, unsigned DefIdx, const MachineInstr &UseMI, unsigned UseIdx) const override
bool isSafeToMoveRegClassDefs(const TargetRegisterClass *RC) const override
uint16_t getExecutionDomainCustom(const MachineInstr &MI) const
bool isHighLatencyDef(int opc) const override
void buildOutlinedFrame(MachineBasicBlock &MBB, MachineFunction &MF, const outliner::OutlinedFunction &OF) const override
bool foldImmediate(MachineInstr &UseMI, MachineInstr &DefMI, Register Reg, MachineRegisterInfo *MRI) const override
foldImmediate - 'Reg' is known to be defined by a move immediate instruction, try to fold the immedia...
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
unsigned getFMA3OpcodeToCommuteOperands(const MachineInstr &MI, unsigned SrcOpIdx1, unsigned SrcOpIdx2, const X86InstrFMA3Group &FMA3Group) const
Returns an adjusted FMA opcode that must be used in FMA instruction that performs the same computatio...
bool preservesZeroValueInReg(const MachineInstr *MI, const Register NullValueReg, const TargetRegisterInfo *TRI) const override
unsigned getPartialRegUpdateClearance(const MachineInstr &MI, unsigned OpNum, const TargetRegisterInfo *TRI) const override
Inform the BreakFalseDeps pass how many idle instructions we would like before a partial register upd...
X86MachineFunctionInfo - This class is derived from MachineFunction and contains private X86 target-s...
Register getGlobalBaseReg() const
int getTCReturnAddrDelta() const
void setGlobalBaseReg(Register Reg)
unsigned getNumLocalDynamicTLSAccesses() const
bool getUsesRedZone() const
const TargetRegisterClass * constrainRegClassToNonRex2(const TargetRegisterClass *RC) const
bool isPICStyleGOT() const
const X86InstrInfo * getInstrInfo() const override
const X86RegisterInfo * getRegisterInfo() const override
const X86FrameLowering * getFrameLowering() const override
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ C
The default llvm calling convention, compatible with C.
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Define
Register definition.
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ X86
Windows x64, Windows Itanium (IA-64)
X86II - This namespace holds all of the target specific flags that instruction info tracks.
bool isKMergeMasked(uint64_t TSFlags)
bool hasNewDataDest(uint64_t TSFlags)
@ MO_GOT_ABSOLUTE_ADDRESS
MO_GOT_ABSOLUTE_ADDRESS - On a symbol operand, this represents a relocation of: SYMBOL_LABEL + [.
@ MO_INDNTPOFF
MO_INDNTPOFF - On a symbol operand this indicates that the immediate is the absolute address of the G...
@ MO_GOTNTPOFF
MO_GOTNTPOFF - On a symbol operand this indicates that the immediate is the offset of the GOT entry w...
@ MO_GOTTPOFF
MO_GOTTPOFF - On a symbol operand this indicates that the immediate is the offset of the GOT entry wi...
@ MO_PIC_BASE_OFFSET
MO_PIC_BASE_OFFSET - On a symbol operand this indicates that the immediate should get the value of th...
@ MO_GOTPCREL
MO_GOTPCREL - On a symbol operand this indicates that the immediate is offset to the GOT entry for th...
@ EVEX
EVEX - Specifies that this instruction use EVEX form which provides syntax support up to 32 512-bit r...
@ SSEDomainShift
Execution domain for SSE instructions.
bool canUseApxExtendedReg(const MCInstrDesc &Desc)
bool isPseudo(uint64_t TSFlags)
bool isKMasked(uint64_t TSFlags)
int getMemoryOperandNo(uint64_t TSFlags)
unsigned getOperandBias(const MCInstrDesc &Desc)
Compute whether all of the def operands are repeated in the uses and therefore should be skipped.
Define some predicates that are used for node matching.
CondCode getCondFromBranch(const MachineInstr &MI)
CondCode getCondFromCFCMov(const MachineInstr &MI)
CondCode getCondFromMI(const MachineInstr &MI)
Return the condition code of the instruction.
int getFirstAddrOperandIdx(const MachineInstr &MI)
Return the index of the instruction's first address operand, if it has a memory reference,...
unsigned getSwappedVCMPImm(unsigned Imm)
Get the VCMP immediate if the opcodes are swapped.
CondCode GetOppositeBranchCondition(CondCode CC)
GetOppositeBranchCondition - Return the inverse of the specified cond, e.g.
unsigned getSwappedVPCOMImm(unsigned Imm)
Get the VPCOM immediate if the opcodes are swapped.
bool isX87Instruction(MachineInstr &MI)
Check if the instruction is X87 instruction.
unsigned getNonNDVariant(unsigned Opc)
unsigned getVPCMPImmForCond(ISD::CondCode CC)
Get the VPCMP immediate for the given condition.
std::pair< CondCode, bool > getX86ConditionCode(CmpInst::Predicate Predicate)
Return a pair of condition code for the given predicate and whether the instruction operands should b...
CondCode getCondFromSETCC(const MachineInstr &MI)
unsigned getSwappedVPCMPImm(unsigned Imm)
Get the VPCMP immediate if the opcodes are swapped.
CondCode getCondFromCCMP(const MachineInstr &MI)
int getCCMPCondFlagsFromCondCode(CondCode CC)
int getCondSrcNoFromDesc(const MCInstrDesc &MCID)
Return the source operand # for condition code by MCID.
const Constant * getConstantFromPool(const MachineInstr &MI, unsigned OpNo)
Find any constant pool entry associated with a specific instruction operand.
unsigned getCMovOpcode(unsigned RegBytes, bool HasMemoryOperand=false, bool HasNDD=false)
Return a cmov opcode for the given register size in bytes, and operand type.
unsigned getNFVariant(unsigned Opc)
unsigned getVectorRegisterWidth(const MCOperandInfo &Info)
Get the width of the vector register operand.
CondCode getCondFromCMov(const MachineInstr &MI)
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
NodeAddr< NodeBase * > Node
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
int popcount(T Value) noexcept
Count the number of set bits in a value.
static bool isAddMemInstrWithRelocation(const MachineInstr &MI)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
LLVM_ABI bool isNullConstant(SDValue V)
Returns true if V is a constant integer zero.
static bool isMem(const MachineInstr &MI, unsigned Op)
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
bool isAligned(Align Lhs, uint64_t SizeInBytes)
Checks that SizeInBytes is a multiple of the alignment.
MCRegister getX86SubSuperRegister(MCRegister Reg, unsigned Size, bool High=false)
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
FunctionPass * createX86GlobalBaseRegPass()
This pass initializes a global base register for PIC on x86-32.
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
static const MachineInstrBuilder & addRegReg(const MachineInstrBuilder &MIB, Register Reg1, bool isKill1, unsigned SubReg1, Register Reg2, bool isKill2, unsigned SubReg2)
addRegReg - This function is used to add a memory reference of the form: [Reg + Reg].
unsigned getDeadRegState(bool B)
static const MachineInstrBuilder & addFrameReference(const MachineInstrBuilder &MIB, int FI, int Offset=0, bool mem=true)
addFrameReference - This function is used to add a reference to the base of an abstract object on the...
FunctionPass * createCleanupLocalDynamicTLSPass()
This pass combines multiple accesses to local-dynamic TLS variables so that the TLS base address for ...
const X86FoldTableEntry * lookupBroadcastFoldTable(unsigned RegOp, unsigned OpNum)
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
const X86InstrFMA3Group * getFMA3Group(unsigned Opcode, uint64_t TSFlags)
Returns a reference to a group of FMA3 opcodes to where the given Opcode is included.
auto reverse(ContainerTy &&C)
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
const X86FoldTableEntry * lookupTwoAddrFoldTable(unsigned RegOp)
FunctionAddr VTableAddr Count
bool is_sorted(R &&Range, Compare C)
Wrapper function around std::is_sorted to check if elements in a range R are sorted with respect to a...
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
DomTreeNodeBase< MachineBasicBlock > MachineDomTreeNode
static bool isMemInstrWithGOTPCREL(const MachineInstr &MI)
static const MachineInstrBuilder & addOffset(const MachineInstrBuilder &MIB, int Offset)
unsigned getUndefRegState(bool B)
unsigned getRegState(const MachineOperand &RegOp)
Get all register state flags from machine operand RegOp.
unsigned getDefRegState(bool B)
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
@ Sub
Subtraction of integers.
unsigned getKillRegState(bool B)
uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
FunctionAddr VTableAddr Next
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
const X86FoldTableEntry * lookupUnfoldTable(unsigned MemOp)
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
bool matchBroadcastSize(const X86FoldTableEntry &Entry, unsigned BroadcastBits)
std::pair< MachineOperand, DIExpression * > ParamLoadedValue
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
const X86FoldTableEntry * lookupFoldTable(unsigned RegOp, unsigned OpNum)
static const MachineInstrBuilder & addRegOffset(const MachineInstrBuilder &MIB, Register Reg, bool isKill, int Offset)
addRegOffset - This function is used to add a memory reference of the form [Reg + Offset],...
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
This represents a simple continuous liveness interval for a value.
std::vector< MachineInstr * > Kills
Kills - List of MachineInstruction's which are the last use of this virtual register (kill it) in the...
static LLVM_ABI MachinePointerInfo getGOT(MachineFunction &MF)
Return a MachinePointerInfo record that refers to a GOT entry.
X86AddressMode - This struct holds a generalized full x86 address mode.
enum llvm::X86AddressMode::@202116273335065351270200035056227005202106004277 BaseType
This class is used to group {132, 213, 231} forms of FMA opcodes together.
unsigned get213Opcode() const
Returns the 213 form of FMA opcode.
unsigned get231Opcode() const
Returns the 231 form of FMA opcode.
bool isIntrinsic() const
Returns true iff the group of FMA opcodes holds intrinsic opcodes.
unsigned get132Opcode() const
Returns the 132 form of FMA opcode.
An individual sequence of instructions to be replaced with a call to an outlined function.
The information necessary to create an outlined function for some class of candidate.