507 : ST(&_ST), MRI(&_MRI) {
509 addRulesForGOpcs({G_ADD, G_SUB},
Standard)
519 addRulesForGOpcs({G_UADDO, G_USUBO},
Standard)
523 addRulesForGOpcs({G_UADDE, G_USUBE, G_SADDE, G_SSUBE},
Standard)
527 addRulesForGOpcs({G_UADDSAT, G_SADDSAT, G_USUBSAT, G_SSUBSAT},
Standard)
535 bool HasVecMulU64 = ST->hasVectorMulU64();
547 bool hasMulHi = ST->hasScalarMulHiInsts();
548 addRulesForGOpcs({G_UMULH, G_SMULH},
Standard)
553 addRulesForGOpcs({G_AMDGPU_MAD_U64_U32},
Standard)
557 bool HasScalarSMulU64 = ST->hasScalarSMulU64();
558 addRulesForGOpcs({G_AMDGPU_S_MUL_U64_U32, G_AMDGPU_S_MUL_I64_I32},
Standard)
562 addRulesForGOpcs({G_XOR, G_OR, G_AND},
StandardB)
582 addRulesForGOpcs({G_LSHR},
Standard)
592 addRulesForGOpcs({G_ASHR},
Standard)
602 addRulesForGOpcs({G_FSHR},
Standard)
608 addRulesForGOpcs({G_UBFX, G_SBFX},
Standard)
614 addRulesForGOpcs({G_SMIN, G_SMAX},
Standard)
622 addRulesForGOpcs({G_UMIN, G_UMAX},
Standard)
633 addRulesForGOpcs({G_CONSTANT})
636 addRulesForGOpcs({G_FREEZE})
643 addRulesForGOpcs({G_UNMERGE_VALUES})
652 addRulesForGOpcs({G_AMDGPU_INTRIN_IMAGE_LOAD, G_AMDGPU_INTRIN_IMAGE_LOAD_D16,
653 G_AMDGPU_INTRIN_IMAGE_LOAD_NORET,
654 G_AMDGPU_INTRIN_IMAGE_STORE,
655 G_AMDGPU_INTRIN_IMAGE_STORE_D16})
670 bool HasScalarCompareEq64 = ST->hasScalarCompareEq64();
672 addRulesForGOpcs({G_ICMP})
691 addRulesForGOpcs({G_BRCOND})
695 addRulesForGOpcs({G_BR}).
Any({{
_}, {{}, {
None}}});
705 addRulesForGOpcs({G_ANYEXT})
717 bool Has16bitCmp = ST->has16BitInsts();
721 addRulesForGOpcs({G_TRUNC})
738 addRulesForGOpcs({G_ZEXT})
753 addRulesForGOpcs({G_SEXT})
768 addRulesForGOpcs({G_SEXT_INREG})
774 addRulesForGOpcs({G_ASSERT_ZEXT, G_ASSERT_SEXT},
Standard)
780 addRulesForGOpcs({G_ASSERT_ALIGN},
Standard)
792 addRulesForGOpcs({G_ATOMICRMW_ADD, G_ATOMICRMW_SUB, G_ATOMICRMW_XCHG,
793 G_ATOMICRMW_AND, G_ATOMICRMW_OR, G_ATOMICRMW_XOR,
794 G_ATOMICRMW_MIN, G_ATOMICRMW_MAX, G_ATOMICRMW_UMIN,
795 G_ATOMICRMW_UMAX, G_ATOMICRMW_UINC_WRAP,
796 G_ATOMICRMW_UDEC_WRAP})
804 bool HasAtomicFlatPkAdd16Insts = ST->hasAtomicFlatPkAdd16Insts();
805 bool HasAtomicBufferGlobalPkAddF16Insts =
806 ST->hasAtomicBufferGlobalPkAddF16NoRtnInsts() ||
807 ST->hasAtomicBufferGlobalPkAddF16Insts();
808 bool HasAtomicDsPkAdd16Insts = ST->hasAtomicDsPkAdd16Insts();
809 addRulesForGOpcs({G_ATOMICRMW_FADD})
817 HasAtomicFlatPkAdd16Insts)
819 HasAtomicBufferGlobalPkAddF16Insts)
821 HasAtomicDsPkAdd16Insts);
823 addRulesForGOpcs({G_ATOMIC_CMPXCHG})
829 addRulesForGOpcs({G_AMDGPU_ATOMIC_CMPXCHG})
835 addRulesForGOpcs({G_AMDGPU_BUFFER_ATOMIC_CMPSWAP},
Standard)
841 addRulesForGOpcs({G_AMDGPU_BUFFER_ATOMIC_SWAP, G_AMDGPU_BUFFER_ATOMIC_UMAX,
842 G_AMDGPU_BUFFER_ATOMIC_UMIN, G_AMDGPU_BUFFER_ATOMIC_SMAX,
843 G_AMDGPU_BUFFER_ATOMIC_SMIN},
848 bool hasSMRDx3 = ST->hasScalarDwordx3Loads();
849 bool hasSMRDSmall = ST->hasScalarSubwordLoads();
850 bool usesTrue16 = ST->useRealTrue16Insts();
853 return (*
MI.memoperands_begin())->getAlign() >=
Align(16);
857 return (*
MI.memoperands_begin())->getAlign() >=
Align(4);
861 return (*
MI.memoperands_begin())->isAtomic();
877 return (*
MI.memoperands_begin())->isVolatile();
881 return (*
MI.memoperands_begin())->isInvariant();
896 return MemSize == 16 || MemSize == 8;
904 auto isUL = !isAtomicMMO && isUniMMO && (isConst || !isVolatileMMO) &&
905 (isConst || isInvMMO || isNoClobberMMO);
909 addRulesForGOpcs({G_LOAD})
1016 addRulesForGOpcs({G_ZEXTLOAD, G_SEXTLOAD})
1036 addRulesForGOpcs({G_STORE})
1072 addRulesForGOpcs({G_AMDGPU_BUFFER_LOAD, G_AMDGPU_BUFFER_LOAD_FORMAT,
1073 G_AMDGPU_TBUFFER_LOAD_FORMAT},
1084 addRulesForGOpcs({G_AMDGPU_BUFFER_LOAD_USHORT, G_AMDGPU_BUFFER_LOAD_UBYTE,
1085 G_AMDGPU_BUFFER_LOAD_SSHORT, G_AMDGPU_BUFFER_LOAD_SBYTE},
1091 {G_AMDGPU_BUFFER_LOAD_UBYTE_TFE, G_AMDGPU_BUFFER_LOAD_USHORT_TFE},
1096 addRulesForGOpcs({G_AMDGPU_BUFFER_LOAD_TFE, G_AMDGPU_BUFFER_LOAD_FORMAT_TFE},
1109 {G_AMDGPU_BUFFER_LOAD_FORMAT_D16, G_AMDGPU_TBUFFER_LOAD_FORMAT_D16},
1118 addRulesForGOpcs({G_AMDGPU_BUFFER_STORE, G_AMDGPU_BUFFER_STORE_BYTE,
1119 G_AMDGPU_BUFFER_STORE_SHORT, G_AMDGPU_BUFFER_STORE_FORMAT,
1120 G_AMDGPU_BUFFER_STORE_FORMAT_D16,
1121 G_AMDGPU_TBUFFER_STORE_FORMAT,
1122 G_AMDGPU_TBUFFER_STORE_FORMAT_D16})
1134 addRulesForGOpcs({G_AMDGPU_BUFFER_ATOMIC_FADD})
1143 addRulesForGOpcs({G_PTR_ADD})
1149 addRulesForGOpcs({G_INTTOPTR})
1157 addRulesForGOpcs({G_PTRTOINT})
1167 addRulesForGOpcs({G_PTRMASK})
1175 addRulesForGOpcs({G_BITREVERSE},
Standard)
1181 addRulesForGOpcs({G_FENCE}).
Any({{{}}, {{}, {}}});
1183 addRulesForGOpcs({G_READSTEADYCOUNTER, G_READCYCLECOUNTER},
Standard)
1188 addRulesForGOpcs({G_GLOBAL_VALUE})
1195 addRulesForGOpcs({G_AMDGPU_WAVE_ADDRESS}).
Any({{
UniP5}, {{
SgprP5}, {}}});
1197 addRulesForGOpcs({G_SI_CALL})
1203 bool hasSALUFloat = ST->hasSALUFloatInsts();
1205 addRulesForGOpcs({G_FADD, G_FMUL, G_STRICT_FADD, G_STRICT_FMUL},
Standard)
1219 addRulesForGOpcs({G_FSUB, G_STRICT_FSUB},
Standard)
1227 addRulesForGOpcs({G_FMAD},
Standard)
1233 addRulesForGOpcs({G_FLDEXP, G_STRICT_FLDEXP},
Standard)
1241 addRulesForGOpcs({G_FMA, G_STRICT_FMA},
Standard)
1259 addRulesForGOpcs({G_AMDGPU_FMED3},
Standard)
1268 addRulesForGOpcs({G_AMDGPU_SMED3},
Standard)
1276 addRulesForGOpcs({G_FNEG, G_FABS},
Standard)
1291 addRulesForGOpcs({G_FCANONICALIZE},
Standard)
1303 bool hasPST = ST->hasPseudoScalarTrans();
1304 addRulesForGOpcs({G_FSQRT},
Standard)
1309 addRulesForGOpcs({G_FPTOUI, G_FPTOSI})
1321 addRulesForGOpcs({G_UITOFP, G_SITOFP})
1333 addRulesForGOpcs({G_FPEXT})
1340 addRulesForGOpcs({G_AMDGPU_CVT_PK_I16_I32},
Standard)
1344 addRulesForGOpcs({G_AMDGPU_FMIN_LEGACY, G_AMDGPU_FMAX_LEGACY},
Standard)
1348 addRulesForGOpcs({G_FMINIMUM, G_FMAXIMUM},
Standard)
1358 addRulesForGOpcs({G_FMINNUM_IEEE, G_FMAXNUM_IEEE, G_FMINNUM, G_FMAXNUM},
1371 addRulesForGOpcs({G_FPTRUNC})
1380 addRulesForGOpcs({G_IS_FPCLASS})
1388 addRulesForGOpcs({G_FCMP},
Standard)
1402 addRulesForGOpcs({G_INTRINSIC_TRUNC, G_INTRINSIC_ROUNDEVEN, G_FFLOOR, G_FCEIL,
1419 addRulesForIOpcs({amdgcn_end_cf})
1423 addRulesForIOpcs({amdgcn_if_break},
Standard)
1427 addRulesForIOpcs({amdgcn_mbcnt_lo, amdgcn_mbcnt_hi},
Standard)
1430 addRulesForIOpcs({amdgcn_readfirstlane})
1436 addRulesForIOpcs({amdgcn_s_sleep}).
Any({{
_,
_}, {{}, {
IntrId,
Imm}}});
1438 addRulesForIOpcs({amdgcn_bitop3},
Standard)
1444 addRulesForIOpcs({amdgcn_mul_u24, amdgcn_mul_i24},
Standard)
1450 addRulesForIOpcs({amdgcn_mulhi_u24, amdgcn_mulhi_i24, amdgcn_fmul_legacy},
1455 addRulesForIOpcs({amdgcn_fma_legacy},
Standard)
1459 addRulesForIOpcs({amdgcn_frexp_mant, amdgcn_fract},
Standard)
1467 addRulesForIOpcs({amdgcn_prng_b32})
1471 addRulesForIOpcs({amdgcn_sffbh},
Standard)
1475 addRulesForIOpcs({amdgcn_ubfe, amdgcn_sbfe},
Standard)
1481 addRulesForIOpcs({amdgcn_global_load_tr_b64})
1485 addRulesForIOpcs({amdgcn_global_load_tr_b128})
1489 addRulesForIOpcs({amdgcn_global_atomic_ordered_add_b64})
1492 addRulesForIOpcs({amdgcn_raw_buffer_load_lds})
1495 addRulesForIOpcs({amdgcn_struct_buffer_load_lds})
1499 addRulesForIOpcs({amdgcn_raw_ptr_buffer_load_lds})
1502 addRulesForIOpcs({amdgcn_struct_ptr_buffer_load_lds})
1505 addRulesForIOpcs({amdgcn_wwm, amdgcn_strict_wwm},
StandardB)