1//===-- SOPInstructions.td - SOP Instruction Definitions ------------------===// 2// 3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4// See https://llvm.org/LICENSE.txt for license information. 5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6// 7//===----------------------------------------------------------------------===// 8 9def GPRIdxMode : CustomOperand<i32>; 10 11class SOP_Pseudo<string opName, dag outs, dag ins, string asmOps, 12 list<dag> pattern=[]> : 13 InstSI<outs, ins, "", pattern>, 14 SIMCInstr<opName, SIEncodingFamily.NONE> { 15 16 let isPseudo = 1; 17 let isCodeGenOnly = 1; 18 let Size = 4; 19 20 string Mnemonic = opName; 21 string AsmOperands = asmOps; 22 23 bits<1> has_sdst = 0; 24} 25 26//===----------------------------------------------------------------------===// 27// SOP1 Instructions 28//===----------------------------------------------------------------------===// 29 30class SOP1_Pseudo <string opName, dag outs, dag ins, 31 string asmOps, list<dag> pattern=[]> : 32 SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> { 33 34 let mayLoad = 0; 35 let mayStore = 0; 36 let hasSideEffects = 0; 37 let SALU = 1; 38 let SOP1 = 1; 39 let SchedRW = [WriteSALU]; 40 let UseNamedOperandTable = 1; 41 42 bits<1> has_src0 = 1; 43 let has_sdst = 1; 44} 45 46class SOP1_Real<bits<8> op, SOP1_Pseudo ps, string real_name = ps.Mnemonic> : 47 InstSI <ps.OutOperandList, ps.InOperandList, 48 real_name # ps.AsmOperands>, 49 Enc32 { 50 51 let SALU = 1; 52 let SOP1 = 1; 53 let isPseudo = 0; 54 let isCodeGenOnly = 0; 55 let Size = 4; 56 57 // copy relevant pseudo op flags 58 let SubtargetPredicate = ps.SubtargetPredicate; 59 let AsmMatchConverter = ps.AsmMatchConverter; 60 let SchedRW = ps.SchedRW; 61 let mayLoad = ps.mayLoad; 62 let mayStore = ps.mayStore; 63 let isTerminator = ps.isTerminator; 64 let isReturn = ps.isReturn; 65 let isCall = ps.isCall; 66 let isBranch = ps.isBranch; 67 let isBarrier = ps.isBarrier; 68 let Uses = ps.Uses; 69 let Defs = ps.Defs; 70 let isConvergent = ps.isConvergent; 71 72 // encoding 73 bits<7> sdst; 74 bits<8> src0; 75 76 let Inst{7-0} = !if(ps.has_src0, src0, ?); 77 let Inst{15-8} = op; 78 let Inst{22-16} = !if(ps.has_sdst, sdst, ?); 79 let Inst{31-23} = 0x17d; //encoding; 80} 81 82class SOP1_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo < 83 opName, (outs SReg_32:$sdst), 84 !if(tied_in, (ins SSrc_b32:$src0, SReg_32:$sdst_in), 85 (ins SSrc_b32:$src0)), 86 "$sdst, $src0", pattern> { 87 let Constraints = !if(tied_in, "$sdst = $sdst_in", ""); 88} 89 90// Only register input allowed. 91class SOP1_32R <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 92 opName, (outs SReg_32:$sdst), (ins SReg_32:$src0), 93 "$sdst, $src0", pattern>; 94 95// 32-bit input, no output. 96class SOP1_0_32 <string opName, list<dag> pattern = []> : SOP1_Pseudo < 97 opName, (outs), (ins SSrc_b32:$src0), 98 "$src0", pattern> { 99 let has_sdst = 0; 100} 101 102// Special case for movreld where sdst is treated as a use operand. 103class SOP1_32_movreld <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 104 opName, (outs), (ins SReg_32:$sdst, SSrc_b32:$src0), 105 "$sdst, $src0", pattern>; 106 107// Special case for movreld where sdst is treated as a use operand. 108class SOP1_64_movreld <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 109 opName, (outs), (ins SReg_64:$sdst, SSrc_b64:$src0), 110 "$sdst, $src0", pattern 111>; 112 113class SOP1_0_32R <string opName, list<dag> pattern = []> : SOP1_Pseudo < 114 opName, (outs), (ins SReg_32:$src0), 115 "$src0", pattern> { 116 let has_sdst = 0; 117} 118 119class SOP1_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 120 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0), 121 "$sdst, $src0", pattern 122>; 123 124// Only register input allowed. 125class SOP1_64R <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 126 opName, (outs SReg_64:$sdst), (ins SReg_64:$src0), 127 "$sdst, $src0", pattern 128>; 129 130// 64-bit input, 32-bit output. 131class SOP1_32_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 132 opName, (outs SReg_32:$sdst), (ins SSrc_b64:$src0), 133 "$sdst, $src0", pattern 134>; 135 136// 32-bit input, 64-bit output. 137class SOP1_64_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo < 138 opName, (outs SReg_64:$sdst), 139 !if(tied_in, (ins SSrc_b32:$src0, SReg_64:$sdst_in), 140 (ins SSrc_b32:$src0)), 141 "$sdst, $src0", pattern> { 142 let Constraints = !if(tied_in, "$sdst = $sdst_in", ""); 143} 144 145// no input, 64-bit output. 146class SOP1_64_0 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 147 opName, (outs SReg_64:$sdst), (ins), "$sdst", pattern> { 148 let has_src0 = 0; 149} 150 151// 64-bit input, no output 152class SOP1_1 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < 153 opName, (outs), (ins SReg_64:$src0), "$src0", pattern> { 154 let has_sdst = 0; 155} 156 157 158class UniformUnaryFrag<SDPatternOperator Op> : PatFrag < 159 (ops node:$src0), 160 (Op $src0), 161 [{ return !N->isDivergent(); }]> { 162 // This check is unnecessary as it's captured by the result register 163 // bank constraint. 164 // 165 // FIXME: Should add a way for the emitter to recognize this is a 166 // trivially true predicate to eliminate the check. 167 let GISelPredicateCode = [{return true;}]; 168} 169 170class UniformBinFrag<SDPatternOperator Op> : PatFrag < 171 (ops node:$src0, node:$src1), 172 (Op $src0, $src1), 173 [{ return !N->isDivergent(); }]> { 174 // This check is unnecessary as it's captured by the result register 175 // bank constraint. 176 // 177 // FIXME: Should add a way for the emitter to recognize this is a 178 // trivially true predicate to eliminate the check. 179 let GISelPredicateCode = [{return true;}]; 180} 181 182class UniformTernaryFrag<SDPatternOperator Op> : PatFrag < 183 (ops node:$src0, node:$src1, node:$src2), 184 (Op $src0, $src1, $src2), 185 [{ return !N->isDivergent(); }]> { 186 // This check is unnecessary as it's captured by the result register 187 // bank constraint. 188 // 189 // FIXME: Should add a way for the emitter to recognize this is a 190 // trivially true predicate to eliminate the check. 191 let GISelPredicateCode = [{return true;}]; 192} 193 194class DivergentBinFrag<SDPatternOperator Op> : PatFrag < 195 (ops node:$src0, node:$src1), 196 (Op $src0, $src1), 197 [{ return N->isDivergent(); }]> { 198 // This check is unnecessary as it's captured by the result register 199 // bank constraint. 200 // 201 // FIXME: Should add a way for the emitter to recognize this is a 202 // trivially true predicate to eliminate the check. 203 let GISelPredicateCode = [{return true;}]; 204} 205 206 207let isMoveImm = 1 in { 208 let isReMaterializable = 1, isAsCheapAsAMove = 1 in { 209 def S_MOV_B32 : SOP1_32 <"s_mov_b32">; 210 def S_MOV_B64 : SOP1_64 <"s_mov_b64">; 211 } // End isReMaterializable = 1 212 213 let Uses = [SCC] in { 214 def S_CMOV_B32 : SOP1_32 <"s_cmov_b32">; 215 def S_CMOV_B64 : SOP1_64 <"s_cmov_b64">; 216 } // End Uses = [SCC] 217} // End isMoveImm = 1 218 219// Variant of S_MOV_B32 used for reading from volatile registers like 220// SRC_POPS_EXITING_WAVE_ID. 221let hasSideEffects = 1 in 222def S_MOV_B32_sideeffects : SOP1_32 <"s_mov_b32">; 223 224let Defs = [SCC] in { 225 def S_NOT_B32 : SOP1_32 <"s_not_b32", 226 [(set i32:$sdst, (UniformUnaryFrag<not> i32:$src0))] 227 >; 228 229 def S_NOT_B64 : SOP1_64 <"s_not_b64", 230 [(set i64:$sdst, (UniformUnaryFrag<not> i64:$src0))] 231 >; 232 def S_WQM_B32 : SOP1_32 <"s_wqm_b32", 233 [(set i32:$sdst, (int_amdgcn_s_wqm i32:$src0))]>; 234 def S_WQM_B64 : SOP1_64 <"s_wqm_b64", 235 [(set i64:$sdst, (int_amdgcn_s_wqm i64:$src0))]>; 236} // End Defs = [SCC] 237 238 239let WaveSizePredicate = isWave32 in { 240def : GCNPat < 241 (int_amdgcn_wqm_vote i1:$src0), 242 (S_WQM_B32 SSrc_b32:$src0) 243>; 244} 245 246let WaveSizePredicate = isWave64 in { 247def : GCNPat < 248 (int_amdgcn_wqm_vote i1:$src0), 249 (S_WQM_B64 SSrc_b64:$src0) 250>; 251} 252 253let isReMaterializable = 1, isAsCheapAsAMove = 1 in { 254def S_BREV_B32 : SOP1_32 <"s_brev_b32", 255 [(set i32:$sdst, (UniformUnaryFrag<bitreverse> i32:$src0))] 256>; 257def S_BREV_B64 : SOP1_64 <"s_brev_b64", 258 [(set i64:$sdst, (UniformUnaryFrag<bitreverse> i64:$src0))] 259>; 260} // End isReMaterializable = 1, isAsCheapAsAMove = 1 261 262let Defs = [SCC] in { 263def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32">; 264def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64">; 265def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32", 266 [(set i32:$sdst, (UniformUnaryFrag<ctpop> i32:$src0))] 267>; 268def S_BCNT1_I32_B64 : SOP1_32_64 <"s_bcnt1_i32_b64", 269 [(set i32:$sdst, (UniformUnaryFrag<ctpop> i64:$src0))] 270>; 271} // End Defs = [SCC] 272 273let isReMaterializable = 1 in { 274def S_FF0_I32_B32 : SOP1_32 <"s_ff0_i32_b32">; 275def S_FF0_I32_B64 : SOP1_32_64 <"s_ff0_i32_b64">; 276def S_FF1_I32_B64 : SOP1_32_64 <"s_ff1_i32_b64", 277 [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbl_b32> i64:$src0))] 278>; 279 280def S_FF1_I32_B32 : SOP1_32 <"s_ff1_i32_b32", 281 [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbl_b32> i32:$src0))] 282>; 283 284def S_FLBIT_I32_B32 : SOP1_32 <"s_flbit_i32_b32", 285 [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbh_u32> i32:$src0))] 286>; 287 288def S_FLBIT_I32_B64 : SOP1_32_64 <"s_flbit_i32_b64", 289 [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbh_u32> i64:$src0))] 290>; 291def S_FLBIT_I32 : SOP1_32 <"s_flbit_i32", 292 [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbh_i32> i32:$src0))] 293>; 294def S_FLBIT_I32_I64 : SOP1_32_64 <"s_flbit_i32_i64">; 295def S_SEXT_I32_I8 : SOP1_32 <"s_sext_i32_i8", 296 [(set i32:$sdst, (UniformSextInreg<i8> i32:$src0))] 297>; 298def S_SEXT_I32_I16 : SOP1_32 <"s_sext_i32_i16", 299 [(set i32:$sdst, (UniformSextInreg<i16> i32:$src0))] 300>; 301} // End isReMaterializable = 1 302 303def S_BITSET0_B32 : SOP1_32 <"s_bitset0_b32", [], 1>; 304def S_BITSET0_B64 : SOP1_64_32 <"s_bitset0_b64", [], 1>; 305def S_BITSET1_B32 : SOP1_32 <"s_bitset1_b32", [], 1>; 306def S_BITSET1_B64 : SOP1_64_32 <"s_bitset1_b64", [], 1>; 307 308def S_GETPC_B64 : SOP1_64_0 <"s_getpc_b64">; 309// PSEUDO includes a workaround for a hardware anomaly where some ASICs 310// zero-extend the result from 48 bits instead of sign-extending. 311let isReMaterializable = 1 in 312def S_GETPC_B64_pseudo : SOP1_64_0 <"s_getpc_b64", 313 [(set i64:$sdst, (int_amdgcn_s_getpc))] 314>; 315 316let isTerminator = 1, isBarrier = 1, SchedRW = [WriteBranch] in { 317 318let isBranch = 1, isIndirectBranch = 1 in { 319def S_SETPC_B64 : SOP1_1 <"s_setpc_b64">; 320} // End isBranch = 1, isIndirectBranch = 1 321 322let isReturn = 1 in { 323// Define variant marked as return rather than branch. 324def S_SETPC_B64_return : SOP1_1<"">; 325} 326} // End isTerminator = 1, isBarrier = 1 327 328let isCall = 1 in { 329def S_SWAPPC_B64 : SOP1_64 <"s_swappc_b64" 330>; 331} 332 333def S_RFE_B64 : SOP1_1 <"s_rfe_b64">; 334 335let hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] in { 336 337def S_AND_SAVEEXEC_B64 : SOP1_64 <"s_and_saveexec_b64">; 338def S_OR_SAVEEXEC_B64 : SOP1_64 <"s_or_saveexec_b64">; 339def S_XOR_SAVEEXEC_B64 : SOP1_64 <"s_xor_saveexec_b64">; 340def S_ANDN2_SAVEEXEC_B64 : SOP1_64 <"s_andn2_saveexec_b64">; 341def S_ORN2_SAVEEXEC_B64 : SOP1_64 <"s_orn2_saveexec_b64">; 342def S_NAND_SAVEEXEC_B64 : SOP1_64 <"s_nand_saveexec_b64">; 343def S_NOR_SAVEEXEC_B64 : SOP1_64 <"s_nor_saveexec_b64">; 344def S_XNOR_SAVEEXEC_B64 : SOP1_64 <"s_xnor_saveexec_b64">; 345 346} // End hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] 347 348def S_QUADMASK_B32 : SOP1_32 <"s_quadmask_b32", 349 [(set i32:$sdst, (int_amdgcn_s_quadmask i32:$src0))]>; 350def S_QUADMASK_B64 : SOP1_64 <"s_quadmask_b64", 351 [(set i64:$sdst, (int_amdgcn_s_quadmask i64:$src0))]>; 352 353let Uses = [M0] in { 354def S_MOVRELS_B32 : SOP1_32R <"s_movrels_b32">; 355def S_MOVRELS_B64 : SOP1_64R <"s_movrels_b64">; 356def S_MOVRELD_B32 : SOP1_32_movreld <"s_movreld_b32">; 357def S_MOVRELD_B64 : SOP1_64_movreld <"s_movreld_b64">; 358} // End Uses = [M0] 359 360let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in { 361def S_CBRANCH_JOIN : SOP1_0_32R <"s_cbranch_join">; 362} // End SubtargetPredicate = isGFX6GFX7GFX8GFX9 363 364let Defs = [SCC] in { 365def S_ABS_I32 : SOP1_32 <"s_abs_i32", 366 [(set i32:$sdst, (UniformUnaryFrag<abs> i32:$src0))] 367 >; 368} // End Defs = [SCC] 369 370let SubtargetPredicate = HasVGPRIndexMode in { 371def S_SET_GPR_IDX_IDX : SOP1_0_32<"s_set_gpr_idx_idx"> { 372 let Uses = [M0, MODE]; 373 let Defs = [M0, MODE]; 374} 375} 376 377let SubtargetPredicate = isGFX9Plus in { 378 let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in { 379 def S_ANDN1_SAVEEXEC_B64 : SOP1_64<"s_andn1_saveexec_b64">; 380 def S_ORN1_SAVEEXEC_B64 : SOP1_64<"s_orn1_saveexec_b64">; 381 def S_ANDN1_WREXEC_B64 : SOP1_64<"s_andn1_wrexec_b64">; 382 def S_ANDN2_WREXEC_B64 : SOP1_64<"s_andn2_wrexec_b64">; 383 } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] 384 385 let isReMaterializable = 1 in 386 def S_BITREPLICATE_B64_B32 : SOP1_64_32<"s_bitreplicate_b64_b32", 387 [(set i64:$sdst, (int_amdgcn_s_bitreplicate i32:$src0))]>; 388} // End SubtargetPredicate = isGFX9Plus 389 390let SubtargetPredicate = isGFX10Plus in { 391 let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in { 392 def S_AND_SAVEEXEC_B32 : SOP1_32<"s_and_saveexec_b32">; 393 def S_OR_SAVEEXEC_B32 : SOP1_32<"s_or_saveexec_b32">; 394 def S_XOR_SAVEEXEC_B32 : SOP1_32<"s_xor_saveexec_b32">; 395 def S_ANDN2_SAVEEXEC_B32 : SOP1_32<"s_andn2_saveexec_b32">; 396 def S_ORN2_SAVEEXEC_B32 : SOP1_32<"s_orn2_saveexec_b32">; 397 def S_NAND_SAVEEXEC_B32 : SOP1_32<"s_nand_saveexec_b32">; 398 def S_NOR_SAVEEXEC_B32 : SOP1_32<"s_nor_saveexec_b32">; 399 def S_XNOR_SAVEEXEC_B32 : SOP1_32<"s_xnor_saveexec_b32">; 400 def S_ANDN1_SAVEEXEC_B32 : SOP1_32<"s_andn1_saveexec_b32">; 401 def S_ORN1_SAVEEXEC_B32 : SOP1_32<"s_orn1_saveexec_b32">; 402 def S_ANDN1_WREXEC_B32 : SOP1_32<"s_andn1_wrexec_b32">; 403 def S_ANDN2_WREXEC_B32 : SOP1_32<"s_andn2_wrexec_b32">; 404 } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] 405 406 let Uses = [M0] in { 407 def S_MOVRELSD_2_B32 : SOP1_32<"s_movrelsd_2_b32">; 408 } // End Uses = [M0] 409} // End SubtargetPredicate = isGFX10Plus 410 411let SubtargetPredicate = isGFX11Plus in { 412 let hasSideEffects = 1 in { 413 // For s_sendmsg_rtn_* the src0 field encodes the message type directly; it 414 // is not an SGPR number. 415 def S_SENDMSG_RTN_B32 : SOP1_Pseudo< 416 "s_sendmsg_rtn_b32", (outs SReg_32:$sdst), (ins SendMsg:$src0), 417 "$sdst, $src0", [(set i32:$sdst, (int_amdgcn_s_sendmsg_rtn timm:$src0))] 418 >; 419 def S_SENDMSG_RTN_B64 : SOP1_Pseudo< 420 "s_sendmsg_rtn_b64", (outs SReg_64:$sdst), (ins SendMsg:$src0), 421 "$sdst, $src0", [(set i64:$sdst, (int_amdgcn_s_sendmsg_rtn timm:$src0))] 422 >; 423 } 424} // End SubtargetPredicate = isGFX11Plus 425 426class SOP1_F32_Inst<string opName, SDPatternOperator Op, ValueType vt0=f32, 427 ValueType vt1=vt0> : 428 SOP1_32<opName, [(set vt0:$sdst, (UniformUnaryFrag<Op> vt1:$src0))]>; 429 430let SubtargetPredicate = HasSALUFloatInsts, Uses = [MODE], 431 SchedRW = [WriteSFPU], isReMaterializable = 1 in { 432 def S_CVT_F32_I32 : SOP1_F32_Inst<"s_cvt_f32_i32", sint_to_fp, f32, i32>; 433 def S_CVT_F32_U32 : SOP1_F32_Inst<"s_cvt_f32_u32", uint_to_fp, f32, i32>; 434 435 let mayRaiseFPException = 1 in { 436 def S_CVT_I32_F32 : SOP1_F32_Inst<"s_cvt_i32_f32", fp_to_sint, i32, f32>; 437 def S_CVT_U32_F32 : SOP1_F32_Inst<"s_cvt_u32_f32", fp_to_uint, i32, f32>; 438 def S_CVT_F32_F16 : SOP1_F32_Inst<"s_cvt_f32_f16", fpextend, f32, f16>; 439 def S_CVT_HI_F32_F16 : SOP1_32<"s_cvt_hi_f32_f16">; 440 441 def S_CEIL_F32 : SOP1_F32_Inst<"s_ceil_f32", fceil>; 442 def S_FLOOR_F32 : SOP1_F32_Inst<"s_floor_f32", ffloor>; 443 def S_TRUNC_F32 : SOP1_F32_Inst<"s_trunc_f32", ftrunc>; 444 def S_RNDNE_F32 : SOP1_F32_Inst<"s_rndne_f32", froundeven>; 445 446 let FPDPRounding = 1 in 447 def S_CVT_F16_F32 : SOP1_F32_Inst<"s_cvt_f16_f32", fpround, f16, f32>; 448 449 def S_CEIL_F16 : SOP1_F32_Inst<"s_ceil_f16", fceil, f16>; 450 def S_FLOOR_F16 : SOP1_F32_Inst<"s_floor_f16", ffloor, f16>; 451 def S_TRUNC_F16 : SOP1_F32_Inst<"s_trunc_f16", ftrunc, f16>; 452 def S_RNDNE_F16 : SOP1_F32_Inst<"s_rndne_f16", froundeven, f16>; 453 } // End mayRaiseFPException = 1 454} // End SubtargetPredicate = HasSALUFloatInsts, Uses = [MODE] 455 // SchedRW = [WriteSFPU], isReMaterializable = 1 456 457let hasSideEffects = 1 in { 458let has_sdst = 0 in { 459let Uses = [M0] in { 460def S_BARRIER_SIGNAL_M0 : SOP1_Pseudo <"s_barrier_signal m0", (outs), (ins), 461 "", []>{ 462 let SchedRW = [WriteBarrier]; 463 let isConvergent = 1; 464} 465 466def S_BARRIER_SIGNAL_ISFIRST_M0 : SOP1_Pseudo <"s_barrier_signal_isfirst m0", (outs), (ins), 467 "", []>{ 468 let Defs = [SCC]; 469 let SchedRW = [WriteBarrier]; 470 let isConvergent = 1; 471} 472 473def S_BARRIER_INIT_M0 : SOP1_Pseudo <"s_barrier_init m0", (outs), (ins), 474 "", []>{ 475 let SchedRW = [WriteBarrier]; 476 let isConvergent = 1; 477} 478 479def S_BARRIER_INIT_IMM : SOP1_Pseudo <"s_barrier_init", (outs), 480 (ins SplitBarrier:$src0), "$src0", []>{ 481 let SchedRW = [WriteBarrier]; 482 let isConvergent = 1; 483} 484 485def S_BARRIER_JOIN_M0 : SOP1_Pseudo <"s_barrier_join m0", (outs), (ins), 486 "", []>{ 487 let SchedRW = [WriteBarrier]; 488 let isConvergent = 1; 489} 490 491} // End Uses = [M0] 492 493def S_BARRIER_SIGNAL_IMM : SOP1_Pseudo <"s_barrier_signal", (outs), 494 (ins SplitBarrier:$src0), "$src0", [(int_amdgcn_s_barrier_signal timm:$src0)]>{ 495 let SchedRW = [WriteBarrier]; 496 let isConvergent = 1; 497} 498 499def S_BARRIER_SIGNAL_ISFIRST_IMM : SOP1_Pseudo <"s_barrier_signal_isfirst", (outs), 500 (ins SplitBarrier:$src0), "$src0", [(set SCC, (int_amdgcn_s_barrier_signal_isfirst timm:$src0))]>{ 501 let Defs = [SCC]; 502 let SchedRW = [WriteBarrier]; 503 let isConvergent = 1; 504} 505 506def S_BARRIER_JOIN_IMM : SOP1_Pseudo <"s_barrier_join", (outs), 507 (ins SplitBarrier:$src0), "$src0", []>{ 508 let SchedRW = [WriteBarrier]; 509 let isConvergent = 1; 510} 511 512} // End has_sdst = 0 513 514def S_GET_BARRIER_STATE_IMM : SOP1_Pseudo <"s_get_barrier_state", (outs SSrc_b32:$sdst), 515 (ins SplitBarrier:$src0), "$sdst, $src0", []>{ 516 let SchedRW = [WriteBarrier]; 517 let isConvergent = 1; 518} 519 520def S_GET_BARRIER_STATE_M0 : SOP1_Pseudo <"s_get_barrier_state $sdst, m0", (outs SSrc_b32:$sdst), 521 (ins), "", []>{ 522 let Uses = [M0]; 523 let SchedRW = [WriteBarrier]; 524 let isConvergent = 1; 525} 526} // End hasSideEffects = 1 527 528//===----------------------------------------------------------------------===// 529// SOP2 Instructions 530//===----------------------------------------------------------------------===// 531 532class SOP2_Pseudo<string opName, dag outs, dag ins, 533 string asmOps, list<dag> pattern=[]> : 534 SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> { 535 536 let mayLoad = 0; 537 let mayStore = 0; 538 let hasSideEffects = 0; 539 let SALU = 1; 540 let SOP2 = 1; 541 let SchedRW = [WriteSALU]; 542 let UseNamedOperandTable = 1; 543 544 let has_sdst = 1; 545 546 // Pseudo instructions have no encodings, but adding this field here allows 547 // us to do: 548 // let sdst = xxx in { 549 // for multiclasses that include both real and pseudo instructions. 550 // field bits<7> sdst = 0; 551} 552 553class SOP2_Real<SOP_Pseudo ps, string name = ps.Mnemonic> : 554 InstSI <ps.OutOperandList, ps.InOperandList, 555 name # ps.AsmOperands> { 556 let SALU = 1; 557 let SOP2 = 1; 558 let isPseudo = 0; 559 let isCodeGenOnly = 0; 560 561 // copy relevant pseudo op flags 562 let SubtargetPredicate = ps.SubtargetPredicate; 563 let AsmMatchConverter = ps.AsmMatchConverter; 564 let UseNamedOperandTable = ps.UseNamedOperandTable; 565 let TSFlags = ps.TSFlags; 566 let SchedRW = ps.SchedRW; 567 let mayLoad = ps.mayLoad; 568 let mayStore = ps.mayStore; 569 let Constraints = ps.Constraints; 570 let DisableEncoding = ps.DisableEncoding; 571 let Uses = ps.Uses; 572 let Defs = ps.Defs; 573 let isConvergent = ps.isConvergent; 574 575 // encoding 576 bits<7> sdst; 577 bits<8> src0; 578 bits<8> src1; 579 bits<32> imm; 580} 581 582class SOP2_Real32<bits<7> op, SOP_Pseudo ps, string name = ps.Mnemonic> : 583 SOP2_Real<ps, name>, Enc32 { 584 let Inst{7-0} = src0; 585 let Inst{15-8} = src1; 586 let Inst{22-16} = !if(ps.has_sdst, sdst, ?); 587 let Inst{29-23} = op; 588 let Inst{31-30} = 0x2; // encoding 589} 590 591class SOP2_Real64<bits<7> op, SOP_Pseudo ps, string name = ps.Mnemonic> : 592 SOP2_Real<ps, name>, Enc64 { 593 let Inst{7-0} = src0; 594 let Inst{15-8} = src1; 595 let Inst{22-16} = !if(ps.has_sdst, sdst, ?); 596 let Inst{29-23} = op; 597 let Inst{31-30} = 0x2; // encoding 598 let Inst{63-32} = imm; 599} 600 601class SOP2_F16 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < 602 opName, (outs SReg_32:$sdst), (ins SSrc_f16:$src0, SSrc_f16:$src1), 603 "$sdst, $src0, $src1", pattern 604>; 605 606class SOP2_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < 607 opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1), 608 "$sdst, $src0, $src1", pattern 609>; 610 611class SOP2_F32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < 612 opName, (outs SReg_32:$sdst), (ins SSrc_f32:$src0, SSrc_f32:$src1), 613 "$sdst, $src0, $src1", pattern 614>; 615 616class SOP2_64 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < 617 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1), 618 "$sdst, $src0, $src1", pattern 619>; 620 621class SOP2_64_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < 622 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b32:$src1), 623 "$sdst, $src0, $src1", pattern 624>; 625 626class SOP2_64_32_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < 627 opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1), 628 "$sdst, $src0, $src1", pattern 629>; 630 631 632let Defs = [SCC] in { // Carry out goes to SCC 633let isCommutable = 1, isAdd = 1 in { 634def S_ADD_U32 : SOP2_32 <"s_add_u32">; 635def S_ADD_I32 : SOP2_32 <"s_add_i32", 636 [(set i32:$sdst, (UniformBinFrag<add> SSrc_b32:$src0, SSrc_b32:$src1))] 637>; 638} // End isCommutable = 1, isAdd = 1 639 640def S_SUB_U32 : SOP2_32 <"s_sub_u32">; 641def S_SUB_I32 : SOP2_32 <"s_sub_i32", 642 [(set i32:$sdst, (UniformBinFrag<sub> SSrc_b32:$src0, SSrc_b32:$src1))] 643>; 644 645let Uses = [SCC] in { // Carry in comes from SCC 646let isCommutable = 1 in { 647def S_ADDC_U32 : SOP2_32 <"s_addc_u32", 648 [(set i32:$sdst, (UniformBinFrag<adde> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>; 649} // End isCommutable = 1 650 651def S_SUBB_U32 : SOP2_32 <"s_subb_u32", 652 [(set i32:$sdst, (UniformBinFrag<sube> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>; 653} // End Uses = [SCC] 654 655let isCommutable = 1 in { 656def S_MIN_I32 : SOP2_32 <"s_min_i32", 657 [(set i32:$sdst, (UniformBinFrag<smin> i32:$src0, i32:$src1))] 658>; 659def S_MIN_U32 : SOP2_32 <"s_min_u32", 660 [(set i32:$sdst, (UniformBinFrag<umin> i32:$src0, i32:$src1))] 661>; 662def S_MAX_I32 : SOP2_32 <"s_max_i32", 663 [(set i32:$sdst, (UniformBinFrag<smax> i32:$src0, i32:$src1))] 664>; 665def S_MAX_U32 : SOP2_32 <"s_max_u32", 666 [(set i32:$sdst, (UniformBinFrag<umax> i32:$src0, i32:$src1))] 667>; 668} // End isCommutable = 1 669} // End Defs = [SCC] 670 671let SubtargetPredicate = isGFX12Plus in { 672 def S_ADD_U64 : SOP2_64<"s_add_u64">{ 673 let isCommutable = 1; 674 } 675 676 def S_SUB_U64 : SOP2_64<"s_sub_u64">; 677 678 def S_MUL_U64 : SOP2_64 <"s_mul_u64", 679 [(set i64:$sdst, (UniformBinFrag<mul> i64:$src0, i64:$src1))]> { 680 let isCommutable = 1; 681 } 682 683 // The higher 32-bits of the inputs contain the sign extension bits. 684 def S_MUL_I64_I32_PSEUDO : SPseudoInstSI < 685 (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1) 686 >; 687 688 // The higher 32-bits of the inputs are zero. 689 def S_MUL_U64_U32_PSEUDO : SPseudoInstSI < 690 (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1) 691 >; 692 693} // End SubtargetPredicate = isGFX12Plus 694 695let Uses = [SCC] in { 696 def S_CSELECT_B32 : SOP2_32 <"s_cselect_b32">; 697 def S_CSELECT_B64 : SOP2_64 <"s_cselect_b64">; 698} // End Uses = [SCC] 699 700let Defs = [SCC] in { 701let isCommutable = 1 in { 702def S_AND_B32 : SOP2_32 <"s_and_b32", 703 [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, i32:$src1))] 704>; 705 706def S_AND_B64 : SOP2_64 <"s_and_b64", 707 [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, i64:$src1))] 708>; 709 710def S_OR_B32 : SOP2_32 <"s_or_b32", 711 [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, i32:$src1))] 712>; 713 714def S_OR_B64 : SOP2_64 <"s_or_b64", 715 [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, i64:$src1))] 716>; 717 718def S_XOR_B32 : SOP2_32 <"s_xor_b32", 719 [(set i32:$sdst, (UniformBinFrag<xor> i32:$src0, i32:$src1))] 720>; 721 722def S_XOR_B64 : SOP2_64 <"s_xor_b64", 723 [(set i64:$sdst, (UniformBinFrag<xor> i64:$src0, i64:$src1))] 724>; 725 726def S_XNOR_B32 : SOP2_32 <"s_xnor_b32", 727 [(set i32:$sdst, (UniformUnaryFrag<not> (xor_oneuse i32:$src0, i32:$src1)))] 728>; 729 730def S_XNOR_B64 : SOP2_64 <"s_xnor_b64", 731 [(set i64:$sdst, (UniformUnaryFrag<not> (xor_oneuse i64:$src0, i64:$src1)))] 732>; 733 734def S_NAND_B32 : SOP2_32 <"s_nand_b32", 735 [(set i32:$sdst, (UniformUnaryFrag<not> (and_oneuse i32:$src0, i32:$src1)))] 736>; 737 738def S_NAND_B64 : SOP2_64 <"s_nand_b64", 739 [(set i64:$sdst, (UniformUnaryFrag<not> (and_oneuse i64:$src0, i64:$src1)))] 740>; 741 742def S_NOR_B32 : SOP2_32 <"s_nor_b32", 743 [(set i32:$sdst, (UniformUnaryFrag<not> (or_oneuse i32:$src0, i32:$src1)))] 744>; 745 746def S_NOR_B64 : SOP2_64 <"s_nor_b64", 747 [(set i64:$sdst, (UniformUnaryFrag<not> (or_oneuse i64:$src0, i64:$src1)))] 748>; 749} // End isCommutable = 1 750 751// There are also separate patterns for types other than i32 752def S_ANDN2_B32 : SOP2_32 <"s_andn2_b32", 753 [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, (not i32:$src1)))] 754>; 755 756def S_ANDN2_B64 : SOP2_64 <"s_andn2_b64", 757 [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, (not i64:$src1)))] 758>; 759 760def S_ORN2_B32 : SOP2_32 <"s_orn2_b32", 761 [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, (not i32:$src1)))] 762>; 763 764def S_ORN2_B64 : SOP2_64 <"s_orn2_b64", 765 [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, (not i64:$src1)))] 766>; 767} // End Defs = [SCC] 768 769// Use added complexity so these patterns are preferred to the VALU patterns. 770let AddedComplexity = 1 in { 771 772let Defs = [SCC] in { 773// TODO: b64 versions require VOP3 change since v_lshlrev_b64 is VOP3 774def S_LSHL_B32 : SOP2_32 <"s_lshl_b32", 775 [(set SReg_32:$sdst, (UniformBinFrag<cshl_32> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))] 776>; 777def S_LSHL_B64 : SOP2_64_32 <"s_lshl_b64", 778 [(set SReg_64:$sdst, (UniformBinFrag<cshl_64> (i64 SSrc_b64:$src0), (i32 SSrc_b32:$src1)))] 779>; 780def S_LSHR_B32 : SOP2_32 <"s_lshr_b32", 781 [(set SReg_32:$sdst, (UniformBinFrag<csrl_32> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))] 782>; 783def S_LSHR_B64 : SOP2_64_32 <"s_lshr_b64", 784 [(set SReg_64:$sdst, (UniformBinFrag<csrl_64> (i64 SSrc_b64:$src0), (i32 SSrc_b32:$src1)))] 785>; 786def S_ASHR_I32 : SOP2_32 <"s_ashr_i32", 787 [(set SReg_32:$sdst, (UniformBinFrag<csra_32> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))] 788>; 789def S_ASHR_I64 : SOP2_64_32 <"s_ashr_i64", 790 [(set SReg_64:$sdst, (UniformBinFrag<csra_64> (i64 SSrc_b64:$src0), (i32 SSrc_b32:$src1)))] 791>; 792} // End Defs = [SCC] 793 794let isReMaterializable = 1 in { 795def S_BFM_B32 : SOP2_32 <"s_bfm_b32", 796 [(set i32:$sdst, (UniformBinFrag<AMDGPUbfm> i32:$src0, i32:$src1))]>; 797def S_BFM_B64 : SOP2_64_32_32 <"s_bfm_b64">; 798 799def S_MUL_I32 : SOP2_32 <"s_mul_i32", 800 [(set i32:$sdst, (UniformBinFrag<mul> i32:$src0, i32:$src1))]> { 801 let isCommutable = 1; 802} 803} // End isReMaterializable = 1 804} // End AddedComplexity = 1 805 806let Defs = [SCC] in { 807def S_BFE_U32 : SOP2_32 <"s_bfe_u32">; 808def S_BFE_I32 : SOP2_32 <"s_bfe_i32">; 809def S_BFE_U64 : SOP2_64_32 <"s_bfe_u64">; 810def S_BFE_I64 : SOP2_64_32 <"s_bfe_i64">; 811} // End Defs = [SCC] 812 813def S_CBRANCH_G_FORK : SOP2_Pseudo < 814 "s_cbranch_g_fork", (outs), 815 (ins SCSrc_b64:$src0, SCSrc_b64:$src1), 816 "$src0, $src1" 817> { 818 let has_sdst = 0; 819 let SubtargetPredicate = isGFX6GFX7GFX8GFX9; 820} 821 822let Defs = [SCC] in { 823def S_ABSDIFF_I32 : SOP2_32 <"s_absdiff_i32">; 824} // End Defs = [SCC] 825 826let SubtargetPredicate = isGFX8GFX9 in { 827 def S_RFE_RESTORE_B64 : SOP2_Pseudo < 828 "s_rfe_restore_b64", (outs), 829 (ins SSrc_b64:$src0, SSrc_b32:$src1), 830 "$src0, $src1" 831 > { 832 let hasSideEffects = 1; 833 let has_sdst = 0; 834 } 835} 836 837let SubtargetPredicate = isGFX9Plus in { 838 let isReMaterializable = 1 in { 839 def S_PACK_LL_B32_B16 : SOP2_32<"s_pack_ll_b32_b16">; 840 def S_PACK_LH_B32_B16 : SOP2_32<"s_pack_lh_b32_b16">; 841 def S_PACK_HH_B32_B16 : SOP2_32<"s_pack_hh_b32_b16">; 842 } // End isReMaterializable = 1 843 844 let Defs = [SCC] in { 845 def S_LSHL1_ADD_U32 : SOP2_32<"s_lshl1_add_u32", 846 [(set i32:$sdst, (shl1_add SSrc_b32:$src0, SSrc_b32:$src1))] 847 >; 848 def S_LSHL2_ADD_U32 : SOP2_32<"s_lshl2_add_u32", 849 [(set i32:$sdst, (shl2_add SSrc_b32:$src0, SSrc_b32:$src1))] 850 >; 851 def S_LSHL3_ADD_U32 : SOP2_32<"s_lshl3_add_u32", 852 [(set i32:$sdst, (shl3_add SSrc_b32:$src0, SSrc_b32:$src1))] 853 >; 854 def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32", 855 [(set i32:$sdst, (shl4_add SSrc_b32:$src0, SSrc_b32:$src1))] 856 >; 857 } // End Defs = [SCC] 858 859 let isCommutable = 1, isReMaterializable = 1 in { 860 def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32", 861 [(set i32:$sdst, (UniformBinFrag<mulhu> SSrc_b32:$src0, SSrc_b32:$src1))]>; 862 def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32", 863 [(set i32:$sdst, (UniformBinFrag<mulhs> SSrc_b32:$src0, SSrc_b32:$src1))]>; 864 } // End isCommutable = 1, isReMaterializable = 1 865} // End SubtargetPredicate = isGFX9Plus 866 867let SubtargetPredicate = isGFX11Plus in { 868 def S_PACK_HL_B32_B16 : SOP2_32<"s_pack_hl_b32_b16">; 869} // End SubtargetPredicate = isGFX11Plus 870 871class SOP2_F32_Inst<string opName, SDPatternOperator Op, ValueType dstVt=f32> : 872 SOP2_F32<opName, 873 [(set dstVt:$sdst, (UniformBinFrag<Op> SSrc_f32:$src0, SSrc_f32:$src1))]>; 874 875class SOP2_F16_Inst<string opName, SDPatternOperator Op> : 876 SOP2_F16<opName, 877 [(set f16:$sdst, (UniformBinFrag<Op> SSrc_f16:$src0, SSrc_f16:$src1))]>; 878 879let SubtargetPredicate = HasSALUFloatInsts, mayRaiseFPException = 1, 880 Uses = [MODE], SchedRW = [WriteSFPU] in { 881 let isReMaterializable = 1 in { 882 let isCommutable = 1 in { 883 def S_ADD_F32 : SOP2_F32_Inst<"s_add_f32", any_fadd>; 884 def S_MIN_F32 : SOP2_F32_Inst<"s_min_f32", fminnum_like>; 885 def S_MAX_F32 : SOP2_F32_Inst<"s_max_f32", fmaxnum_like>; 886 def S_MUL_F32 : SOP2_F32_Inst<"s_mul_f32", any_fmul>; 887 888 let FixedSize = 1 in 889 def S_FMAAK_F32 : SOP2_Pseudo< 890 "s_fmaak_f32", (outs SReg_32:$sdst), 891 (ins SSrc_f32_Deferred:$src0, SSrc_f32_Deferred:$src1, KImmFP32:$imm), 892 "$sdst, $src0, $src1, $imm" 893 >; 894 895 let FPDPRounding = 1 in { 896 def S_ADD_F16 : SOP2_F16_Inst<"s_add_f16", any_fadd>; 897 def S_MUL_F16 : SOP2_F16_Inst<"s_mul_f16", any_fmul>; 898 } // End FPDPRounding 899 900 def S_MIN_F16 : SOP2_F16_Inst<"s_min_f16", fminnum_like>; 901 def S_MAX_F16 : SOP2_F16_Inst<"s_max_f16", fmaxnum_like>; 902 } // End isCommutable = 1 903 904 let FPDPRounding = 1 in 905 def S_SUB_F16 : SOP2_F16_Inst<"s_sub_f16", any_fsub>; 906 907 def S_SUB_F32 : SOP2_F32_Inst<"s_sub_f32", any_fsub>; 908 def S_CVT_PK_RTZ_F16_F32 : SOP2_F32_Inst<"s_cvt_pk_rtz_f16_f32", 909 AMDGPUpkrtz_f16_f32, v2f16>; 910 911 let FixedSize = 1 in 912 def S_FMAMK_F32 : SOP2_Pseudo< 913 "s_fmamk_f32", (outs SReg_32:$sdst), 914 (ins SSrc_f32_Deferred:$src0, KImmFP32:$imm, SSrc_f32_Deferred:$src1), 915 "$sdst, $src0, $imm, $src1" 916 >; 917 } // End isReMaterializable = 1 918 919 let Constraints = "$sdst = $src2", DisableEncoding="$src2", 920 isCommutable = 1, AddedComplexity = 20 in { 921 def S_FMAC_F32 : SOP2_Pseudo< 922 "s_fmac_f32", (outs SReg_32:$sdst), 923 (ins SSrc_f32:$src0, SSrc_f32:$src1, SReg_32:$src2), 924 "$sdst, $src0, $src1", 925 [(set f32:$sdst, (UniformTernaryFrag<any_fma> SSrc_f32:$src0, SSrc_f32:$src1, SReg_32:$src2))] 926 >; 927 928 def S_FMAC_F16 : SOP2_Pseudo< 929 "s_fmac_f16", (outs SReg_32:$sdst), 930 (ins SSrc_f16:$src0, SSrc_f16:$src1, SReg_32:$src2), 931 "$sdst, $src0, $src1", 932 [(set f16:$sdst, (UniformTernaryFrag<any_fma> SSrc_f16:$src0, SSrc_f16:$src1, SReg_32:$src2))] 933 >; 934 } // End Constraints = "$sdst = $src2", DisableEncoding="$src2", 935 // isCommutable = 1, AddedComplexity = 20 936} // End SubtargetPredicate = HasSALUFloatInsts, mayRaiseFPException = 1, 937 // Uses = [MODE], SchedRW = [WriteSFPU] 938 939// On GFX12 MIN/MAX instructions do not read MODE register. 940let SubtargetPredicate = isGFX12Plus, mayRaiseFPException = 1, isCommutable = 1, 941 isReMaterializable = 1, SchedRW = [WriteSFPU], AddedComplexity = 17 in { 942 def S_MINIMUM_F32 : SOP2_F32_Inst<"s_minimum_f32", fminimum>; 943 def S_MAXIMUM_F32 : SOP2_F32_Inst<"s_maximum_f32", fmaximum>; 944 def S_MINIMUM_F16 : SOP2_F16_Inst<"s_minimum_f16", fminimum>; 945 def S_MAXIMUM_F16 : SOP2_F16_Inst<"s_maximum_f16", fmaximum>; 946} 947 948//===----------------------------------------------------------------------===// 949// SOPK Instructions 950//===----------------------------------------------------------------------===// 951 952class SOPK_Pseudo <string opName, dag outs, dag ins, 953 string asmOps, list<dag> pattern=[]> : 954 SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> { 955 let mayLoad = 0; 956 let mayStore = 0; 957 let hasSideEffects = 0; 958 let SALU = 1; 959 let SOPK = 1; 960 let FixedSize = 1; 961 let SchedRW = [WriteSALU]; 962 let UseNamedOperandTable = 1; 963 964 let has_sdst = 1; 965} 966 967class SOPK_Real<SOPK_Pseudo ps, string name = ps.Mnemonic> : 968 InstSI <ps.OutOperandList, ps.InOperandList, 969 name # ps.AsmOperands> { 970 let SALU = 1; 971 let SOPK = 1; 972 let isPseudo = 0; 973 let isCodeGenOnly = 0; 974 let UseNamedOperandTable = 1; 975 976 // copy relevant pseudo op flags 977 let SubtargetPredicate = ps.SubtargetPredicate; 978 let AsmMatchConverter = ps.AsmMatchConverter; 979 let DisableEncoding = ps.DisableEncoding; 980 let Constraints = ps.Constraints; 981 let SchedRW = ps.SchedRW; 982 let mayLoad = ps.mayLoad; 983 let mayStore = ps.mayStore; 984 let isBranch = ps.isBranch; 985 let isCall = ps.isCall; 986 let isTerminator = ps.isTerminator; 987 let isReturn = ps.isReturn; 988 let isBarrier = ps.isBarrier; 989 let Uses = ps.Uses; 990 let Defs = ps.Defs; 991 let isConvergent = ps.isConvergent; 992 993 // encoding 994 bits<7> sdst; 995 bits<16> simm16; 996 bits<32> imm; 997} 998 999class SOPK_Real32<bits<5> op, SOPK_Pseudo ps, string name = ps.Mnemonic> : 1000 SOPK_Real <ps, name>, 1001 Enc32 { 1002 let Inst{15-0} = simm16; 1003 let Inst{22-16} = !if(ps.has_sdst, sdst, ?); 1004 let Inst{27-23} = op; 1005 let Inst{31-28} = 0xb; //encoding 1006} 1007 1008class SOPK_Real64<bits<5> op, SOPK_Pseudo ps> : 1009 SOPK_Real<ps>, 1010 Enc64 { 1011 let Inst{15-0} = simm16; 1012 let Inst{22-16} = !if(ps.has_sdst, sdst, ?); 1013 let Inst{27-23} = op; 1014 let Inst{31-28} = 0xb; //encoding 1015 let Inst{63-32} = imm; 1016} 1017 1018class SOPKInstTable <bit is_sopk, string cmpOp = ""> { 1019 bit IsSOPK = is_sopk; 1020 string BaseCmpOp = cmpOp; 1021} 1022 1023class SOPK_32 <string opName, list<dag> pattern=[]> : SOPK_Pseudo < 1024 opName, 1025 (outs SReg_32:$sdst), 1026 (ins s16imm:$simm16), 1027 "$sdst, $simm16", 1028 pattern>; 1029 1030class SOPK_32_BR <string opName, list<dag> pattern=[]> : SOPK_Pseudo < 1031 opName, 1032 (outs), 1033 (ins SOPPBrTarget:$simm16, SReg_32:$sdst), 1034 "$sdst, $simm16", 1035 pattern> { 1036 let Defs = [EXEC]; 1037 let Uses = [EXEC]; 1038 let isBranch = 1; 1039 let isTerminator = 1; 1040 let SchedRW = [WriteBranch]; 1041} 1042 1043class SOPK_SCC <string opName, string base_op, bit isSignExt> : SOPK_Pseudo < 1044 opName, 1045 (outs), 1046 !if(isSignExt, 1047 (ins SReg_32:$sdst, s16imm:$simm16), 1048 (ins SReg_32:$sdst, u16imm:$simm16)), 1049 "$sdst, $simm16">, 1050 SOPKInstTable<1, base_op>{ 1051 let Defs = [SCC]; 1052} 1053 1054class SOPK_32TIE <string opName, list<dag> pattern=[]> : SOPK_Pseudo < 1055 opName, 1056 (outs SReg_32:$sdst), 1057 (ins SReg_32:$src0, s16imm:$simm16), 1058 "$sdst, $simm16", 1059 pattern 1060>; 1061 1062let isReMaterializable = 1, isMoveImm = 1 in { 1063def S_MOVK_I32 : SOPK_32 <"s_movk_i32">; 1064} // End isReMaterializable = 1 1065let Uses = [SCC] in { 1066def S_CMOVK_I32 : SOPK_32 <"s_cmovk_i32">; 1067} 1068 1069let isCompare = 1 in { 1070 1071// This instruction is disabled for now until we can figure out how to teach 1072// the instruction selector to correctly use the S_CMP* vs V_CMP* 1073// instructions. 1074// 1075// When this instruction is enabled the code generator sometimes produces this 1076// invalid sequence: 1077// 1078// SCC = S_CMPK_EQ_I32 SGPR0, imm 1079// VCC = COPY SCC 1080// VGPR0 = V_CNDMASK VCC, VGPR0, VGPR1 1081// 1082// def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", 1083// [(set i1:$dst, (setcc i32:$src0, imm:$src1, SETEQ))] 1084// >; 1085 1086def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", "s_cmp_eq_i32", 1>; 1087def S_CMPK_LG_I32 : SOPK_SCC <"s_cmpk_lg_i32", "s_cmp_lg_i32", 1>; 1088def S_CMPK_GT_I32 : SOPK_SCC <"s_cmpk_gt_i32", "s_cmp_gt_i32", 1>; 1089def S_CMPK_GE_I32 : SOPK_SCC <"s_cmpk_ge_i32", "s_cmp_ge_i32", 1>; 1090def S_CMPK_LT_I32 : SOPK_SCC <"s_cmpk_lt_i32", "s_cmp_lt_i32", 1>; 1091def S_CMPK_LE_I32 : SOPK_SCC <"s_cmpk_le_i32", "s_cmp_le_i32", 1>; 1092 1093def S_CMPK_EQ_U32 : SOPK_SCC <"s_cmpk_eq_u32", "s_cmp_eq_u32", 0>; 1094def S_CMPK_LG_U32 : SOPK_SCC <"s_cmpk_lg_u32", "s_cmp_lg_u32", 0>; 1095def S_CMPK_GT_U32 : SOPK_SCC <"s_cmpk_gt_u32", "s_cmp_gt_u32", 0>; 1096def S_CMPK_GE_U32 : SOPK_SCC <"s_cmpk_ge_u32", "s_cmp_ge_u32", 0>; 1097def S_CMPK_LT_U32 : SOPK_SCC <"s_cmpk_lt_u32", "s_cmp_lt_u32", 0>; 1098def S_CMPK_LE_U32 : SOPK_SCC <"s_cmpk_le_u32", "s_cmp_le_u32", 0>; 1099} // End isCompare = 1 1100 1101let isCommutable = 1, DisableEncoding = "$src0", 1102 Constraints = "$sdst = $src0" in { 1103 let Defs = [SCC] in 1104 def S_ADDK_I32 : SOPK_32TIE <"s_addk_i32">; 1105 def S_MULK_I32 : SOPK_32TIE <"s_mulk_i32">; 1106} 1107 1108let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in 1109def S_CBRANCH_I_FORK : SOPK_Pseudo < 1110 "s_cbranch_i_fork", 1111 (outs), (ins SReg_64:$sdst, SOPPBrTarget:$simm16), 1112 "$sdst, $simm16" 1113>; 1114 1115// This is hasSideEffects to allow its use in readcyclecounter selection. 1116// FIXME: Need to truncate immediate to 16-bits. 1117// FIXME: Should have separate pseudos for known may read MODE and 1118// only read MODE. 1119def S_GETREG_B32 : SOPK_Pseudo < 1120 "s_getreg_b32", 1121 (outs SReg_32:$sdst), (ins hwreg:$simm16), 1122 "$sdst, $simm16", 1123 [(set i32:$sdst, (int_amdgcn_s_getreg (i32 timm:$simm16)))]> { 1124 let hasSideEffects = 1; 1125 let Uses = [MODE]; 1126} 1127 1128let Defs = [MODE], Uses = [MODE] in { 1129 1130// FIXME: Need to truncate immediate to 16-bits. 1131class S_SETREG_B32_Pseudo <list<dag> pattern=[]> : SOPK_Pseudo < 1132 "s_setreg_b32", 1133 (outs), (ins SReg_32:$sdst, hwreg:$simm16), 1134 "$simm16, $sdst", 1135 pattern>; 1136 1137def S_SETREG_B32 : S_SETREG_B32_Pseudo < 1138 [(int_amdgcn_s_setreg (i32 SIMM16bit:$simm16), i32:$sdst)]> { 1139 // Use custom inserter to optimize some cases to 1140 // S_DENORM_MODE/S_ROUND_MODE/S_SETREG_B32_mode. 1141 let usesCustomInserter = 1; 1142 let hasSideEffects = 1; 1143} 1144 1145// Variant of SETREG that is guaranteed to only touch FP bits in the MODE 1146// register, so doesn't have unmodeled side effects. 1147def S_SETREG_B32_mode : S_SETREG_B32_Pseudo { 1148 let hasSideEffects = 0; 1149} 1150 1151// FIXME: Not on SI? 1152//def S_GETREG_REGRD_B32 : SOPK_32 <sopk<0x14, 0x13>, "s_getreg_regrd_b32">; 1153 1154class S_SETREG_IMM32_B32_Pseudo : SOPK_Pseudo < 1155 "s_setreg_imm32_b32", 1156 (outs), (ins i32imm:$imm, hwreg:$simm16), 1157 "$simm16, $imm"> { 1158 let Size = 8; // Unlike every other SOPK instruction. 1159 let has_sdst = 0; 1160} 1161 1162def S_SETREG_IMM32_B32 : S_SETREG_IMM32_B32_Pseudo { 1163 let hasSideEffects = 1; 1164} 1165 1166// Variant of SETREG_IMM32 that is guaranteed to only touch FP bits in the MODE 1167// register, so doesn't have unmodeled side effects. 1168def S_SETREG_IMM32_B32_mode : S_SETREG_IMM32_B32_Pseudo { 1169 let hasSideEffects = 0; 1170} 1171 1172} // End Defs = [MODE], Uses = [MODE] 1173 1174class SOPK_WAITCNT<string opName, list<dag> pat=[]> : 1175 SOPK_Pseudo< 1176 opName, 1177 (outs), 1178 (ins SReg_32:$sdst, s16imm:$simm16), 1179 "$sdst, $simm16", 1180 pat> { 1181 let hasSideEffects = 1; 1182 let mayLoad = 1; 1183 let mayStore = 1; 1184 let has_sdst = 1; // First source takes place of sdst in encoding 1185} 1186 1187let SubtargetPredicate = isGFX9Plus in { 1188 def S_CALL_B64 : SOPK_Pseudo< 1189 "s_call_b64", 1190 (outs SReg_64:$sdst), 1191 (ins SOPPBrTarget:$simm16), 1192 "$sdst, $simm16"> { 1193 let isCall = 1; 1194 } 1195} // End SubtargetPredicate = isGFX9Plus 1196 1197def VersionImm : S16ImmOperand { 1198 let DecoderMethod = "decodeVersionImm"; 1199} 1200 1201let SubtargetPredicate = isGFX10Plus in { 1202 def S_VERSION : SOPK_Pseudo< 1203 "s_version", 1204 (outs), 1205 (ins VersionImm:$simm16), 1206 "$simm16"> { 1207 let has_sdst = 0; 1208 } 1209} // End SubtargetPredicate = isGFX10Plus 1210 1211let SubtargetPredicate = isGFX10GFX11 in { 1212 def S_SUBVECTOR_LOOP_BEGIN : SOPK_32_BR<"s_subvector_loop_begin">; 1213 def S_SUBVECTOR_LOOP_END : SOPK_32_BR<"s_subvector_loop_end">; 1214 1215 def S_WAITCNT_VSCNT : SOPK_WAITCNT<"s_waitcnt_vscnt">; 1216 def S_WAITCNT_VMCNT : SOPK_WAITCNT<"s_waitcnt_vmcnt">; 1217 def S_WAITCNT_EXPCNT : SOPK_WAITCNT<"s_waitcnt_expcnt">; 1218 def S_WAITCNT_LGKMCNT : SOPK_WAITCNT<"s_waitcnt_lgkmcnt">; 1219} // End SubtargetPredicate = isGFX10GFX11 1220 1221//===----------------------------------------------------------------------===// 1222// SOPC Instructions 1223//===----------------------------------------------------------------------===// 1224 1225class SOPC_Pseudo<string opName, dag outs, dag ins, 1226 string asmOps, list<dag> pattern=[]> : 1227 SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> { 1228 let mayLoad = 0; 1229 let mayStore = 0; 1230 let hasSideEffects = 0; 1231 let SALU = 1; 1232 let SOPC = 1; 1233 let Defs = [SCC]; 1234 let SchedRW = [WriteSALU]; 1235 let UseNamedOperandTable = 1; 1236} 1237 1238class SOPC_Real<bits<7> op, SOPC_Pseudo ps> : 1239 InstSI <ps.OutOperandList, ps.InOperandList, 1240 ps.Mnemonic # ps.AsmOperands>, 1241 Enc32 { 1242 let SALU = 1; 1243 let SOPC = 1; 1244 let isPseudo = 0; 1245 let isCodeGenOnly = 0; 1246 1247 // copy relevant pseudo op flags 1248 let SubtargetPredicate = ps.SubtargetPredicate; 1249 let OtherPredicates = ps.OtherPredicates; 1250 let AsmMatchConverter = ps.AsmMatchConverter; 1251 let UseNamedOperandTable = ps.UseNamedOperandTable; 1252 let TSFlags = ps.TSFlags; 1253 let SchedRW = ps.SchedRW; 1254 let mayLoad = ps.mayLoad; 1255 let mayStore = ps.mayStore; 1256 let Uses = ps.Uses; 1257 let Defs = ps.Defs; 1258 let isConvergent = ps.isConvergent; 1259 1260 // encoding 1261 bits<8> src0; 1262 bits<8> src1; 1263 1264 let Inst{7-0} = src0; 1265 let Inst{15-8} = src1; 1266 let Inst{22-16} = op; 1267 let Inst{31-23} = 0x17e; 1268} 1269 1270class SOPC_Base <RegisterOperand rc0, RegisterOperand rc1, 1271 string opName, list<dag> pattern = []> : SOPC_Pseudo < 1272 opName, (outs), (ins rc0:$src0, rc1:$src1), 1273 "$src0, $src1", pattern > { 1274} 1275 1276class SOPC_Helper <RegisterOperand rc, ValueType vt, 1277 string opName, SDPatternOperator cond> : SOPC_Base < 1278 rc, rc, opName, 1279 [(set SCC, (UniformTernaryFrag<setcc> vt:$src0, vt:$src1, cond))] > { 1280} 1281 1282class SOPC_CMP_32<string opName, 1283 SDPatternOperator cond = COND_NULL, string revOp = opName> 1284 : SOPC_Helper<SSrc_b32, i32, opName, cond>, 1285 Commutable_REV<revOp, !eq(revOp, opName)>, 1286 SOPKInstTable<0, opName> { 1287 let isCompare = 1; 1288 let isCommutable = 1; 1289} 1290 1291class SOPC_CMP_F32<string opName, 1292 SDPatternOperator cond = COND_NULL, string revOp = opName> 1293 : SOPC_Helper<SSrc_b32, f32, opName, cond>, 1294 Commutable_REV<revOp, !eq(revOp, opName)>, 1295 SOPKInstTable<0, opName> { 1296 let isCompare = 1; 1297 let isCommutable = 1; 1298 let mayRaiseFPException = 1; 1299 let Uses = [MODE]; 1300 let SchedRW = [WriteSFPU]; 1301} 1302 1303class SOPC_CMP_F16<string opName, 1304 SDPatternOperator cond = COND_NULL, string revOp = opName> 1305 : SOPC_Helper<SSrc_b16, f16, opName, cond>, 1306 Commutable_REV<revOp, !eq(revOp, opName)>, 1307 SOPKInstTable<0, opName> { 1308 let isCompare = 1; 1309 let isCommutable = 1; 1310 let mayRaiseFPException = 1; 1311 let Uses = [MODE]; 1312 let SchedRW = [WriteSFPU]; 1313} 1314 1315class SOPC_CMP_64<string opName, 1316 SDPatternOperator cond = COND_NULL, string revOp = opName> 1317 : SOPC_Helper<SSrc_b64, i64, opName, cond>, 1318 Commutable_REV<revOp, !eq(revOp, opName)> { 1319 let isCompare = 1; 1320 let isCommutable = 1; 1321} 1322 1323class SOPC_32<string opName, list<dag> pattern = []> 1324 : SOPC_Base<SSrc_b32, SSrc_b32, opName, pattern>; 1325 1326class SOPC_64_32<string opName, list<dag> pattern = []> 1327 : SOPC_Base<SSrc_b64, SSrc_b32, opName, pattern>; 1328 1329def S_CMP_EQ_I32 : SOPC_CMP_32 <"s_cmp_eq_i32">; 1330def S_CMP_LG_I32 : SOPC_CMP_32 <"s_cmp_lg_i32">; 1331def S_CMP_GT_I32 : SOPC_CMP_32 <"s_cmp_gt_i32", COND_SGT>; 1332def S_CMP_GE_I32 : SOPC_CMP_32 <"s_cmp_ge_i32", COND_SGE>; 1333def S_CMP_LT_I32 : SOPC_CMP_32 <"s_cmp_lt_i32", COND_SLT, "s_cmp_gt_i32">; 1334def S_CMP_LE_I32 : SOPC_CMP_32 <"s_cmp_le_i32", COND_SLE, "s_cmp_ge_i32">; 1335def S_CMP_EQ_U32 : SOPC_CMP_32 <"s_cmp_eq_u32", COND_EQ>; 1336def S_CMP_LG_U32 : SOPC_CMP_32 <"s_cmp_lg_u32", COND_NE>; 1337def S_CMP_GT_U32 : SOPC_CMP_32 <"s_cmp_gt_u32", COND_UGT>; 1338def S_CMP_GE_U32 : SOPC_CMP_32 <"s_cmp_ge_u32", COND_UGE>; 1339def S_CMP_LT_U32 : SOPC_CMP_32 <"s_cmp_lt_u32", COND_ULT, "s_cmp_gt_u32">; 1340def S_CMP_LE_U32 : SOPC_CMP_32 <"s_cmp_le_u32", COND_ULE, "s_cmp_ge_u32">; 1341 1342def S_BITCMP0_B32 : SOPC_32 <"s_bitcmp0_b32">; 1343def S_BITCMP1_B32 : SOPC_32 <"s_bitcmp1_b32">; 1344def S_BITCMP0_B64 : SOPC_64_32 <"s_bitcmp0_b64">; 1345def S_BITCMP1_B64 : SOPC_64_32 <"s_bitcmp1_b64">; 1346let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in 1347def S_SETVSKIP : SOPC_32 <"s_setvskip">; 1348 1349let SubtargetPredicate = isGFX8Plus in { 1350def S_CMP_EQ_U64 : SOPC_CMP_64 <"s_cmp_eq_u64", COND_EQ>; 1351def S_CMP_LG_U64 : SOPC_CMP_64 <"s_cmp_lg_u64", COND_NE>; 1352} // End SubtargetPredicate = isGFX8Plus 1353 1354let SubtargetPredicate = HasVGPRIndexMode in { 1355// Setting the GPR index mode is really writing the fields in the mode 1356// register. We don't want to add mode register uses to every 1357// instruction, and it's too complicated to deal with anyway. This is 1358// modeled just as a side effect. 1359def S_SET_GPR_IDX_ON : SOPC_Pseudo < 1360 "s_set_gpr_idx_on" , 1361 (outs), 1362 (ins SSrc_b32:$src0, GPRIdxMode:$src1), 1363 "$src0, $src1"> { 1364 let Defs = [M0, MODE]; // No scc def 1365 let Uses = [M0, MODE]; // Other bits of mode, m0 unmodified. 1366 let hasSideEffects = 1; // Sets mode.gpr_idx_en 1367 let FixedSize = 1; 1368} 1369} 1370 1371let SubtargetPredicate = HasSALUFloatInsts in { 1372 1373def S_CMP_LT_F32 : SOPC_CMP_F32<"s_cmp_lt_f32", COND_OLT, "s_cmp_gt_f32">; 1374def S_CMP_EQ_F32 : SOPC_CMP_F32<"s_cmp_eq_f32", COND_OEQ>; 1375def S_CMP_LE_F32 : SOPC_CMP_F32<"s_cmp_le_f32", COND_OLE, "s_cmp_ge_f32">; 1376def S_CMP_GT_F32 : SOPC_CMP_F32<"s_cmp_gt_f32", COND_OGT>; 1377def S_CMP_LG_F32 : SOPC_CMP_F32<"s_cmp_lg_f32", COND_ONE>; 1378def S_CMP_GE_F32 : SOPC_CMP_F32<"s_cmp_ge_f32", COND_OGE>; 1379def S_CMP_O_F32 : SOPC_CMP_F32<"s_cmp_o_f32", COND_O>; 1380def S_CMP_U_F32 : SOPC_CMP_F32<"s_cmp_u_f32", COND_UO>; 1381def S_CMP_NGE_F32 : SOPC_CMP_F32<"s_cmp_nge_f32", COND_ULT, "s_cmp_nle_f32">; 1382def S_CMP_NLG_F32 : SOPC_CMP_F32<"s_cmp_nlg_f32", COND_UEQ>; 1383def S_CMP_NGT_F32 : SOPC_CMP_F32<"s_cmp_ngt_f32", COND_ULE, "s_cmp_nlt_f32">; 1384def S_CMP_NLE_F32 : SOPC_CMP_F32<"s_cmp_nle_f32", COND_UGT>; 1385def S_CMP_NEQ_F32 : SOPC_CMP_F32<"s_cmp_neq_f32", COND_UNE>; 1386def S_CMP_NLT_F32 : SOPC_CMP_F32<"s_cmp_nlt_f32", COND_UGE>; 1387 1388def S_CMP_LT_F16 : SOPC_CMP_F16<"s_cmp_lt_f16", COND_OLT, "s_cmp_gt_f16">; 1389def S_CMP_EQ_F16 : SOPC_CMP_F16<"s_cmp_eq_f16", COND_OEQ>; 1390def S_CMP_LE_F16 : SOPC_CMP_F16<"s_cmp_le_f16", COND_OLE, "s_cmp_ge_f16">; 1391def S_CMP_GT_F16 : SOPC_CMP_F16<"s_cmp_gt_f16", COND_OGT>; 1392def S_CMP_LG_F16 : SOPC_CMP_F16<"s_cmp_lg_f16", COND_ONE>; 1393def S_CMP_GE_F16 : SOPC_CMP_F16<"s_cmp_ge_f16", COND_OGE>; 1394def S_CMP_O_F16 : SOPC_CMP_F16<"s_cmp_o_f16", COND_O>; 1395def S_CMP_U_F16 : SOPC_CMP_F16<"s_cmp_u_f16", COND_UO>; 1396def S_CMP_NGE_F16 : SOPC_CMP_F16<"s_cmp_nge_f16", COND_ULT, "s_cmp_nle_f16">; 1397def S_CMP_NLG_F16 : SOPC_CMP_F16<"s_cmp_nlg_f16", COND_UEQ>; 1398def S_CMP_NGT_F16 : SOPC_CMP_F16<"s_cmp_ngt_f16", COND_ULE, "s_cmp_nlt_f16">; 1399def S_CMP_NLE_F16 : SOPC_CMP_F16<"s_cmp_nle_f16", COND_UGT>; 1400def S_CMP_NEQ_F16 : SOPC_CMP_F16<"s_cmp_neq_f16", COND_UNE>; 1401def S_CMP_NLT_F16 : SOPC_CMP_F16<"s_cmp_nlt_f16", COND_UGE>; 1402 1403} // End SubtargetPredicate = HasSALUFloatInsts 1404 1405//===----------------------------------------------------------------------===// 1406// SOPP Instructions 1407//===----------------------------------------------------------------------===// 1408 1409class SOPP_Pseudo<string opName, dag ins, 1410 string asmOps = "", list<dag> pattern=[], 1411 string sep = !if(!empty(asmOps), "", " "), 1412 string keyName = opName> : 1413 SOP_Pseudo<opName, (outs), ins, sep # asmOps, pattern> { 1414 let mayLoad = 0; 1415 let mayStore = 0; 1416 let hasSideEffects = 0; 1417 let SALU = 1; 1418 let SOPP = 1; 1419 let FixedSize = 1; 1420 let SchedRW = [WriteSALU]; 1421 let UseNamedOperandTable = 1; 1422 bits <16> simm16; 1423 bits <1> fixed_imm = 0; 1424 string KeyName = keyName; 1425} 1426 1427class SOPPRelaxTable <bit isRelaxed, string keyName, string gfxip> { 1428 bit IsRelaxed = isRelaxed; 1429 string KeyName = keyName # gfxip; 1430} 1431 1432class SOPP_Real<SOPP_Pseudo ps, string name = ps.Mnemonic> : 1433 InstSI <ps.OutOperandList, ps.InOperandList, 1434 name # ps.AsmOperands> { 1435 let SALU = 1; 1436 let SOPP = 1; 1437 let isPseudo = 0; 1438 let isCodeGenOnly = 0; 1439 1440 // copy relevant pseudo op flags 1441 let SubtargetPredicate = ps.SubtargetPredicate; 1442 let OtherPredicates = ps.OtherPredicates; 1443 let AsmMatchConverter = ps.AsmMatchConverter; 1444 let UseNamedOperandTable = ps.UseNamedOperandTable; 1445 let TSFlags = ps.TSFlags; 1446 let SchedRW = ps.SchedRW; 1447 let mayLoad = ps.mayLoad; 1448 let mayStore = ps.mayStore; 1449 let isTerminator = ps.isTerminator; 1450 let isReturn = ps.isReturn; 1451 let isCall = ps.isCall; 1452 let isBranch = ps.isBranch; 1453 let isBarrier = ps.isBarrier; 1454 let Uses = ps.Uses; 1455 let Defs = ps.Defs; 1456 let isConvergent = ps.isConvergent; 1457 bits <16> simm16; 1458} 1459 1460class SOPP_Real_32 <bits<7> op, SOPP_Pseudo ps, string name = ps.Mnemonic> : SOPP_Real<ps, name>, 1461Enc32 { 1462 let Inst{15-0} = !if(ps.fixed_imm, ps.simm16, simm16); 1463 let Inst{22-16} = op; 1464 let Inst{31-23} = 0x17f; 1465} 1466 1467class SOPP_Real_64 <bits<7> op, SOPP_Pseudo ps, string name = ps.Mnemonic> : SOPP_Real<ps, name>, 1468Enc64 { 1469 // encoding 1470 let Inst{15-0} = !if(ps.fixed_imm, ps.simm16, simm16); 1471 let Inst{22-16} = op; 1472 let Inst{31-23} = 0x17f; 1473 //effectively a nop 1474 let Inst{47-32} = 0x0; 1475 let Inst{54-48} = 0x0; 1476 let Inst{63-55} = 0x17f; 1477} 1478 1479multiclass SOPP_With_Relaxation <string opName, dag ins, 1480 string asmOps, list<dag> pattern=[]> { 1481 def "" : SOPP_Pseudo <opName, ins, asmOps, pattern>; 1482 def _pad_s_nop : SOPP_Pseudo <opName # "_pad_s_nop", ins, asmOps, pattern, " ", opName>; 1483} 1484 1485def S_NOP : SOPP_Pseudo<"s_nop" , (ins i16imm:$simm16), "$simm16", 1486 [(int_amdgcn_s_nop timm:$simm16)]> { 1487 let hasSideEffects = 1; 1488} 1489 1490let isTerminator = 1 in { 1491def S_ENDPGM : SOPP_Pseudo<"s_endpgm", (ins Endpgm:$simm16), "$simm16", [], ""> { 1492 let isBarrier = 1; 1493 let isReturn = 1; 1494 let hasSideEffects = 1; 1495} 1496 1497def S_ENDPGM_SAVED : SOPP_Pseudo<"s_endpgm_saved", (ins)> { 1498 let SubtargetPredicate = isGFX8Plus; 1499 let simm16 = 0; 1500 let fixed_imm = 1; 1501 let isBarrier = 1; 1502 let isReturn = 1; 1503} 1504 1505let SubtargetPredicate = isGFX9GFX10GFX11 in { 1506 let isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1 in { 1507 def S_ENDPGM_ORDERED_PS_DONE : 1508 SOPP_Pseudo<"s_endpgm_ordered_ps_done", (ins)>; 1509 } // End isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1 1510} // End SubtargetPredicate = isGFX9GFX10GFX11 1511 1512let SubtargetPredicate = isGFX10Plus in { 1513 let isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1 in { 1514 def S_CODE_END : 1515 SOPP_Pseudo<"s_code_end", (ins)>; 1516 } // End isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1 1517} // End SubtargetPredicate = isGFX10Plus 1518 1519let isBranch = 1, SchedRW = [WriteBranch] in { 1520let isBarrier = 1 in { 1521defm S_BRANCH : SOPP_With_Relaxation< 1522 "s_branch" , (ins SOPPBrTarget:$simm16), "$simm16", 1523 [(br bb:$simm16)]>; 1524} 1525 1526let Uses = [SCC] in { 1527defm S_CBRANCH_SCC0 : SOPP_With_Relaxation< 1528 "s_cbranch_scc0" , (ins SOPPBrTarget:$simm16), 1529 "$simm16" 1530>; 1531defm S_CBRANCH_SCC1 : SOPP_With_Relaxation < 1532 "s_cbranch_scc1" , (ins SOPPBrTarget:$simm16), 1533 "$simm16" 1534>; 1535} // End Uses = [SCC] 1536 1537let Uses = [VCC] in { 1538defm S_CBRANCH_VCCZ : SOPP_With_Relaxation < 1539 "s_cbranch_vccz" , (ins SOPPBrTarget:$simm16), 1540 "$simm16" 1541>; 1542defm S_CBRANCH_VCCNZ : SOPP_With_Relaxation < 1543 "s_cbranch_vccnz" , (ins SOPPBrTarget:$simm16), 1544 "$simm16" 1545>; 1546} // End Uses = [VCC] 1547 1548let Uses = [EXEC] in { 1549defm S_CBRANCH_EXECZ : SOPP_With_Relaxation < 1550 "s_cbranch_execz" , (ins SOPPBrTarget:$simm16), 1551 "$simm16" 1552>; 1553defm S_CBRANCH_EXECNZ : SOPP_With_Relaxation < 1554 "s_cbranch_execnz" , (ins SOPPBrTarget:$simm16), 1555 "$simm16" 1556>; 1557} // End Uses = [EXEC] 1558 1559defm S_CBRANCH_CDBGSYS : SOPP_With_Relaxation < 1560 "s_cbranch_cdbgsys" , (ins SOPPBrTarget:$simm16), 1561 "$simm16" 1562>; 1563 1564defm S_CBRANCH_CDBGSYS_AND_USER : SOPP_With_Relaxation < 1565 "s_cbranch_cdbgsys_and_user" , (ins SOPPBrTarget:$simm16), 1566 "$simm16" 1567>; 1568 1569defm S_CBRANCH_CDBGSYS_OR_USER : SOPP_With_Relaxation < 1570 "s_cbranch_cdbgsys_or_user" , (ins SOPPBrTarget:$simm16), 1571 "$simm16" 1572>; 1573 1574defm S_CBRANCH_CDBGUSER : SOPP_With_Relaxation < 1575 "s_cbranch_cdbguser" , (ins SOPPBrTarget:$simm16), 1576 "$simm16" 1577>; 1578 1579} // End isBranch = 1 1580} // End isTerminator = 1 1581 1582let hasSideEffects = 1 in { 1583def S_BARRIER : SOPP_Pseudo <"s_barrier", (ins), "", 1584 [(int_amdgcn_s_barrier)]> { 1585 let SchedRW = [WriteBarrier]; 1586 let simm16 = 0; 1587 let fixed_imm = 1; 1588 let isConvergent = 1; 1589} 1590 1591def S_BARRIER_WAIT : SOPP_Pseudo <"s_barrier_wait", (ins i16imm:$simm16), "$simm16", 1592 [(int_amdgcn_s_barrier_wait timm:$simm16)]> { 1593 let SchedRW = [WriteBarrier]; 1594 let isConvergent = 1; 1595} 1596 1597def S_BARRIER_LEAVE : SOPP_Pseudo <"s_barrier_leave", (ins)> { 1598 let SchedRW = [WriteBarrier]; 1599 let simm16 = 0; 1600 let fixed_imm = 1; 1601 let isConvergent = 1; 1602 let Defs = [SCC]; 1603} 1604 1605def S_BARRIER_LEAVE_IMM : SOPP_Pseudo <"s_barrier_leave", 1606 (ins i16imm:$simm16), "$simm16", [(int_amdgcn_s_barrier_leave timm:$simm16)]>; 1607 1608def S_WAKEUP : SOPP_Pseudo <"s_wakeup", (ins) > { 1609 let SubtargetPredicate = isGFX8Plus; 1610 let simm16 = 0; 1611 let fixed_imm = 1; 1612 let mayLoad = 1; 1613 let mayStore = 1; 1614} 1615 1616def S_WAITCNT : SOPP_Pseudo <"s_waitcnt" , (ins SWaitCnt:$simm16), "$simm16", 1617 [(int_amdgcn_s_waitcnt timm:$simm16)]>; 1618 1619// "_soft" waitcnts are waitcnts that are either relaxed into their non-soft 1620// counterpart, or completely removed. 1621// 1622// These are inserted by SIMemoryLegalizer to resolve memory dependencies 1623// and later optimized by SIInsertWaitcnts 1624// For example, a S_WAITCNT_soft 0 can be completely removed in a function 1625// that doesn't access memory. 1626def S_WAITCNT_soft : SOPP_Pseudo <"s_soft_waitcnt" , (ins SWaitCnt:$simm16), "$simm16">; 1627def S_WAITCNT_VSCNT_soft : SOPK_WAITCNT<"s_soft_waitcnt_vscnt">; 1628let SubtargetPredicate = isGFX12Plus in { 1629 def S_WAIT_LOADCNT_soft : SOPP_Pseudo <"s_soft_wait_loadcnt", (ins s16imm:$simm16), "$simm16">; 1630 def S_WAIT_STORECNT_soft : SOPP_Pseudo <"s_soft_wait_storecnt", (ins s16imm:$simm16), "$simm16">; 1631let OtherPredicates = [HasImageInsts] in { 1632 def S_WAIT_SAMPLECNT_soft : SOPP_Pseudo <"s_soft_wait_samplecnt", (ins s16imm:$simm16), "$simm16">; 1633 def S_WAIT_BVHCNT_soft : SOPP_Pseudo <"s_soft_wait_bvhcnt", (ins s16imm:$simm16), "$simm16">; 1634} // End OtherPredicates = [HasImageInsts]. 1635 def S_WAIT_DSCNT_soft : SOPP_Pseudo <"s_soft_wait_dscnt", (ins s16imm:$simm16), "$simm16">; 1636 def S_WAIT_KMCNT_soft : SOPP_Pseudo <"s_soft_wait_kmcnt", (ins s16imm:$simm16), "$simm16">; 1637} 1638 1639def S_SETHALT : SOPP_Pseudo <"s_sethalt" , (ins i32imm:$simm16), "$simm16", 1640 [(int_amdgcn_s_sethalt timm:$simm16)]>; 1641def S_SETKILL : SOPP_Pseudo <"s_setkill" , (ins i16imm:$simm16), "$simm16">; 1642 1643// On SI the documentation says sleep for approximately 64 * low 2 1644// bits, consistent with the reported maximum of 448. On VI the 1645// maximum reported is 960 cycles, so 960 / 64 = 15 max, so is the 1646// maximum really 15 on VI? 1647def S_SLEEP : SOPP_Pseudo <"s_sleep", (ins i32imm:$simm16), 1648 "$simm16", [(int_amdgcn_s_sleep timm:$simm16)]> { 1649} 1650 1651def S_SLEEP_VAR : SOP1_0_32 <"s_sleep_var", [(int_amdgcn_s_sleep_var SSrc_b32:$src0)]> { 1652 let hasSideEffects = 1; 1653} 1654 1655def S_SETPRIO : SOPP_Pseudo <"s_setprio", (ins i16imm:$simm16), "$simm16", 1656 [(int_amdgcn_s_setprio timm:$simm16)]> { 1657} 1658 1659let Uses = [EXEC, M0] in { 1660def S_SENDMSG : SOPP_Pseudo <"s_sendmsg" , (ins SendMsg:$simm16), "$simm16", 1661 [(int_amdgcn_s_sendmsg (i32 timm:$simm16), M0)]> { 1662} 1663 1664def S_SENDMSGHALT : SOPP_Pseudo <"s_sendmsghalt" , (ins SendMsg:$simm16), "$simm16", 1665 [(int_amdgcn_s_sendmsghalt (i32 timm:$simm16), M0)]> { 1666} 1667 1668} // End Uses = [EXEC, M0] 1669 1670def S_TRAP : SOPP_Pseudo <"s_trap" , (ins i16imm:$simm16), "$simm16"> { 1671 let isTrap = 1; 1672} 1673 1674def S_ICACHE_INV : SOPP_Pseudo <"s_icache_inv", (ins)> { 1675 let simm16 = 0; 1676 let fixed_imm = 1; 1677} 1678def S_INCPERFLEVEL : SOPP_Pseudo <"s_incperflevel", (ins i32imm:$simm16), "$simm16", 1679 [(int_amdgcn_s_incperflevel timm:$simm16)]> { 1680} 1681def S_DECPERFLEVEL : SOPP_Pseudo <"s_decperflevel", (ins i32imm:$simm16), "$simm16", 1682 [(int_amdgcn_s_decperflevel timm:$simm16)]> { 1683} 1684 1685let Uses = [M0] in 1686def S_TTRACEDATA : SOPP_Pseudo <"s_ttracedata", (ins), "", 1687 [(int_amdgcn_s_ttracedata M0)]> { 1688 let simm16 = 0; 1689 let fixed_imm = 1; 1690} 1691 1692let SubtargetPredicate = HasVGPRIndexMode in { 1693def S_SET_GPR_IDX_OFF : SOPP_Pseudo<"s_set_gpr_idx_off", (ins) > { 1694 let simm16 = 0; 1695 let fixed_imm = 1; 1696 let Defs = [MODE]; 1697 let Uses = [MODE]; 1698} 1699} 1700} // End hasSideEffects 1701 1702let SubtargetPredicate = HasVGPRIndexMode in { 1703def S_SET_GPR_IDX_MODE : SOPP_Pseudo<"s_set_gpr_idx_mode", (ins GPRIdxMode:$simm16), 1704 "$simm16"> { 1705 let Defs = [M0, MODE]; 1706 let Uses = [MODE]; 1707} 1708} 1709 1710let SubtargetPredicate = isGFX10Plus in { 1711 def S_INST_PREFETCH : 1712 SOPP_Pseudo<"s_inst_prefetch", (ins s16imm:$simm16), "$simm16">; 1713 def S_CLAUSE : 1714 SOPP_Pseudo<"s_clause", (ins s16imm:$simm16), "$simm16">; 1715 def S_WAIT_IDLE : 1716 SOPP_Pseudo <"s_wait_idle", (ins)> { 1717 let simm16 = 0; 1718 let fixed_imm = 1; 1719 } 1720 def S_WAITCNT_DEPCTR : 1721 SOPP_Pseudo <"s_waitcnt_depctr" , (ins DepCtr:$simm16), "$simm16">; 1722 1723 let hasSideEffects = 0, Uses = [MODE], Defs = [MODE] in { 1724 def S_ROUND_MODE : 1725 SOPP_Pseudo<"s_round_mode", (ins s16imm:$simm16), "$simm16">; 1726 def S_DENORM_MODE : 1727 SOPP_Pseudo<"s_denorm_mode", (ins i32imm:$simm16), "$simm16", 1728 [(SIdenorm_mode (i32 timm:$simm16))]>; 1729 } 1730 1731 let hasSideEffects = 1 in 1732 def S_TTRACEDATA_IMM : 1733 SOPP_Pseudo<"s_ttracedata_imm", (ins s16imm:$simm16), "$simm16", 1734 [(int_amdgcn_s_ttracedata_imm timm:$simm16)]>; 1735} // End SubtargetPredicate = isGFX10Plus 1736 1737let SubtargetPredicate = isGFX11Plus in { 1738let OtherPredicates = [HasExportInsts] in 1739 def S_WAIT_EVENT : SOPP_Pseudo<"s_wait_event", (ins s16imm:$simm16), 1740 "$simm16"> { 1741 let hasSideEffects = 1; 1742 } 1743 def S_DELAY_ALU : SOPP_Pseudo<"s_delay_alu", (ins SDelayALU:$simm16), 1744 "$simm16">; 1745} // End SubtargetPredicate = isGFX11Plus 1746 1747let SubtargetPredicate = isGFX12Plus, hasSideEffects = 1 in { 1748 def S_WAIT_LOADCNT : 1749 SOPP_Pseudo<"s_wait_loadcnt", (ins s16imm:$simm16), "$simm16", 1750 [(int_amdgcn_s_wait_loadcnt timm:$simm16)]>; 1751 def S_WAIT_LOADCNT_DSCNT : 1752 SOPP_Pseudo<"s_wait_loadcnt_dscnt", (ins s16imm:$simm16), "$simm16">; 1753 def S_WAIT_STORECNT : 1754 SOPP_Pseudo<"s_wait_storecnt", (ins s16imm:$simm16), "$simm16", 1755 [(int_amdgcn_s_wait_storecnt timm:$simm16)]>; 1756 def S_WAIT_STORECNT_DSCNT : 1757 SOPP_Pseudo<"s_wait_storecnt_dscnt", (ins s16imm:$simm16), "$simm16">; 1758let OtherPredicates = [HasImageInsts] in { 1759 def S_WAIT_SAMPLECNT : 1760 SOPP_Pseudo<"s_wait_samplecnt", (ins s16imm:$simm16), "$simm16", 1761 [(int_amdgcn_s_wait_samplecnt timm:$simm16)]>; 1762 def S_WAIT_BVHCNT : 1763 SOPP_Pseudo<"s_wait_bvhcnt", (ins s16imm:$simm16), "$simm16", 1764 [(int_amdgcn_s_wait_bvhcnt timm:$simm16)]>; 1765} // End OtherPredicates = [HasImageInsts]. 1766let OtherPredicates = [HasExportInsts] in 1767 def S_WAIT_EXPCNT : 1768 SOPP_Pseudo<"s_wait_expcnt", (ins s16imm:$simm16), "$simm16", 1769 [(int_amdgcn_s_wait_expcnt timm:$simm16)]>; 1770 def S_WAIT_DSCNT : 1771 SOPP_Pseudo<"s_wait_dscnt", (ins s16imm:$simm16), "$simm16", 1772 [(int_amdgcn_s_wait_dscnt timm:$simm16)]>; 1773 def S_WAIT_KMCNT : 1774 SOPP_Pseudo<"s_wait_kmcnt", (ins s16imm:$simm16), "$simm16", 1775 [(int_amdgcn_s_wait_kmcnt timm:$simm16)]>; 1776} // End SubtargetPredicate = isGFX12Plus, hasSideEffects = 1 1777 1778//===----------------------------------------------------------------------===// 1779// SOP1 Patterns 1780//===----------------------------------------------------------------------===// 1781 1782def : GCNPat < 1783 (AMDGPUendpgm), 1784 (S_ENDPGM (i16 0)) 1785>; 1786 1787def : GCNPat < 1788 (int_amdgcn_endpgm), 1789 (S_ENDPGM (i16 0)) 1790>; 1791 1792def : GCNPat < 1793 (i64 (UniformUnaryFrag<ctpop> i64:$src)), 1794 (i64 (REG_SEQUENCE SReg_64, 1795 (i32 (COPY_TO_REGCLASS (S_BCNT1_I32_B64 $src), SReg_32)), sub0, 1796 (S_MOV_B32 (i32 0)), sub1)) 1797>; 1798 1799def : GCNPat < 1800 (i32 (UniformBinFrag<smax> i32:$x, (i32 (ineg i32:$x)))), 1801 (S_ABS_I32 SReg_32:$x) 1802>; 1803 1804def : GCNPat < 1805 (i16 imm:$imm), 1806 (S_MOV_B32 imm:$imm) 1807>; 1808 1809// Same as a 32-bit inreg 1810def : GCNPat< 1811 (i32 (UniformUnaryFrag<sext> i16:$src)), 1812 (S_SEXT_I32_I16 $src) 1813>; 1814 1815let SubtargetPredicate = isNotGFX12Plus in 1816 def : GCNPat <(int_amdgcn_s_wait_event_export_ready), (S_WAIT_EVENT (i16 0))>; 1817let SubtargetPredicate = isGFX12Plus in 1818 def : GCNPat <(int_amdgcn_s_wait_event_export_ready), (S_WAIT_EVENT (i16 2))>; 1819 1820// The first 10 bits of the mode register are the core FP mode on all 1821// subtargets. 1822// 1823// The high bits include additional fields, intermixed with some 1824// non-floating point environment information. We extract the full 1825// register and clear non-relevant bits. 1826// 1827// EXCP_EN covers floating point exceptions, but also some other 1828// non-FP exceptions. 1829// 1830// Bits 12-18 cover the relevant exception mask on all subtargets. 1831// 1832// FIXME: Bit 18 is int_div0, should this be in the FP environment? I 1833// think the only source is v_rcp_iflag_i32. 1834// 1835// On GFX9+: 1836// Bit 23 is the additional FP16_OVFL mode. 1837// 1838// Bits 19, 20, and 21 cover non-FP exceptions and differ between 1839// gfx9/10/11, so we ignore them here. 1840 1841// TODO: Would it be cheaper to emit multiple s_getreg_b32 calls for 1842// the ranges and combine the results? 1843 1844defvar fp_round_mask = !add(!shl(1, 4), -1); 1845defvar fp_denorm_mask = !shl(!add(!shl(1, 4), -1), 4); 1846defvar dx10_clamp_mask = !shl(1, 8); 1847defvar ieee_mode_mask = !shl(1, 9); 1848 1849// Covers fp_round, fp_denorm, dx10_clamp, and IEEE bit. 1850defvar fpmode_mask = 1851 !or(fp_round_mask, fp_denorm_mask, dx10_clamp_mask, ieee_mode_mask); 1852 1853defvar fp_excp_en_mask = !shl(!add(!shl(1, 7), -1), 12); 1854defvar fp16_ovfl = !shl(1, 23); 1855defvar fpmode_mask_gfx6plus = !or(fpmode_mask, fp_excp_en_mask); 1856defvar fpmode_mask_gfx9plus = !or(fpmode_mask_gfx6plus, fp16_ovfl); 1857 1858class GetFPModePat<int fpmode_mask> : GCNPat< 1859 (i32 get_fpmode), 1860 (S_AND_B32 (i32 fpmode_mask), 1861 (S_GETREG_B32 getHwRegImm< 1862 HWREG.MODE, 0, 1863 !add(!logtwo(fpmode_mask), 1)>.ret)) 1864>; 1865 1866// TODO: Might be worth moving to custom lowering so the and is 1867// exposed to demanded bits optimizations. Most users probably only 1868// care about the rounding or denorm mode bits. We also can reduce the 1869// demanded read from the getreg immediate. 1870let SubtargetPredicate = isGFX9Plus in { 1871// Last bit = FP16_OVFL 1872def : GetFPModePat<fpmode_mask_gfx9plus>; 1873} 1874 1875// Last bit = EXCP_EN.int_div0 1876let SubtargetPredicate = isNotGFX9Plus in { 1877def : GetFPModePat<fpmode_mask_gfx6plus>; 1878} 1879 1880let SubtargetPredicate = isGFX9GFX10 in 1881def : GCNPat< 1882 (int_amdgcn_pops_exiting_wave_id), 1883 (S_MOV_B32_sideeffects (i32 SRC_POPS_EXITING_WAVE_ID)) 1884>; 1885 1886//===----------------------------------------------------------------------===// 1887// SOP2 Patterns 1888//===----------------------------------------------------------------------===// 1889 1890def UniformSelect : PatFrag< 1891 (ops node:$src0, node:$src1), 1892 (select SCC, $src0, $src1), 1893 [{ return !N->isDivergent(); }] 1894>; 1895 1896let AddedComplexity = 20 in { 1897 def : GCNPat< 1898 (i32 (UniformSelect i32:$src0, i32:$src1)), 1899 (S_CSELECT_B32 SSrc_b32:$src0, SSrc_b32:$src1) 1900 >; 1901 1902 // TODO: The predicate should not be necessary, but enabling this pattern for 1903 // all subtargets generates worse code in some cases. 1904 let OtherPredicates = [HasPseudoScalarTrans] in 1905 def : GCNPat< 1906 (f32 (UniformSelect f32:$src0, f32:$src1)), 1907 (S_CSELECT_B32 SSrc_b32:$src0, SSrc_b32:$src1) 1908 >; 1909} 1910 1911// V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector 1912// case, the sgpr-copies pass will fix this to use the vector version. 1913def : GCNPat < 1914 (i32 (addc i32:$src0, i32:$src1)), 1915 (S_ADD_U32 $src0, $src1) 1916>; 1917 1918// FIXME: We need to use COPY_TO_REGCLASS to work-around the fact that 1919// REG_SEQUENCE patterns don't support instructions with multiple 1920// outputs. 1921def : GCNPat< 1922 (i64 (UniformUnaryFrag<zext> i16:$src)), 1923 (REG_SEQUENCE SReg_64, 1924 (i32 (COPY_TO_REGCLASS (S_AND_B32 $src, (S_MOV_B32 (i32 0xffff))), SGPR_32)), sub0, 1925 (S_MOV_B32 (i32 0)), sub1) 1926>; 1927 1928def : GCNPat < 1929 (i64 (UniformUnaryFrag<sext> i16:$src)), 1930 (REG_SEQUENCE SReg_64, (i32 (S_SEXT_I32_I16 $src)), sub0, 1931 (i32 (COPY_TO_REGCLASS (S_ASHR_I32 (i32 (S_SEXT_I32_I16 $src)), (S_MOV_B32 (i32 31))), SGPR_32)), sub1) 1932>; 1933 1934def : GCNPat< 1935 (i32 (UniformUnaryFrag<zext> i16:$src)), 1936 (S_AND_B32 (S_MOV_B32 (i32 0xffff)), $src) 1937>; 1938 1939class ScalarNot2Pat<Instruction inst, SDPatternOperator op, ValueType vt, 1940 SDPatternOperator notnode = !if(vt.isVector, vnot, not)> : GCNPat< 1941 (UniformBinFrag<op> vt:$src0, (notnode vt:$src1)), 1942 (inst getSOPSrcForVT<vt>.ret:$src0, getSOPSrcForVT<vt>.ret:$src1) 1943>; 1944 1945// Match these for some more types 1946// TODO: i1 1947def : ScalarNot2Pat<S_ANDN2_B32, and, i16>; 1948def : ScalarNot2Pat<S_ANDN2_B32, and, v2i16>; 1949def : ScalarNot2Pat<S_ANDN2_B64, and, v4i16>; 1950def : ScalarNot2Pat<S_ANDN2_B64, and, v2i32>; 1951 1952def : ScalarNot2Pat<S_ORN2_B32, or, i16>; 1953def : ScalarNot2Pat<S_ORN2_B32, or, v2i16>; 1954def : ScalarNot2Pat<S_ORN2_B64, or, v4i16>; 1955def : ScalarNot2Pat<S_ORN2_B64, or, v2i32>; 1956 1957//===----------------------------------------------------------------------===// 1958// Target-specific instruction encodings. 1959//===----------------------------------------------------------------------===// 1960 1961class Select<GFXGen Gen, string opName> : SIMCInstr<opName, Gen.Subtarget> { 1962 Predicate AssemblerPredicate = Gen.AssemblerPredicate; 1963 string DecoderNamespace = Gen.DecoderNamespace; 1964} 1965 1966class Select_vi<string opName> : SIMCInstr<opName, SIEncodingFamily.VI> { 1967 Predicate AssemblerPredicate = isGFX8GFX9; 1968 string DecoderNamespace = "GFX8"; 1969} 1970 1971class Select_gfx6_gfx7<string opName> : SIMCInstr<opName, SIEncodingFamily.SI> { 1972 Predicate AssemblerPredicate = isGFX6GFX7; 1973 string DecoderNamespace = "GFX6GFX7"; 1974} 1975 1976//===----------------------------------------------------------------------===// 1977// SOP1 - GFX11, GFX12 1978//===----------------------------------------------------------------------===// 1979 1980multiclass SOP1_Real_gfx11<bits<8> op, string name = !tolower(NAME)> { 1981 defvar ps = !cast<SOP1_Pseudo>(NAME); 1982 def _gfx11 : SOP1_Real<op, ps, name>, 1983 Select<GFX11Gen, ps.PseudoInstr>; 1984 if !ne(ps.Mnemonic, name) then 1985 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 1986 let AssemblerPredicate = isGFX11Only; 1987 } 1988} 1989 1990multiclass SOP1_Real_gfx12<bits<8> op, string name = !tolower(NAME)> { 1991 defvar ps = !cast<SOP1_Pseudo>(NAME); 1992 def _gfx12 : SOP1_Real<op, ps, name>, 1993 Select<GFX12Gen, ps.PseudoInstr>; 1994 if !ne(ps.Mnemonic, name) then 1995 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 1996 let AssemblerPredicate = isGFX12Plus; 1997 } 1998} 1999 2000multiclass SOP1_M0_Real_gfx12<bits<8> op> { 2001 def _gfx12 : SOP1_Real<op, !cast<SOP1_Pseudo>(NAME)>, 2002 Select<GFX12Gen, !cast<SOP1_Pseudo>(NAME).PseudoInstr> { 2003 let Inst{7-0} = M0_gfx11plus.HWEncoding{7-0}; // Set Src0 encoding to M0 2004 } 2005} 2006 2007multiclass SOP1_IMM_Real_gfx12<bits<8> op> { 2008 defvar ps = !cast<SOP1_Pseudo>(NAME); 2009 def _gfx12 : SOP1_Real<op, ps>, 2010 Select<GFX12Gen, ps.PseudoInstr>; 2011} 2012 2013multiclass SOP1_Real_gfx11_gfx12<bits<8> op, string name = !tolower(NAME)> : 2014 SOP1_Real_gfx11<op, name>, SOP1_Real_gfx12<op, name>; 2015 2016defm S_MOV_B32 : SOP1_Real_gfx11_gfx12<0x000>; 2017defm S_MOV_B64 : SOP1_Real_gfx11_gfx12<0x001>; 2018defm S_CMOV_B32 : SOP1_Real_gfx11_gfx12<0x002>; 2019defm S_CMOV_B64 : SOP1_Real_gfx11_gfx12<0x003>; 2020defm S_BREV_B32 : SOP1_Real_gfx11_gfx12<0x004>; 2021defm S_BREV_B64 : SOP1_Real_gfx11_gfx12<0x005>; 2022defm S_FF1_I32_B32 : SOP1_Real_gfx11_gfx12<0x008, "s_ctz_i32_b32">; 2023defm S_FF1_I32_B64 : SOP1_Real_gfx11_gfx12<0x009, "s_ctz_i32_b64">; 2024defm S_FLBIT_I32_B32 : SOP1_Real_gfx11_gfx12<0x00a, "s_clz_i32_u32">; 2025defm S_FLBIT_I32_B64 : SOP1_Real_gfx11_gfx12<0x00b, "s_clz_i32_u64">; 2026defm S_FLBIT_I32 : SOP1_Real_gfx11_gfx12<0x00c, "s_cls_i32">; 2027defm S_FLBIT_I32_I64 : SOP1_Real_gfx11_gfx12<0x00d, "s_cls_i32_i64">; 2028defm S_SEXT_I32_I8 : SOP1_Real_gfx11_gfx12<0x00e>; 2029defm S_SEXT_I32_I16 : SOP1_Real_gfx11_gfx12<0x00f>; 2030defm S_BITSET0_B32 : SOP1_Real_gfx11_gfx12<0x010>; 2031defm S_BITSET0_B64 : SOP1_Real_gfx11_gfx12<0x011>; 2032defm S_BITSET1_B32 : SOP1_Real_gfx11_gfx12<0x012>; 2033defm S_BITSET1_B64 : SOP1_Real_gfx11_gfx12<0x013>; 2034defm S_BITREPLICATE_B64_B32 : SOP1_Real_gfx11_gfx12<0x014>; 2035defm S_ABS_I32 : SOP1_Real_gfx11_gfx12<0x015>; 2036defm S_BCNT0_I32_B32 : SOP1_Real_gfx11_gfx12<0x016>; 2037defm S_BCNT0_I32_B64 : SOP1_Real_gfx11_gfx12<0x017>; 2038defm S_BCNT1_I32_B32 : SOP1_Real_gfx11_gfx12<0x018>; 2039defm S_BCNT1_I32_B64 : SOP1_Real_gfx11_gfx12<0x019>; 2040defm S_QUADMASK_B32 : SOP1_Real_gfx11_gfx12<0x01a>; 2041defm S_QUADMASK_B64 : SOP1_Real_gfx11_gfx12<0x01b>; 2042defm S_WQM_B32 : SOP1_Real_gfx11_gfx12<0x01c>; 2043defm S_WQM_B64 : SOP1_Real_gfx11_gfx12<0x01d>; 2044defm S_NOT_B32 : SOP1_Real_gfx11_gfx12<0x01e>; 2045defm S_NOT_B64 : SOP1_Real_gfx11_gfx12<0x01f>; 2046defm S_AND_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x020>; 2047defm S_AND_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x021>; 2048defm S_OR_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x022>; 2049defm S_OR_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x023>; 2050defm S_XOR_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x024>; 2051defm S_XOR_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x025>; 2052defm S_NAND_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x026>; 2053defm S_NAND_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x027>; 2054defm S_NOR_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x028>; 2055defm S_NOR_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x029>; 2056defm S_XNOR_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x02a>; 2057defm S_ANDN1_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x02c, "s_and_not0_saveexec_b32">; 2058defm S_ANDN1_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x02d, "s_and_not0_saveexec_b64">; 2059defm S_ORN1_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x02e, "s_or_not0_saveexec_b32">; 2060defm S_ORN1_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x02f, "s_or_not0_saveexec_b64">; 2061defm S_ANDN2_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x030, "s_and_not1_saveexec_b32">; 2062defm S_ANDN2_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x031, "s_and_not1_saveexec_b64">; 2063defm S_ORN2_SAVEEXEC_B32 : SOP1_Real_gfx11_gfx12<0x032, "s_or_not1_saveexec_b32">; 2064defm S_ORN2_SAVEEXEC_B64 : SOP1_Real_gfx11_gfx12<0x033, "s_or_not1_saveexec_b64">; 2065defm S_ANDN1_WREXEC_B32 : SOP1_Real_gfx11_gfx12<0x034, "s_and_not0_wrexec_b32">; 2066defm S_ANDN1_WREXEC_B64 : SOP1_Real_gfx11_gfx12<0x035, "s_and_not0_wrexec_b64">; 2067defm S_ANDN2_WREXEC_B32 : SOP1_Real_gfx11_gfx12<0x036, "s_and_not1_wrexec_b32">; 2068defm S_ANDN2_WREXEC_B64 : SOP1_Real_gfx11_gfx12<0x037, "s_and_not1_wrexec_b64">; 2069defm S_MOVRELS_B32 : SOP1_Real_gfx11_gfx12<0x040>; 2070defm S_MOVRELS_B64 : SOP1_Real_gfx11_gfx12<0x041>; 2071defm S_MOVRELD_B32 : SOP1_Real_gfx11_gfx12<0x042>; 2072defm S_MOVRELD_B64 : SOP1_Real_gfx11_gfx12<0x043>; 2073defm S_MOVRELSD_2_B32 : SOP1_Real_gfx11_gfx12<0x044>; 2074defm S_GETPC_B64 : SOP1_Real_gfx11_gfx12<0x047>; 2075defm S_SETPC_B64 : SOP1_Real_gfx11_gfx12<0x048>; 2076defm S_SWAPPC_B64 : SOP1_Real_gfx11_gfx12<0x049>; 2077defm S_RFE_B64 : SOP1_Real_gfx11_gfx12<0x04a>; 2078defm S_SENDMSG_RTN_B32 : SOP1_Real_gfx11_gfx12<0x04c>; 2079defm S_SENDMSG_RTN_B64 : SOP1_Real_gfx11_gfx12<0x04d>; 2080defm S_BARRIER_SIGNAL_M0 : SOP1_M0_Real_gfx12<0x04e>; 2081defm S_BARRIER_SIGNAL_ISFIRST_M0 : SOP1_M0_Real_gfx12<0x04f>; 2082defm S_GET_BARRIER_STATE_M0 : SOP1_M0_Real_gfx12<0x050>; 2083defm S_BARRIER_INIT_M0 : SOP1_M0_Real_gfx12<0x051>; 2084defm S_BARRIER_JOIN_M0 : SOP1_M0_Real_gfx12<0x052>; 2085defm S_BARRIER_SIGNAL_IMM : SOP1_IMM_Real_gfx12<0x04e>; 2086defm S_BARRIER_SIGNAL_ISFIRST_IMM : SOP1_IMM_Real_gfx12<0x04f>; 2087defm S_GET_BARRIER_STATE_IMM : SOP1_IMM_Real_gfx12<0x050>; 2088defm S_BARRIER_INIT_IMM : SOP1_IMM_Real_gfx12<0x051>; 2089defm S_BARRIER_JOIN_IMM : SOP1_IMM_Real_gfx12<0x052>; 2090defm S_SLEEP_VAR : SOP1_IMM_Real_gfx12<0x058>; 2091 2092//===----------------------------------------------------------------------===// 2093// SOP1 - GFX1150, GFX12 2094//===----------------------------------------------------------------------===// 2095 2096defm S_CEIL_F32 : SOP1_Real_gfx11_gfx12<0x060>; 2097defm S_FLOOR_F32 : SOP1_Real_gfx11_gfx12<0x061>; 2098defm S_TRUNC_F32 : SOP1_Real_gfx11_gfx12<0x062>; 2099defm S_RNDNE_F32 : SOP1_Real_gfx11_gfx12<0x063>; 2100defm S_CVT_F32_I32 : SOP1_Real_gfx11_gfx12<0x064>; 2101defm S_CVT_F32_U32 : SOP1_Real_gfx11_gfx12<0x065>; 2102defm S_CVT_I32_F32 : SOP1_Real_gfx11_gfx12<0x066>; 2103defm S_CVT_U32_F32 : SOP1_Real_gfx11_gfx12<0x067>; 2104defm S_CVT_F16_F32 : SOP1_Real_gfx11_gfx12<0x068>; 2105defm S_CVT_F32_F16 : SOP1_Real_gfx11_gfx12<0x069>; 2106defm S_CVT_HI_F32_F16 : SOP1_Real_gfx11_gfx12<0x06a>; 2107defm S_CEIL_F16 : SOP1_Real_gfx11_gfx12<0x06b>; 2108defm S_FLOOR_F16 : SOP1_Real_gfx11_gfx12<0x06c>; 2109defm S_TRUNC_F16 : SOP1_Real_gfx11_gfx12<0x06d>; 2110defm S_RNDNE_F16 : SOP1_Real_gfx11_gfx12<0x06e>; 2111 2112//===----------------------------------------------------------------------===// 2113// SOP1 - GFX10. 2114//===----------------------------------------------------------------------===// 2115 2116multiclass SOP1_Real_gfx10<bits<8> op> { 2117 defvar ps = !cast<SOP1_Pseudo>(NAME); 2118 def _gfx10 : SOP1_Real<op, ps>, 2119 Select<GFX10Gen, ps.PseudoInstr>; 2120} 2121 2122multiclass SOP1_Real_gfx10_gfx11_gfx12<bits<8> op> : 2123 SOP1_Real_gfx10<op>, SOP1_Real_gfx11_gfx12<op>; 2124 2125defm S_ANDN1_SAVEEXEC_B64 : SOP1_Real_gfx10<0x037>; 2126defm S_ORN1_SAVEEXEC_B64 : SOP1_Real_gfx10<0x038>; 2127defm S_ANDN1_WREXEC_B64 : SOP1_Real_gfx10<0x039>; 2128defm S_ANDN2_WREXEC_B64 : SOP1_Real_gfx10<0x03a>; 2129defm S_BITREPLICATE_B64_B32 : SOP1_Real_gfx10<0x03b>; 2130defm S_AND_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03c>; 2131defm S_OR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03d>; 2132defm S_XOR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03e>; 2133defm S_ANDN2_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03f>; 2134defm S_ORN2_SAVEEXEC_B32 : SOP1_Real_gfx10<0x040>; 2135defm S_NAND_SAVEEXEC_B32 : SOP1_Real_gfx10<0x041>; 2136defm S_NOR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x042>; 2137defm S_XNOR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x043>; 2138defm S_ANDN1_SAVEEXEC_B32 : SOP1_Real_gfx10<0x044>; 2139defm S_ORN1_SAVEEXEC_B32 : SOP1_Real_gfx10<0x045>; 2140defm S_ANDN1_WREXEC_B32 : SOP1_Real_gfx10<0x046>; 2141defm S_ANDN2_WREXEC_B32 : SOP1_Real_gfx10<0x047>; 2142defm S_MOVRELSD_2_B32 : SOP1_Real_gfx10<0x049>; 2143 2144//===----------------------------------------------------------------------===// 2145// SOP1 - GFX6, GFX7, GFX10, GFX11. 2146//===----------------------------------------------------------------------===// 2147 2148 2149multiclass SOP1_Real_gfx6_gfx7<bits<8> op> { 2150 defvar ps = !cast<SOP1_Pseudo>(NAME); 2151 def _gfx6_gfx7 : SOP1_Real<op, ps>, 2152 Select_gfx6_gfx7<ps.PseudoInstr>; 2153} 2154 2155multiclass SOP1_Real_gfx6_gfx7_gfx10<bits<8> op> : 2156 SOP1_Real_gfx6_gfx7<op>, SOP1_Real_gfx10<op>; 2157 2158multiclass SOP1_Real_gfx6_gfx7_gfx10_gfx11_gfx12<bits<8> op> : 2159 SOP1_Real_gfx6_gfx7<op>, SOP1_Real_gfx10_gfx11_gfx12<op>; 2160 2161defm S_CBRANCH_JOIN : SOP1_Real_gfx6_gfx7<0x032>; 2162 2163defm S_MOV_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x003>; 2164defm S_MOV_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x004>; 2165defm S_CMOV_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x005>; 2166defm S_CMOV_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x006>; 2167defm S_NOT_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x007>; 2168defm S_NOT_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x008>; 2169defm S_WQM_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x009>; 2170defm S_WQM_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x00a>; 2171defm S_BREV_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x00b>; 2172defm S_BREV_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x00c>; 2173defm S_BCNT0_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x00d>; 2174defm S_BCNT0_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x00e>; 2175defm S_BCNT1_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x00f>; 2176defm S_BCNT1_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x010>; 2177defm S_FF0_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x011>; 2178defm S_FF0_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x012>; 2179defm S_FF1_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x013>; 2180defm S_FF1_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x014>; 2181defm S_FLBIT_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x015>; 2182defm S_FLBIT_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x016>; 2183defm S_FLBIT_I32 : SOP1_Real_gfx6_gfx7_gfx10<0x017>; 2184defm S_FLBIT_I32_I64 : SOP1_Real_gfx6_gfx7_gfx10<0x018>; 2185defm S_SEXT_I32_I8 : SOP1_Real_gfx6_gfx7_gfx10<0x019>; 2186defm S_SEXT_I32_I16 : SOP1_Real_gfx6_gfx7_gfx10<0x01a>; 2187defm S_BITSET0_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x01b>; 2188defm S_BITSET0_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x01c>; 2189defm S_BITSET1_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x01d>; 2190defm S_BITSET1_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x01e>; 2191defm S_GETPC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x01f>; 2192defm S_SETPC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x020>; 2193defm S_SWAPPC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x021>; 2194defm S_RFE_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x022>; 2195defm S_AND_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x024>; 2196defm S_OR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x025>; 2197defm S_XOR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x026>; 2198defm S_ANDN2_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x027>; 2199defm S_ORN2_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x028>; 2200defm S_NAND_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x029>; 2201defm S_NOR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02a>; 2202defm S_XNOR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10_gfx11_gfx12<0x02b>; 2203defm S_QUADMASK_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x02c>; 2204defm S_QUADMASK_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02d>; 2205defm S_MOVRELS_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x02e>; 2206defm S_MOVRELS_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02f>; 2207defm S_MOVRELD_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x030>; 2208defm S_MOVRELD_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x031>; 2209defm S_ABS_I32 : SOP1_Real_gfx6_gfx7_gfx10<0x034>; 2210 2211//===----------------------------------------------------------------------===// 2212// SOP2 - GFX12 2213//===----------------------------------------------------------------------===// 2214 2215multiclass SOP2_Real_gfx12<bits<7> op, string name = !tolower(NAME)> { 2216 defvar ps = !cast<SOP2_Pseudo>(NAME); 2217 def _gfx12 : SOP2_Real32<op, ps, name>, 2218 Select<GFX12Gen, ps.PseudoInstr>; 2219 if !ne(ps.Mnemonic, name) then 2220 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 2221 let AssemblerPredicate = isGFX12Plus; 2222 } 2223} 2224 2225defm S_MINIMUM_F32 : SOP2_Real_gfx12<0x04f>; 2226defm S_MAXIMUM_F32 : SOP2_Real_gfx12<0x050>; 2227defm S_MINIMUM_F16 : SOP2_Real_gfx12<0x051>; 2228defm S_MAXIMUM_F16 : SOP2_Real_gfx12<0x052>; 2229 2230//===----------------------------------------------------------------------===// 2231// SOP2 - GFX11, GFX12. 2232//===----------------------------------------------------------------------===// 2233 2234multiclass SOP2_Real_gfx11<bits<7> op, string name = !tolower(NAME)> { 2235 defvar ps = !cast<SOP2_Pseudo>(NAME); 2236 def _gfx11 : SOP2_Real32<op, ps, name>, 2237 Select<GFX11Gen, ps.PseudoInstr>; 2238 if !ne(ps.Mnemonic, name) then 2239 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 2240 let AssemblerPredicate = isGFX11Only; 2241 } 2242} 2243 2244multiclass SOP2_Real_gfx11_gfx12<bits<7> op, string name = !tolower(NAME)> : 2245 SOP2_Real_gfx11<op, name>, SOP2_Real_gfx12<op, name>; 2246 2247defm S_ABSDIFF_I32 : SOP2_Real_gfx11_gfx12<0x006>; 2248defm S_LSHL_B32 : SOP2_Real_gfx11_gfx12<0x008>; 2249defm S_LSHL_B64 : SOP2_Real_gfx11_gfx12<0x009>; 2250defm S_LSHR_B32 : SOP2_Real_gfx11_gfx12<0x00a>; 2251defm S_LSHR_B64 : SOP2_Real_gfx11_gfx12<0x00b>; 2252defm S_ASHR_I32 : SOP2_Real_gfx11_gfx12<0x00c>; 2253defm S_ASHR_I64 : SOP2_Real_gfx11_gfx12<0x00d>; 2254defm S_LSHL1_ADD_U32 : SOP2_Real_gfx11_gfx12<0x00e>; 2255defm S_LSHL2_ADD_U32 : SOP2_Real_gfx11_gfx12<0x00f>; 2256defm S_LSHL3_ADD_U32 : SOP2_Real_gfx11_gfx12<0x010>; 2257defm S_LSHL4_ADD_U32 : SOP2_Real_gfx11_gfx12<0x011>; 2258defm S_MIN_I32 : SOP2_Real_gfx11_gfx12<0x012>; 2259defm S_MIN_U32 : SOP2_Real_gfx11_gfx12<0x013>; 2260defm S_MAX_I32 : SOP2_Real_gfx11_gfx12<0x014>; 2261defm S_MAX_U32 : SOP2_Real_gfx11_gfx12<0x015>; 2262defm S_AND_B32 : SOP2_Real_gfx11_gfx12<0x016>; 2263defm S_AND_B64 : SOP2_Real_gfx11_gfx12<0x017>; 2264defm S_OR_B32 : SOP2_Real_gfx11_gfx12<0x018>; 2265defm S_OR_B64 : SOP2_Real_gfx11_gfx12<0x019>; 2266defm S_XOR_B32 : SOP2_Real_gfx11_gfx12<0x01a>; 2267defm S_XOR_B64 : SOP2_Real_gfx11_gfx12<0x01b>; 2268defm S_NAND_B32 : SOP2_Real_gfx11_gfx12<0x01c>; 2269defm S_NAND_B64 : SOP2_Real_gfx11_gfx12<0x01d>; 2270defm S_NOR_B32 : SOP2_Real_gfx11_gfx12<0x01e>; 2271defm S_NOR_B64 : SOP2_Real_gfx11_gfx12<0x01f>; 2272defm S_XNOR_B32 : SOP2_Real_gfx11_gfx12<0x020>; 2273defm S_XNOR_B64 : SOP2_Real_gfx11_gfx12<0x021>; 2274defm S_ANDN2_B32 : SOP2_Real_gfx11_gfx12<0x022, "s_and_not1_b32">; 2275defm S_ANDN2_B64 : SOP2_Real_gfx11_gfx12<0x023, "s_and_not1_b64">; 2276defm S_ORN2_B32 : SOP2_Real_gfx11_gfx12<0x024, "s_or_not1_b32">; 2277defm S_ORN2_B64 : SOP2_Real_gfx11_gfx12<0x025, "s_or_not1_b64">; 2278defm S_BFE_U32 : SOP2_Real_gfx11_gfx12<0x026>; 2279defm S_BFE_I32 : SOP2_Real_gfx11_gfx12<0x027>; 2280defm S_BFE_U64 : SOP2_Real_gfx11_gfx12<0x028>; 2281defm S_BFE_I64 : SOP2_Real_gfx11_gfx12<0x029>; 2282defm S_BFM_B32 : SOP2_Real_gfx11_gfx12<0x02a>; 2283defm S_BFM_B64 : SOP2_Real_gfx11_gfx12<0x02b>; 2284defm S_MUL_I32 : SOP2_Real_gfx11_gfx12<0x02c>; 2285defm S_MUL_HI_U32 : SOP2_Real_gfx11_gfx12<0x02d>; 2286defm S_MUL_HI_I32 : SOP2_Real_gfx11_gfx12<0x02e>; 2287defm S_CSELECT_B32 : SOP2_Real_gfx11_gfx12<0x030>; 2288defm S_CSELECT_B64 : SOP2_Real_gfx11_gfx12<0x031>; 2289defm S_PACK_HL_B32_B16 : SOP2_Real_gfx11_gfx12<0x035>; 2290defm S_ADD_U64 : SOP2_Real_gfx12<0x053, "s_add_nc_u64">; 2291defm S_SUB_U64 : SOP2_Real_gfx12<0x054, "s_sub_nc_u64">; 2292defm S_MUL_U64 : SOP2_Real_gfx12<0x055>; 2293 2294//===----------------------------------------------------------------------===// 2295// SOP2 - GFX1150, GFX12 2296//===----------------------------------------------------------------------===// 2297 2298multiclass SOP2_Real_FMAK_gfx12<bits<7> op> { 2299 def _gfx12 : SOP2_Real64<op, !cast<SOP2_Pseudo>(NAME)>, 2300 Select<GFX12Gen, !cast<SOP2_Pseudo>(NAME).PseudoInstr>; 2301} 2302 2303multiclass SOP2_Real_FMAK_gfx11<bits<7> op> { 2304 def _gfx11 : SOP2_Real64<op, !cast<SOP2_Pseudo>(NAME)>, 2305 Select<GFX11Gen, !cast<SOP2_Pseudo>(NAME).PseudoInstr>; 2306} 2307 2308multiclass SOP2_Real_FMAK_gfx11_gfx12<bits<7> op> : 2309 SOP2_Real_FMAK_gfx11<op>, SOP2_Real_FMAK_gfx12<op>; 2310 2311defm S_ADD_F32 : SOP2_Real_gfx11_gfx12<0x040>; 2312defm S_SUB_F32 : SOP2_Real_gfx11_gfx12<0x041>; 2313defm S_MUL_F32 : SOP2_Real_gfx11_gfx12<0x044>; 2314defm S_FMAAK_F32 : SOP2_Real_FMAK_gfx11_gfx12<0x045>; 2315defm S_FMAMK_F32 : SOP2_Real_FMAK_gfx11_gfx12<0x046>; 2316defm S_FMAC_F32 : SOP2_Real_gfx11_gfx12<0x047>; 2317defm S_CVT_PK_RTZ_F16_F32 : SOP2_Real_gfx11_gfx12<0x048>; 2318defm S_ADD_F16 : SOP2_Real_gfx11_gfx12<0x049>; 2319defm S_SUB_F16 : SOP2_Real_gfx11_gfx12<0x04a>; 2320defm S_MUL_F16 : SOP2_Real_gfx11_gfx12<0x04d>; 2321defm S_FMAC_F16 : SOP2_Real_gfx11_gfx12<0x04e>; 2322 2323//===----------------------------------------------------------------------===// 2324// SOP2 - GFX1150 2325//===----------------------------------------------------------------------===// 2326 2327multiclass SOP2_Real_gfx11_Renamed_gfx12<bits<7> op, string gfx12_name> : 2328 SOP2_Real_gfx11<op>, SOP2_Real_gfx12<op, gfx12_name>; 2329 2330defm S_MIN_F32 : SOP2_Real_gfx11_Renamed_gfx12<0x042, "s_min_num_f32">; 2331defm S_MAX_F32 : SOP2_Real_gfx11_Renamed_gfx12<0x043, "s_max_num_f32">; 2332defm S_MIN_F16 : SOP2_Real_gfx11_Renamed_gfx12<0x04b, "s_min_num_f16">; 2333defm S_MAX_F16 : SOP2_Real_gfx11_Renamed_gfx12<0x04c, "s_max_num_f16">; 2334 2335//===----------------------------------------------------------------------===// 2336// SOP2 - GFX10. 2337//===----------------------------------------------------------------------===// 2338 2339multiclass SOP2_Real_gfx10<bits<7> op> { 2340 defvar ps = !cast<SOP2_Pseudo>(NAME); 2341 def _gfx10 : SOP2_Real32<op, ps>, 2342 Select<GFX10Gen, ps.PseudoInstr>; 2343} 2344 2345multiclass SOP2_Real_gfx10_gfx11_gfx12<bits<7> op> : 2346 SOP2_Real_gfx10<op>, SOP2_Real_gfx11_gfx12<op>; 2347 2348defm S_LSHL1_ADD_U32 : SOP2_Real_gfx10<0x02e>; 2349defm S_LSHL2_ADD_U32 : SOP2_Real_gfx10<0x02f>; 2350defm S_LSHL3_ADD_U32 : SOP2_Real_gfx10<0x030>; 2351defm S_LSHL4_ADD_U32 : SOP2_Real_gfx10<0x031>; 2352defm S_PACK_LL_B32_B16 : SOP2_Real_gfx10_gfx11_gfx12<0x032>; 2353defm S_PACK_LH_B32_B16 : SOP2_Real_gfx10_gfx11_gfx12<0x033>; 2354defm S_PACK_HH_B32_B16 : SOP2_Real_gfx10_gfx11_gfx12<0x034>; 2355defm S_MUL_HI_U32 : SOP2_Real_gfx10<0x035>; 2356defm S_MUL_HI_I32 : SOP2_Real_gfx10<0x036>; 2357 2358//===----------------------------------------------------------------------===// 2359// SOP2 - GFX6, GFX7. 2360//===----------------------------------------------------------------------===// 2361 2362multiclass SOP2_Real_gfx6_gfx7<bits<7> op> { 2363 defvar ps = !cast<SOP2_Pseudo>(NAME); 2364 def _gfx6_gfx7 : SOP2_Real32<op, ps>, 2365 Select_gfx6_gfx7<ps.PseudoInstr>; 2366} 2367 2368multiclass SOP2_Real_gfx6_gfx7_gfx10<bits<7> op> : 2369 SOP2_Real_gfx6_gfx7<op>, SOP2_Real_gfx10<op>; 2370 2371multiclass SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<bits<7> op, string gfx12_name> : 2372 SOP2_Real_gfx6_gfx7<op>, SOP2_Real_gfx10<op>, SOP2_Real_gfx11<op>, 2373 SOP2_Real_gfx12<op, gfx12_name>; 2374 2375defm S_CBRANCH_G_FORK : SOP2_Real_gfx6_gfx7<0x02b>; 2376 2377defm S_ADD_U32 : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x000, "s_add_co_u32">; 2378defm S_SUB_U32 : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x001, "s_sub_co_u32">; 2379defm S_ADD_I32 : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x002, "s_add_co_i32">; 2380defm S_SUB_I32 : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x003, "s_sub_co_i32">; 2381defm S_ADDC_U32 : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x004, "s_add_co_ci_u32">; 2382defm S_SUBB_U32 : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x005, "s_sub_co_ci_u32">; 2383defm S_MIN_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x006>; 2384defm S_MIN_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x007>; 2385defm S_MAX_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x008>; 2386defm S_MAX_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x009>; 2387defm S_CSELECT_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x00a>; 2388defm S_CSELECT_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x00b>; 2389defm S_AND_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x00e>; 2390defm S_AND_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x00f>; 2391defm S_OR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x010>; 2392defm S_OR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x011>; 2393defm S_XOR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x012>; 2394defm S_XOR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x013>; 2395defm S_ANDN2_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x014>; 2396defm S_ANDN2_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x015>; 2397defm S_ORN2_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x016>; 2398defm S_ORN2_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x017>; 2399defm S_NAND_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x018>; 2400defm S_NAND_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x019>; 2401defm S_NOR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x01a>; 2402defm S_NOR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x01b>; 2403defm S_XNOR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x01c>; 2404defm S_XNOR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x01d>; 2405defm S_LSHL_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x01e>; 2406defm S_LSHL_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x01f>; 2407defm S_LSHR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x020>; 2408defm S_LSHR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x021>; 2409defm S_ASHR_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x022>; 2410defm S_ASHR_I64 : SOP2_Real_gfx6_gfx7_gfx10<0x023>; 2411defm S_BFM_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x024>; 2412defm S_BFM_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x025>; 2413defm S_MUL_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x026>; 2414defm S_BFE_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x027>; 2415defm S_BFE_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x028>; 2416defm S_BFE_U64 : SOP2_Real_gfx6_gfx7_gfx10<0x029>; 2417defm S_BFE_I64 : SOP2_Real_gfx6_gfx7_gfx10<0x02a>; 2418defm S_ABSDIFF_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x02c>; 2419 2420//===----------------------------------------------------------------------===// 2421// SOPK - GFX11, GFX12. 2422//===----------------------------------------------------------------------===// 2423 2424multiclass SOPK_Real32_gfx12<bits<5> op, string name = !tolower(NAME)> { 2425 defvar ps = !cast<SOPK_Pseudo>(NAME); 2426 def _gfx12 : SOPK_Real32<op, ps, name>, 2427 Select<GFX12Gen, ps.PseudoInstr>; 2428 if !ne(ps.Mnemonic, name) then 2429 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 2430 let AssemblerPredicate = isGFX12Plus; 2431 } 2432} 2433 2434multiclass SOPK_Real32_gfx11<bits<5> op> { 2435 def _gfx11 : SOPK_Real32<op, !cast<SOPK_Pseudo>(NAME)>, 2436 Select<GFX11Gen, !cast<SOPK_Pseudo>(NAME).PseudoInstr>; 2437} 2438 2439multiclass SOPK_Real64_gfx12<bits<5> op> { 2440 def _gfx12 : SOPK_Real64<op, !cast<SOPK_Pseudo>(NAME)>, 2441 Select<GFX12Gen, !cast<SOPK_Pseudo>(NAME).PseudoInstr>; 2442} 2443 2444multiclass SOPK_Real64_gfx11<bits<5> op> { 2445 def _gfx11 : SOPK_Real64<op, !cast<SOPK_Pseudo>(NAME)>, 2446 Select<GFX11Gen, !cast<SOPK_Pseudo>(NAME).PseudoInstr>; 2447} 2448 2449multiclass SOPK_Real32_gfx11_gfx12<bits<5> op> : 2450 SOPK_Real32_gfx11<op>, SOPK_Real32_gfx12<op>; 2451 2452multiclass SOPK_Real64_gfx11_gfx12<bits<5> op> : 2453 SOPK_Real64_gfx11<op>, SOPK_Real64_gfx12<op>; 2454 2455defm S_GETREG_B32 : SOPK_Real32_gfx11_gfx12<0x011>; 2456defm S_SETREG_B32 : SOPK_Real32_gfx11_gfx12<0x012>; 2457defm S_SETREG_IMM32_B32 : SOPK_Real64_gfx11_gfx12<0x013>; 2458defm S_CALL_B64 : SOPK_Real32_gfx11_gfx12<0x014>; 2459defm S_SUBVECTOR_LOOP_BEGIN : SOPK_Real32_gfx11<0x016>; 2460defm S_SUBVECTOR_LOOP_END : SOPK_Real32_gfx11<0x017>; 2461defm S_WAITCNT_VSCNT : SOPK_Real32_gfx11<0x018>; 2462defm S_WAITCNT_VMCNT : SOPK_Real32_gfx11<0x019>; 2463defm S_WAITCNT_EXPCNT : SOPK_Real32_gfx11<0x01a>; 2464defm S_WAITCNT_LGKMCNT : SOPK_Real32_gfx11<0x01b>; 2465 2466//===----------------------------------------------------------------------===// 2467// SOPK - GFX10. 2468//===----------------------------------------------------------------------===// 2469 2470multiclass SOPK_Real32_gfx10<bits<5> op> { 2471 defvar ps = !cast<SOPK_Pseudo>(NAME); 2472 def _gfx10 : SOPK_Real32<op, ps>, 2473 Select<GFX10Gen, ps.PseudoInstr>; 2474} 2475 2476multiclass SOPK_Real64_gfx10<bits<5> op> { 2477 defvar ps = !cast<SOPK_Pseudo>(NAME); 2478 def _gfx10 : SOPK_Real64<op, ps>, 2479 Select<GFX10Gen, ps.PseudoInstr>; 2480} 2481 2482multiclass SOPK_Real32_gfx10_gfx11<bits<5> op> : 2483 SOPK_Real32_gfx10<op>, SOPK_Real32_gfx11<op>; 2484 2485multiclass SOPK_Real32_gfx10_gfx11_gfx12<bits<5> op> : 2486 SOPK_Real32_gfx10<op>, SOPK_Real32_gfx11_gfx12<op>; 2487 2488defm S_VERSION : SOPK_Real32_gfx10_gfx11_gfx12<0x001>; 2489defm S_CALL_B64 : SOPK_Real32_gfx10<0x016>; 2490defm S_WAITCNT_VSCNT : SOPK_Real32_gfx10<0x017>; 2491defm S_WAITCNT_VMCNT : SOPK_Real32_gfx10<0x018>; 2492defm S_WAITCNT_EXPCNT : SOPK_Real32_gfx10<0x019>; 2493defm S_WAITCNT_LGKMCNT : SOPK_Real32_gfx10<0x01a>; 2494defm S_SUBVECTOR_LOOP_BEGIN : SOPK_Real32_gfx10<0x01b>; 2495defm S_SUBVECTOR_LOOP_END : SOPK_Real32_gfx10<0x01c>; 2496 2497//===----------------------------------------------------------------------===// 2498// SOPK - GFX6, GFX7. 2499//===----------------------------------------------------------------------===// 2500 2501multiclass SOPK_Real32_gfx6_gfx7<bits<5> op> { 2502 defvar ps = !cast<SOPK_Pseudo>(NAME); 2503 def _gfx6_gfx7 : SOPK_Real32<op, ps>, 2504 Select_gfx6_gfx7<ps.PseudoInstr>; 2505} 2506 2507multiclass SOPK_Real64_gfx6_gfx7<bits<5> op> { 2508 defvar ps = !cast<SOPK_Pseudo>(NAME); 2509 def _gfx6_gfx7 : SOPK_Real64<op, ps>, 2510 Select_gfx6_gfx7<ps.PseudoInstr>; 2511} 2512 2513multiclass SOPK_Real32_gfx6_gfx7_gfx10<bits<5> op> : 2514 SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10<op>; 2515 2516multiclass SOPK_Real64_gfx6_gfx7_gfx10<bits<5> op> : 2517 SOPK_Real64_gfx6_gfx7<op>, SOPK_Real64_gfx10<op>; 2518 2519multiclass SOPK_Real32_gfx6_gfx7_gfx10_gfx11<bits<5> op> : 2520 SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10_gfx11<op>; 2521 2522multiclass SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<bits<5> op> : 2523 SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10_gfx11_gfx12<op>; 2524 2525multiclass SOPK_Real32_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<bits<5> op, string gfx12_name> : 2526 SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10<op>, SOPK_Real32_gfx11<op>, 2527 SOPK_Real32_gfx12<op, gfx12_name>; 2528 2529defm S_CBRANCH_I_FORK : SOPK_Real32_gfx6_gfx7<0x011>; 2530 2531defm S_MOVK_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<0x000>; 2532defm S_CMOVK_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<0x002>; 2533defm S_CMPK_EQ_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x003>; 2534defm S_CMPK_LG_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x004>; 2535defm S_CMPK_GT_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x005>; 2536defm S_CMPK_GE_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x006>; 2537defm S_CMPK_LT_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x007>; 2538defm S_CMPK_LE_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x008>; 2539defm S_CMPK_EQ_U32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x009>; 2540defm S_CMPK_LG_U32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00a>; 2541defm S_CMPK_GT_U32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00b>; 2542defm S_CMPK_GE_U32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00c>; 2543defm S_CMPK_LT_U32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00d>; 2544defm S_CMPK_LE_U32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00e>; 2545defm S_ADDK_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x00f, "s_addk_co_i32">; 2546defm S_MULK_I32 : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<0x010>; 2547defm S_GETREG_B32 : SOPK_Real32_gfx6_gfx7_gfx10<0x012>; 2548defm S_SETREG_B32 : SOPK_Real32_gfx6_gfx7_gfx10<0x013>; 2549defm S_SETREG_IMM32_B32 : SOPK_Real64_gfx6_gfx7_gfx10<0x015>; 2550 2551//===----------------------------------------------------------------------===// 2552// SOPP - GFX12 only. 2553//===----------------------------------------------------------------------===// 2554 2555multiclass SOPP_Real_32_gfx12<bits<7> op, string name = !tolower(NAME)> { 2556 defvar ps = !cast<SOPP_Pseudo>(NAME); 2557 def _gfx12 : SOPP_Real_32<op, ps, name>, 2558 Select<GFX12Gen, ps.PseudoInstr>; 2559 if !ne(ps.Mnemonic, name) then 2560 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 2561 let AssemblerPredicate = isGFX12Plus; 2562 } 2563} 2564 2565defm S_BARRIER_WAIT : SOPP_Real_32_gfx12<0x014>; 2566defm S_BARRIER_LEAVE : SOPP_Real_32_gfx12<0x015>; 2567defm S_WAIT_LOADCNT : SOPP_Real_32_gfx12<0x040>; 2568defm S_WAIT_STORECNT : SOPP_Real_32_gfx12<0x041>; 2569defm S_WAIT_SAMPLECNT : SOPP_Real_32_gfx12<0x042>; 2570defm S_WAIT_BVHCNT : SOPP_Real_32_gfx12<0x043>; 2571defm S_WAIT_EXPCNT : SOPP_Real_32_gfx12<0x044>; 2572defm S_WAIT_DSCNT : SOPP_Real_32_gfx12<0x046>; 2573defm S_WAIT_KMCNT : SOPP_Real_32_gfx12<0x047>; 2574defm S_WAIT_LOADCNT_DSCNT : SOPP_Real_32_gfx12<0x048>; 2575defm S_WAIT_STORECNT_DSCNT : SOPP_Real_32_gfx12<0x049>; 2576 2577//===----------------------------------------------------------------------===// 2578// SOPP - GFX11, GFX12. 2579//===----------------------------------------------------------------------===// 2580 2581 2582multiclass SOPP_Real_32_gfx11<bits<7> op, string name = !tolower(NAME)> { 2583 defvar ps = !cast<SOPP_Pseudo>(NAME); 2584 def _gfx11 : SOPP_Real_32<op, ps, name>, 2585 Select<GFX11Gen, ps.PseudoInstr>, 2586 SOPPRelaxTable<0, ps.KeyName, "_gfx11">; 2587 if !ne(ps.Mnemonic, name) then 2588 def : AMDGPUMnemonicAlias<ps.Mnemonic, name> { 2589 let AssemblerPredicate = isGFX11Only; 2590 } 2591} 2592 2593multiclass SOPP_Real_64_gfx12<bits<7> op> { 2594 def _gfx12 : SOPP_Real_64<op, !cast<SOPP_Pseudo>(NAME), !cast<SOPP_Pseudo>(NAME).Mnemonic>, 2595 Select<GFX12Gen, !cast<SOPP_Pseudo>(NAME).PseudoInstr>, 2596 SOPPRelaxTable<1, !cast<SOPP_Pseudo>(NAME).KeyName, "_gfx12">; 2597} 2598 2599multiclass SOPP_Real_64_gfx11<bits<7> op> { 2600 def _gfx11 : SOPP_Real_64<op, !cast<SOPP_Pseudo>(NAME), !cast<SOPP_Pseudo>(NAME).Mnemonic>, 2601 Select<GFX11Gen, !cast<SOPP_Pseudo>(NAME).PseudoInstr>, 2602 SOPPRelaxTable<1, !cast<SOPP_Pseudo>(NAME).KeyName, "_gfx11">; 2603} 2604 2605multiclass SOPP_Real_32_gfx11_gfx12<bits<7> op> : 2606 SOPP_Real_32_gfx11<op>, SOPP_Real_32_gfx12<op>; 2607 2608multiclass SOPP_Real_32_gfx11_Renamed_gfx12<bits<7> op, string gfx12_name> : 2609 SOPP_Real_32_gfx11<op>, SOPP_Real_32_gfx12<op, gfx12_name>; 2610 2611multiclass SOPP_Real_With_Relaxation_gfx12<bits<7> op> { 2612 defm "" : SOPP_Real_32_gfx12<op>; 2613 let isCodeGenOnly = 1 in 2614 defm _pad_s_nop : SOPP_Real_64_gfx12<op>; 2615} 2616 2617multiclass SOPP_Real_With_Relaxation_gfx11<bits<7> op> { 2618 defm "" : SOPP_Real_32_gfx11<op>; 2619 let isCodeGenOnly = 1 in 2620 defm _pad_s_nop : SOPP_Real_64_gfx11<op>; 2621} 2622 2623multiclass SOPP_Real_With_Relaxation_gfx11_gfx12<bits<7>op> : 2624 SOPP_Real_With_Relaxation_gfx11<op>, SOPP_Real_With_Relaxation_gfx12<op>; 2625 2626defm S_SETKILL : SOPP_Real_32_gfx11_gfx12<0x001>; 2627defm S_SETHALT : SOPP_Real_32_gfx11_gfx12<0x002>; 2628defm S_SLEEP : SOPP_Real_32_gfx11_gfx12<0x003>; 2629defm S_INST_PREFETCH : SOPP_Real_32_gfx11<0x004, "s_set_inst_prefetch_distance">; 2630defm S_CLAUSE : SOPP_Real_32_gfx11_gfx12<0x005>; 2631defm S_DELAY_ALU : SOPP_Real_32_gfx11_gfx12<0x007>; 2632defm S_WAITCNT_DEPCTR : SOPP_Real_32_gfx11_Renamed_gfx12<0x008, "s_wait_alu">; 2633defm S_WAITCNT : SOPP_Real_32_gfx11_gfx12<0x009>; 2634defm S_WAIT_IDLE : SOPP_Real_32_gfx11_gfx12<0x00a>; 2635defm S_WAIT_EVENT : SOPP_Real_32_gfx11_gfx12<0x00b>; 2636defm S_TRAP : SOPP_Real_32_gfx11_gfx12<0x010>; 2637defm S_ROUND_MODE : SOPP_Real_32_gfx11_gfx12<0x011>; 2638defm S_DENORM_MODE : SOPP_Real_32_gfx11_gfx12<0x012>; 2639defm S_BRANCH : SOPP_Real_With_Relaxation_gfx11_gfx12<0x020>; 2640defm S_CBRANCH_SCC0 : SOPP_Real_With_Relaxation_gfx11_gfx12<0x021>; 2641defm S_CBRANCH_SCC1 : SOPP_Real_With_Relaxation_gfx11_gfx12<0x022>; 2642defm S_CBRANCH_VCCZ : SOPP_Real_With_Relaxation_gfx11_gfx12<0x023>; 2643defm S_CBRANCH_VCCNZ : SOPP_Real_With_Relaxation_gfx11_gfx12<0x024>; 2644defm S_CBRANCH_EXECZ : SOPP_Real_With_Relaxation_gfx11_gfx12<0x025>; 2645defm S_CBRANCH_EXECNZ : SOPP_Real_With_Relaxation_gfx11_gfx12<0x026>; 2646defm S_CBRANCH_CDBGSYS : SOPP_Real_With_Relaxation_gfx11<0x027>; 2647defm S_CBRANCH_CDBGUSER : SOPP_Real_With_Relaxation_gfx11<0x028>; 2648defm S_CBRANCH_CDBGSYS_OR_USER : SOPP_Real_With_Relaxation_gfx11<0x029>; 2649defm S_CBRANCH_CDBGSYS_AND_USER : SOPP_Real_With_Relaxation_gfx11<0x02a>; 2650defm S_ENDPGM : SOPP_Real_32_gfx11_gfx12<0x030>; 2651defm S_ENDPGM_SAVED : SOPP_Real_32_gfx11_gfx12<0x031>; 2652defm S_ENDPGM_ORDERED_PS_DONE : SOPP_Real_32_gfx11<0x032>; 2653defm S_WAKEUP : SOPP_Real_32_gfx11_gfx12<0x034>; 2654defm S_SETPRIO : SOPP_Real_32_gfx11_gfx12<0x035>; 2655defm S_SENDMSG : SOPP_Real_32_gfx11_gfx12<0x036>; 2656defm S_SENDMSGHALT : SOPP_Real_32_gfx11_gfx12<0x037>; 2657defm S_INCPERFLEVEL : SOPP_Real_32_gfx11_gfx12<0x038>; 2658defm S_DECPERFLEVEL : SOPP_Real_32_gfx11_gfx12<0x039>; 2659defm S_TTRACEDATA : SOPP_Real_32_gfx11_gfx12<0x03a>; 2660defm S_TTRACEDATA_IMM : SOPP_Real_32_gfx11_gfx12<0x03b>; 2661defm S_ICACHE_INV : SOPP_Real_32_gfx11_gfx12<0x03c>; 2662 2663defm S_BARRIER : SOPP_Real_32_gfx11<0x03d>; 2664 2665//===----------------------------------------------------------------------===// 2666// SOPP - GFX6, GFX7, GFX8, GFX9, GFX10 2667//===----------------------------------------------------------------------===// 2668 2669multiclass SOPP_Real_32_gfx6_gfx7<bits<7> op> { 2670 defvar ps = !cast<SOPP_Pseudo>(NAME); 2671 def _gfx6_gfx7 : SOPP_Real_32<op, ps, !cast<SOPP_Pseudo>(NAME).Mnemonic>, 2672 Select_gfx6_gfx7<ps.PseudoInstr>, 2673 SOPPRelaxTable<0, ps.KeyName, "_gfx6_gfx7">; 2674} 2675 2676multiclass SOPP_Real_32_gfx8_gfx9<bits<7> op> { 2677 defvar ps = !cast<SOPP_Pseudo>(NAME); 2678 def _vi : SOPP_Real_32<op, ps>, 2679 Select_vi<ps.PseudoInstr>, 2680 SOPPRelaxTable<0, ps.KeyName, "_vi">; 2681} 2682 2683multiclass SOPP_Real_32_gfx10<bits<7> op> { 2684 defvar ps = !cast<SOPP_Pseudo>(NAME); 2685 def _gfx10 : SOPP_Real_32<op, ps>, 2686 Select<GFX10Gen, ps.PseudoInstr>, 2687 SOPPRelaxTable<0, ps.KeyName, "_gfx10">; 2688} 2689 2690multiclass SOPP_Real_32_gfx8_gfx9_gfx10<bits<7> op> : 2691 SOPP_Real_32_gfx8_gfx9<op>, SOPP_Real_32_gfx10<op>; 2692 2693multiclass SOPP_Real_32_gfx6_gfx7_gfx8_gfx9<bits<7> op> : 2694 SOPP_Real_32_gfx6_gfx7<op>, SOPP_Real_32_gfx8_gfx9<op>; 2695 2696multiclass SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<bits<7> op> : 2697 SOPP_Real_32_gfx6_gfx7_gfx8_gfx9<op>, SOPP_Real_32_gfx10<op>; 2698 2699multiclass SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<bits<7> op> : 2700 SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<op>, SOPP_Real_32_gfx11_gfx12<op>; 2701 2702multiclass SOPP_Real_32_gfx10_gfx11_gfx12<bits<7> op> : 2703 SOPP_Real_32_gfx10<op>, SOPP_Real_32_gfx11_gfx12<op>; 2704 2705//64 bit encodings, for Relaxation 2706multiclass SOPP_Real_64_gfx6_gfx7<bits<7> op> { 2707 defvar ps = !cast<SOPP_Pseudo>(NAME); 2708 def _gfx6_gfx7 : SOPP_Real_64<op, ps>, 2709 Select_gfx6_gfx7<ps.PseudoInstr>, 2710 SOPPRelaxTable<1, ps.KeyName, "_gfx6_gfx7">; 2711} 2712 2713multiclass SOPP_Real_64_gfx8_gfx9<bits<7> op> { 2714 defvar ps = !cast<SOPP_Pseudo>(NAME); 2715 def _vi : SOPP_Real_64<op, ps>, 2716 Select_vi<ps.PseudoInstr>, 2717 SOPPRelaxTable<1, ps.KeyName, "_vi">; 2718} 2719 2720multiclass SOPP_Real_64_gfx10<bits<7> op> { 2721 defvar ps = !cast<SOPP_Pseudo>(NAME); 2722 def _gfx10 : SOPP_Real_64<op, ps>, 2723 Select<GFX10Gen, ps.PseudoInstr>, 2724 SOPPRelaxTable<1, ps.KeyName, "_gfx10">; 2725} 2726 2727multiclass SOPP_Real_64_gfx6_gfx7_gfx8_gfx9<bits<7> op> : 2728 SOPP_Real_64_gfx6_gfx7<op>, SOPP_Real_64_gfx8_gfx9<op>; 2729 2730multiclass SOPP_Real_64_gfx6_gfx7_gfx8_gfx9_gfx10<bits<7> op> : 2731 SOPP_Real_64_gfx6_gfx7_gfx8_gfx9<op>, SOPP_Real_64_gfx10<op>; 2732 2733//relaxation for insts with no operands not implemented 2734multiclass SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<bits<7> op> { 2735 defm "" : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<op>; 2736 let isCodeGenOnly = 1 in 2737 defm _pad_s_nop : SOPP_Real_64_gfx6_gfx7_gfx8_gfx9_gfx10<op>; 2738} 2739 2740defm S_NOP : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x000>; 2741defm S_ENDPGM : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x001>; 2742defm S_WAKEUP : SOPP_Real_32_gfx8_gfx9_gfx10<0x003>; 2743defm S_BARRIER : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00a>; 2744defm S_WAITCNT : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00c>; 2745defm S_SETHALT : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00d>; 2746defm S_SETKILL : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00b>; 2747defm S_SLEEP : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00e>; 2748defm S_SETPRIO : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00f>; 2749defm S_SENDMSG : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x010>; 2750defm S_SENDMSGHALT : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x011>; 2751defm S_TRAP : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x012>; 2752defm S_ICACHE_INV : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x013>; 2753defm S_INCPERFLEVEL : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x014>; 2754defm S_DECPERFLEVEL : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x015>; 2755defm S_TTRACEDATA : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x016>; 2756defm S_ENDPGM_SAVED : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x01B>; 2757defm S_SET_GPR_IDX_OFF : SOPP_Real_32_gfx8_gfx9<0x01c>; 2758defm S_SET_GPR_IDX_MODE : SOPP_Real_32_gfx8_gfx9<0x01d>; 2759defm S_ENDPGM_ORDERED_PS_DONE : SOPP_Real_32_gfx8_gfx9_gfx10<0x01e>; 2760defm S_CODE_END : SOPP_Real_32_gfx10_gfx11_gfx12<0x01f>; 2761defm S_INST_PREFETCH : SOPP_Real_32_gfx10<0x020>; 2762defm S_CLAUSE : SOPP_Real_32_gfx10<0x021>; 2763defm S_WAIT_IDLE : SOPP_Real_32_gfx10<0x022>; 2764defm S_WAITCNT_DEPCTR : SOPP_Real_32_gfx10<0x023>; 2765defm S_ROUND_MODE : SOPP_Real_32_gfx10<0x024>; 2766defm S_DENORM_MODE : SOPP_Real_32_gfx10<0x025>; 2767defm S_TTRACEDATA_IMM : SOPP_Real_32_gfx10<0x028>; 2768 2769let isBranch = 1 in { 2770defm S_BRANCH : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x002>; 2771defm S_CBRANCH_SCC0 : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x004>; 2772defm S_CBRANCH_SCC1 : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x005>; 2773defm S_CBRANCH_VCCZ : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x006>; 2774defm S_CBRANCH_VCCNZ : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x007>; 2775defm S_CBRANCH_EXECZ : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x008>; 2776defm S_CBRANCH_EXECNZ : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x009>; 2777defm S_CBRANCH_CDBGSYS : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x017>; 2778defm S_CBRANCH_CDBGUSER : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x018>; 2779defm S_CBRANCH_CDBGSYS_OR_USER : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x019>; 2780defm S_CBRANCH_CDBGSYS_AND_USER : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x01A>; 2781} 2782 2783//===----------------------------------------------------------------------===// 2784// SOPC - GFX11, GFX12. 2785//===----------------------------------------------------------------------===// 2786 2787multiclass SOPC_Real_gfx12<bits<7> op> { 2788 def _gfx12 : SOPC_Real<op, !cast<SOPC_Pseudo>(NAME)>, 2789 Select<GFX12Gen, !cast<SOPC_Pseudo>(NAME).PseudoInstr>; 2790} 2791 2792multiclass SOPC_Real_gfx11<bits<7> op> { 2793 def _gfx11 : SOPC_Real<op, !cast<SOPC_Pseudo>(NAME)>, 2794 Select<GFX11Gen, !cast<SOPC_Pseudo>(NAME).PseudoInstr>; 2795} 2796 2797multiclass SOPC_Real_gfx11_gfx12<bits<7> op> : 2798 SOPC_Real_gfx11<op>, SOPC_Real_gfx12<op>; 2799 2800defm S_CMP_EQ_U64 : SOPC_Real_gfx11_gfx12<0x10>; 2801defm S_CMP_LG_U64 : SOPC_Real_gfx11_gfx12<0x11>; 2802 2803//===----------------------------------------------------------------------===// 2804// SOPC - GFX1150, GFX12 2805//===----------------------------------------------------------------------===// 2806 2807defm S_CMP_LT_F32 : SOPC_Real_gfx11_gfx12<0x41>; 2808defm S_CMP_EQ_F32 : SOPC_Real_gfx11_gfx12<0x42>; 2809defm S_CMP_LE_F32 : SOPC_Real_gfx11_gfx12<0x43>; 2810defm S_CMP_GT_F32 : SOPC_Real_gfx11_gfx12<0x44>; 2811defm S_CMP_LG_F32 : SOPC_Real_gfx11_gfx12<0x45>; 2812defm S_CMP_GE_F32 : SOPC_Real_gfx11_gfx12<0x46>; 2813defm S_CMP_O_F32 : SOPC_Real_gfx11_gfx12<0x47>; 2814defm S_CMP_U_F32 : SOPC_Real_gfx11_gfx12<0x48>; 2815defm S_CMP_NGE_F32 : SOPC_Real_gfx11_gfx12<0x49>; 2816defm S_CMP_NLG_F32 : SOPC_Real_gfx11_gfx12<0x4a>; 2817defm S_CMP_NGT_F32 : SOPC_Real_gfx11_gfx12<0x4b>; 2818defm S_CMP_NLE_F32 : SOPC_Real_gfx11_gfx12<0x4c>; 2819defm S_CMP_NEQ_F32 : SOPC_Real_gfx11_gfx12<0x4d>; 2820defm S_CMP_NLT_F32 : SOPC_Real_gfx11_gfx12<0x4e>; 2821 2822defm S_CMP_LT_F16 : SOPC_Real_gfx11_gfx12<0x51>; 2823defm S_CMP_EQ_F16 : SOPC_Real_gfx11_gfx12<0x52>; 2824defm S_CMP_LE_F16 : SOPC_Real_gfx11_gfx12<0x53>; 2825defm S_CMP_GT_F16 : SOPC_Real_gfx11_gfx12<0x54>; 2826defm S_CMP_LG_F16 : SOPC_Real_gfx11_gfx12<0x55>; 2827defm S_CMP_GE_F16 : SOPC_Real_gfx11_gfx12<0x56>; 2828defm S_CMP_O_F16 : SOPC_Real_gfx11_gfx12<0x57>; 2829defm S_CMP_U_F16 : SOPC_Real_gfx11_gfx12<0x58>; 2830defm S_CMP_NGE_F16 : SOPC_Real_gfx11_gfx12<0x59>; 2831defm S_CMP_NLG_F16 : SOPC_Real_gfx11_gfx12<0x5a>; 2832defm S_CMP_NGT_F16 : SOPC_Real_gfx11_gfx12<0x5b>; 2833defm S_CMP_NLE_F16 : SOPC_Real_gfx11_gfx12<0x5c>; 2834defm S_CMP_NEQ_F16 : SOPC_Real_gfx11_gfx12<0x5d>; 2835defm S_CMP_NLT_F16 : SOPC_Real_gfx11_gfx12<0x5e>; 2836 2837//===----------------------------------------------------------------------===// 2838// SOPC - GFX6, GFX7, GFX8, GFX9, GFX10 2839//===----------------------------------------------------------------------===// 2840 2841multiclass SOPC_Real_gfx6_gfx7<bits<7> op> { 2842 defvar ps = !cast<SOPC_Pseudo>(NAME); 2843 def _gfx6_gfx7 : SOPC_Real<op, ps>, 2844 Select_gfx6_gfx7<ps.PseudoInstr>; 2845} 2846 2847multiclass SOPC_Real_gfx8_gfx9<bits<7> op> { 2848 defvar ps = !cast<SOPC_Pseudo>(NAME); 2849 def _vi : SOPC_Real<op, ps>, 2850 Select_vi<ps.PseudoInstr>; 2851} 2852 2853multiclass SOPC_Real_gfx10<bits<7> op> { 2854 defvar ps = !cast<SOPC_Pseudo>(NAME); 2855 def _gfx10 : SOPC_Real<op, ps>, 2856 Select<GFX10Gen, ps.PseudoInstr>; 2857} 2858 2859multiclass SOPC_Real_gfx8_gfx9_gfx10<bits<7> op> : 2860 SOPC_Real_gfx8_gfx9<op>, SOPC_Real_gfx10<op>; 2861 2862multiclass SOPC_Real_gfx6_gfx7_gfx8_gfx9<bits<7> op> : 2863 SOPC_Real_gfx6_gfx7<op>, SOPC_Real_gfx8_gfx9<op>; 2864 2865multiclass SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<bits<7> op> : 2866 SOPC_Real_gfx6_gfx7_gfx8_gfx9<op>, SOPC_Real_gfx10<op>, SOPC_Real_gfx11<op>, 2867 SOPC_Real_gfx12<op>; 2868 2869defm S_CMP_EQ_I32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x00>; 2870defm S_CMP_LG_I32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x01>; 2871defm S_CMP_GT_I32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x02>; 2872defm S_CMP_GE_I32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x03>; 2873defm S_CMP_LT_I32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x04>; 2874defm S_CMP_LE_I32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x05>; 2875defm S_CMP_EQ_U32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x06>; 2876defm S_CMP_LG_U32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x07>; 2877defm S_CMP_GT_U32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x08>; 2878defm S_CMP_GE_U32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x09>; 2879defm S_CMP_LT_U32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0a>; 2880defm S_CMP_LE_U32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0b>; 2881defm S_BITCMP0_B32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0c>; 2882defm S_BITCMP1_B32 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0d>; 2883defm S_BITCMP0_B64 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0e>; 2884defm S_BITCMP1_B64 : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0f>; 2885defm S_SETVSKIP : SOPC_Real_gfx6_gfx7_gfx8_gfx9<0x10>; 2886defm S_SET_GPR_IDX_ON : SOPC_Real_gfx8_gfx9<0x11>; 2887defm S_CMP_EQ_U64 : SOPC_Real_gfx8_gfx9_gfx10<0x12>; 2888defm S_CMP_LG_U64 : SOPC_Real_gfx8_gfx9_gfx10<0x13>; 2889 2890//===----------------------------------------------------------------------===// 2891// GFX8 (VI), GFX9. 2892//===----------------------------------------------------------------------===// 2893 2894class SOP1_Real_vi<bits<8> op, SOP1_Pseudo ps> : 2895 SOP1_Real<op, ps>, 2896 Select_vi<ps.PseudoInstr>; 2897 2898class SOP2_Real_vi<bits<7> op, SOP2_Pseudo ps> : 2899 SOP2_Real32<op, ps>, 2900 Select_vi<ps.PseudoInstr>; 2901 2902class SOPK_Real_vi<bits<5> op, SOPK_Pseudo ps> : 2903 SOPK_Real32<op, ps>, 2904 Select_vi<ps.PseudoInstr>; 2905 2906def S_MOV_B32_vi : SOP1_Real_vi <0x00, S_MOV_B32>; 2907def S_MOV_B64_vi : SOP1_Real_vi <0x01, S_MOV_B64>; 2908def S_CMOV_B32_vi : SOP1_Real_vi <0x02, S_CMOV_B32>; 2909def S_CMOV_B64_vi : SOP1_Real_vi <0x03, S_CMOV_B64>; 2910def S_NOT_B32_vi : SOP1_Real_vi <0x04, S_NOT_B32>; 2911def S_NOT_B64_vi : SOP1_Real_vi <0x05, S_NOT_B64>; 2912def S_WQM_B32_vi : SOP1_Real_vi <0x06, S_WQM_B32>; 2913def S_WQM_B64_vi : SOP1_Real_vi <0x07, S_WQM_B64>; 2914def S_BREV_B32_vi : SOP1_Real_vi <0x08, S_BREV_B32>; 2915def S_BREV_B64_vi : SOP1_Real_vi <0x09, S_BREV_B64>; 2916def S_BCNT0_I32_B32_vi : SOP1_Real_vi <0x0a, S_BCNT0_I32_B32>; 2917def S_BCNT0_I32_B64_vi : SOP1_Real_vi <0x0b, S_BCNT0_I32_B64>; 2918def S_BCNT1_I32_B32_vi : SOP1_Real_vi <0x0c, S_BCNT1_I32_B32>; 2919def S_BCNT1_I32_B64_vi : SOP1_Real_vi <0x0d, S_BCNT1_I32_B64>; 2920def S_FF0_I32_B32_vi : SOP1_Real_vi <0x0e, S_FF0_I32_B32>; 2921def S_FF0_I32_B64_vi : SOP1_Real_vi <0x0f, S_FF0_I32_B64>; 2922def S_FF1_I32_B32_vi : SOP1_Real_vi <0x10, S_FF1_I32_B32>; 2923def S_FF1_I32_B64_vi : SOP1_Real_vi <0x11, S_FF1_I32_B64>; 2924def S_FLBIT_I32_B32_vi : SOP1_Real_vi <0x12, S_FLBIT_I32_B32>; 2925def S_FLBIT_I32_B64_vi : SOP1_Real_vi <0x13, S_FLBIT_I32_B64>; 2926def S_FLBIT_I32_vi : SOP1_Real_vi <0x14, S_FLBIT_I32>; 2927def S_FLBIT_I32_I64_vi : SOP1_Real_vi <0x15, S_FLBIT_I32_I64>; 2928def S_SEXT_I32_I8_vi : SOP1_Real_vi <0x16, S_SEXT_I32_I8>; 2929def S_SEXT_I32_I16_vi : SOP1_Real_vi <0x17, S_SEXT_I32_I16>; 2930def S_BITSET0_B32_vi : SOP1_Real_vi <0x18, S_BITSET0_B32>; 2931def S_BITSET0_B64_vi : SOP1_Real_vi <0x19, S_BITSET0_B64>; 2932def S_BITSET1_B32_vi : SOP1_Real_vi <0x1a, S_BITSET1_B32>; 2933def S_BITSET1_B64_vi : SOP1_Real_vi <0x1b, S_BITSET1_B64>; 2934def S_GETPC_B64_vi : SOP1_Real_vi <0x1c, S_GETPC_B64>; 2935def S_SETPC_B64_vi : SOP1_Real_vi <0x1d, S_SETPC_B64>; 2936def S_SWAPPC_B64_vi : SOP1_Real_vi <0x1e, S_SWAPPC_B64>; 2937def S_RFE_B64_vi : SOP1_Real_vi <0x1f, S_RFE_B64>; 2938def S_AND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x20, S_AND_SAVEEXEC_B64>; 2939def S_OR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x21, S_OR_SAVEEXEC_B64>; 2940def S_XOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x22, S_XOR_SAVEEXEC_B64>; 2941def S_ANDN2_SAVEEXEC_B64_vi: SOP1_Real_vi <0x23, S_ANDN2_SAVEEXEC_B64>; 2942def S_ORN2_SAVEEXEC_B64_vi : SOP1_Real_vi <0x24, S_ORN2_SAVEEXEC_B64>; 2943def S_NAND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x25, S_NAND_SAVEEXEC_B64>; 2944def S_NOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x26, S_NOR_SAVEEXEC_B64>; 2945def S_XNOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x27, S_XNOR_SAVEEXEC_B64>; 2946def S_QUADMASK_B32_vi : SOP1_Real_vi <0x28, S_QUADMASK_B32>; 2947def S_QUADMASK_B64_vi : SOP1_Real_vi <0x29, S_QUADMASK_B64>; 2948def S_MOVRELS_B32_vi : SOP1_Real_vi <0x2a, S_MOVRELS_B32>; 2949def S_MOVRELS_B64_vi : SOP1_Real_vi <0x2b, S_MOVRELS_B64>; 2950def S_MOVRELD_B32_vi : SOP1_Real_vi <0x2c, S_MOVRELD_B32>; 2951def S_MOVRELD_B64_vi : SOP1_Real_vi <0x2d, S_MOVRELD_B64>; 2952def S_CBRANCH_JOIN_vi : SOP1_Real_vi <0x2e, S_CBRANCH_JOIN>; 2953def S_ABS_I32_vi : SOP1_Real_vi <0x30, S_ABS_I32>; 2954def S_SET_GPR_IDX_IDX_vi : SOP1_Real_vi <0x32, S_SET_GPR_IDX_IDX>; 2955 2956def S_ADD_U32_vi : SOP2_Real_vi <0x00, S_ADD_U32>; 2957def S_ADD_I32_vi : SOP2_Real_vi <0x02, S_ADD_I32>; 2958def S_SUB_U32_vi : SOP2_Real_vi <0x01, S_SUB_U32>; 2959def S_SUB_I32_vi : SOP2_Real_vi <0x03, S_SUB_I32>; 2960def S_ADDC_U32_vi : SOP2_Real_vi <0x04, S_ADDC_U32>; 2961def S_SUBB_U32_vi : SOP2_Real_vi <0x05, S_SUBB_U32>; 2962def S_MIN_I32_vi : SOP2_Real_vi <0x06, S_MIN_I32>; 2963def S_MIN_U32_vi : SOP2_Real_vi <0x07, S_MIN_U32>; 2964def S_MAX_I32_vi : SOP2_Real_vi <0x08, S_MAX_I32>; 2965def S_MAX_U32_vi : SOP2_Real_vi <0x09, S_MAX_U32>; 2966def S_CSELECT_B32_vi : SOP2_Real_vi <0x0a, S_CSELECT_B32>; 2967def S_CSELECT_B64_vi : SOP2_Real_vi <0x0b, S_CSELECT_B64>; 2968def S_AND_B32_vi : SOP2_Real_vi <0x0c, S_AND_B32>; 2969def S_AND_B64_vi : SOP2_Real_vi <0x0d, S_AND_B64>; 2970def S_OR_B32_vi : SOP2_Real_vi <0x0e, S_OR_B32>; 2971def S_OR_B64_vi : SOP2_Real_vi <0x0f, S_OR_B64>; 2972def S_XOR_B32_vi : SOP2_Real_vi <0x10, S_XOR_B32>; 2973def S_XOR_B64_vi : SOP2_Real_vi <0x11, S_XOR_B64>; 2974def S_ANDN2_B32_vi : SOP2_Real_vi <0x12, S_ANDN2_B32>; 2975def S_ANDN2_B64_vi : SOP2_Real_vi <0x13, S_ANDN2_B64>; 2976def S_ORN2_B32_vi : SOP2_Real_vi <0x14, S_ORN2_B32>; 2977def S_ORN2_B64_vi : SOP2_Real_vi <0x15, S_ORN2_B64>; 2978def S_NAND_B32_vi : SOP2_Real_vi <0x16, S_NAND_B32>; 2979def S_NAND_B64_vi : SOP2_Real_vi <0x17, S_NAND_B64>; 2980def S_NOR_B32_vi : SOP2_Real_vi <0x18, S_NOR_B32>; 2981def S_NOR_B64_vi : SOP2_Real_vi <0x19, S_NOR_B64>; 2982def S_XNOR_B32_vi : SOP2_Real_vi <0x1a, S_XNOR_B32>; 2983def S_XNOR_B64_vi : SOP2_Real_vi <0x1b, S_XNOR_B64>; 2984def S_LSHL_B32_vi : SOP2_Real_vi <0x1c, S_LSHL_B32>; 2985def S_LSHL_B64_vi : SOP2_Real_vi <0x1d, S_LSHL_B64>; 2986def S_LSHR_B32_vi : SOP2_Real_vi <0x1e, S_LSHR_B32>; 2987def S_LSHR_B64_vi : SOP2_Real_vi <0x1f, S_LSHR_B64>; 2988def S_ASHR_I32_vi : SOP2_Real_vi <0x20, S_ASHR_I32>; 2989def S_ASHR_I64_vi : SOP2_Real_vi <0x21, S_ASHR_I64>; 2990def S_BFM_B32_vi : SOP2_Real_vi <0x22, S_BFM_B32>; 2991def S_BFM_B64_vi : SOP2_Real_vi <0x23, S_BFM_B64>; 2992def S_MUL_I32_vi : SOP2_Real_vi <0x24, S_MUL_I32>; 2993def S_BFE_U32_vi : SOP2_Real_vi <0x25, S_BFE_U32>; 2994def S_BFE_I32_vi : SOP2_Real_vi <0x26, S_BFE_I32>; 2995def S_BFE_U64_vi : SOP2_Real_vi <0x27, S_BFE_U64>; 2996def S_BFE_I64_vi : SOP2_Real_vi <0x28, S_BFE_I64>; 2997def S_CBRANCH_G_FORK_vi : SOP2_Real_vi <0x29, S_CBRANCH_G_FORK>; 2998def S_ABSDIFF_I32_vi : SOP2_Real_vi <0x2a, S_ABSDIFF_I32>; 2999def S_PACK_LL_B32_B16_vi : SOP2_Real_vi <0x32, S_PACK_LL_B32_B16>; 3000def S_PACK_LH_B32_B16_vi : SOP2_Real_vi <0x33, S_PACK_LH_B32_B16>; 3001def S_PACK_HH_B32_B16_vi : SOP2_Real_vi <0x34, S_PACK_HH_B32_B16>; 3002def S_RFE_RESTORE_B64_vi : SOP2_Real_vi <0x2b, S_RFE_RESTORE_B64>; 3003 3004def S_MOVK_I32_vi : SOPK_Real_vi <0x00, S_MOVK_I32>; 3005def S_CMOVK_I32_vi : SOPK_Real_vi <0x01, S_CMOVK_I32>; 3006def S_CMPK_EQ_I32_vi : SOPK_Real_vi <0x02, S_CMPK_EQ_I32>; 3007def S_CMPK_LG_I32_vi : SOPK_Real_vi <0x03, S_CMPK_LG_I32>; 3008def S_CMPK_GT_I32_vi : SOPK_Real_vi <0x04, S_CMPK_GT_I32>; 3009def S_CMPK_GE_I32_vi : SOPK_Real_vi <0x05, S_CMPK_GE_I32>; 3010def S_CMPK_LT_I32_vi : SOPK_Real_vi <0x06, S_CMPK_LT_I32>; 3011def S_CMPK_LE_I32_vi : SOPK_Real_vi <0x07, S_CMPK_LE_I32>; 3012def S_CMPK_EQ_U32_vi : SOPK_Real_vi <0x08, S_CMPK_EQ_U32>; 3013def S_CMPK_LG_U32_vi : SOPK_Real_vi <0x09, S_CMPK_LG_U32>; 3014def S_CMPK_GT_U32_vi : SOPK_Real_vi <0x0A, S_CMPK_GT_U32>; 3015def S_CMPK_GE_U32_vi : SOPK_Real_vi <0x0B, S_CMPK_GE_U32>; 3016def S_CMPK_LT_U32_vi : SOPK_Real_vi <0x0C, S_CMPK_LT_U32>; 3017def S_CMPK_LE_U32_vi : SOPK_Real_vi <0x0D, S_CMPK_LE_U32>; 3018def S_ADDK_I32_vi : SOPK_Real_vi <0x0E, S_ADDK_I32>; 3019def S_MULK_I32_vi : SOPK_Real_vi <0x0F, S_MULK_I32>; 3020def S_CBRANCH_I_FORK_vi : SOPK_Real_vi <0x10, S_CBRANCH_I_FORK>; 3021def S_GETREG_B32_vi : SOPK_Real_vi <0x11, S_GETREG_B32>; 3022def S_SETREG_B32_vi : SOPK_Real_vi <0x12, S_SETREG_B32>; 3023//def S_GETREG_REGRD_B32_vi : SOPK_Real_vi <0x13, S_GETREG_REGRD_B32>; // see pseudo for comments 3024def S_SETREG_IMM32_B32_vi : SOPK_Real64<0x14, S_SETREG_IMM32_B32>, 3025 Select_vi<S_SETREG_IMM32_B32.PseudoInstr>; 3026 3027def S_CALL_B64_vi : SOPK_Real_vi <0x15, S_CALL_B64>; 3028 3029//===----------------------------------------------------------------------===// 3030// SOP1 - GFX9. 3031//===----------------------------------------------------------------------===// 3032 3033def S_ANDN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x33, S_ANDN1_SAVEEXEC_B64>; 3034def S_ORN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x34, S_ORN1_SAVEEXEC_B64>; 3035def S_ANDN1_WREXEC_B64_vi : SOP1_Real_vi<0x35, S_ANDN1_WREXEC_B64>; 3036def S_ANDN2_WREXEC_B64_vi : SOP1_Real_vi<0x36, S_ANDN2_WREXEC_B64>; 3037def S_BITREPLICATE_B64_B32_vi : SOP1_Real_vi<0x37, S_BITREPLICATE_B64_B32>; 3038 3039//===----------------------------------------------------------------------===// 3040// SOP2 - GFX9. 3041//===----------------------------------------------------------------------===// 3042 3043def S_LSHL1_ADD_U32_vi : SOP2_Real_vi<0x2e, S_LSHL1_ADD_U32>; 3044def S_LSHL2_ADD_U32_vi : SOP2_Real_vi<0x2f, S_LSHL2_ADD_U32>; 3045def S_LSHL3_ADD_U32_vi : SOP2_Real_vi<0x30, S_LSHL3_ADD_U32>; 3046def S_LSHL4_ADD_U32_vi : SOP2_Real_vi<0x31, S_LSHL4_ADD_U32>; 3047def S_MUL_HI_U32_vi : SOP2_Real_vi<0x2c, S_MUL_HI_U32>; 3048def S_MUL_HI_I32_vi : SOP2_Real_vi<0x2d, S_MUL_HI_I32>; 3049