xref: /llvm-project/llvm/lib/Target/AMDGPU/SOPInstructions.td (revision 3def49cb64ec1298290724081bd37dbdeb2ea5f8)
1//===-- SOPInstructions.td - SOP Instruction Definitions ------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9def GPRIdxMode : CustomOperand<i32>;
10
11class SOP_Pseudo<string opName, dag outs, dag ins, string asmOps,
12                  list<dag> pattern=[]> :
13    InstSI<outs, ins, "", pattern>,
14    SIMCInstr<opName, SIEncodingFamily.NONE> {
15
16  let isPseudo = 1;
17  let isCodeGenOnly = 1;
18  let Size = 4;
19
20  string Mnemonic = opName;
21  string AsmOperands = asmOps;
22
23  bits<1> has_sdst = 0;
24}
25
26//===----------------------------------------------------------------------===//
27// SOP1 Instructions
28//===----------------------------------------------------------------------===//
29
30class SOP1_Pseudo <string opName, dag outs, dag ins,
31                   string asmOps, list<dag> pattern=[]> :
32  SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> {
33
34  let mayLoad = 0;
35  let mayStore = 0;
36  let hasSideEffects = 0;
37  let SALU = 1;
38  let SOP1 = 1;
39  let SchedRW = [WriteSALU];
40  let UseNamedOperandTable = 1;
41
42  bits<1> has_src0 = 1;
43  let has_sdst = 1;
44}
45
46class SOP1_Real<bits<8> op, SOP1_Pseudo ps, string real_name = ps.Mnemonic> :
47  InstSI <ps.OutOperandList, ps.InOperandList,
48          real_name # ps.AsmOperands>,
49  Enc32 {
50
51  let SALU = 1;
52  let SOP1 = 1;
53  let isPseudo = 0;
54  let isCodeGenOnly = 0;
55  let Size = 4;
56
57  // copy relevant pseudo op flags
58  let SubtargetPredicate = ps.SubtargetPredicate;
59  let AsmMatchConverter  = ps.AsmMatchConverter;
60  let SchedRW            = ps.SchedRW;
61  let mayLoad            = ps.mayLoad;
62  let mayStore           = ps.mayStore;
63  let isTerminator       = ps.isTerminator;
64  let isReturn           = ps.isReturn;
65  let isCall             = ps.isCall;
66  let isBranch           = ps.isBranch;
67  let isBarrier          = ps.isBarrier;
68  let Uses               = ps.Uses;
69  let Defs               = ps.Defs;
70  let isConvergent       = ps.isConvergent;
71
72  // encoding
73  bits<7> sdst;
74  bits<8> src0;
75
76  let Inst{7-0} = !if(ps.has_src0, src0, ?);
77  let Inst{15-8} = op;
78  let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
79  let Inst{31-23} = 0x17d; //encoding;
80}
81
82class SOP1_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo <
83  opName, (outs SReg_32:$sdst),
84  !if(tied_in, (ins SSrc_b32:$src0, SReg_32:$sdst_in),
85               (ins SSrc_b32:$src0)),
86  "$sdst, $src0", pattern> {
87  let Constraints = !if(tied_in, "$sdst = $sdst_in", "");
88}
89
90// Only register input allowed.
91class SOP1_32R <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
92  opName, (outs SReg_32:$sdst), (ins SReg_32:$src0),
93  "$sdst, $src0", pattern>;
94
95// 32-bit input, no output.
96class SOP1_0_32 <string opName, list<dag> pattern = []> : SOP1_Pseudo <
97  opName, (outs), (ins SSrc_b32:$src0),
98  "$src0", pattern> {
99  let has_sdst = 0;
100}
101
102// Special case for movreld where sdst is treated as a use operand.
103class SOP1_32_movreld <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
104  opName, (outs), (ins SReg_32:$sdst, SSrc_b32:$src0),
105  "$sdst, $src0", pattern>;
106
107// Special case for movreld where sdst is treated as a use operand.
108class SOP1_64_movreld <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
109  opName, (outs), (ins SReg_64:$sdst, SSrc_b64:$src0),
110  "$sdst, $src0", pattern
111>;
112
113class SOP1_0_32R <string opName, list<dag> pattern = []> : SOP1_Pseudo <
114  opName, (outs), (ins SReg_32:$src0),
115  "$src0", pattern> {
116  let has_sdst = 0;
117}
118
119class SOP1_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
120  opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0),
121  "$sdst, $src0", pattern
122>;
123
124// Only register input allowed.
125class SOP1_64R <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
126  opName, (outs SReg_64:$sdst), (ins SReg_64:$src0),
127  "$sdst, $src0", pattern
128>;
129
130// 64-bit input, 32-bit output.
131class SOP1_32_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
132  opName, (outs SReg_32:$sdst), (ins SSrc_b64:$src0),
133  "$sdst, $src0", pattern
134>;
135
136// 32-bit input, 64-bit output.
137class SOP1_64_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo <
138  opName, (outs SReg_64:$sdst),
139  !if(tied_in, (ins SSrc_b32:$src0, SReg_64:$sdst_in),
140               (ins SSrc_b32:$src0)),
141  "$sdst, $src0", pattern> {
142  let Constraints = !if(tied_in, "$sdst = $sdst_in", "");
143}
144
145// no input, 64-bit output.
146class SOP1_64_0 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
147  opName, (outs SReg_64:$sdst), (ins), "$sdst", pattern> {
148  let has_src0 = 0;
149}
150
151// 64-bit input, no output
152class SOP1_1 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
153  opName, (outs), (ins SReg_64:$src0), "$src0", pattern> {
154  let has_sdst = 0;
155}
156
157
158class UniformUnaryFrag<SDPatternOperator Op> : PatFrag <
159  (ops node:$src0),
160  (Op $src0),
161  [{ return !N->isDivergent(); }]> {
162  // This check is unnecessary as it's captured by the result register
163  // bank constraint.
164  //
165  // FIXME: Should add a way for the emitter to recognize this is a
166  // trivially true predicate to eliminate the check.
167  let GISelPredicateCode = [{return true;}];
168}
169
170class UniformBinFrag<SDPatternOperator Op> : PatFrag <
171  (ops node:$src0, node:$src1),
172  (Op $src0, $src1),
173  [{ return !N->isDivergent(); }]> {
174  // This check is unnecessary as it's captured by the result register
175  // bank constraint.
176  //
177  // FIXME: Should add a way for the emitter to recognize this is a
178  // trivially true predicate to eliminate the check.
179  let GISelPredicateCode = [{return true;}];
180}
181
182class UniformTernaryFrag<SDPatternOperator Op> : PatFrag <
183  (ops node:$src0, node:$src1, node:$src2),
184  (Op $src0, $src1, $src2),
185  [{ return !N->isDivergent(); }]> {
186  // This check is unnecessary as it's captured by the result register
187  // bank constraint.
188  //
189  // FIXME: Should add a way for the emitter to recognize this is a
190  // trivially true predicate to eliminate the check.
191  let GISelPredicateCode = [{return true;}];
192}
193
194class DivergentBinFrag<SDPatternOperator Op> : PatFrag <
195  (ops node:$src0, node:$src1),
196  (Op $src0, $src1),
197  [{ return N->isDivergent(); }]> {
198  // This check is unnecessary as it's captured by the result register
199  // bank constraint.
200  //
201  // FIXME: Should add a way for the emitter to recognize this is a
202  // trivially true predicate to eliminate the check.
203  let GISelPredicateCode = [{return true;}];
204}
205
206
207let isMoveImm = 1 in {
208  let isReMaterializable = 1, isAsCheapAsAMove = 1 in {
209    def S_MOV_B32 : SOP1_32 <"s_mov_b32">;
210    def S_MOV_B64 : SOP1_64 <"s_mov_b64">;
211  } // End isReMaterializable = 1
212
213  let Uses = [SCC] in {
214    def S_CMOV_B32 : SOP1_32 <"s_cmov_b32">;
215    def S_CMOV_B64 : SOP1_64 <"s_cmov_b64">;
216  } // End Uses = [SCC]
217} // End isMoveImm = 1
218
219// Variant of S_MOV_B32 used for reading from volatile registers like
220// SRC_POPS_EXITING_WAVE_ID.
221let hasSideEffects = 1 in
222def S_MOV_B32_sideeffects : SOP1_32 <"s_mov_b32">;
223
224let Defs = [SCC] in {
225  def S_NOT_B32 : SOP1_32 <"s_not_b32",
226    [(set i32:$sdst, (UniformUnaryFrag<not> i32:$src0))]
227  >;
228
229  def S_NOT_B64 : SOP1_64 <"s_not_b64",
230    [(set i64:$sdst, (UniformUnaryFrag<not> i64:$src0))]
231  >;
232  def S_WQM_B32 : SOP1_32 <"s_wqm_b32",
233    [(set i32:$sdst, (int_amdgcn_s_wqm i32:$src0))]>;
234  def S_WQM_B64 : SOP1_64 <"s_wqm_b64",
235    [(set i64:$sdst, (int_amdgcn_s_wqm i64:$src0))]>;
236} // End Defs = [SCC]
237
238
239let WaveSizePredicate = isWave32 in {
240def : GCNPat <
241  (int_amdgcn_wqm_vote i1:$src0),
242  (S_WQM_B32 SSrc_b32:$src0)
243>;
244}
245
246let WaveSizePredicate = isWave64 in {
247def : GCNPat <
248  (int_amdgcn_wqm_vote i1:$src0),
249  (S_WQM_B64 SSrc_b64:$src0)
250>;
251}
252
253let isReMaterializable = 1, isAsCheapAsAMove = 1 in {
254def S_BREV_B32 : SOP1_32 <"s_brev_b32",
255  [(set i32:$sdst, (UniformUnaryFrag<bitreverse> i32:$src0))]
256>;
257def S_BREV_B64 : SOP1_64 <"s_brev_b64",
258  [(set i64:$sdst, (UniformUnaryFrag<bitreverse> i64:$src0))]
259>;
260} // End isReMaterializable = 1, isAsCheapAsAMove = 1
261
262let Defs = [SCC] in {
263def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32">;
264def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64">;
265def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32",
266  [(set i32:$sdst, (UniformUnaryFrag<ctpop> i32:$src0))]
267>;
268def S_BCNT1_I32_B64 : SOP1_32_64 <"s_bcnt1_i32_b64",
269  [(set i32:$sdst, (UniformUnaryFrag<ctpop> i64:$src0))]
270>;
271} // End Defs = [SCC]
272
273let isReMaterializable = 1 in {
274def S_FF0_I32_B32 : SOP1_32 <"s_ff0_i32_b32">;
275def S_FF0_I32_B64 : SOP1_32_64 <"s_ff0_i32_b64">;
276def S_FF1_I32_B64 : SOP1_32_64 <"s_ff1_i32_b64",
277  [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbl_b32> i64:$src0))]
278>;
279
280def S_FF1_I32_B32 : SOP1_32 <"s_ff1_i32_b32",
281  [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbl_b32> i32:$src0))]
282>;
283
284def S_FLBIT_I32_B32 : SOP1_32 <"s_flbit_i32_b32",
285  [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbh_u32> i32:$src0))]
286>;
287
288def S_FLBIT_I32_B64 : SOP1_32_64 <"s_flbit_i32_b64",
289  [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbh_u32> i64:$src0))]
290>;
291def S_FLBIT_I32 : SOP1_32 <"s_flbit_i32",
292  [(set i32:$sdst, (UniformUnaryFrag<AMDGPUffbh_i32> i32:$src0))]
293>;
294def S_FLBIT_I32_I64 : SOP1_32_64 <"s_flbit_i32_i64">;
295def S_SEXT_I32_I8 : SOP1_32 <"s_sext_i32_i8",
296  [(set i32:$sdst, (UniformSextInreg<i8> i32:$src0))]
297>;
298def S_SEXT_I32_I16 : SOP1_32 <"s_sext_i32_i16",
299  [(set i32:$sdst, (UniformSextInreg<i16> i32:$src0))]
300>;
301} // End isReMaterializable = 1
302
303def S_BITSET0_B32 : SOP1_32    <"s_bitset0_b32", [], 1>;
304def S_BITSET0_B64 : SOP1_64_32 <"s_bitset0_b64", [], 1>;
305def S_BITSET1_B32 : SOP1_32    <"s_bitset1_b32", [], 1>;
306def S_BITSET1_B64 : SOP1_64_32 <"s_bitset1_b64", [], 1>;
307
308def S_GETPC_B64 : SOP1_64_0  <"s_getpc_b64">;
309// PSEUDO includes a workaround for a hardware anomaly where some ASICs
310// zero-extend the result from 48 bits instead of sign-extending.
311let isReMaterializable = 1 in
312def S_GETPC_B64_pseudo : SOP1_64_0  <"s_getpc_b64",
313  [(set i64:$sdst, (int_amdgcn_s_getpc))]
314>;
315
316let isTerminator = 1, isBarrier = 1, SchedRW = [WriteBranch] in {
317
318let isBranch = 1, isIndirectBranch = 1 in {
319def S_SETPC_B64 : SOP1_1  <"s_setpc_b64">;
320} // End isBranch = 1, isIndirectBranch = 1
321
322let isReturn = 1 in {
323// Define variant marked as return rather than branch.
324def S_SETPC_B64_return : SOP1_1<"">;
325}
326} // End isTerminator = 1, isBarrier = 1
327
328let isCall = 1 in {
329def S_SWAPPC_B64 : SOP1_64 <"s_swappc_b64"
330>;
331}
332
333def S_RFE_B64 : SOP1_1  <"s_rfe_b64">;
334
335let hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] in {
336
337def S_AND_SAVEEXEC_B64 : SOP1_64 <"s_and_saveexec_b64">;
338def S_OR_SAVEEXEC_B64 : SOP1_64 <"s_or_saveexec_b64">;
339def S_XOR_SAVEEXEC_B64 : SOP1_64 <"s_xor_saveexec_b64">;
340def S_ANDN2_SAVEEXEC_B64 : SOP1_64 <"s_andn2_saveexec_b64">;
341def S_ORN2_SAVEEXEC_B64 : SOP1_64 <"s_orn2_saveexec_b64">;
342def S_NAND_SAVEEXEC_B64 : SOP1_64 <"s_nand_saveexec_b64">;
343def S_NOR_SAVEEXEC_B64 : SOP1_64 <"s_nor_saveexec_b64">;
344def S_XNOR_SAVEEXEC_B64 : SOP1_64 <"s_xnor_saveexec_b64">;
345
346} // End hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC]
347
348def S_QUADMASK_B32 : SOP1_32 <"s_quadmask_b32",
349  [(set i32:$sdst, (int_amdgcn_s_quadmask i32:$src0))]>;
350def S_QUADMASK_B64 : SOP1_64 <"s_quadmask_b64",
351  [(set i64:$sdst, (int_amdgcn_s_quadmask i64:$src0))]>;
352
353let Uses = [M0] in {
354def S_MOVRELS_B32 : SOP1_32R <"s_movrels_b32">;
355def S_MOVRELS_B64 : SOP1_64R <"s_movrels_b64">;
356def S_MOVRELD_B32 : SOP1_32_movreld <"s_movreld_b32">;
357def S_MOVRELD_B64 : SOP1_64_movreld <"s_movreld_b64">;
358} // End Uses = [M0]
359
360let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in {
361def S_CBRANCH_JOIN : SOP1_0_32R <"s_cbranch_join">;
362} // End SubtargetPredicate = isGFX6GFX7GFX8GFX9
363
364let Defs = [SCC] in {
365def S_ABS_I32 : SOP1_32 <"s_abs_i32",
366    [(set i32:$sdst, (UniformUnaryFrag<abs> i32:$src0))]
367  >;
368} // End Defs = [SCC]
369
370let SubtargetPredicate = HasVGPRIndexMode in {
371def S_SET_GPR_IDX_IDX : SOP1_0_32<"s_set_gpr_idx_idx"> {
372  let Uses = [M0, MODE];
373  let Defs = [M0, MODE];
374}
375}
376
377let SubtargetPredicate = isGFX9Plus in {
378  let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in {
379    def S_ANDN1_SAVEEXEC_B64 : SOP1_64<"s_andn1_saveexec_b64">;
380    def S_ORN1_SAVEEXEC_B64  : SOP1_64<"s_orn1_saveexec_b64">;
381    def S_ANDN1_WREXEC_B64   : SOP1_64<"s_andn1_wrexec_b64">;
382    def S_ANDN2_WREXEC_B64   : SOP1_64<"s_andn2_wrexec_b64">;
383  } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC]
384
385  let isReMaterializable = 1 in
386  def S_BITREPLICATE_B64_B32 : SOP1_64_32<"s_bitreplicate_b64_b32",
387  [(set i64:$sdst, (int_amdgcn_s_bitreplicate i32:$src0))]>;
388} // End SubtargetPredicate = isGFX9Plus
389
390let SubtargetPredicate = isGFX10Plus in {
391  let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in {
392    def S_AND_SAVEEXEC_B32   : SOP1_32<"s_and_saveexec_b32">;
393    def S_OR_SAVEEXEC_B32    : SOP1_32<"s_or_saveexec_b32">;
394    def S_XOR_SAVEEXEC_B32   : SOP1_32<"s_xor_saveexec_b32">;
395    def S_ANDN2_SAVEEXEC_B32 : SOP1_32<"s_andn2_saveexec_b32">;
396    def S_ORN2_SAVEEXEC_B32  : SOP1_32<"s_orn2_saveexec_b32">;
397    def S_NAND_SAVEEXEC_B32  : SOP1_32<"s_nand_saveexec_b32">;
398    def S_NOR_SAVEEXEC_B32   : SOP1_32<"s_nor_saveexec_b32">;
399    def S_XNOR_SAVEEXEC_B32  : SOP1_32<"s_xnor_saveexec_b32">;
400    def S_ANDN1_SAVEEXEC_B32 : SOP1_32<"s_andn1_saveexec_b32">;
401    def S_ORN1_SAVEEXEC_B32  : SOP1_32<"s_orn1_saveexec_b32">;
402    def S_ANDN1_WREXEC_B32   : SOP1_32<"s_andn1_wrexec_b32">;
403    def S_ANDN2_WREXEC_B32   : SOP1_32<"s_andn2_wrexec_b32">;
404  } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC]
405
406  let Uses = [M0] in {
407    def S_MOVRELSD_2_B32 : SOP1_32<"s_movrelsd_2_b32">;
408  } // End Uses = [M0]
409} // End SubtargetPredicate = isGFX10Plus
410
411let SubtargetPredicate = isGFX11Plus in {
412  let hasSideEffects = 1 in {
413    // For s_sendmsg_rtn_* the src0 field encodes the message type directly; it
414    // is not an SGPR number.
415    def S_SENDMSG_RTN_B32 : SOP1_Pseudo<
416      "s_sendmsg_rtn_b32", (outs SReg_32:$sdst), (ins SendMsg:$src0),
417      "$sdst, $src0", [(set i32:$sdst, (int_amdgcn_s_sendmsg_rtn timm:$src0))]
418    >;
419    def S_SENDMSG_RTN_B64 : SOP1_Pseudo<
420      "s_sendmsg_rtn_b64", (outs SReg_64:$sdst), (ins SendMsg:$src0),
421      "$sdst, $src0", [(set i64:$sdst, (int_amdgcn_s_sendmsg_rtn timm:$src0))]
422    >;
423  }
424} // End SubtargetPredicate = isGFX11Plus
425
426class SOP1_F32_Inst<string opName, SDPatternOperator Op, ValueType vt0=f32,
427                    ValueType vt1=vt0> :
428  SOP1_32<opName, [(set vt0:$sdst, (UniformUnaryFrag<Op> vt1:$src0))]>;
429
430let SubtargetPredicate = HasSALUFloatInsts, Uses = [MODE],
431    SchedRW = [WriteSFPU], isReMaterializable = 1 in {
432  def S_CVT_F32_I32 : SOP1_F32_Inst<"s_cvt_f32_i32", sint_to_fp, f32, i32>;
433  def S_CVT_F32_U32 : SOP1_F32_Inst<"s_cvt_f32_u32", uint_to_fp, f32, i32>;
434
435  let mayRaiseFPException = 1 in {
436    def S_CVT_I32_F32    : SOP1_F32_Inst<"s_cvt_i32_f32", fp_to_sint, i32, f32>;
437    def S_CVT_U32_F32    : SOP1_F32_Inst<"s_cvt_u32_f32", fp_to_uint, i32, f32>;
438    def S_CVT_F32_F16    : SOP1_F32_Inst<"s_cvt_f32_f16", fpextend, f32, f16>;
439    def S_CVT_HI_F32_F16 : SOP1_32<"s_cvt_hi_f32_f16">;
440
441    def S_CEIL_F32  : SOP1_F32_Inst<"s_ceil_f32", fceil>;
442    def S_FLOOR_F32 : SOP1_F32_Inst<"s_floor_f32", ffloor>;
443    def S_TRUNC_F32 : SOP1_F32_Inst<"s_trunc_f32", ftrunc>;
444    def S_RNDNE_F32 : SOP1_F32_Inst<"s_rndne_f32", froundeven>;
445
446    let FPDPRounding = 1 in
447      def S_CVT_F16_F32 : SOP1_F32_Inst<"s_cvt_f16_f32", fpround, f16, f32>;
448
449    def S_CEIL_F16  : SOP1_F32_Inst<"s_ceil_f16", fceil, f16>;
450    def S_FLOOR_F16 : SOP1_F32_Inst<"s_floor_f16", ffloor, f16>;
451    def S_TRUNC_F16 : SOP1_F32_Inst<"s_trunc_f16", ftrunc, f16>;
452    def S_RNDNE_F16 : SOP1_F32_Inst<"s_rndne_f16", froundeven, f16>;
453  } // End mayRaiseFPException = 1
454} // End SubtargetPredicate = HasSALUFloatInsts, Uses = [MODE]
455  // SchedRW = [WriteSFPU], isReMaterializable = 1
456
457let hasSideEffects = 1 in {
458let has_sdst = 0 in {
459let Uses = [M0] in {
460def S_BARRIER_SIGNAL_M0 : SOP1_Pseudo <"s_barrier_signal m0", (outs), (ins),
461  "", []>{
462  let SchedRW = [WriteBarrier];
463  let isConvergent = 1;
464}
465
466def S_BARRIER_SIGNAL_ISFIRST_M0 : SOP1_Pseudo <"s_barrier_signal_isfirst m0", (outs), (ins),
467  "", []>{
468  let Defs = [SCC];
469  let SchedRW = [WriteBarrier];
470  let isConvergent = 1;
471}
472
473def S_BARRIER_INIT_M0 : SOP1_Pseudo <"s_barrier_init m0", (outs), (ins),
474  "", []>{
475  let SchedRW = [WriteBarrier];
476  let isConvergent = 1;
477}
478
479def S_BARRIER_INIT_IMM : SOP1_Pseudo <"s_barrier_init", (outs),
480  (ins SplitBarrier:$src0), "$src0", []>{
481  let SchedRW = [WriteBarrier];
482  let isConvergent = 1;
483}
484
485def S_BARRIER_JOIN_M0 : SOP1_Pseudo <"s_barrier_join m0", (outs), (ins),
486  "", []>{
487  let SchedRW = [WriteBarrier];
488  let isConvergent = 1;
489}
490
491} // End Uses = [M0]
492
493def S_BARRIER_SIGNAL_IMM : SOP1_Pseudo <"s_barrier_signal", (outs),
494  (ins SplitBarrier:$src0), "$src0", [(int_amdgcn_s_barrier_signal timm:$src0)]>{
495  let SchedRW = [WriteBarrier];
496  let isConvergent = 1;
497}
498
499def S_BARRIER_SIGNAL_ISFIRST_IMM : SOP1_Pseudo <"s_barrier_signal_isfirst", (outs),
500  (ins SplitBarrier:$src0), "$src0", [(set SCC, (int_amdgcn_s_barrier_signal_isfirst timm:$src0))]>{
501  let Defs = [SCC];
502  let SchedRW = [WriteBarrier];
503  let isConvergent = 1;
504}
505
506def S_BARRIER_JOIN_IMM : SOP1_Pseudo <"s_barrier_join", (outs),
507  (ins SplitBarrier:$src0), "$src0", []>{
508  let SchedRW = [WriteBarrier];
509  let isConvergent = 1;
510}
511
512} // End has_sdst = 0
513
514def S_GET_BARRIER_STATE_IMM : SOP1_Pseudo <"s_get_barrier_state", (outs SSrc_b32:$sdst),
515  (ins SplitBarrier:$src0), "$sdst, $src0", []>{
516  let SchedRW = [WriteBarrier];
517  let isConvergent = 1;
518}
519
520def S_GET_BARRIER_STATE_M0 : SOP1_Pseudo <"s_get_barrier_state $sdst, m0", (outs SSrc_b32:$sdst),
521  (ins), "", []>{
522  let Uses = [M0];
523  let SchedRW = [WriteBarrier];
524  let isConvergent = 1;
525}
526} // End hasSideEffects = 1
527
528//===----------------------------------------------------------------------===//
529// SOP2 Instructions
530//===----------------------------------------------------------------------===//
531
532class SOP2_Pseudo<string opName, dag outs, dag ins,
533                  string asmOps, list<dag> pattern=[]> :
534  SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> {
535
536  let mayLoad = 0;
537  let mayStore = 0;
538  let hasSideEffects = 0;
539  let SALU = 1;
540  let SOP2 = 1;
541  let SchedRW = [WriteSALU];
542  let UseNamedOperandTable = 1;
543
544  let has_sdst = 1;
545
546  // Pseudo instructions have no encodings, but adding this field here allows
547  // us to do:
548  // let sdst = xxx in {
549  // for multiclasses that include both real and pseudo instructions.
550  // field bits<7> sdst = 0;
551}
552
553class SOP2_Real<SOP_Pseudo ps, string name = ps.Mnemonic> :
554  InstSI <ps.OutOperandList, ps.InOperandList,
555          name # ps.AsmOperands> {
556  let SALU = 1;
557  let SOP2 = 1;
558  let isPseudo = 0;
559  let isCodeGenOnly = 0;
560
561  // copy relevant pseudo op flags
562  let SubtargetPredicate   = ps.SubtargetPredicate;
563  let AsmMatchConverter    = ps.AsmMatchConverter;
564  let UseNamedOperandTable = ps.UseNamedOperandTable;
565  let TSFlags              = ps.TSFlags;
566  let SchedRW              = ps.SchedRW;
567  let mayLoad              = ps.mayLoad;
568  let mayStore             = ps.mayStore;
569  let Constraints          = ps.Constraints;
570  let DisableEncoding      = ps.DisableEncoding;
571  let Uses                 = ps.Uses;
572  let Defs                 = ps.Defs;
573  let isConvergent         = ps.isConvergent;
574
575  // encoding
576  bits<7> sdst;
577  bits<8> src0;
578  bits<8> src1;
579  bits<32> imm;
580}
581
582class SOP2_Real32<bits<7> op, SOP_Pseudo ps, string name = ps.Mnemonic> :
583  SOP2_Real<ps, name>, Enc32 {
584  let Inst{7-0}   = src0;
585  let Inst{15-8}  = src1;
586  let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
587  let Inst{29-23} = op;
588  let Inst{31-30} = 0x2; // encoding
589}
590
591class SOP2_Real64<bits<7> op, SOP_Pseudo ps, string name = ps.Mnemonic> :
592  SOP2_Real<ps, name>, Enc64 {
593  let Inst{7-0}   = src0;
594  let Inst{15-8}  = src1;
595  let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
596  let Inst{29-23} = op;
597  let Inst{31-30} = 0x2; // encoding
598  let Inst{63-32} = imm;
599}
600
601class SOP2_F16 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
602  opName, (outs SReg_32:$sdst), (ins SSrc_f16:$src0, SSrc_f16:$src1),
603  "$sdst, $src0, $src1", pattern
604>;
605
606class SOP2_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
607  opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
608  "$sdst, $src0, $src1", pattern
609>;
610
611class SOP2_F32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
612  opName, (outs SReg_32:$sdst), (ins SSrc_f32:$src0, SSrc_f32:$src1),
613  "$sdst, $src0, $src1", pattern
614>;
615
616class SOP2_64 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
617  opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1),
618  "$sdst, $src0, $src1", pattern
619>;
620
621class SOP2_64_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
622  opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b32:$src1),
623  "$sdst, $src0, $src1", pattern
624>;
625
626class SOP2_64_32_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
627  opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
628  "$sdst, $src0, $src1", pattern
629>;
630
631
632let Defs = [SCC] in { // Carry out goes to SCC
633let isCommutable = 1, isAdd = 1 in {
634def S_ADD_U32 : SOP2_32 <"s_add_u32">;
635def S_ADD_I32 : SOP2_32 <"s_add_i32",
636  [(set i32:$sdst, (UniformBinFrag<add> SSrc_b32:$src0, SSrc_b32:$src1))]
637>;
638} // End isCommutable = 1, isAdd = 1
639
640def S_SUB_U32 : SOP2_32 <"s_sub_u32">;
641def S_SUB_I32 : SOP2_32 <"s_sub_i32",
642  [(set i32:$sdst, (UniformBinFrag<sub> SSrc_b32:$src0, SSrc_b32:$src1))]
643>;
644
645let Uses = [SCC] in { // Carry in comes from SCC
646let isCommutable = 1 in {
647def S_ADDC_U32 : SOP2_32 <"s_addc_u32",
648  [(set i32:$sdst, (UniformBinFrag<adde> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
649} // End isCommutable = 1
650
651def S_SUBB_U32 : SOP2_32 <"s_subb_u32",
652  [(set i32:$sdst, (UniformBinFrag<sube> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
653} // End Uses = [SCC]
654
655let isCommutable = 1 in {
656def S_MIN_I32 : SOP2_32 <"s_min_i32",
657  [(set i32:$sdst, (UniformBinFrag<smin> i32:$src0, i32:$src1))]
658>;
659def S_MIN_U32 : SOP2_32 <"s_min_u32",
660  [(set i32:$sdst, (UniformBinFrag<umin> i32:$src0, i32:$src1))]
661>;
662def S_MAX_I32 : SOP2_32 <"s_max_i32",
663  [(set i32:$sdst, (UniformBinFrag<smax> i32:$src0, i32:$src1))]
664>;
665def S_MAX_U32 : SOP2_32 <"s_max_u32",
666  [(set i32:$sdst, (UniformBinFrag<umax> i32:$src0, i32:$src1))]
667>;
668} // End isCommutable = 1
669} // End Defs = [SCC]
670
671let SubtargetPredicate = isGFX12Plus in {
672  def S_ADD_U64 : SOP2_64<"s_add_u64">{
673    let isCommutable = 1;
674  }
675
676  def S_SUB_U64 : SOP2_64<"s_sub_u64">;
677
678  def S_MUL_U64 : SOP2_64 <"s_mul_u64",
679    [(set i64:$sdst, (UniformBinFrag<mul> i64:$src0, i64:$src1))]> {
680    let isCommutable = 1;
681  }
682
683  // The higher 32-bits of the inputs contain the sign extension bits.
684  def S_MUL_I64_I32_PSEUDO : SPseudoInstSI <
685    (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1)
686  >;
687
688  // The higher 32-bits of the inputs are zero.
689  def S_MUL_U64_U32_PSEUDO : SPseudoInstSI <
690    (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1)
691  >;
692
693} // End SubtargetPredicate = isGFX12Plus
694
695let Uses = [SCC] in {
696  def S_CSELECT_B32 : SOP2_32 <"s_cselect_b32">;
697  def S_CSELECT_B64 : SOP2_64 <"s_cselect_b64">;
698} // End Uses = [SCC]
699
700let Defs = [SCC] in {
701let isCommutable = 1 in {
702def S_AND_B32 : SOP2_32 <"s_and_b32",
703  [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, i32:$src1))]
704>;
705
706def S_AND_B64 : SOP2_64 <"s_and_b64",
707  [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, i64:$src1))]
708>;
709
710def S_OR_B32 : SOP2_32 <"s_or_b32",
711  [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, i32:$src1))]
712>;
713
714def S_OR_B64 : SOP2_64 <"s_or_b64",
715  [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, i64:$src1))]
716>;
717
718def S_XOR_B32 : SOP2_32 <"s_xor_b32",
719  [(set i32:$sdst, (UniformBinFrag<xor> i32:$src0, i32:$src1))]
720>;
721
722def S_XOR_B64 : SOP2_64 <"s_xor_b64",
723  [(set i64:$sdst, (UniformBinFrag<xor> i64:$src0, i64:$src1))]
724>;
725
726def S_XNOR_B32 : SOP2_32 <"s_xnor_b32",
727  [(set i32:$sdst, (UniformUnaryFrag<not> (xor_oneuse i32:$src0, i32:$src1)))]
728>;
729
730def S_XNOR_B64 : SOP2_64 <"s_xnor_b64",
731  [(set i64:$sdst, (UniformUnaryFrag<not> (xor_oneuse i64:$src0, i64:$src1)))]
732>;
733
734def S_NAND_B32 : SOP2_32 <"s_nand_b32",
735  [(set i32:$sdst, (UniformUnaryFrag<not> (and_oneuse i32:$src0, i32:$src1)))]
736>;
737
738def S_NAND_B64 : SOP2_64 <"s_nand_b64",
739  [(set i64:$sdst, (UniformUnaryFrag<not> (and_oneuse i64:$src0, i64:$src1)))]
740>;
741
742def S_NOR_B32 : SOP2_32 <"s_nor_b32",
743  [(set i32:$sdst, (UniformUnaryFrag<not> (or_oneuse i32:$src0, i32:$src1)))]
744>;
745
746def S_NOR_B64 : SOP2_64 <"s_nor_b64",
747  [(set i64:$sdst, (UniformUnaryFrag<not> (or_oneuse i64:$src0, i64:$src1)))]
748>;
749} // End isCommutable = 1
750
751// There are also separate patterns for types other than i32
752def S_ANDN2_B32 : SOP2_32 <"s_andn2_b32",
753  [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, (not i32:$src1)))]
754>;
755
756def S_ANDN2_B64 : SOP2_64 <"s_andn2_b64",
757  [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, (not i64:$src1)))]
758>;
759
760def S_ORN2_B32 : SOP2_32 <"s_orn2_b32",
761  [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, (not i32:$src1)))]
762>;
763
764def S_ORN2_B64 : SOP2_64 <"s_orn2_b64",
765  [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, (not i64:$src1)))]
766>;
767} // End Defs = [SCC]
768
769// Use added complexity so these patterns are preferred to the VALU patterns.
770let AddedComplexity = 1 in {
771
772let Defs = [SCC] in {
773// TODO: b64 versions require VOP3 change since v_lshlrev_b64 is VOP3
774def S_LSHL_B32 : SOP2_32 <"s_lshl_b32",
775  [(set SReg_32:$sdst, (UniformBinFrag<cshl_32> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]
776>;
777def S_LSHL_B64 : SOP2_64_32 <"s_lshl_b64",
778  [(set SReg_64:$sdst, (UniformBinFrag<cshl_64> (i64 SSrc_b64:$src0), (i32 SSrc_b32:$src1)))]
779>;
780def S_LSHR_B32 : SOP2_32 <"s_lshr_b32",
781  [(set SReg_32:$sdst, (UniformBinFrag<csrl_32> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]
782>;
783def S_LSHR_B64 : SOP2_64_32 <"s_lshr_b64",
784  [(set SReg_64:$sdst, (UniformBinFrag<csrl_64> (i64 SSrc_b64:$src0), (i32 SSrc_b32:$src1)))]
785>;
786def S_ASHR_I32 : SOP2_32 <"s_ashr_i32",
787  [(set SReg_32:$sdst, (UniformBinFrag<csra_32> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]
788>;
789def S_ASHR_I64 : SOP2_64_32 <"s_ashr_i64",
790  [(set SReg_64:$sdst, (UniformBinFrag<csra_64> (i64 SSrc_b64:$src0), (i32 SSrc_b32:$src1)))]
791>;
792} // End Defs = [SCC]
793
794let isReMaterializable = 1 in {
795def S_BFM_B32 : SOP2_32 <"s_bfm_b32",
796  [(set i32:$sdst, (UniformBinFrag<AMDGPUbfm> i32:$src0, i32:$src1))]>;
797def S_BFM_B64 : SOP2_64_32_32 <"s_bfm_b64">;
798
799def S_MUL_I32 : SOP2_32 <"s_mul_i32",
800  [(set i32:$sdst, (UniformBinFrag<mul> i32:$src0, i32:$src1))]> {
801  let isCommutable = 1;
802}
803} // End isReMaterializable = 1
804} // End AddedComplexity = 1
805
806let Defs = [SCC] in {
807def S_BFE_U32 : SOP2_32 <"s_bfe_u32">;
808def S_BFE_I32 : SOP2_32 <"s_bfe_i32">;
809def S_BFE_U64 : SOP2_64_32 <"s_bfe_u64">;
810def S_BFE_I64 : SOP2_64_32 <"s_bfe_i64">;
811} // End Defs = [SCC]
812
813def S_CBRANCH_G_FORK : SOP2_Pseudo <
814  "s_cbranch_g_fork", (outs),
815  (ins SCSrc_b64:$src0, SCSrc_b64:$src1),
816  "$src0, $src1"
817> {
818  let has_sdst = 0;
819  let SubtargetPredicate = isGFX6GFX7GFX8GFX9;
820}
821
822let Defs = [SCC] in {
823def S_ABSDIFF_I32 : SOP2_32 <"s_absdiff_i32">;
824} // End Defs = [SCC]
825
826let SubtargetPredicate = isGFX8GFX9 in {
827  def S_RFE_RESTORE_B64 : SOP2_Pseudo <
828    "s_rfe_restore_b64", (outs),
829    (ins SSrc_b64:$src0, SSrc_b32:$src1),
830    "$src0, $src1"
831  > {
832    let hasSideEffects = 1;
833    let has_sdst = 0;
834  }
835}
836
837let SubtargetPredicate = isGFX9Plus in {
838  let isReMaterializable = 1 in {
839    def S_PACK_LL_B32_B16 : SOP2_32<"s_pack_ll_b32_b16">;
840    def S_PACK_LH_B32_B16 : SOP2_32<"s_pack_lh_b32_b16">;
841    def S_PACK_HH_B32_B16 : SOP2_32<"s_pack_hh_b32_b16">;
842  } // End isReMaterializable = 1
843
844  let Defs = [SCC] in {
845    def S_LSHL1_ADD_U32 : SOP2_32<"s_lshl1_add_u32",
846      [(set i32:$sdst, (shl1_add SSrc_b32:$src0, SSrc_b32:$src1))]
847    >;
848    def S_LSHL2_ADD_U32 : SOP2_32<"s_lshl2_add_u32",
849      [(set i32:$sdst, (shl2_add SSrc_b32:$src0, SSrc_b32:$src1))]
850    >;
851    def S_LSHL3_ADD_U32 : SOP2_32<"s_lshl3_add_u32",
852      [(set i32:$sdst, (shl3_add SSrc_b32:$src0, SSrc_b32:$src1))]
853    >;
854    def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32",
855      [(set i32:$sdst, (shl4_add SSrc_b32:$src0, SSrc_b32:$src1))]
856    >;
857  } // End Defs = [SCC]
858
859  let isCommutable = 1, isReMaterializable = 1 in {
860    def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32",
861      [(set i32:$sdst, (UniformBinFrag<mulhu> SSrc_b32:$src0, SSrc_b32:$src1))]>;
862    def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32",
863      [(set i32:$sdst, (UniformBinFrag<mulhs> SSrc_b32:$src0, SSrc_b32:$src1))]>;
864  } // End isCommutable = 1, isReMaterializable = 1
865} // End SubtargetPredicate = isGFX9Plus
866
867let SubtargetPredicate = isGFX11Plus in {
868  def S_PACK_HL_B32_B16 : SOP2_32<"s_pack_hl_b32_b16">;
869} // End SubtargetPredicate = isGFX11Plus
870
871class SOP2_F32_Inst<string opName, SDPatternOperator Op, ValueType dstVt=f32> :
872  SOP2_F32<opName,
873    [(set dstVt:$sdst, (UniformBinFrag<Op> SSrc_f32:$src0, SSrc_f32:$src1))]>;
874
875class SOP2_F16_Inst<string opName, SDPatternOperator Op> :
876  SOP2_F16<opName,
877    [(set f16:$sdst, (UniformBinFrag<Op> SSrc_f16:$src0, SSrc_f16:$src1))]>;
878
879let SubtargetPredicate = HasSALUFloatInsts, mayRaiseFPException = 1,
880    Uses = [MODE], SchedRW = [WriteSFPU] in {
881  let isReMaterializable = 1 in {
882    let isCommutable = 1 in {
883      def S_ADD_F32 : SOP2_F32_Inst<"s_add_f32", any_fadd>;
884      def S_MIN_F32 : SOP2_F32_Inst<"s_min_f32", fminnum_like>;
885      def S_MAX_F32 : SOP2_F32_Inst<"s_max_f32", fmaxnum_like>;
886      def S_MUL_F32 : SOP2_F32_Inst<"s_mul_f32", any_fmul>;
887
888      let FixedSize = 1 in
889      def S_FMAAK_F32 : SOP2_Pseudo<
890        "s_fmaak_f32", (outs SReg_32:$sdst),
891        (ins SSrc_f32_Deferred:$src0, SSrc_f32_Deferred:$src1, KImmFP32:$imm),
892        "$sdst, $src0, $src1, $imm"
893      >;
894
895      let FPDPRounding = 1 in {
896        def S_ADD_F16 : SOP2_F16_Inst<"s_add_f16", any_fadd>;
897        def S_MUL_F16 : SOP2_F16_Inst<"s_mul_f16", any_fmul>;
898      } // End FPDPRounding
899
900      def S_MIN_F16 : SOP2_F16_Inst<"s_min_f16", fminnum_like>;
901      def S_MAX_F16 : SOP2_F16_Inst<"s_max_f16", fmaxnum_like>;
902    } // End isCommutable = 1
903
904    let FPDPRounding = 1 in
905      def S_SUB_F16 : SOP2_F16_Inst<"s_sub_f16", any_fsub>;
906
907    def S_SUB_F32            : SOP2_F32_Inst<"s_sub_f32", any_fsub>;
908    def S_CVT_PK_RTZ_F16_F32 : SOP2_F32_Inst<"s_cvt_pk_rtz_f16_f32",
909                                             AMDGPUpkrtz_f16_f32, v2f16>;
910
911    let FixedSize = 1 in
912    def S_FMAMK_F32 : SOP2_Pseudo<
913      "s_fmamk_f32", (outs SReg_32:$sdst),
914      (ins SSrc_f32_Deferred:$src0, KImmFP32:$imm, SSrc_f32_Deferred:$src1),
915      "$sdst, $src0, $imm, $src1"
916    >;
917  } // End isReMaterializable = 1
918
919  let Constraints = "$sdst = $src2", DisableEncoding="$src2",
920      isCommutable = 1, AddedComplexity = 20 in {
921    def S_FMAC_F32 : SOP2_Pseudo<
922      "s_fmac_f32", (outs SReg_32:$sdst),
923      (ins SSrc_f32:$src0, SSrc_f32:$src1, SReg_32:$src2),
924      "$sdst, $src0, $src1",
925      [(set f32:$sdst, (UniformTernaryFrag<any_fma> SSrc_f32:$src0, SSrc_f32:$src1, SReg_32:$src2))]
926    >;
927
928    def S_FMAC_F16 : SOP2_Pseudo<
929      "s_fmac_f16", (outs SReg_32:$sdst),
930      (ins SSrc_f16:$src0, SSrc_f16:$src1, SReg_32:$src2),
931      "$sdst, $src0, $src1",
932      [(set f16:$sdst, (UniformTernaryFrag<any_fma> SSrc_f16:$src0, SSrc_f16:$src1, SReg_32:$src2))]
933    >;
934  } // End Constraints = "$sdst = $src2", DisableEncoding="$src2",
935    // isCommutable = 1, AddedComplexity = 20
936} // End SubtargetPredicate = HasSALUFloatInsts, mayRaiseFPException = 1,
937  // Uses = [MODE], SchedRW = [WriteSFPU]
938
939// On GFX12 MIN/MAX instructions do not read MODE register.
940let SubtargetPredicate = isGFX12Plus, mayRaiseFPException = 1, isCommutable = 1,
941    isReMaterializable = 1, SchedRW = [WriteSFPU], AddedComplexity = 17 in {
942  def S_MINIMUM_F32 : SOP2_F32_Inst<"s_minimum_f32", fminimum>;
943  def S_MAXIMUM_F32 : SOP2_F32_Inst<"s_maximum_f32", fmaximum>;
944  def S_MINIMUM_F16 : SOP2_F16_Inst<"s_minimum_f16", fminimum>;
945  def S_MAXIMUM_F16 : SOP2_F16_Inst<"s_maximum_f16", fmaximum>;
946}
947
948//===----------------------------------------------------------------------===//
949// SOPK Instructions
950//===----------------------------------------------------------------------===//
951
952class SOPK_Pseudo <string opName, dag outs, dag ins,
953                   string asmOps, list<dag> pattern=[]> :
954  SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> {
955  let mayLoad = 0;
956  let mayStore = 0;
957  let hasSideEffects = 0;
958  let SALU = 1;
959  let SOPK = 1;
960  let FixedSize = 1;
961  let SchedRW = [WriteSALU];
962  let UseNamedOperandTable = 1;
963
964  let has_sdst = 1;
965}
966
967class SOPK_Real<SOPK_Pseudo ps, string name = ps.Mnemonic> :
968  InstSI <ps.OutOperandList, ps.InOperandList,
969          name # ps.AsmOperands> {
970  let SALU = 1;
971  let SOPK = 1;
972  let isPseudo = 0;
973  let isCodeGenOnly = 0;
974  let UseNamedOperandTable = 1;
975
976  // copy relevant pseudo op flags
977  let SubtargetPredicate = ps.SubtargetPredicate;
978  let AsmMatchConverter  = ps.AsmMatchConverter;
979  let DisableEncoding    = ps.DisableEncoding;
980  let Constraints        = ps.Constraints;
981  let SchedRW            = ps.SchedRW;
982  let mayLoad            = ps.mayLoad;
983  let mayStore           = ps.mayStore;
984  let isBranch           = ps.isBranch;
985  let isCall             = ps.isCall;
986  let isTerminator       = ps.isTerminator;
987  let isReturn           = ps.isReturn;
988  let isBarrier          = ps.isBarrier;
989  let Uses               = ps.Uses;
990  let Defs               = ps.Defs;
991  let isConvergent       = ps.isConvergent;
992
993  // encoding
994  bits<7>  sdst;
995  bits<16> simm16;
996  bits<32> imm;
997}
998
999class SOPK_Real32<bits<5> op, SOPK_Pseudo ps, string name = ps.Mnemonic> :
1000  SOPK_Real <ps, name>,
1001  Enc32 {
1002  let Inst{15-0}  = simm16;
1003  let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
1004  let Inst{27-23} = op;
1005  let Inst{31-28} = 0xb; //encoding
1006}
1007
1008class SOPK_Real64<bits<5> op, SOPK_Pseudo ps> :
1009  SOPK_Real<ps>,
1010  Enc64 {
1011  let Inst{15-0}  = simm16;
1012  let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
1013  let Inst{27-23} = op;
1014  let Inst{31-28} = 0xb; //encoding
1015  let Inst{63-32} = imm;
1016}
1017
1018class SOPKInstTable <bit is_sopk, string cmpOp = ""> {
1019  bit IsSOPK = is_sopk;
1020  string BaseCmpOp = cmpOp;
1021}
1022
1023class SOPK_32 <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
1024  opName,
1025  (outs SReg_32:$sdst),
1026  (ins s16imm:$simm16),
1027  "$sdst, $simm16",
1028  pattern>;
1029
1030class SOPK_32_BR <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
1031  opName,
1032  (outs),
1033  (ins SOPPBrTarget:$simm16, SReg_32:$sdst),
1034  "$sdst, $simm16",
1035  pattern> {
1036  let Defs = [EXEC];
1037  let Uses = [EXEC];
1038  let isBranch = 1;
1039  let isTerminator = 1;
1040  let SchedRW = [WriteBranch];
1041}
1042
1043class SOPK_SCC <string opName, string base_op, bit isSignExt> : SOPK_Pseudo <
1044  opName,
1045  (outs),
1046  !if(isSignExt,
1047      (ins SReg_32:$sdst, s16imm:$simm16),
1048      (ins SReg_32:$sdst, u16imm:$simm16)),
1049  "$sdst, $simm16">,
1050  SOPKInstTable<1, base_op>{
1051  let Defs = [SCC];
1052}
1053
1054class SOPK_32TIE <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
1055  opName,
1056  (outs SReg_32:$sdst),
1057  (ins SReg_32:$src0, s16imm:$simm16),
1058  "$sdst, $simm16",
1059  pattern
1060>;
1061
1062let isReMaterializable = 1, isMoveImm = 1 in {
1063def S_MOVK_I32 : SOPK_32 <"s_movk_i32">;
1064} // End isReMaterializable = 1
1065let Uses = [SCC] in {
1066def S_CMOVK_I32 : SOPK_32 <"s_cmovk_i32">;
1067}
1068
1069let isCompare = 1 in {
1070
1071// This instruction is disabled for now until we can figure out how to teach
1072// the instruction selector to correctly use the  S_CMP* vs V_CMP*
1073// instructions.
1074//
1075// When this instruction is enabled the code generator sometimes produces this
1076// invalid sequence:
1077//
1078// SCC = S_CMPK_EQ_I32 SGPR0, imm
1079// VCC = COPY SCC
1080// VGPR0 = V_CNDMASK VCC, VGPR0, VGPR1
1081//
1082// def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32",
1083//   [(set i1:$dst, (setcc i32:$src0, imm:$src1, SETEQ))]
1084// >;
1085
1086def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", "s_cmp_eq_i32", 1>;
1087def S_CMPK_LG_I32 : SOPK_SCC <"s_cmpk_lg_i32", "s_cmp_lg_i32", 1>;
1088def S_CMPK_GT_I32 : SOPK_SCC <"s_cmpk_gt_i32", "s_cmp_gt_i32", 1>;
1089def S_CMPK_GE_I32 : SOPK_SCC <"s_cmpk_ge_i32", "s_cmp_ge_i32", 1>;
1090def S_CMPK_LT_I32 : SOPK_SCC <"s_cmpk_lt_i32", "s_cmp_lt_i32", 1>;
1091def S_CMPK_LE_I32 : SOPK_SCC <"s_cmpk_le_i32", "s_cmp_le_i32", 1>;
1092
1093def S_CMPK_EQ_U32 : SOPK_SCC <"s_cmpk_eq_u32", "s_cmp_eq_u32", 0>;
1094def S_CMPK_LG_U32 : SOPK_SCC <"s_cmpk_lg_u32", "s_cmp_lg_u32", 0>;
1095def S_CMPK_GT_U32 : SOPK_SCC <"s_cmpk_gt_u32", "s_cmp_gt_u32", 0>;
1096def S_CMPK_GE_U32 : SOPK_SCC <"s_cmpk_ge_u32", "s_cmp_ge_u32", 0>;
1097def S_CMPK_LT_U32 : SOPK_SCC <"s_cmpk_lt_u32", "s_cmp_lt_u32", 0>;
1098def S_CMPK_LE_U32 : SOPK_SCC <"s_cmpk_le_u32", "s_cmp_le_u32", 0>;
1099} // End isCompare = 1
1100
1101let isCommutable = 1, DisableEncoding = "$src0",
1102    Constraints = "$sdst = $src0" in {
1103  let Defs = [SCC] in
1104    def S_ADDK_I32 : SOPK_32TIE <"s_addk_i32">;
1105  def S_MULK_I32 : SOPK_32TIE <"s_mulk_i32">;
1106}
1107
1108let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in
1109def S_CBRANCH_I_FORK : SOPK_Pseudo <
1110  "s_cbranch_i_fork",
1111  (outs), (ins SReg_64:$sdst, SOPPBrTarget:$simm16),
1112  "$sdst, $simm16"
1113>;
1114
1115// This is hasSideEffects to allow its use in readcyclecounter selection.
1116// FIXME: Need to truncate immediate to 16-bits.
1117// FIXME: Should have separate pseudos for known may read MODE and
1118// only read MODE.
1119def S_GETREG_B32 : SOPK_Pseudo <
1120  "s_getreg_b32",
1121  (outs SReg_32:$sdst), (ins hwreg:$simm16),
1122  "$sdst, $simm16",
1123  [(set i32:$sdst, (int_amdgcn_s_getreg (i32 timm:$simm16)))]> {
1124  let hasSideEffects = 1;
1125  let Uses = [MODE];
1126}
1127
1128let Defs = [MODE], Uses = [MODE] in {
1129
1130// FIXME: Need to truncate immediate to 16-bits.
1131class S_SETREG_B32_Pseudo <list<dag> pattern=[]> : SOPK_Pseudo <
1132  "s_setreg_b32",
1133  (outs), (ins SReg_32:$sdst, hwreg:$simm16),
1134  "$simm16, $sdst",
1135  pattern>;
1136
1137def S_SETREG_B32 : S_SETREG_B32_Pseudo <
1138  [(int_amdgcn_s_setreg (i32 SIMM16bit:$simm16), i32:$sdst)]> {
1139  // Use custom inserter to optimize some cases to
1140  // S_DENORM_MODE/S_ROUND_MODE/S_SETREG_B32_mode.
1141  let usesCustomInserter = 1;
1142  let hasSideEffects = 1;
1143}
1144
1145// Variant of SETREG that is guaranteed to only touch FP bits in the MODE
1146// register, so doesn't have unmodeled side effects.
1147def S_SETREG_B32_mode : S_SETREG_B32_Pseudo {
1148  let hasSideEffects = 0;
1149}
1150
1151// FIXME: Not on SI?
1152//def S_GETREG_REGRD_B32 : SOPK_32 <sopk<0x14, 0x13>, "s_getreg_regrd_b32">;
1153
1154class S_SETREG_IMM32_B32_Pseudo : SOPK_Pseudo <
1155  "s_setreg_imm32_b32",
1156  (outs), (ins i32imm:$imm, hwreg:$simm16),
1157  "$simm16, $imm"> {
1158  let Size = 8; // Unlike every other SOPK instruction.
1159  let has_sdst = 0;
1160}
1161
1162def S_SETREG_IMM32_B32 : S_SETREG_IMM32_B32_Pseudo {
1163  let hasSideEffects = 1;
1164}
1165
1166// Variant of SETREG_IMM32 that is guaranteed to only touch FP bits in the MODE
1167// register, so doesn't have unmodeled side effects.
1168def S_SETREG_IMM32_B32_mode : S_SETREG_IMM32_B32_Pseudo {
1169  let hasSideEffects = 0;
1170}
1171
1172} // End Defs = [MODE], Uses = [MODE]
1173
1174class SOPK_WAITCNT<string opName, list<dag> pat=[]> :
1175    SOPK_Pseudo<
1176        opName,
1177        (outs),
1178        (ins SReg_32:$sdst, s16imm:$simm16),
1179        "$sdst, $simm16",
1180        pat> {
1181  let hasSideEffects = 1;
1182  let mayLoad = 1;
1183  let mayStore = 1;
1184  let has_sdst = 1; // First source takes place of sdst in encoding
1185}
1186
1187let SubtargetPredicate = isGFX9Plus in {
1188  def S_CALL_B64 : SOPK_Pseudo<
1189      "s_call_b64",
1190      (outs SReg_64:$sdst),
1191      (ins SOPPBrTarget:$simm16),
1192      "$sdst, $simm16"> {
1193    let isCall = 1;
1194  }
1195} // End SubtargetPredicate = isGFX9Plus
1196
1197def VersionImm : S16ImmOperand {
1198  let DecoderMethod = "decodeVersionImm";
1199}
1200
1201let SubtargetPredicate = isGFX10Plus in {
1202  def S_VERSION : SOPK_Pseudo<
1203      "s_version",
1204      (outs),
1205      (ins VersionImm:$simm16),
1206      "$simm16"> {
1207    let has_sdst = 0;
1208  }
1209} // End SubtargetPredicate = isGFX10Plus
1210
1211let SubtargetPredicate = isGFX10GFX11 in {
1212  def S_SUBVECTOR_LOOP_BEGIN : SOPK_32_BR<"s_subvector_loop_begin">;
1213  def S_SUBVECTOR_LOOP_END   : SOPK_32_BR<"s_subvector_loop_end">;
1214
1215  def S_WAITCNT_VSCNT   : SOPK_WAITCNT<"s_waitcnt_vscnt">;
1216  def S_WAITCNT_VMCNT   : SOPK_WAITCNT<"s_waitcnt_vmcnt">;
1217  def S_WAITCNT_EXPCNT  : SOPK_WAITCNT<"s_waitcnt_expcnt">;
1218  def S_WAITCNT_LGKMCNT : SOPK_WAITCNT<"s_waitcnt_lgkmcnt">;
1219} // End SubtargetPredicate = isGFX10GFX11
1220
1221//===----------------------------------------------------------------------===//
1222// SOPC Instructions
1223//===----------------------------------------------------------------------===//
1224
1225class SOPC_Pseudo<string opName, dag outs, dag ins,
1226                  string asmOps, list<dag> pattern=[]> :
1227  SOP_Pseudo<opName, outs, ins, " " # asmOps, pattern> {
1228  let mayLoad = 0;
1229  let mayStore = 0;
1230  let hasSideEffects = 0;
1231  let SALU = 1;
1232  let SOPC = 1;
1233  let Defs = [SCC];
1234  let SchedRW = [WriteSALU];
1235  let UseNamedOperandTable = 1;
1236}
1237
1238class SOPC_Real<bits<7> op, SOPC_Pseudo ps> :
1239  InstSI <ps.OutOperandList, ps.InOperandList,
1240          ps.Mnemonic # ps.AsmOperands>,
1241  Enc32 {
1242  let SALU = 1;
1243  let SOPC = 1;
1244  let isPseudo = 0;
1245  let isCodeGenOnly = 0;
1246
1247  // copy relevant pseudo op flags
1248  let SubtargetPredicate   = ps.SubtargetPredicate;
1249  let OtherPredicates      = ps.OtherPredicates;
1250  let AsmMatchConverter    = ps.AsmMatchConverter;
1251  let UseNamedOperandTable = ps.UseNamedOperandTable;
1252  let TSFlags              = ps.TSFlags;
1253  let SchedRW              = ps.SchedRW;
1254  let mayLoad              = ps.mayLoad;
1255  let mayStore             = ps.mayStore;
1256  let Uses                 = ps.Uses;
1257  let Defs                 = ps.Defs;
1258  let isConvergent         = ps.isConvergent;
1259
1260  // encoding
1261  bits<8> src0;
1262  bits<8> src1;
1263
1264  let Inst{7-0} = src0;
1265  let Inst{15-8} = src1;
1266  let Inst{22-16} = op;
1267  let Inst{31-23} = 0x17e;
1268}
1269
1270class SOPC_Base <RegisterOperand rc0, RegisterOperand rc1,
1271                 string opName, list<dag> pattern = []> : SOPC_Pseudo <
1272  opName, (outs), (ins rc0:$src0, rc1:$src1),
1273  "$src0, $src1", pattern > {
1274}
1275
1276class SOPC_Helper <RegisterOperand rc, ValueType vt,
1277                    string opName, SDPatternOperator cond> : SOPC_Base <
1278  rc, rc, opName,
1279  [(set SCC, (UniformTernaryFrag<setcc> vt:$src0, vt:$src1, cond))] > {
1280}
1281
1282class SOPC_CMP_32<string opName,
1283                  SDPatternOperator cond = COND_NULL, string revOp = opName>
1284  : SOPC_Helper<SSrc_b32, i32, opName, cond>,
1285    Commutable_REV<revOp, !eq(revOp, opName)>,
1286    SOPKInstTable<0, opName> {
1287  let isCompare = 1;
1288  let isCommutable = 1;
1289}
1290
1291class SOPC_CMP_F32<string opName,
1292                  SDPatternOperator cond = COND_NULL, string revOp = opName>
1293  : SOPC_Helper<SSrc_b32, f32, opName, cond>,
1294    Commutable_REV<revOp, !eq(revOp, opName)>,
1295    SOPKInstTable<0, opName> {
1296  let isCompare = 1;
1297  let isCommutable = 1;
1298  let mayRaiseFPException = 1;
1299  let Uses = [MODE];
1300  let SchedRW = [WriteSFPU];
1301}
1302
1303class SOPC_CMP_F16<string opName,
1304                  SDPatternOperator cond = COND_NULL, string revOp = opName>
1305  : SOPC_Helper<SSrc_b16, f16, opName, cond>,
1306    Commutable_REV<revOp, !eq(revOp, opName)>,
1307    SOPKInstTable<0, opName> {
1308  let isCompare = 1;
1309  let isCommutable = 1;
1310  let mayRaiseFPException = 1;
1311  let Uses = [MODE];
1312  let SchedRW = [WriteSFPU];
1313}
1314
1315class SOPC_CMP_64<string opName,
1316                  SDPatternOperator cond = COND_NULL, string revOp = opName>
1317  : SOPC_Helper<SSrc_b64, i64, opName, cond>,
1318    Commutable_REV<revOp, !eq(revOp, opName)> {
1319  let isCompare = 1;
1320  let isCommutable = 1;
1321}
1322
1323class SOPC_32<string opName, list<dag> pattern = []>
1324  : SOPC_Base<SSrc_b32, SSrc_b32, opName, pattern>;
1325
1326class SOPC_64_32<string opName, list<dag> pattern = []>
1327  : SOPC_Base<SSrc_b64, SSrc_b32, opName, pattern>;
1328
1329def S_CMP_EQ_I32 : SOPC_CMP_32 <"s_cmp_eq_i32">;
1330def S_CMP_LG_I32 : SOPC_CMP_32 <"s_cmp_lg_i32">;
1331def S_CMP_GT_I32 : SOPC_CMP_32 <"s_cmp_gt_i32", COND_SGT>;
1332def S_CMP_GE_I32 : SOPC_CMP_32 <"s_cmp_ge_i32", COND_SGE>;
1333def S_CMP_LT_I32 : SOPC_CMP_32 <"s_cmp_lt_i32", COND_SLT, "s_cmp_gt_i32">;
1334def S_CMP_LE_I32 : SOPC_CMP_32 <"s_cmp_le_i32", COND_SLE, "s_cmp_ge_i32">;
1335def S_CMP_EQ_U32 : SOPC_CMP_32 <"s_cmp_eq_u32", COND_EQ>;
1336def S_CMP_LG_U32 : SOPC_CMP_32 <"s_cmp_lg_u32", COND_NE>;
1337def S_CMP_GT_U32 : SOPC_CMP_32 <"s_cmp_gt_u32", COND_UGT>;
1338def S_CMP_GE_U32 : SOPC_CMP_32 <"s_cmp_ge_u32", COND_UGE>;
1339def S_CMP_LT_U32 : SOPC_CMP_32 <"s_cmp_lt_u32", COND_ULT, "s_cmp_gt_u32">;
1340def S_CMP_LE_U32 : SOPC_CMP_32 <"s_cmp_le_u32", COND_ULE, "s_cmp_ge_u32">;
1341
1342def S_BITCMP0_B32 : SOPC_32 <"s_bitcmp0_b32">;
1343def S_BITCMP1_B32 : SOPC_32 <"s_bitcmp1_b32">;
1344def S_BITCMP0_B64 : SOPC_64_32 <"s_bitcmp0_b64">;
1345def S_BITCMP1_B64 : SOPC_64_32 <"s_bitcmp1_b64">;
1346let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in
1347def S_SETVSKIP : SOPC_32 <"s_setvskip">;
1348
1349let SubtargetPredicate = isGFX8Plus in {
1350def S_CMP_EQ_U64 : SOPC_CMP_64 <"s_cmp_eq_u64", COND_EQ>;
1351def S_CMP_LG_U64 : SOPC_CMP_64 <"s_cmp_lg_u64", COND_NE>;
1352} // End SubtargetPredicate = isGFX8Plus
1353
1354let SubtargetPredicate = HasVGPRIndexMode in {
1355// Setting the GPR index mode is really writing the fields in the mode
1356// register. We don't want to add mode register uses to every
1357// instruction, and it's too complicated to deal with anyway. This is
1358// modeled just as a side effect.
1359def S_SET_GPR_IDX_ON : SOPC_Pseudo <
1360  "s_set_gpr_idx_on" ,
1361  (outs),
1362  (ins SSrc_b32:$src0, GPRIdxMode:$src1),
1363  "$src0, $src1"> {
1364  let Defs = [M0, MODE]; // No scc def
1365  let Uses = [M0, MODE]; // Other bits of mode, m0 unmodified.
1366  let hasSideEffects = 1; // Sets mode.gpr_idx_en
1367  let FixedSize = 1;
1368}
1369}
1370
1371let SubtargetPredicate = HasSALUFloatInsts in {
1372
1373def S_CMP_LT_F32  : SOPC_CMP_F32<"s_cmp_lt_f32", COND_OLT, "s_cmp_gt_f32">;
1374def S_CMP_EQ_F32  : SOPC_CMP_F32<"s_cmp_eq_f32", COND_OEQ>;
1375def S_CMP_LE_F32  : SOPC_CMP_F32<"s_cmp_le_f32", COND_OLE, "s_cmp_ge_f32">;
1376def S_CMP_GT_F32  : SOPC_CMP_F32<"s_cmp_gt_f32", COND_OGT>;
1377def S_CMP_LG_F32  : SOPC_CMP_F32<"s_cmp_lg_f32", COND_ONE>;
1378def S_CMP_GE_F32  : SOPC_CMP_F32<"s_cmp_ge_f32", COND_OGE>;
1379def S_CMP_O_F32   : SOPC_CMP_F32<"s_cmp_o_f32", COND_O>;
1380def S_CMP_U_F32   : SOPC_CMP_F32<"s_cmp_u_f32", COND_UO>;
1381def S_CMP_NGE_F32 : SOPC_CMP_F32<"s_cmp_nge_f32", COND_ULT, "s_cmp_nle_f32">;
1382def S_CMP_NLG_F32 : SOPC_CMP_F32<"s_cmp_nlg_f32", COND_UEQ>;
1383def S_CMP_NGT_F32 : SOPC_CMP_F32<"s_cmp_ngt_f32", COND_ULE, "s_cmp_nlt_f32">;
1384def S_CMP_NLE_F32 : SOPC_CMP_F32<"s_cmp_nle_f32", COND_UGT>;
1385def S_CMP_NEQ_F32 : SOPC_CMP_F32<"s_cmp_neq_f32", COND_UNE>;
1386def S_CMP_NLT_F32 : SOPC_CMP_F32<"s_cmp_nlt_f32", COND_UGE>;
1387
1388def S_CMP_LT_F16  : SOPC_CMP_F16<"s_cmp_lt_f16", COND_OLT, "s_cmp_gt_f16">;
1389def S_CMP_EQ_F16  : SOPC_CMP_F16<"s_cmp_eq_f16", COND_OEQ>;
1390def S_CMP_LE_F16  : SOPC_CMP_F16<"s_cmp_le_f16", COND_OLE, "s_cmp_ge_f16">;
1391def S_CMP_GT_F16  : SOPC_CMP_F16<"s_cmp_gt_f16", COND_OGT>;
1392def S_CMP_LG_F16  : SOPC_CMP_F16<"s_cmp_lg_f16", COND_ONE>;
1393def S_CMP_GE_F16  : SOPC_CMP_F16<"s_cmp_ge_f16", COND_OGE>;
1394def S_CMP_O_F16   : SOPC_CMP_F16<"s_cmp_o_f16", COND_O>;
1395def S_CMP_U_F16   : SOPC_CMP_F16<"s_cmp_u_f16", COND_UO>;
1396def S_CMP_NGE_F16 : SOPC_CMP_F16<"s_cmp_nge_f16", COND_ULT, "s_cmp_nle_f16">;
1397def S_CMP_NLG_F16 : SOPC_CMP_F16<"s_cmp_nlg_f16", COND_UEQ>;
1398def S_CMP_NGT_F16 : SOPC_CMP_F16<"s_cmp_ngt_f16", COND_ULE, "s_cmp_nlt_f16">;
1399def S_CMP_NLE_F16 : SOPC_CMP_F16<"s_cmp_nle_f16", COND_UGT>;
1400def S_CMP_NEQ_F16 : SOPC_CMP_F16<"s_cmp_neq_f16", COND_UNE>;
1401def S_CMP_NLT_F16 : SOPC_CMP_F16<"s_cmp_nlt_f16", COND_UGE>;
1402
1403} // End SubtargetPredicate = HasSALUFloatInsts
1404
1405//===----------------------------------------------------------------------===//
1406// SOPP Instructions
1407//===----------------------------------------------------------------------===//
1408
1409class SOPP_Pseudo<string opName, dag ins,
1410                  string asmOps = "", list<dag> pattern=[],
1411                  string sep = !if(!empty(asmOps), "", " "),
1412                  string keyName = opName> :
1413  SOP_Pseudo<opName, (outs), ins, sep # asmOps, pattern> {
1414  let mayLoad = 0;
1415  let mayStore = 0;
1416  let hasSideEffects = 0;
1417  let SALU = 1;
1418  let SOPP = 1;
1419  let FixedSize = 1;
1420  let SchedRW = [WriteSALU];
1421  let UseNamedOperandTable = 1;
1422  bits <16> simm16;
1423  bits <1> fixed_imm = 0;
1424  string KeyName = keyName;
1425}
1426
1427class SOPPRelaxTable <bit isRelaxed, string keyName, string gfxip> {
1428  bit IsRelaxed = isRelaxed;
1429  string KeyName = keyName # gfxip;
1430}
1431
1432class SOPP_Real<SOPP_Pseudo ps, string name = ps.Mnemonic> :
1433  InstSI <ps.OutOperandList, ps.InOperandList,
1434          name # ps.AsmOperands> {
1435  let SALU = 1;
1436  let SOPP = 1;
1437  let isPseudo = 0;
1438  let isCodeGenOnly = 0;
1439
1440  // copy relevant pseudo op flags
1441  let SubtargetPredicate   = ps.SubtargetPredicate;
1442  let OtherPredicates      = ps.OtherPredicates;
1443  let AsmMatchConverter    = ps.AsmMatchConverter;
1444  let UseNamedOperandTable = ps.UseNamedOperandTable;
1445  let TSFlags              = ps.TSFlags;
1446  let SchedRW              = ps.SchedRW;
1447  let mayLoad              = ps.mayLoad;
1448  let mayStore             = ps.mayStore;
1449  let isTerminator         = ps.isTerminator;
1450  let isReturn             = ps.isReturn;
1451  let isCall               = ps.isCall;
1452  let isBranch             = ps.isBranch;
1453  let isBarrier            = ps.isBarrier;
1454  let Uses                 = ps.Uses;
1455  let Defs                 = ps.Defs;
1456  let isConvergent         = ps.isConvergent;
1457  bits <16> simm16;
1458}
1459
1460class SOPP_Real_32 <bits<7> op, SOPP_Pseudo ps, string name = ps.Mnemonic> : SOPP_Real<ps, name>,
1461Enc32 {
1462  let Inst{15-0} = !if(ps.fixed_imm, ps.simm16, simm16);
1463  let Inst{22-16} = op;
1464  let Inst{31-23} = 0x17f;
1465}
1466
1467class SOPP_Real_64 <bits<7> op, SOPP_Pseudo ps, string name = ps.Mnemonic> : SOPP_Real<ps, name>,
1468Enc64 {
1469  // encoding
1470  let Inst{15-0} = !if(ps.fixed_imm, ps.simm16, simm16);
1471  let Inst{22-16} = op;
1472  let Inst{31-23} = 0x17f;
1473  //effectively a nop
1474  let Inst{47-32} = 0x0;
1475  let Inst{54-48} = 0x0;
1476  let Inst{63-55} = 0x17f;
1477}
1478
1479multiclass SOPP_With_Relaxation <string opName, dag ins,
1480                  string asmOps, list<dag> pattern=[]> {
1481  def "" : SOPP_Pseudo <opName, ins, asmOps, pattern>;
1482  def _pad_s_nop : SOPP_Pseudo <opName # "_pad_s_nop", ins, asmOps, pattern, " ", opName>;
1483}
1484
1485def S_NOP : SOPP_Pseudo<"s_nop" , (ins i16imm:$simm16), "$simm16",
1486  [(int_amdgcn_s_nop timm:$simm16)]> {
1487  let hasSideEffects = 1;
1488}
1489
1490let isTerminator = 1 in {
1491def S_ENDPGM : SOPP_Pseudo<"s_endpgm", (ins Endpgm:$simm16), "$simm16", [], ""> {
1492  let isBarrier = 1;
1493  let isReturn = 1;
1494  let hasSideEffects = 1;
1495}
1496
1497def S_ENDPGM_SAVED : SOPP_Pseudo<"s_endpgm_saved", (ins)> {
1498  let SubtargetPredicate = isGFX8Plus;
1499  let simm16 = 0;
1500  let fixed_imm = 1;
1501  let isBarrier = 1;
1502  let isReturn = 1;
1503}
1504
1505let SubtargetPredicate = isGFX9GFX10GFX11 in {
1506  let isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1 in {
1507    def S_ENDPGM_ORDERED_PS_DONE :
1508      SOPP_Pseudo<"s_endpgm_ordered_ps_done", (ins)>;
1509  } // End isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1
1510} // End SubtargetPredicate = isGFX9GFX10GFX11
1511
1512let SubtargetPredicate = isGFX10Plus in {
1513  let isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1 in {
1514    def S_CODE_END :
1515      SOPP_Pseudo<"s_code_end", (ins)>;
1516  } // End isBarrier = 1, isReturn = 1, simm16 = 0, fixed_imm = 1
1517} // End SubtargetPredicate = isGFX10Plus
1518
1519let isBranch = 1, SchedRW = [WriteBranch] in {
1520let isBarrier = 1 in {
1521defm S_BRANCH : SOPP_With_Relaxation<
1522  "s_branch" , (ins SOPPBrTarget:$simm16), "$simm16",
1523  [(br bb:$simm16)]>;
1524}
1525
1526let Uses = [SCC] in {
1527defm S_CBRANCH_SCC0 : SOPP_With_Relaxation<
1528  "s_cbranch_scc0" , (ins SOPPBrTarget:$simm16),
1529  "$simm16"
1530>;
1531defm S_CBRANCH_SCC1 : SOPP_With_Relaxation <
1532  "s_cbranch_scc1" , (ins SOPPBrTarget:$simm16),
1533  "$simm16"
1534>;
1535} // End Uses = [SCC]
1536
1537let Uses = [VCC] in {
1538defm S_CBRANCH_VCCZ : SOPP_With_Relaxation <
1539  "s_cbranch_vccz" , (ins SOPPBrTarget:$simm16),
1540  "$simm16"
1541>;
1542defm S_CBRANCH_VCCNZ : SOPP_With_Relaxation <
1543  "s_cbranch_vccnz" , (ins SOPPBrTarget:$simm16),
1544  "$simm16"
1545>;
1546} // End Uses = [VCC]
1547
1548let Uses = [EXEC] in {
1549defm S_CBRANCH_EXECZ : SOPP_With_Relaxation <
1550  "s_cbranch_execz" , (ins SOPPBrTarget:$simm16),
1551  "$simm16"
1552>;
1553defm S_CBRANCH_EXECNZ : SOPP_With_Relaxation <
1554  "s_cbranch_execnz" , (ins SOPPBrTarget:$simm16),
1555  "$simm16"
1556>;
1557} // End Uses = [EXEC]
1558
1559defm S_CBRANCH_CDBGSYS : SOPP_With_Relaxation <
1560  "s_cbranch_cdbgsys" , (ins SOPPBrTarget:$simm16),
1561  "$simm16"
1562>;
1563
1564defm S_CBRANCH_CDBGSYS_AND_USER : SOPP_With_Relaxation <
1565  "s_cbranch_cdbgsys_and_user" , (ins SOPPBrTarget:$simm16),
1566  "$simm16"
1567>;
1568
1569defm S_CBRANCH_CDBGSYS_OR_USER : SOPP_With_Relaxation <
1570  "s_cbranch_cdbgsys_or_user" , (ins SOPPBrTarget:$simm16),
1571  "$simm16"
1572>;
1573
1574defm S_CBRANCH_CDBGUSER : SOPP_With_Relaxation <
1575  "s_cbranch_cdbguser" , (ins SOPPBrTarget:$simm16),
1576  "$simm16"
1577>;
1578
1579} // End isBranch = 1
1580} // End isTerminator = 1
1581
1582let hasSideEffects = 1 in {
1583def S_BARRIER : SOPP_Pseudo <"s_barrier", (ins), "",
1584  [(int_amdgcn_s_barrier)]> {
1585  let SchedRW = [WriteBarrier];
1586  let simm16 = 0;
1587  let fixed_imm = 1;
1588  let isConvergent = 1;
1589}
1590
1591def S_BARRIER_WAIT : SOPP_Pseudo <"s_barrier_wait", (ins i16imm:$simm16), "$simm16",
1592  [(int_amdgcn_s_barrier_wait timm:$simm16)]> {
1593  let SchedRW = [WriteBarrier];
1594  let isConvergent = 1;
1595}
1596
1597def S_BARRIER_LEAVE : SOPP_Pseudo <"s_barrier_leave", (ins)> {
1598  let SchedRW = [WriteBarrier];
1599  let simm16 = 0;
1600  let fixed_imm = 1;
1601  let isConvergent = 1;
1602  let Defs = [SCC];
1603}
1604
1605def S_BARRIER_LEAVE_IMM : SOPP_Pseudo <"s_barrier_leave",
1606    (ins i16imm:$simm16), "$simm16", [(int_amdgcn_s_barrier_leave timm:$simm16)]>;
1607
1608def S_WAKEUP : SOPP_Pseudo <"s_wakeup", (ins) > {
1609  let SubtargetPredicate = isGFX8Plus;
1610  let simm16 = 0;
1611  let fixed_imm = 1;
1612  let mayLoad = 1;
1613  let mayStore = 1;
1614}
1615
1616def S_WAITCNT : SOPP_Pseudo <"s_waitcnt" , (ins SWaitCnt:$simm16), "$simm16",
1617    [(int_amdgcn_s_waitcnt timm:$simm16)]>;
1618
1619// "_soft" waitcnts are waitcnts that are either relaxed into their non-soft
1620// counterpart, or completely removed.
1621//
1622// These are inserted by SIMemoryLegalizer to resolve memory dependencies
1623// and later optimized by SIInsertWaitcnts
1624// For example, a S_WAITCNT_soft 0 can be completely removed in a function
1625// that doesn't access memory.
1626def S_WAITCNT_soft : SOPP_Pseudo <"s_soft_waitcnt" , (ins SWaitCnt:$simm16), "$simm16">;
1627def S_WAITCNT_VSCNT_soft : SOPK_WAITCNT<"s_soft_waitcnt_vscnt">;
1628let SubtargetPredicate = isGFX12Plus in {
1629  def S_WAIT_LOADCNT_soft : SOPP_Pseudo <"s_soft_wait_loadcnt", (ins s16imm:$simm16), "$simm16">;
1630  def S_WAIT_STORECNT_soft : SOPP_Pseudo <"s_soft_wait_storecnt", (ins s16imm:$simm16), "$simm16">;
1631let OtherPredicates = [HasImageInsts] in {
1632  def S_WAIT_SAMPLECNT_soft : SOPP_Pseudo <"s_soft_wait_samplecnt", (ins s16imm:$simm16), "$simm16">;
1633  def S_WAIT_BVHCNT_soft : SOPP_Pseudo <"s_soft_wait_bvhcnt", (ins s16imm:$simm16), "$simm16">;
1634} // End OtherPredicates = [HasImageInsts].
1635  def S_WAIT_DSCNT_soft : SOPP_Pseudo <"s_soft_wait_dscnt", (ins s16imm:$simm16), "$simm16">;
1636  def S_WAIT_KMCNT_soft : SOPP_Pseudo <"s_soft_wait_kmcnt", (ins s16imm:$simm16), "$simm16">;
1637}
1638
1639def S_SETHALT : SOPP_Pseudo <"s_sethalt" , (ins i32imm:$simm16), "$simm16",
1640    [(int_amdgcn_s_sethalt timm:$simm16)]>;
1641def S_SETKILL : SOPP_Pseudo <"s_setkill" , (ins i16imm:$simm16), "$simm16">;
1642
1643// On SI the documentation says sleep for approximately 64 * low 2
1644// bits, consistent with the reported maximum of 448. On VI the
1645// maximum reported is 960 cycles, so 960 / 64 = 15 max, so is the
1646// maximum really 15 on VI?
1647def S_SLEEP : SOPP_Pseudo <"s_sleep", (ins i32imm:$simm16),
1648  "$simm16", [(int_amdgcn_s_sleep timm:$simm16)]> {
1649}
1650
1651def S_SLEEP_VAR : SOP1_0_32 <"s_sleep_var", [(int_amdgcn_s_sleep_var SSrc_b32:$src0)]> {
1652  let hasSideEffects = 1;
1653}
1654
1655def S_SETPRIO : SOPP_Pseudo <"s_setprio", (ins i16imm:$simm16), "$simm16",
1656  [(int_amdgcn_s_setprio timm:$simm16)]> {
1657}
1658
1659let Uses = [EXEC, M0] in {
1660def S_SENDMSG : SOPP_Pseudo <"s_sendmsg" , (ins SendMsg:$simm16), "$simm16",
1661  [(int_amdgcn_s_sendmsg (i32 timm:$simm16), M0)]> {
1662}
1663
1664def S_SENDMSGHALT : SOPP_Pseudo <"s_sendmsghalt" , (ins SendMsg:$simm16), "$simm16",
1665  [(int_amdgcn_s_sendmsghalt (i32 timm:$simm16), M0)]> {
1666}
1667
1668} // End Uses = [EXEC, M0]
1669
1670def S_TRAP : SOPP_Pseudo <"s_trap" , (ins i16imm:$simm16), "$simm16"> {
1671  let isTrap = 1;
1672}
1673
1674def S_ICACHE_INV : SOPP_Pseudo <"s_icache_inv", (ins)> {
1675  let simm16 = 0;
1676  let fixed_imm = 1;
1677}
1678def S_INCPERFLEVEL : SOPP_Pseudo <"s_incperflevel", (ins i32imm:$simm16), "$simm16",
1679  [(int_amdgcn_s_incperflevel timm:$simm16)]> {
1680}
1681def S_DECPERFLEVEL : SOPP_Pseudo <"s_decperflevel", (ins i32imm:$simm16), "$simm16",
1682  [(int_amdgcn_s_decperflevel timm:$simm16)]> {
1683}
1684
1685let Uses = [M0] in
1686def S_TTRACEDATA : SOPP_Pseudo <"s_ttracedata", (ins), "",
1687                                [(int_amdgcn_s_ttracedata M0)]> {
1688  let simm16 = 0;
1689  let fixed_imm = 1;
1690}
1691
1692let SubtargetPredicate = HasVGPRIndexMode in {
1693def S_SET_GPR_IDX_OFF : SOPP_Pseudo<"s_set_gpr_idx_off", (ins) > {
1694  let simm16 = 0;
1695  let fixed_imm = 1;
1696  let Defs = [MODE];
1697  let Uses = [MODE];
1698}
1699}
1700} // End hasSideEffects
1701
1702let SubtargetPredicate = HasVGPRIndexMode in {
1703def S_SET_GPR_IDX_MODE : SOPP_Pseudo<"s_set_gpr_idx_mode", (ins GPRIdxMode:$simm16),
1704  "$simm16"> {
1705  let Defs = [M0, MODE];
1706  let Uses = [MODE];
1707}
1708}
1709
1710let SubtargetPredicate = isGFX10Plus in {
1711  def S_INST_PREFETCH :
1712    SOPP_Pseudo<"s_inst_prefetch", (ins s16imm:$simm16), "$simm16">;
1713  def S_CLAUSE :
1714    SOPP_Pseudo<"s_clause", (ins s16imm:$simm16), "$simm16">;
1715  def S_WAIT_IDLE :
1716    SOPP_Pseudo <"s_wait_idle", (ins)> {
1717      let simm16 = 0;
1718      let fixed_imm = 1;
1719    }
1720  def S_WAITCNT_DEPCTR :
1721    SOPP_Pseudo <"s_waitcnt_depctr" , (ins DepCtr:$simm16), "$simm16">;
1722
1723  let hasSideEffects = 0, Uses = [MODE], Defs = [MODE] in {
1724    def S_ROUND_MODE :
1725      SOPP_Pseudo<"s_round_mode", (ins s16imm:$simm16), "$simm16">;
1726    def S_DENORM_MODE :
1727      SOPP_Pseudo<"s_denorm_mode", (ins i32imm:$simm16), "$simm16",
1728      [(SIdenorm_mode (i32 timm:$simm16))]>;
1729  }
1730
1731  let hasSideEffects = 1 in
1732  def S_TTRACEDATA_IMM :
1733    SOPP_Pseudo<"s_ttracedata_imm", (ins s16imm:$simm16), "$simm16",
1734                [(int_amdgcn_s_ttracedata_imm timm:$simm16)]>;
1735} // End SubtargetPredicate = isGFX10Plus
1736
1737let SubtargetPredicate = isGFX11Plus in {
1738let OtherPredicates = [HasExportInsts] in
1739  def S_WAIT_EVENT : SOPP_Pseudo<"s_wait_event", (ins s16imm:$simm16),
1740                                 "$simm16"> {
1741                                   let hasSideEffects = 1;
1742                                 }
1743  def S_DELAY_ALU : SOPP_Pseudo<"s_delay_alu", (ins SDelayALU:$simm16),
1744                                "$simm16">;
1745} // End SubtargetPredicate = isGFX11Plus
1746
1747let SubtargetPredicate = isGFX12Plus, hasSideEffects = 1 in {
1748  def S_WAIT_LOADCNT :
1749    SOPP_Pseudo<"s_wait_loadcnt", (ins s16imm:$simm16), "$simm16",
1750                [(int_amdgcn_s_wait_loadcnt timm:$simm16)]>;
1751  def S_WAIT_LOADCNT_DSCNT :
1752    SOPP_Pseudo<"s_wait_loadcnt_dscnt", (ins s16imm:$simm16), "$simm16">;
1753  def S_WAIT_STORECNT :
1754    SOPP_Pseudo<"s_wait_storecnt", (ins s16imm:$simm16), "$simm16",
1755                [(int_amdgcn_s_wait_storecnt timm:$simm16)]>;
1756  def S_WAIT_STORECNT_DSCNT :
1757    SOPP_Pseudo<"s_wait_storecnt_dscnt", (ins s16imm:$simm16), "$simm16">;
1758let OtherPredicates = [HasImageInsts] in {
1759  def S_WAIT_SAMPLECNT :
1760    SOPP_Pseudo<"s_wait_samplecnt", (ins s16imm:$simm16), "$simm16",
1761                [(int_amdgcn_s_wait_samplecnt timm:$simm16)]>;
1762  def S_WAIT_BVHCNT :
1763    SOPP_Pseudo<"s_wait_bvhcnt", (ins s16imm:$simm16), "$simm16",
1764                [(int_amdgcn_s_wait_bvhcnt timm:$simm16)]>;
1765} // End OtherPredicates = [HasImageInsts].
1766let OtherPredicates = [HasExportInsts] in
1767  def S_WAIT_EXPCNT :
1768    SOPP_Pseudo<"s_wait_expcnt", (ins s16imm:$simm16), "$simm16",
1769                [(int_amdgcn_s_wait_expcnt timm:$simm16)]>;
1770  def S_WAIT_DSCNT :
1771    SOPP_Pseudo<"s_wait_dscnt", (ins s16imm:$simm16), "$simm16",
1772                [(int_amdgcn_s_wait_dscnt timm:$simm16)]>;
1773  def S_WAIT_KMCNT :
1774    SOPP_Pseudo<"s_wait_kmcnt", (ins s16imm:$simm16), "$simm16",
1775                [(int_amdgcn_s_wait_kmcnt timm:$simm16)]>;
1776} // End SubtargetPredicate = isGFX12Plus, hasSideEffects = 1
1777
1778//===----------------------------------------------------------------------===//
1779// SOP1 Patterns
1780//===----------------------------------------------------------------------===//
1781
1782def : GCNPat <
1783  (AMDGPUendpgm),
1784    (S_ENDPGM (i16 0))
1785>;
1786
1787def : GCNPat <
1788  (int_amdgcn_endpgm),
1789    (S_ENDPGM (i16 0))
1790>;
1791
1792def : GCNPat <
1793  (i64 (UniformUnaryFrag<ctpop> i64:$src)),
1794    (i64 (REG_SEQUENCE SReg_64,
1795     (i32 (COPY_TO_REGCLASS (S_BCNT1_I32_B64 $src), SReg_32)), sub0,
1796     (S_MOV_B32 (i32 0)), sub1))
1797>;
1798
1799def : GCNPat <
1800  (i32 (UniformBinFrag<smax> i32:$x, (i32 (ineg i32:$x)))),
1801  (S_ABS_I32 SReg_32:$x)
1802>;
1803
1804def : GCNPat <
1805  (i16 imm:$imm),
1806  (S_MOV_B32 imm:$imm)
1807>;
1808
1809// Same as a 32-bit inreg
1810def : GCNPat<
1811  (i32 (UniformUnaryFrag<sext> i16:$src)),
1812  (S_SEXT_I32_I16 $src)
1813>;
1814
1815let SubtargetPredicate = isNotGFX12Plus in
1816  def : GCNPat <(int_amdgcn_s_wait_event_export_ready), (S_WAIT_EVENT (i16 0))>;
1817let SubtargetPredicate = isGFX12Plus in
1818  def : GCNPat <(int_amdgcn_s_wait_event_export_ready), (S_WAIT_EVENT (i16 2))>;
1819
1820// The first 10 bits of the mode register are the core FP mode on all
1821// subtargets.
1822//
1823// The high bits include additional fields, intermixed with some
1824// non-floating point environment information. We extract the full
1825// register and clear non-relevant bits.
1826//
1827// EXCP_EN covers floating point exceptions, but also some other
1828// non-FP exceptions.
1829//
1830// Bits 12-18 cover the relevant exception mask on all subtargets.
1831//
1832// FIXME: Bit 18 is int_div0, should this be in the FP environment? I
1833// think the only source is v_rcp_iflag_i32.
1834//
1835// On GFX9+:
1836// Bit 23 is the additional FP16_OVFL mode.
1837//
1838// Bits 19, 20, and 21 cover non-FP exceptions and differ between
1839// gfx9/10/11, so we ignore them here.
1840
1841// TODO: Would it be cheaper to emit multiple s_getreg_b32 calls for
1842// the ranges and combine the results?
1843
1844defvar fp_round_mask = !add(!shl(1, 4), -1);
1845defvar fp_denorm_mask = !shl(!add(!shl(1, 4), -1), 4);
1846defvar dx10_clamp_mask = !shl(1, 8);
1847defvar ieee_mode_mask = !shl(1, 9);
1848
1849// Covers fp_round, fp_denorm, dx10_clamp, and IEEE bit.
1850defvar fpmode_mask =
1851  !or(fp_round_mask, fp_denorm_mask, dx10_clamp_mask, ieee_mode_mask);
1852
1853defvar fp_excp_en_mask = !shl(!add(!shl(1, 7), -1), 12);
1854defvar fp16_ovfl = !shl(1, 23);
1855defvar fpmode_mask_gfx6plus = !or(fpmode_mask, fp_excp_en_mask);
1856defvar fpmode_mask_gfx9plus = !or(fpmode_mask_gfx6plus, fp16_ovfl);
1857
1858class GetFPModePat<int fpmode_mask> : GCNPat<
1859  (i32 get_fpmode),
1860  (S_AND_B32 (i32 fpmode_mask),
1861             (S_GETREG_B32 getHwRegImm<
1862                HWREG.MODE, 0,
1863                !add(!logtwo(fpmode_mask), 1)>.ret))
1864>;
1865
1866// TODO: Might be worth moving to custom lowering so the and is
1867// exposed to demanded bits optimizations. Most users probably only
1868// care about the rounding or denorm mode bits. We also can reduce the
1869// demanded read from the getreg immediate.
1870let SubtargetPredicate = isGFX9Plus in {
1871// Last bit = FP16_OVFL
1872def : GetFPModePat<fpmode_mask_gfx9plus>;
1873}
1874
1875// Last bit = EXCP_EN.int_div0
1876let SubtargetPredicate = isNotGFX9Plus in {
1877def : GetFPModePat<fpmode_mask_gfx6plus>;
1878}
1879
1880let SubtargetPredicate = isGFX9GFX10 in
1881def : GCNPat<
1882  (int_amdgcn_pops_exiting_wave_id),
1883  (S_MOV_B32_sideeffects (i32 SRC_POPS_EXITING_WAVE_ID))
1884>;
1885
1886//===----------------------------------------------------------------------===//
1887// SOP2 Patterns
1888//===----------------------------------------------------------------------===//
1889
1890def UniformSelect : PatFrag<
1891  (ops node:$src0, node:$src1),
1892  (select SCC, $src0, $src1),
1893  [{ return !N->isDivergent(); }]
1894>;
1895
1896let AddedComplexity = 20 in {
1897  def : GCNPat<
1898    (i32 (UniformSelect i32:$src0, i32:$src1)),
1899    (S_CSELECT_B32 SSrc_b32:$src0, SSrc_b32:$src1)
1900  >;
1901
1902  // TODO: The predicate should not be necessary, but enabling this pattern for
1903  // all subtargets generates worse code in some cases.
1904  let OtherPredicates = [HasPseudoScalarTrans] in
1905  def : GCNPat<
1906    (f32 (UniformSelect f32:$src0, f32:$src1)),
1907    (S_CSELECT_B32 SSrc_b32:$src0, SSrc_b32:$src1)
1908  >;
1909}
1910
1911// V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector
1912// case, the sgpr-copies pass will fix this to use the vector version.
1913def : GCNPat <
1914  (i32 (addc i32:$src0, i32:$src1)),
1915  (S_ADD_U32 $src0, $src1)
1916>;
1917
1918// FIXME: We need to use COPY_TO_REGCLASS to work-around the fact that
1919// REG_SEQUENCE patterns don't support instructions with multiple
1920// outputs.
1921def : GCNPat<
1922  (i64 (UniformUnaryFrag<zext> i16:$src)),
1923    (REG_SEQUENCE SReg_64,
1924      (i32 (COPY_TO_REGCLASS (S_AND_B32 $src, (S_MOV_B32 (i32 0xffff))), SGPR_32)), sub0,
1925      (S_MOV_B32 (i32 0)), sub1)
1926>;
1927
1928def : GCNPat <
1929  (i64 (UniformUnaryFrag<sext> i16:$src)),
1930    (REG_SEQUENCE SReg_64, (i32 (S_SEXT_I32_I16 $src)), sub0,
1931    (i32 (COPY_TO_REGCLASS (S_ASHR_I32 (i32 (S_SEXT_I32_I16 $src)), (S_MOV_B32 (i32 31))), SGPR_32)), sub1)
1932>;
1933
1934def : GCNPat<
1935  (i32 (UniformUnaryFrag<zext> i16:$src)),
1936  (S_AND_B32 (S_MOV_B32 (i32 0xffff)), $src)
1937>;
1938
1939class ScalarNot2Pat<Instruction inst, SDPatternOperator op, ValueType vt,
1940                    SDPatternOperator notnode = !if(vt.isVector, vnot, not)> : GCNPat<
1941  (UniformBinFrag<op> vt:$src0, (notnode vt:$src1)),
1942  (inst getSOPSrcForVT<vt>.ret:$src0, getSOPSrcForVT<vt>.ret:$src1)
1943>;
1944
1945// Match these for some more types
1946// TODO: i1
1947def : ScalarNot2Pat<S_ANDN2_B32, and, i16>;
1948def : ScalarNot2Pat<S_ANDN2_B32, and, v2i16>;
1949def : ScalarNot2Pat<S_ANDN2_B64, and, v4i16>;
1950def : ScalarNot2Pat<S_ANDN2_B64, and, v2i32>;
1951
1952def : ScalarNot2Pat<S_ORN2_B32, or, i16>;
1953def : ScalarNot2Pat<S_ORN2_B32, or, v2i16>;
1954def : ScalarNot2Pat<S_ORN2_B64, or, v4i16>;
1955def : ScalarNot2Pat<S_ORN2_B64, or, v2i32>;
1956
1957//===----------------------------------------------------------------------===//
1958// Target-specific instruction encodings.
1959//===----------------------------------------------------------------------===//
1960
1961class Select<GFXGen Gen, string opName> : SIMCInstr<opName, Gen.Subtarget> {
1962  Predicate AssemblerPredicate = Gen.AssemblerPredicate;
1963  string DecoderNamespace = Gen.DecoderNamespace;
1964}
1965
1966class Select_vi<string opName> : SIMCInstr<opName, SIEncodingFamily.VI> {
1967  Predicate AssemblerPredicate = isGFX8GFX9;
1968  string DecoderNamespace = "GFX8";
1969}
1970
1971class Select_gfx6_gfx7<string opName> : SIMCInstr<opName, SIEncodingFamily.SI> {
1972  Predicate AssemblerPredicate = isGFX6GFX7;
1973  string DecoderNamespace      = "GFX6GFX7";
1974}
1975
1976//===----------------------------------------------------------------------===//
1977//  SOP1 - GFX11, GFX12
1978//===----------------------------------------------------------------------===//
1979
1980multiclass SOP1_Real_gfx11<bits<8> op, string name = !tolower(NAME)> {
1981  defvar ps = !cast<SOP1_Pseudo>(NAME);
1982  def _gfx11 : SOP1_Real<op, ps, name>,
1983               Select<GFX11Gen, ps.PseudoInstr>;
1984  if !ne(ps.Mnemonic, name) then
1985    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
1986      let AssemblerPredicate = isGFX11Only;
1987    }
1988}
1989
1990multiclass SOP1_Real_gfx12<bits<8> op, string name = !tolower(NAME)> {
1991  defvar ps = !cast<SOP1_Pseudo>(NAME);
1992  def _gfx12 : SOP1_Real<op, ps, name>,
1993               Select<GFX12Gen, ps.PseudoInstr>;
1994  if !ne(ps.Mnemonic, name) then
1995    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
1996      let AssemblerPredicate = isGFX12Plus;
1997    }
1998}
1999
2000multiclass SOP1_M0_Real_gfx12<bits<8> op> {
2001  def _gfx12 : SOP1_Real<op, !cast<SOP1_Pseudo>(NAME)>,
2002               Select<GFX12Gen, !cast<SOP1_Pseudo>(NAME).PseudoInstr> {
2003    let Inst{7-0} = M0_gfx11plus.HWEncoding{7-0}; // Set Src0 encoding to M0
2004  }
2005}
2006
2007multiclass SOP1_IMM_Real_gfx12<bits<8> op> {
2008  defvar ps = !cast<SOP1_Pseudo>(NAME);
2009  def _gfx12 : SOP1_Real<op, ps>,
2010               Select<GFX12Gen, ps.PseudoInstr>;
2011}
2012
2013multiclass SOP1_Real_gfx11_gfx12<bits<8> op, string name = !tolower(NAME)> :
2014  SOP1_Real_gfx11<op, name>, SOP1_Real_gfx12<op, name>;
2015
2016defm S_MOV_B32                    : SOP1_Real_gfx11_gfx12<0x000>;
2017defm S_MOV_B64                    : SOP1_Real_gfx11_gfx12<0x001>;
2018defm S_CMOV_B32                   : SOP1_Real_gfx11_gfx12<0x002>;
2019defm S_CMOV_B64                   : SOP1_Real_gfx11_gfx12<0x003>;
2020defm S_BREV_B32                   : SOP1_Real_gfx11_gfx12<0x004>;
2021defm S_BREV_B64                   : SOP1_Real_gfx11_gfx12<0x005>;
2022defm S_FF1_I32_B32                : SOP1_Real_gfx11_gfx12<0x008, "s_ctz_i32_b32">;
2023defm S_FF1_I32_B64                : SOP1_Real_gfx11_gfx12<0x009, "s_ctz_i32_b64">;
2024defm S_FLBIT_I32_B32              : SOP1_Real_gfx11_gfx12<0x00a, "s_clz_i32_u32">;
2025defm S_FLBIT_I32_B64              : SOP1_Real_gfx11_gfx12<0x00b, "s_clz_i32_u64">;
2026defm S_FLBIT_I32                  : SOP1_Real_gfx11_gfx12<0x00c, "s_cls_i32">;
2027defm S_FLBIT_I32_I64              : SOP1_Real_gfx11_gfx12<0x00d, "s_cls_i32_i64">;
2028defm S_SEXT_I32_I8                : SOP1_Real_gfx11_gfx12<0x00e>;
2029defm S_SEXT_I32_I16               : SOP1_Real_gfx11_gfx12<0x00f>;
2030defm S_BITSET0_B32                : SOP1_Real_gfx11_gfx12<0x010>;
2031defm S_BITSET0_B64                : SOP1_Real_gfx11_gfx12<0x011>;
2032defm S_BITSET1_B32                : SOP1_Real_gfx11_gfx12<0x012>;
2033defm S_BITSET1_B64                : SOP1_Real_gfx11_gfx12<0x013>;
2034defm S_BITREPLICATE_B64_B32       : SOP1_Real_gfx11_gfx12<0x014>;
2035defm S_ABS_I32                    : SOP1_Real_gfx11_gfx12<0x015>;
2036defm S_BCNT0_I32_B32              : SOP1_Real_gfx11_gfx12<0x016>;
2037defm S_BCNT0_I32_B64              : SOP1_Real_gfx11_gfx12<0x017>;
2038defm S_BCNT1_I32_B32              : SOP1_Real_gfx11_gfx12<0x018>;
2039defm S_BCNT1_I32_B64              : SOP1_Real_gfx11_gfx12<0x019>;
2040defm S_QUADMASK_B32               : SOP1_Real_gfx11_gfx12<0x01a>;
2041defm S_QUADMASK_B64               : SOP1_Real_gfx11_gfx12<0x01b>;
2042defm S_WQM_B32                    : SOP1_Real_gfx11_gfx12<0x01c>;
2043defm S_WQM_B64                    : SOP1_Real_gfx11_gfx12<0x01d>;
2044defm S_NOT_B32                    : SOP1_Real_gfx11_gfx12<0x01e>;
2045defm S_NOT_B64                    : SOP1_Real_gfx11_gfx12<0x01f>;
2046defm S_AND_SAVEEXEC_B32           : SOP1_Real_gfx11_gfx12<0x020>;
2047defm S_AND_SAVEEXEC_B64           : SOP1_Real_gfx11_gfx12<0x021>;
2048defm S_OR_SAVEEXEC_B32            : SOP1_Real_gfx11_gfx12<0x022>;
2049defm S_OR_SAVEEXEC_B64            : SOP1_Real_gfx11_gfx12<0x023>;
2050defm S_XOR_SAVEEXEC_B32           : SOP1_Real_gfx11_gfx12<0x024>;
2051defm S_XOR_SAVEEXEC_B64           : SOP1_Real_gfx11_gfx12<0x025>;
2052defm S_NAND_SAVEEXEC_B32          : SOP1_Real_gfx11_gfx12<0x026>;
2053defm S_NAND_SAVEEXEC_B64          : SOP1_Real_gfx11_gfx12<0x027>;
2054defm S_NOR_SAVEEXEC_B32           : SOP1_Real_gfx11_gfx12<0x028>;
2055defm S_NOR_SAVEEXEC_B64           : SOP1_Real_gfx11_gfx12<0x029>;
2056defm S_XNOR_SAVEEXEC_B32          : SOP1_Real_gfx11_gfx12<0x02a>;
2057defm S_ANDN1_SAVEEXEC_B32         : SOP1_Real_gfx11_gfx12<0x02c, "s_and_not0_saveexec_b32">;
2058defm S_ANDN1_SAVEEXEC_B64         : SOP1_Real_gfx11_gfx12<0x02d, "s_and_not0_saveexec_b64">;
2059defm S_ORN1_SAVEEXEC_B32          : SOP1_Real_gfx11_gfx12<0x02e, "s_or_not0_saveexec_b32">;
2060defm S_ORN1_SAVEEXEC_B64          : SOP1_Real_gfx11_gfx12<0x02f, "s_or_not0_saveexec_b64">;
2061defm S_ANDN2_SAVEEXEC_B32         : SOP1_Real_gfx11_gfx12<0x030, "s_and_not1_saveexec_b32">;
2062defm S_ANDN2_SAVEEXEC_B64         : SOP1_Real_gfx11_gfx12<0x031, "s_and_not1_saveexec_b64">;
2063defm S_ORN2_SAVEEXEC_B32          : SOP1_Real_gfx11_gfx12<0x032, "s_or_not1_saveexec_b32">;
2064defm S_ORN2_SAVEEXEC_B64          : SOP1_Real_gfx11_gfx12<0x033, "s_or_not1_saveexec_b64">;
2065defm S_ANDN1_WREXEC_B32           : SOP1_Real_gfx11_gfx12<0x034, "s_and_not0_wrexec_b32">;
2066defm S_ANDN1_WREXEC_B64           : SOP1_Real_gfx11_gfx12<0x035, "s_and_not0_wrexec_b64">;
2067defm S_ANDN2_WREXEC_B32           : SOP1_Real_gfx11_gfx12<0x036, "s_and_not1_wrexec_b32">;
2068defm S_ANDN2_WREXEC_B64           : SOP1_Real_gfx11_gfx12<0x037, "s_and_not1_wrexec_b64">;
2069defm S_MOVRELS_B32                : SOP1_Real_gfx11_gfx12<0x040>;
2070defm S_MOVRELS_B64                : SOP1_Real_gfx11_gfx12<0x041>;
2071defm S_MOVRELD_B32                : SOP1_Real_gfx11_gfx12<0x042>;
2072defm S_MOVRELD_B64                : SOP1_Real_gfx11_gfx12<0x043>;
2073defm S_MOVRELSD_2_B32             : SOP1_Real_gfx11_gfx12<0x044>;
2074defm S_GETPC_B64                  : SOP1_Real_gfx11_gfx12<0x047>;
2075defm S_SETPC_B64                  : SOP1_Real_gfx11_gfx12<0x048>;
2076defm S_SWAPPC_B64                 : SOP1_Real_gfx11_gfx12<0x049>;
2077defm S_RFE_B64                    : SOP1_Real_gfx11_gfx12<0x04a>;
2078defm S_SENDMSG_RTN_B32            : SOP1_Real_gfx11_gfx12<0x04c>;
2079defm S_SENDMSG_RTN_B64            : SOP1_Real_gfx11_gfx12<0x04d>;
2080defm S_BARRIER_SIGNAL_M0          : SOP1_M0_Real_gfx12<0x04e>;
2081defm S_BARRIER_SIGNAL_ISFIRST_M0  : SOP1_M0_Real_gfx12<0x04f>;
2082defm S_GET_BARRIER_STATE_M0       : SOP1_M0_Real_gfx12<0x050>;
2083defm S_BARRIER_INIT_M0            : SOP1_M0_Real_gfx12<0x051>;
2084defm S_BARRIER_JOIN_M0            : SOP1_M0_Real_gfx12<0x052>;
2085defm S_BARRIER_SIGNAL_IMM         : SOP1_IMM_Real_gfx12<0x04e>;
2086defm S_BARRIER_SIGNAL_ISFIRST_IMM : SOP1_IMM_Real_gfx12<0x04f>;
2087defm S_GET_BARRIER_STATE_IMM      : SOP1_IMM_Real_gfx12<0x050>;
2088defm S_BARRIER_INIT_IMM           : SOP1_IMM_Real_gfx12<0x051>;
2089defm S_BARRIER_JOIN_IMM           : SOP1_IMM_Real_gfx12<0x052>;
2090defm S_SLEEP_VAR                  : SOP1_IMM_Real_gfx12<0x058>;
2091
2092//===----------------------------------------------------------------------===//
2093// SOP1 - GFX1150, GFX12
2094//===----------------------------------------------------------------------===//
2095
2096defm S_CEIL_F32          : SOP1_Real_gfx11_gfx12<0x060>;
2097defm S_FLOOR_F32         : SOP1_Real_gfx11_gfx12<0x061>;
2098defm S_TRUNC_F32         : SOP1_Real_gfx11_gfx12<0x062>;
2099defm S_RNDNE_F32         : SOP1_Real_gfx11_gfx12<0x063>;
2100defm S_CVT_F32_I32       : SOP1_Real_gfx11_gfx12<0x064>;
2101defm S_CVT_F32_U32       : SOP1_Real_gfx11_gfx12<0x065>;
2102defm S_CVT_I32_F32       : SOP1_Real_gfx11_gfx12<0x066>;
2103defm S_CVT_U32_F32       : SOP1_Real_gfx11_gfx12<0x067>;
2104defm S_CVT_F16_F32       : SOP1_Real_gfx11_gfx12<0x068>;
2105defm S_CVT_F32_F16       : SOP1_Real_gfx11_gfx12<0x069>;
2106defm S_CVT_HI_F32_F16    : SOP1_Real_gfx11_gfx12<0x06a>;
2107defm S_CEIL_F16          : SOP1_Real_gfx11_gfx12<0x06b>;
2108defm S_FLOOR_F16         : SOP1_Real_gfx11_gfx12<0x06c>;
2109defm S_TRUNC_F16         : SOP1_Real_gfx11_gfx12<0x06d>;
2110defm S_RNDNE_F16         : SOP1_Real_gfx11_gfx12<0x06e>;
2111
2112//===----------------------------------------------------------------------===//
2113// SOP1 - GFX10.
2114//===----------------------------------------------------------------------===//
2115
2116multiclass SOP1_Real_gfx10<bits<8> op> {
2117  defvar ps = !cast<SOP1_Pseudo>(NAME);
2118  def _gfx10 : SOP1_Real<op, ps>,
2119               Select<GFX10Gen, ps.PseudoInstr>;
2120}
2121
2122multiclass SOP1_Real_gfx10_gfx11_gfx12<bits<8> op> :
2123  SOP1_Real_gfx10<op>, SOP1_Real_gfx11_gfx12<op>;
2124
2125defm S_ANDN1_SAVEEXEC_B64   : SOP1_Real_gfx10<0x037>;
2126defm S_ORN1_SAVEEXEC_B64    : SOP1_Real_gfx10<0x038>;
2127defm S_ANDN1_WREXEC_B64     : SOP1_Real_gfx10<0x039>;
2128defm S_ANDN2_WREXEC_B64     : SOP1_Real_gfx10<0x03a>;
2129defm S_BITREPLICATE_B64_B32 : SOP1_Real_gfx10<0x03b>;
2130defm S_AND_SAVEEXEC_B32     : SOP1_Real_gfx10<0x03c>;
2131defm S_OR_SAVEEXEC_B32      : SOP1_Real_gfx10<0x03d>;
2132defm S_XOR_SAVEEXEC_B32     : SOP1_Real_gfx10<0x03e>;
2133defm S_ANDN2_SAVEEXEC_B32   : SOP1_Real_gfx10<0x03f>;
2134defm S_ORN2_SAVEEXEC_B32    : SOP1_Real_gfx10<0x040>;
2135defm S_NAND_SAVEEXEC_B32    : SOP1_Real_gfx10<0x041>;
2136defm S_NOR_SAVEEXEC_B32     : SOP1_Real_gfx10<0x042>;
2137defm S_XNOR_SAVEEXEC_B32    : SOP1_Real_gfx10<0x043>;
2138defm S_ANDN1_SAVEEXEC_B32   : SOP1_Real_gfx10<0x044>;
2139defm S_ORN1_SAVEEXEC_B32    : SOP1_Real_gfx10<0x045>;
2140defm S_ANDN1_WREXEC_B32     : SOP1_Real_gfx10<0x046>;
2141defm S_ANDN2_WREXEC_B32     : SOP1_Real_gfx10<0x047>;
2142defm S_MOVRELSD_2_B32       : SOP1_Real_gfx10<0x049>;
2143
2144//===----------------------------------------------------------------------===//
2145// SOP1 - GFX6, GFX7, GFX10, GFX11.
2146//===----------------------------------------------------------------------===//
2147
2148
2149multiclass SOP1_Real_gfx6_gfx7<bits<8> op> {
2150  defvar ps = !cast<SOP1_Pseudo>(NAME);
2151  def _gfx6_gfx7 : SOP1_Real<op, ps>,
2152                   Select_gfx6_gfx7<ps.PseudoInstr>;
2153}
2154
2155multiclass SOP1_Real_gfx6_gfx7_gfx10<bits<8> op> :
2156  SOP1_Real_gfx6_gfx7<op>, SOP1_Real_gfx10<op>;
2157
2158multiclass SOP1_Real_gfx6_gfx7_gfx10_gfx11_gfx12<bits<8> op> :
2159  SOP1_Real_gfx6_gfx7<op>, SOP1_Real_gfx10_gfx11_gfx12<op>;
2160
2161defm S_CBRANCH_JOIN  : SOP1_Real_gfx6_gfx7<0x032>;
2162
2163defm S_MOV_B32            : SOP1_Real_gfx6_gfx7_gfx10<0x003>;
2164defm S_MOV_B64            : SOP1_Real_gfx6_gfx7_gfx10<0x004>;
2165defm S_CMOV_B32           : SOP1_Real_gfx6_gfx7_gfx10<0x005>;
2166defm S_CMOV_B64           : SOP1_Real_gfx6_gfx7_gfx10<0x006>;
2167defm S_NOT_B32            : SOP1_Real_gfx6_gfx7_gfx10<0x007>;
2168defm S_NOT_B64            : SOP1_Real_gfx6_gfx7_gfx10<0x008>;
2169defm S_WQM_B32            : SOP1_Real_gfx6_gfx7_gfx10<0x009>;
2170defm S_WQM_B64            : SOP1_Real_gfx6_gfx7_gfx10<0x00a>;
2171defm S_BREV_B32           : SOP1_Real_gfx6_gfx7_gfx10<0x00b>;
2172defm S_BREV_B64           : SOP1_Real_gfx6_gfx7_gfx10<0x00c>;
2173defm S_BCNT0_I32_B32      : SOP1_Real_gfx6_gfx7_gfx10<0x00d>;
2174defm S_BCNT0_I32_B64      : SOP1_Real_gfx6_gfx7_gfx10<0x00e>;
2175defm S_BCNT1_I32_B32      : SOP1_Real_gfx6_gfx7_gfx10<0x00f>;
2176defm S_BCNT1_I32_B64      : SOP1_Real_gfx6_gfx7_gfx10<0x010>;
2177defm S_FF0_I32_B32        : SOP1_Real_gfx6_gfx7_gfx10<0x011>;
2178defm S_FF0_I32_B64        : SOP1_Real_gfx6_gfx7_gfx10<0x012>;
2179defm S_FF1_I32_B32        : SOP1_Real_gfx6_gfx7_gfx10<0x013>;
2180defm S_FF1_I32_B64        : SOP1_Real_gfx6_gfx7_gfx10<0x014>;
2181defm S_FLBIT_I32_B32      : SOP1_Real_gfx6_gfx7_gfx10<0x015>;
2182defm S_FLBIT_I32_B64      : SOP1_Real_gfx6_gfx7_gfx10<0x016>;
2183defm S_FLBIT_I32          : SOP1_Real_gfx6_gfx7_gfx10<0x017>;
2184defm S_FLBIT_I32_I64      : SOP1_Real_gfx6_gfx7_gfx10<0x018>;
2185defm S_SEXT_I32_I8        : SOP1_Real_gfx6_gfx7_gfx10<0x019>;
2186defm S_SEXT_I32_I16       : SOP1_Real_gfx6_gfx7_gfx10<0x01a>;
2187defm S_BITSET0_B32        : SOP1_Real_gfx6_gfx7_gfx10<0x01b>;
2188defm S_BITSET0_B64        : SOP1_Real_gfx6_gfx7_gfx10<0x01c>;
2189defm S_BITSET1_B32        : SOP1_Real_gfx6_gfx7_gfx10<0x01d>;
2190defm S_BITSET1_B64        : SOP1_Real_gfx6_gfx7_gfx10<0x01e>;
2191defm S_GETPC_B64          : SOP1_Real_gfx6_gfx7_gfx10<0x01f>;
2192defm S_SETPC_B64          : SOP1_Real_gfx6_gfx7_gfx10<0x020>;
2193defm S_SWAPPC_B64         : SOP1_Real_gfx6_gfx7_gfx10<0x021>;
2194defm S_RFE_B64            : SOP1_Real_gfx6_gfx7_gfx10<0x022>;
2195defm S_AND_SAVEEXEC_B64   : SOP1_Real_gfx6_gfx7_gfx10<0x024>;
2196defm S_OR_SAVEEXEC_B64    : SOP1_Real_gfx6_gfx7_gfx10<0x025>;
2197defm S_XOR_SAVEEXEC_B64   : SOP1_Real_gfx6_gfx7_gfx10<0x026>;
2198defm S_ANDN2_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x027>;
2199defm S_ORN2_SAVEEXEC_B64  : SOP1_Real_gfx6_gfx7_gfx10<0x028>;
2200defm S_NAND_SAVEEXEC_B64  : SOP1_Real_gfx6_gfx7_gfx10<0x029>;
2201defm S_NOR_SAVEEXEC_B64   : SOP1_Real_gfx6_gfx7_gfx10<0x02a>;
2202defm S_XNOR_SAVEEXEC_B64  : SOP1_Real_gfx6_gfx7_gfx10_gfx11_gfx12<0x02b>;
2203defm S_QUADMASK_B32       : SOP1_Real_gfx6_gfx7_gfx10<0x02c>;
2204defm S_QUADMASK_B64       : SOP1_Real_gfx6_gfx7_gfx10<0x02d>;
2205defm S_MOVRELS_B32        : SOP1_Real_gfx6_gfx7_gfx10<0x02e>;
2206defm S_MOVRELS_B64        : SOP1_Real_gfx6_gfx7_gfx10<0x02f>;
2207defm S_MOVRELD_B32        : SOP1_Real_gfx6_gfx7_gfx10<0x030>;
2208defm S_MOVRELD_B64        : SOP1_Real_gfx6_gfx7_gfx10<0x031>;
2209defm S_ABS_I32            : SOP1_Real_gfx6_gfx7_gfx10<0x034>;
2210
2211//===----------------------------------------------------------------------===//
2212// SOP2 - GFX12
2213//===----------------------------------------------------------------------===//
2214
2215multiclass SOP2_Real_gfx12<bits<7> op, string name = !tolower(NAME)> {
2216  defvar ps = !cast<SOP2_Pseudo>(NAME);
2217  def _gfx12 : SOP2_Real32<op, ps, name>,
2218               Select<GFX12Gen, ps.PseudoInstr>;
2219  if !ne(ps.Mnemonic, name) then
2220    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
2221      let AssemblerPredicate = isGFX12Plus;
2222    }
2223}
2224
2225defm S_MINIMUM_F32 : SOP2_Real_gfx12<0x04f>;
2226defm S_MAXIMUM_F32 : SOP2_Real_gfx12<0x050>;
2227defm S_MINIMUM_F16 : SOP2_Real_gfx12<0x051>;
2228defm S_MAXIMUM_F16 : SOP2_Real_gfx12<0x052>;
2229
2230//===----------------------------------------------------------------------===//
2231// SOP2 - GFX11, GFX12.
2232//===----------------------------------------------------------------------===//
2233
2234multiclass SOP2_Real_gfx11<bits<7> op, string name = !tolower(NAME)> {
2235  defvar ps = !cast<SOP2_Pseudo>(NAME);
2236  def _gfx11 : SOP2_Real32<op, ps, name>,
2237               Select<GFX11Gen, ps.PseudoInstr>;
2238  if !ne(ps.Mnemonic, name) then
2239    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
2240      let AssemblerPredicate = isGFX11Only;
2241    }
2242}
2243
2244multiclass SOP2_Real_gfx11_gfx12<bits<7> op, string name = !tolower(NAME)> :
2245  SOP2_Real_gfx11<op, name>, SOP2_Real_gfx12<op, name>;
2246
2247defm S_ABSDIFF_I32     : SOP2_Real_gfx11_gfx12<0x006>;
2248defm S_LSHL_B32        : SOP2_Real_gfx11_gfx12<0x008>;
2249defm S_LSHL_B64        : SOP2_Real_gfx11_gfx12<0x009>;
2250defm S_LSHR_B32        : SOP2_Real_gfx11_gfx12<0x00a>;
2251defm S_LSHR_B64        : SOP2_Real_gfx11_gfx12<0x00b>;
2252defm S_ASHR_I32        : SOP2_Real_gfx11_gfx12<0x00c>;
2253defm S_ASHR_I64        : SOP2_Real_gfx11_gfx12<0x00d>;
2254defm S_LSHL1_ADD_U32   : SOP2_Real_gfx11_gfx12<0x00e>;
2255defm S_LSHL2_ADD_U32   : SOP2_Real_gfx11_gfx12<0x00f>;
2256defm S_LSHL3_ADD_U32   : SOP2_Real_gfx11_gfx12<0x010>;
2257defm S_LSHL4_ADD_U32   : SOP2_Real_gfx11_gfx12<0x011>;
2258defm S_MIN_I32         : SOP2_Real_gfx11_gfx12<0x012>;
2259defm S_MIN_U32         : SOP2_Real_gfx11_gfx12<0x013>;
2260defm S_MAX_I32         : SOP2_Real_gfx11_gfx12<0x014>;
2261defm S_MAX_U32         : SOP2_Real_gfx11_gfx12<0x015>;
2262defm S_AND_B32         : SOP2_Real_gfx11_gfx12<0x016>;
2263defm S_AND_B64         : SOP2_Real_gfx11_gfx12<0x017>;
2264defm S_OR_B32          : SOP2_Real_gfx11_gfx12<0x018>;
2265defm S_OR_B64          : SOP2_Real_gfx11_gfx12<0x019>;
2266defm S_XOR_B32         : SOP2_Real_gfx11_gfx12<0x01a>;
2267defm S_XOR_B64         : SOP2_Real_gfx11_gfx12<0x01b>;
2268defm S_NAND_B32        : SOP2_Real_gfx11_gfx12<0x01c>;
2269defm S_NAND_B64        : SOP2_Real_gfx11_gfx12<0x01d>;
2270defm S_NOR_B32         : SOP2_Real_gfx11_gfx12<0x01e>;
2271defm S_NOR_B64         : SOP2_Real_gfx11_gfx12<0x01f>;
2272defm S_XNOR_B32        : SOP2_Real_gfx11_gfx12<0x020>;
2273defm S_XNOR_B64        : SOP2_Real_gfx11_gfx12<0x021>;
2274defm S_ANDN2_B32       : SOP2_Real_gfx11_gfx12<0x022, "s_and_not1_b32">;
2275defm S_ANDN2_B64       : SOP2_Real_gfx11_gfx12<0x023, "s_and_not1_b64">;
2276defm S_ORN2_B32        : SOP2_Real_gfx11_gfx12<0x024, "s_or_not1_b32">;
2277defm S_ORN2_B64        : SOP2_Real_gfx11_gfx12<0x025, "s_or_not1_b64">;
2278defm S_BFE_U32         : SOP2_Real_gfx11_gfx12<0x026>;
2279defm S_BFE_I32         : SOP2_Real_gfx11_gfx12<0x027>;
2280defm S_BFE_U64         : SOP2_Real_gfx11_gfx12<0x028>;
2281defm S_BFE_I64         : SOP2_Real_gfx11_gfx12<0x029>;
2282defm S_BFM_B32         : SOP2_Real_gfx11_gfx12<0x02a>;
2283defm S_BFM_B64         : SOP2_Real_gfx11_gfx12<0x02b>;
2284defm S_MUL_I32         : SOP2_Real_gfx11_gfx12<0x02c>;
2285defm S_MUL_HI_U32      : SOP2_Real_gfx11_gfx12<0x02d>;
2286defm S_MUL_HI_I32      : SOP2_Real_gfx11_gfx12<0x02e>;
2287defm S_CSELECT_B32     : SOP2_Real_gfx11_gfx12<0x030>;
2288defm S_CSELECT_B64     : SOP2_Real_gfx11_gfx12<0x031>;
2289defm S_PACK_HL_B32_B16 : SOP2_Real_gfx11_gfx12<0x035>;
2290defm S_ADD_U64         : SOP2_Real_gfx12<0x053, "s_add_nc_u64">;
2291defm S_SUB_U64         : SOP2_Real_gfx12<0x054, "s_sub_nc_u64">;
2292defm S_MUL_U64         : SOP2_Real_gfx12<0x055>;
2293
2294//===----------------------------------------------------------------------===//
2295// SOP2 - GFX1150, GFX12
2296//===----------------------------------------------------------------------===//
2297
2298multiclass SOP2_Real_FMAK_gfx12<bits<7> op> {
2299  def _gfx12 : SOP2_Real64<op, !cast<SOP2_Pseudo>(NAME)>,
2300               Select<GFX12Gen, !cast<SOP2_Pseudo>(NAME).PseudoInstr>;
2301}
2302
2303multiclass SOP2_Real_FMAK_gfx11<bits<7> op> {
2304  def _gfx11 : SOP2_Real64<op, !cast<SOP2_Pseudo>(NAME)>,
2305               Select<GFX11Gen, !cast<SOP2_Pseudo>(NAME).PseudoInstr>;
2306}
2307
2308multiclass SOP2_Real_FMAK_gfx11_gfx12<bits<7> op> :
2309  SOP2_Real_FMAK_gfx11<op>, SOP2_Real_FMAK_gfx12<op>;
2310
2311defm S_ADD_F32            : SOP2_Real_gfx11_gfx12<0x040>;
2312defm S_SUB_F32            : SOP2_Real_gfx11_gfx12<0x041>;
2313defm S_MUL_F32            : SOP2_Real_gfx11_gfx12<0x044>;
2314defm S_FMAAK_F32          : SOP2_Real_FMAK_gfx11_gfx12<0x045>;
2315defm S_FMAMK_F32          : SOP2_Real_FMAK_gfx11_gfx12<0x046>;
2316defm S_FMAC_F32           : SOP2_Real_gfx11_gfx12<0x047>;
2317defm S_CVT_PK_RTZ_F16_F32 : SOP2_Real_gfx11_gfx12<0x048>;
2318defm S_ADD_F16            : SOP2_Real_gfx11_gfx12<0x049>;
2319defm S_SUB_F16            : SOP2_Real_gfx11_gfx12<0x04a>;
2320defm S_MUL_F16            : SOP2_Real_gfx11_gfx12<0x04d>;
2321defm S_FMAC_F16           : SOP2_Real_gfx11_gfx12<0x04e>;
2322
2323//===----------------------------------------------------------------------===//
2324// SOP2 - GFX1150
2325//===----------------------------------------------------------------------===//
2326
2327multiclass SOP2_Real_gfx11_Renamed_gfx12<bits<7> op, string gfx12_name> :
2328  SOP2_Real_gfx11<op>, SOP2_Real_gfx12<op, gfx12_name>;
2329
2330defm S_MIN_F32 : SOP2_Real_gfx11_Renamed_gfx12<0x042, "s_min_num_f32">;
2331defm S_MAX_F32 : SOP2_Real_gfx11_Renamed_gfx12<0x043, "s_max_num_f32">;
2332defm S_MIN_F16 : SOP2_Real_gfx11_Renamed_gfx12<0x04b, "s_min_num_f16">;
2333defm S_MAX_F16 : SOP2_Real_gfx11_Renamed_gfx12<0x04c, "s_max_num_f16">;
2334
2335//===----------------------------------------------------------------------===//
2336// SOP2 - GFX10.
2337//===----------------------------------------------------------------------===//
2338
2339multiclass SOP2_Real_gfx10<bits<7> op> {
2340  defvar ps = !cast<SOP2_Pseudo>(NAME);
2341  def _gfx10 : SOP2_Real32<op, ps>,
2342               Select<GFX10Gen, ps.PseudoInstr>;
2343}
2344
2345multiclass SOP2_Real_gfx10_gfx11_gfx12<bits<7> op> :
2346  SOP2_Real_gfx10<op>, SOP2_Real_gfx11_gfx12<op>;
2347
2348defm S_LSHL1_ADD_U32   : SOP2_Real_gfx10<0x02e>;
2349defm S_LSHL2_ADD_U32   : SOP2_Real_gfx10<0x02f>;
2350defm S_LSHL3_ADD_U32   : SOP2_Real_gfx10<0x030>;
2351defm S_LSHL4_ADD_U32   : SOP2_Real_gfx10<0x031>;
2352defm S_PACK_LL_B32_B16 : SOP2_Real_gfx10_gfx11_gfx12<0x032>;
2353defm S_PACK_LH_B32_B16 : SOP2_Real_gfx10_gfx11_gfx12<0x033>;
2354defm S_PACK_HH_B32_B16 : SOP2_Real_gfx10_gfx11_gfx12<0x034>;
2355defm S_MUL_HI_U32      : SOP2_Real_gfx10<0x035>;
2356defm S_MUL_HI_I32      : SOP2_Real_gfx10<0x036>;
2357
2358//===----------------------------------------------------------------------===//
2359// SOP2 - GFX6, GFX7.
2360//===----------------------------------------------------------------------===//
2361
2362multiclass SOP2_Real_gfx6_gfx7<bits<7> op> {
2363  defvar ps = !cast<SOP2_Pseudo>(NAME);
2364  def _gfx6_gfx7 : SOP2_Real32<op, ps>,
2365                   Select_gfx6_gfx7<ps.PseudoInstr>;
2366}
2367
2368multiclass SOP2_Real_gfx6_gfx7_gfx10<bits<7> op> :
2369  SOP2_Real_gfx6_gfx7<op>, SOP2_Real_gfx10<op>;
2370
2371multiclass SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<bits<7> op, string gfx12_name> :
2372  SOP2_Real_gfx6_gfx7<op>, SOP2_Real_gfx10<op>, SOP2_Real_gfx11<op>,
2373  SOP2_Real_gfx12<op, gfx12_name>;
2374
2375defm S_CBRANCH_G_FORK : SOP2_Real_gfx6_gfx7<0x02b>;
2376
2377defm S_ADD_U32     : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x000, "s_add_co_u32">;
2378defm S_SUB_U32     : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x001, "s_sub_co_u32">;
2379defm S_ADD_I32     : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x002, "s_add_co_i32">;
2380defm S_SUB_I32     : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x003, "s_sub_co_i32">;
2381defm S_ADDC_U32    : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x004, "s_add_co_ci_u32">;
2382defm S_SUBB_U32    : SOP2_Real_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x005, "s_sub_co_ci_u32">;
2383defm S_MIN_I32     : SOP2_Real_gfx6_gfx7_gfx10<0x006>;
2384defm S_MIN_U32     : SOP2_Real_gfx6_gfx7_gfx10<0x007>;
2385defm S_MAX_I32     : SOP2_Real_gfx6_gfx7_gfx10<0x008>;
2386defm S_MAX_U32     : SOP2_Real_gfx6_gfx7_gfx10<0x009>;
2387defm S_CSELECT_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x00a>;
2388defm S_CSELECT_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x00b>;
2389defm S_AND_B32     : SOP2_Real_gfx6_gfx7_gfx10<0x00e>;
2390defm S_AND_B64     : SOP2_Real_gfx6_gfx7_gfx10<0x00f>;
2391defm S_OR_B32      : SOP2_Real_gfx6_gfx7_gfx10<0x010>;
2392defm S_OR_B64      : SOP2_Real_gfx6_gfx7_gfx10<0x011>;
2393defm S_XOR_B32     : SOP2_Real_gfx6_gfx7_gfx10<0x012>;
2394defm S_XOR_B64     : SOP2_Real_gfx6_gfx7_gfx10<0x013>;
2395defm S_ANDN2_B32   : SOP2_Real_gfx6_gfx7_gfx10<0x014>;
2396defm S_ANDN2_B64   : SOP2_Real_gfx6_gfx7_gfx10<0x015>;
2397defm S_ORN2_B32    : SOP2_Real_gfx6_gfx7_gfx10<0x016>;
2398defm S_ORN2_B64    : SOP2_Real_gfx6_gfx7_gfx10<0x017>;
2399defm S_NAND_B32    : SOP2_Real_gfx6_gfx7_gfx10<0x018>;
2400defm S_NAND_B64    : SOP2_Real_gfx6_gfx7_gfx10<0x019>;
2401defm S_NOR_B32     : SOP2_Real_gfx6_gfx7_gfx10<0x01a>;
2402defm S_NOR_B64     : SOP2_Real_gfx6_gfx7_gfx10<0x01b>;
2403defm S_XNOR_B32    : SOP2_Real_gfx6_gfx7_gfx10<0x01c>;
2404defm S_XNOR_B64    : SOP2_Real_gfx6_gfx7_gfx10<0x01d>;
2405defm S_LSHL_B32    : SOP2_Real_gfx6_gfx7_gfx10<0x01e>;
2406defm S_LSHL_B64    : SOP2_Real_gfx6_gfx7_gfx10<0x01f>;
2407defm S_LSHR_B32    : SOP2_Real_gfx6_gfx7_gfx10<0x020>;
2408defm S_LSHR_B64    : SOP2_Real_gfx6_gfx7_gfx10<0x021>;
2409defm S_ASHR_I32    : SOP2_Real_gfx6_gfx7_gfx10<0x022>;
2410defm S_ASHR_I64    : SOP2_Real_gfx6_gfx7_gfx10<0x023>;
2411defm S_BFM_B32     : SOP2_Real_gfx6_gfx7_gfx10<0x024>;
2412defm S_BFM_B64     : SOP2_Real_gfx6_gfx7_gfx10<0x025>;
2413defm S_MUL_I32     : SOP2_Real_gfx6_gfx7_gfx10<0x026>;
2414defm S_BFE_U32     : SOP2_Real_gfx6_gfx7_gfx10<0x027>;
2415defm S_BFE_I32     : SOP2_Real_gfx6_gfx7_gfx10<0x028>;
2416defm S_BFE_U64     : SOP2_Real_gfx6_gfx7_gfx10<0x029>;
2417defm S_BFE_I64     : SOP2_Real_gfx6_gfx7_gfx10<0x02a>;
2418defm S_ABSDIFF_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x02c>;
2419
2420//===----------------------------------------------------------------------===//
2421// SOPK - GFX11, GFX12.
2422//===----------------------------------------------------------------------===//
2423
2424multiclass SOPK_Real32_gfx12<bits<5> op, string name = !tolower(NAME)> {
2425  defvar ps = !cast<SOPK_Pseudo>(NAME);
2426  def _gfx12 : SOPK_Real32<op, ps, name>,
2427               Select<GFX12Gen, ps.PseudoInstr>;
2428  if !ne(ps.Mnemonic, name) then
2429    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
2430      let AssemblerPredicate = isGFX12Plus;
2431    }
2432}
2433
2434multiclass SOPK_Real32_gfx11<bits<5> op> {
2435  def _gfx11 : SOPK_Real32<op, !cast<SOPK_Pseudo>(NAME)>,
2436               Select<GFX11Gen, !cast<SOPK_Pseudo>(NAME).PseudoInstr>;
2437}
2438
2439multiclass SOPK_Real64_gfx12<bits<5> op> {
2440  def _gfx12 : SOPK_Real64<op, !cast<SOPK_Pseudo>(NAME)>,
2441               Select<GFX12Gen, !cast<SOPK_Pseudo>(NAME).PseudoInstr>;
2442}
2443
2444multiclass SOPK_Real64_gfx11<bits<5> op> {
2445  def _gfx11 : SOPK_Real64<op, !cast<SOPK_Pseudo>(NAME)>,
2446               Select<GFX11Gen, !cast<SOPK_Pseudo>(NAME).PseudoInstr>;
2447}
2448
2449multiclass SOPK_Real32_gfx11_gfx12<bits<5> op> :
2450  SOPK_Real32_gfx11<op>, SOPK_Real32_gfx12<op>;
2451
2452multiclass SOPK_Real64_gfx11_gfx12<bits<5> op> :
2453  SOPK_Real64_gfx11<op>, SOPK_Real64_gfx12<op>;
2454
2455defm S_GETREG_B32           : SOPK_Real32_gfx11_gfx12<0x011>;
2456defm S_SETREG_B32           : SOPK_Real32_gfx11_gfx12<0x012>;
2457defm S_SETREG_IMM32_B32     : SOPK_Real64_gfx11_gfx12<0x013>;
2458defm S_CALL_B64             : SOPK_Real32_gfx11_gfx12<0x014>;
2459defm S_SUBVECTOR_LOOP_BEGIN : SOPK_Real32_gfx11<0x016>;
2460defm S_SUBVECTOR_LOOP_END   : SOPK_Real32_gfx11<0x017>;
2461defm S_WAITCNT_VSCNT        : SOPK_Real32_gfx11<0x018>;
2462defm S_WAITCNT_VMCNT        : SOPK_Real32_gfx11<0x019>;
2463defm S_WAITCNT_EXPCNT       : SOPK_Real32_gfx11<0x01a>;
2464defm S_WAITCNT_LGKMCNT      : SOPK_Real32_gfx11<0x01b>;
2465
2466//===----------------------------------------------------------------------===//
2467// SOPK - GFX10.
2468//===----------------------------------------------------------------------===//
2469
2470multiclass SOPK_Real32_gfx10<bits<5> op> {
2471  defvar ps = !cast<SOPK_Pseudo>(NAME);
2472  def _gfx10 : SOPK_Real32<op, ps>,
2473               Select<GFX10Gen, ps.PseudoInstr>;
2474}
2475
2476multiclass SOPK_Real64_gfx10<bits<5> op> {
2477  defvar ps = !cast<SOPK_Pseudo>(NAME);
2478  def _gfx10 : SOPK_Real64<op, ps>,
2479               Select<GFX10Gen, ps.PseudoInstr>;
2480}
2481
2482multiclass SOPK_Real32_gfx10_gfx11<bits<5> op> :
2483  SOPK_Real32_gfx10<op>, SOPK_Real32_gfx11<op>;
2484
2485multiclass SOPK_Real32_gfx10_gfx11_gfx12<bits<5> op> :
2486  SOPK_Real32_gfx10<op>, SOPK_Real32_gfx11_gfx12<op>;
2487
2488defm S_VERSION              : SOPK_Real32_gfx10_gfx11_gfx12<0x001>;
2489defm S_CALL_B64             : SOPK_Real32_gfx10<0x016>;
2490defm S_WAITCNT_VSCNT        : SOPK_Real32_gfx10<0x017>;
2491defm S_WAITCNT_VMCNT        : SOPK_Real32_gfx10<0x018>;
2492defm S_WAITCNT_EXPCNT       : SOPK_Real32_gfx10<0x019>;
2493defm S_WAITCNT_LGKMCNT      : SOPK_Real32_gfx10<0x01a>;
2494defm S_SUBVECTOR_LOOP_BEGIN : SOPK_Real32_gfx10<0x01b>;
2495defm S_SUBVECTOR_LOOP_END   : SOPK_Real32_gfx10<0x01c>;
2496
2497//===----------------------------------------------------------------------===//
2498// SOPK - GFX6, GFX7.
2499//===----------------------------------------------------------------------===//
2500
2501multiclass SOPK_Real32_gfx6_gfx7<bits<5> op> {
2502  defvar ps = !cast<SOPK_Pseudo>(NAME);
2503  def _gfx6_gfx7 : SOPK_Real32<op, ps>,
2504                   Select_gfx6_gfx7<ps.PseudoInstr>;
2505}
2506
2507multiclass SOPK_Real64_gfx6_gfx7<bits<5> op> {
2508  defvar ps = !cast<SOPK_Pseudo>(NAME);
2509  def _gfx6_gfx7 : SOPK_Real64<op, ps>,
2510                   Select_gfx6_gfx7<ps.PseudoInstr>;
2511}
2512
2513multiclass SOPK_Real32_gfx6_gfx7_gfx10<bits<5> op> :
2514  SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10<op>;
2515
2516multiclass SOPK_Real64_gfx6_gfx7_gfx10<bits<5> op> :
2517  SOPK_Real64_gfx6_gfx7<op>, SOPK_Real64_gfx10<op>;
2518
2519multiclass SOPK_Real32_gfx6_gfx7_gfx10_gfx11<bits<5> op> :
2520  SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10_gfx11<op>;
2521
2522multiclass SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<bits<5> op> :
2523  SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10_gfx11_gfx12<op>;
2524
2525multiclass SOPK_Real32_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<bits<5> op, string gfx12_name> :
2526  SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10<op>, SOPK_Real32_gfx11<op>,
2527  SOPK_Real32_gfx12<op, gfx12_name>;
2528
2529defm S_CBRANCH_I_FORK : SOPK_Real32_gfx6_gfx7<0x011>;
2530
2531defm S_MOVK_I32         : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<0x000>;
2532defm S_CMOVK_I32        : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<0x002>;
2533defm S_CMPK_EQ_I32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x003>;
2534defm S_CMPK_LG_I32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x004>;
2535defm S_CMPK_GT_I32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x005>;
2536defm S_CMPK_GE_I32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x006>;
2537defm S_CMPK_LT_I32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x007>;
2538defm S_CMPK_LE_I32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x008>;
2539defm S_CMPK_EQ_U32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x009>;
2540defm S_CMPK_LG_U32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00a>;
2541defm S_CMPK_GT_U32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00b>;
2542defm S_CMPK_GE_U32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00c>;
2543defm S_CMPK_LT_U32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00d>;
2544defm S_CMPK_LE_U32      : SOPK_Real32_gfx6_gfx7_gfx10_gfx11<0x00e>;
2545defm S_ADDK_I32         : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_Renamed_gfx12<0x00f, "s_addk_co_i32">;
2546defm S_MULK_I32         : SOPK_Real32_gfx6_gfx7_gfx10_gfx11_gfx12<0x010>;
2547defm S_GETREG_B32       : SOPK_Real32_gfx6_gfx7_gfx10<0x012>;
2548defm S_SETREG_B32       : SOPK_Real32_gfx6_gfx7_gfx10<0x013>;
2549defm S_SETREG_IMM32_B32 : SOPK_Real64_gfx6_gfx7_gfx10<0x015>;
2550
2551//===----------------------------------------------------------------------===//
2552// SOPP - GFX12 only.
2553//===----------------------------------------------------------------------===//
2554
2555multiclass SOPP_Real_32_gfx12<bits<7> op, string name = !tolower(NAME)> {
2556  defvar ps = !cast<SOPP_Pseudo>(NAME);
2557  def _gfx12 : SOPP_Real_32<op, ps, name>,
2558               Select<GFX12Gen, ps.PseudoInstr>;
2559  if !ne(ps.Mnemonic, name) then
2560    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
2561      let AssemblerPredicate = isGFX12Plus;
2562    }
2563}
2564
2565defm S_BARRIER_WAIT         : SOPP_Real_32_gfx12<0x014>;
2566defm S_BARRIER_LEAVE        : SOPP_Real_32_gfx12<0x015>;
2567defm S_WAIT_LOADCNT         : SOPP_Real_32_gfx12<0x040>;
2568defm S_WAIT_STORECNT        : SOPP_Real_32_gfx12<0x041>;
2569defm S_WAIT_SAMPLECNT       : SOPP_Real_32_gfx12<0x042>;
2570defm S_WAIT_BVHCNT          : SOPP_Real_32_gfx12<0x043>;
2571defm S_WAIT_EXPCNT          : SOPP_Real_32_gfx12<0x044>;
2572defm S_WAIT_DSCNT           : SOPP_Real_32_gfx12<0x046>;
2573defm S_WAIT_KMCNT           : SOPP_Real_32_gfx12<0x047>;
2574defm S_WAIT_LOADCNT_DSCNT   : SOPP_Real_32_gfx12<0x048>;
2575defm S_WAIT_STORECNT_DSCNT  : SOPP_Real_32_gfx12<0x049>;
2576
2577//===----------------------------------------------------------------------===//
2578// SOPP - GFX11, GFX12.
2579//===----------------------------------------------------------------------===//
2580
2581
2582multiclass SOPP_Real_32_gfx11<bits<7> op, string name = !tolower(NAME)> {
2583  defvar ps = !cast<SOPP_Pseudo>(NAME);
2584  def _gfx11 : SOPP_Real_32<op, ps, name>,
2585               Select<GFX11Gen, ps.PseudoInstr>,
2586               SOPPRelaxTable<0, ps.KeyName, "_gfx11">;
2587  if !ne(ps.Mnemonic, name) then
2588    def : AMDGPUMnemonicAlias<ps.Mnemonic, name> {
2589      let AssemblerPredicate = isGFX11Only;
2590    }
2591}
2592
2593multiclass SOPP_Real_64_gfx12<bits<7> op> {
2594  def _gfx12 : SOPP_Real_64<op, !cast<SOPP_Pseudo>(NAME), !cast<SOPP_Pseudo>(NAME).Mnemonic>,
2595               Select<GFX12Gen, !cast<SOPP_Pseudo>(NAME).PseudoInstr>,
2596               SOPPRelaxTable<1, !cast<SOPP_Pseudo>(NAME).KeyName, "_gfx12">;
2597}
2598
2599multiclass SOPP_Real_64_gfx11<bits<7> op> {
2600  def _gfx11 : SOPP_Real_64<op, !cast<SOPP_Pseudo>(NAME), !cast<SOPP_Pseudo>(NAME).Mnemonic>,
2601               Select<GFX11Gen, !cast<SOPP_Pseudo>(NAME).PseudoInstr>,
2602               SOPPRelaxTable<1, !cast<SOPP_Pseudo>(NAME).KeyName, "_gfx11">;
2603}
2604
2605multiclass SOPP_Real_32_gfx11_gfx12<bits<7> op> :
2606  SOPP_Real_32_gfx11<op>, SOPP_Real_32_gfx12<op>;
2607
2608multiclass SOPP_Real_32_gfx11_Renamed_gfx12<bits<7> op, string gfx12_name> :
2609  SOPP_Real_32_gfx11<op>, SOPP_Real_32_gfx12<op, gfx12_name>;
2610
2611multiclass SOPP_Real_With_Relaxation_gfx12<bits<7> op> {
2612  defm "" : SOPP_Real_32_gfx12<op>;
2613  let isCodeGenOnly = 1 in
2614  defm _pad_s_nop : SOPP_Real_64_gfx12<op>;
2615}
2616
2617multiclass SOPP_Real_With_Relaxation_gfx11<bits<7> op> {
2618  defm "" : SOPP_Real_32_gfx11<op>;
2619  let isCodeGenOnly = 1 in
2620  defm _pad_s_nop : SOPP_Real_64_gfx11<op>;
2621}
2622
2623multiclass SOPP_Real_With_Relaxation_gfx11_gfx12<bits<7>op> :
2624  SOPP_Real_With_Relaxation_gfx11<op>, SOPP_Real_With_Relaxation_gfx12<op>;
2625
2626defm S_SETKILL                    : SOPP_Real_32_gfx11_gfx12<0x001>;
2627defm S_SETHALT                    : SOPP_Real_32_gfx11_gfx12<0x002>;
2628defm S_SLEEP                      : SOPP_Real_32_gfx11_gfx12<0x003>;
2629defm S_INST_PREFETCH              : SOPP_Real_32_gfx11<0x004, "s_set_inst_prefetch_distance">;
2630defm S_CLAUSE                     : SOPP_Real_32_gfx11_gfx12<0x005>;
2631defm S_DELAY_ALU                  : SOPP_Real_32_gfx11_gfx12<0x007>;
2632defm S_WAITCNT_DEPCTR             : SOPP_Real_32_gfx11_Renamed_gfx12<0x008, "s_wait_alu">;
2633defm S_WAITCNT                    : SOPP_Real_32_gfx11_gfx12<0x009>;
2634defm S_WAIT_IDLE                  : SOPP_Real_32_gfx11_gfx12<0x00a>;
2635defm S_WAIT_EVENT                 : SOPP_Real_32_gfx11_gfx12<0x00b>;
2636defm S_TRAP                       : SOPP_Real_32_gfx11_gfx12<0x010>;
2637defm S_ROUND_MODE                 : SOPP_Real_32_gfx11_gfx12<0x011>;
2638defm S_DENORM_MODE                : SOPP_Real_32_gfx11_gfx12<0x012>;
2639defm S_BRANCH                     : SOPP_Real_With_Relaxation_gfx11_gfx12<0x020>;
2640defm S_CBRANCH_SCC0               : SOPP_Real_With_Relaxation_gfx11_gfx12<0x021>;
2641defm S_CBRANCH_SCC1               : SOPP_Real_With_Relaxation_gfx11_gfx12<0x022>;
2642defm S_CBRANCH_VCCZ               : SOPP_Real_With_Relaxation_gfx11_gfx12<0x023>;
2643defm S_CBRANCH_VCCNZ              : SOPP_Real_With_Relaxation_gfx11_gfx12<0x024>;
2644defm S_CBRANCH_EXECZ              : SOPP_Real_With_Relaxation_gfx11_gfx12<0x025>;
2645defm S_CBRANCH_EXECNZ             : SOPP_Real_With_Relaxation_gfx11_gfx12<0x026>;
2646defm S_CBRANCH_CDBGSYS            : SOPP_Real_With_Relaxation_gfx11<0x027>;
2647defm S_CBRANCH_CDBGUSER           : SOPP_Real_With_Relaxation_gfx11<0x028>;
2648defm S_CBRANCH_CDBGSYS_OR_USER    : SOPP_Real_With_Relaxation_gfx11<0x029>;
2649defm S_CBRANCH_CDBGSYS_AND_USER   : SOPP_Real_With_Relaxation_gfx11<0x02a>;
2650defm S_ENDPGM                     : SOPP_Real_32_gfx11_gfx12<0x030>;
2651defm S_ENDPGM_SAVED               : SOPP_Real_32_gfx11_gfx12<0x031>;
2652defm S_ENDPGM_ORDERED_PS_DONE     : SOPP_Real_32_gfx11<0x032>;
2653defm S_WAKEUP                     : SOPP_Real_32_gfx11_gfx12<0x034>;
2654defm S_SETPRIO                    : SOPP_Real_32_gfx11_gfx12<0x035>;
2655defm S_SENDMSG                    : SOPP_Real_32_gfx11_gfx12<0x036>;
2656defm S_SENDMSGHALT                : SOPP_Real_32_gfx11_gfx12<0x037>;
2657defm S_INCPERFLEVEL               : SOPP_Real_32_gfx11_gfx12<0x038>;
2658defm S_DECPERFLEVEL               : SOPP_Real_32_gfx11_gfx12<0x039>;
2659defm S_TTRACEDATA                 : SOPP_Real_32_gfx11_gfx12<0x03a>;
2660defm S_TTRACEDATA_IMM             : SOPP_Real_32_gfx11_gfx12<0x03b>;
2661defm S_ICACHE_INV                 : SOPP_Real_32_gfx11_gfx12<0x03c>;
2662
2663defm S_BARRIER                    : SOPP_Real_32_gfx11<0x03d>;
2664
2665//===----------------------------------------------------------------------===//
2666// SOPP - GFX6, GFX7, GFX8, GFX9, GFX10
2667//===----------------------------------------------------------------------===//
2668
2669multiclass SOPP_Real_32_gfx6_gfx7<bits<7> op> {
2670  defvar ps = !cast<SOPP_Pseudo>(NAME);
2671  def _gfx6_gfx7 : SOPP_Real_32<op, ps, !cast<SOPP_Pseudo>(NAME).Mnemonic>,
2672                   Select_gfx6_gfx7<ps.PseudoInstr>,
2673                   SOPPRelaxTable<0, ps.KeyName, "_gfx6_gfx7">;
2674}
2675
2676multiclass SOPP_Real_32_gfx8_gfx9<bits<7> op> {
2677  defvar ps = !cast<SOPP_Pseudo>(NAME);
2678  def _vi : SOPP_Real_32<op, ps>,
2679            Select_vi<ps.PseudoInstr>,
2680            SOPPRelaxTable<0, ps.KeyName, "_vi">;
2681}
2682
2683multiclass SOPP_Real_32_gfx10<bits<7> op> {
2684  defvar ps = !cast<SOPP_Pseudo>(NAME);
2685  def _gfx10 : SOPP_Real_32<op, ps>,
2686               Select<GFX10Gen, ps.PseudoInstr>,
2687               SOPPRelaxTable<0, ps.KeyName, "_gfx10">;
2688}
2689
2690multiclass SOPP_Real_32_gfx8_gfx9_gfx10<bits<7> op> :
2691  SOPP_Real_32_gfx8_gfx9<op>, SOPP_Real_32_gfx10<op>;
2692
2693multiclass SOPP_Real_32_gfx6_gfx7_gfx8_gfx9<bits<7> op> :
2694  SOPP_Real_32_gfx6_gfx7<op>, SOPP_Real_32_gfx8_gfx9<op>;
2695
2696multiclass SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<bits<7> op> :
2697  SOPP_Real_32_gfx6_gfx7_gfx8_gfx9<op>, SOPP_Real_32_gfx10<op>;
2698
2699multiclass SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<bits<7> op> :
2700  SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<op>, SOPP_Real_32_gfx11_gfx12<op>;
2701
2702multiclass SOPP_Real_32_gfx10_gfx11_gfx12<bits<7> op> :
2703  SOPP_Real_32_gfx10<op>, SOPP_Real_32_gfx11_gfx12<op>;
2704
2705//64 bit encodings, for Relaxation
2706multiclass SOPP_Real_64_gfx6_gfx7<bits<7> op> {
2707  defvar ps = !cast<SOPP_Pseudo>(NAME);
2708  def _gfx6_gfx7 : SOPP_Real_64<op, ps>,
2709                   Select_gfx6_gfx7<ps.PseudoInstr>,
2710                   SOPPRelaxTable<1, ps.KeyName, "_gfx6_gfx7">;
2711}
2712
2713multiclass SOPP_Real_64_gfx8_gfx9<bits<7> op> {
2714  defvar ps = !cast<SOPP_Pseudo>(NAME);
2715  def _vi : SOPP_Real_64<op, ps>,
2716            Select_vi<ps.PseudoInstr>,
2717            SOPPRelaxTable<1, ps.KeyName, "_vi">;
2718}
2719
2720multiclass SOPP_Real_64_gfx10<bits<7> op> {
2721  defvar ps = !cast<SOPP_Pseudo>(NAME);
2722  def _gfx10 : SOPP_Real_64<op, ps>,
2723               Select<GFX10Gen, ps.PseudoInstr>,
2724               SOPPRelaxTable<1, ps.KeyName, "_gfx10">;
2725}
2726
2727multiclass SOPP_Real_64_gfx6_gfx7_gfx8_gfx9<bits<7> op> :
2728  SOPP_Real_64_gfx6_gfx7<op>, SOPP_Real_64_gfx8_gfx9<op>;
2729
2730multiclass SOPP_Real_64_gfx6_gfx7_gfx8_gfx9_gfx10<bits<7> op> :
2731  SOPP_Real_64_gfx6_gfx7_gfx8_gfx9<op>, SOPP_Real_64_gfx10<op>;
2732
2733//relaxation for insts with no operands not implemented
2734multiclass SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<bits<7> op> {
2735  defm "" : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<op>;
2736  let isCodeGenOnly = 1 in
2737  defm _pad_s_nop : SOPP_Real_64_gfx6_gfx7_gfx8_gfx9_gfx10<op>;
2738}
2739
2740defm S_NOP                      : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x000>;
2741defm S_ENDPGM                   : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x001>;
2742defm S_WAKEUP                   : SOPP_Real_32_gfx8_gfx9_gfx10<0x003>;
2743defm S_BARRIER                  : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00a>;
2744defm S_WAITCNT                  : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00c>;
2745defm S_SETHALT                  : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00d>;
2746defm S_SETKILL                  : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00b>;
2747defm S_SLEEP                    : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00e>;
2748defm S_SETPRIO                  : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x00f>;
2749defm S_SENDMSG                  : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x010>;
2750defm S_SENDMSGHALT              : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x011>;
2751defm S_TRAP                     : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x012>;
2752defm S_ICACHE_INV               : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x013>;
2753defm S_INCPERFLEVEL             : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x014>;
2754defm S_DECPERFLEVEL             : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x015>;
2755defm S_TTRACEDATA               : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x016>;
2756defm S_ENDPGM_SAVED             : SOPP_Real_32_gfx6_gfx7_gfx8_gfx9_gfx10<0x01B>;
2757defm S_SET_GPR_IDX_OFF          : SOPP_Real_32_gfx8_gfx9<0x01c>;
2758defm S_SET_GPR_IDX_MODE         : SOPP_Real_32_gfx8_gfx9<0x01d>;
2759defm S_ENDPGM_ORDERED_PS_DONE   : SOPP_Real_32_gfx8_gfx9_gfx10<0x01e>;
2760defm S_CODE_END                 : SOPP_Real_32_gfx10_gfx11_gfx12<0x01f>;
2761defm S_INST_PREFETCH            : SOPP_Real_32_gfx10<0x020>;
2762defm S_CLAUSE                   : SOPP_Real_32_gfx10<0x021>;
2763defm S_WAIT_IDLE                : SOPP_Real_32_gfx10<0x022>;
2764defm S_WAITCNT_DEPCTR           : SOPP_Real_32_gfx10<0x023>;
2765defm S_ROUND_MODE               : SOPP_Real_32_gfx10<0x024>;
2766defm S_DENORM_MODE              : SOPP_Real_32_gfx10<0x025>;
2767defm S_TTRACEDATA_IMM           : SOPP_Real_32_gfx10<0x028>;
2768
2769let isBranch = 1 in {
2770defm S_BRANCH                   : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x002>;
2771defm S_CBRANCH_SCC0             : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x004>;
2772defm S_CBRANCH_SCC1             : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x005>;
2773defm S_CBRANCH_VCCZ             : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x006>;
2774defm S_CBRANCH_VCCNZ            : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x007>;
2775defm S_CBRANCH_EXECZ            : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x008>;
2776defm S_CBRANCH_EXECNZ           : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x009>;
2777defm S_CBRANCH_CDBGSYS          : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x017>;
2778defm S_CBRANCH_CDBGUSER         : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x018>;
2779defm S_CBRANCH_CDBGSYS_OR_USER  : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x019>;
2780defm S_CBRANCH_CDBGSYS_AND_USER : SOPP_Real_With_Relaxation_gfx6_gfx7_gfx8_gfx9_gfx10<0x01A>;
2781}
2782
2783//===----------------------------------------------------------------------===//
2784// SOPC - GFX11, GFX12.
2785//===----------------------------------------------------------------------===//
2786
2787multiclass SOPC_Real_gfx12<bits<7> op> {
2788  def _gfx12 : SOPC_Real<op, !cast<SOPC_Pseudo>(NAME)>,
2789               Select<GFX12Gen, !cast<SOPC_Pseudo>(NAME).PseudoInstr>;
2790}
2791
2792multiclass SOPC_Real_gfx11<bits<7> op> {
2793  def _gfx11 : SOPC_Real<op, !cast<SOPC_Pseudo>(NAME)>,
2794               Select<GFX11Gen, !cast<SOPC_Pseudo>(NAME).PseudoInstr>;
2795}
2796
2797multiclass SOPC_Real_gfx11_gfx12<bits<7> op> :
2798  SOPC_Real_gfx11<op>, SOPC_Real_gfx12<op>;
2799
2800defm S_CMP_EQ_U64 : SOPC_Real_gfx11_gfx12<0x10>;
2801defm S_CMP_LG_U64 : SOPC_Real_gfx11_gfx12<0x11>;
2802
2803//===----------------------------------------------------------------------===//
2804// SOPC - GFX1150, GFX12
2805//===----------------------------------------------------------------------===//
2806
2807defm S_CMP_LT_F32  : SOPC_Real_gfx11_gfx12<0x41>;
2808defm S_CMP_EQ_F32  : SOPC_Real_gfx11_gfx12<0x42>;
2809defm S_CMP_LE_F32  : SOPC_Real_gfx11_gfx12<0x43>;
2810defm S_CMP_GT_F32  : SOPC_Real_gfx11_gfx12<0x44>;
2811defm S_CMP_LG_F32  : SOPC_Real_gfx11_gfx12<0x45>;
2812defm S_CMP_GE_F32  : SOPC_Real_gfx11_gfx12<0x46>;
2813defm S_CMP_O_F32   : SOPC_Real_gfx11_gfx12<0x47>;
2814defm S_CMP_U_F32   : SOPC_Real_gfx11_gfx12<0x48>;
2815defm S_CMP_NGE_F32 : SOPC_Real_gfx11_gfx12<0x49>;
2816defm S_CMP_NLG_F32 : SOPC_Real_gfx11_gfx12<0x4a>;
2817defm S_CMP_NGT_F32 : SOPC_Real_gfx11_gfx12<0x4b>;
2818defm S_CMP_NLE_F32 : SOPC_Real_gfx11_gfx12<0x4c>;
2819defm S_CMP_NEQ_F32 : SOPC_Real_gfx11_gfx12<0x4d>;
2820defm S_CMP_NLT_F32 : SOPC_Real_gfx11_gfx12<0x4e>;
2821
2822defm S_CMP_LT_F16  : SOPC_Real_gfx11_gfx12<0x51>;
2823defm S_CMP_EQ_F16  : SOPC_Real_gfx11_gfx12<0x52>;
2824defm S_CMP_LE_F16  : SOPC_Real_gfx11_gfx12<0x53>;
2825defm S_CMP_GT_F16  : SOPC_Real_gfx11_gfx12<0x54>;
2826defm S_CMP_LG_F16  : SOPC_Real_gfx11_gfx12<0x55>;
2827defm S_CMP_GE_F16  : SOPC_Real_gfx11_gfx12<0x56>;
2828defm S_CMP_O_F16   : SOPC_Real_gfx11_gfx12<0x57>;
2829defm S_CMP_U_F16   : SOPC_Real_gfx11_gfx12<0x58>;
2830defm S_CMP_NGE_F16 : SOPC_Real_gfx11_gfx12<0x59>;
2831defm S_CMP_NLG_F16 : SOPC_Real_gfx11_gfx12<0x5a>;
2832defm S_CMP_NGT_F16 : SOPC_Real_gfx11_gfx12<0x5b>;
2833defm S_CMP_NLE_F16 : SOPC_Real_gfx11_gfx12<0x5c>;
2834defm S_CMP_NEQ_F16 : SOPC_Real_gfx11_gfx12<0x5d>;
2835defm S_CMP_NLT_F16 : SOPC_Real_gfx11_gfx12<0x5e>;
2836
2837//===----------------------------------------------------------------------===//
2838// SOPC - GFX6, GFX7, GFX8, GFX9, GFX10
2839//===----------------------------------------------------------------------===//
2840
2841multiclass SOPC_Real_gfx6_gfx7<bits<7> op> {
2842  defvar ps = !cast<SOPC_Pseudo>(NAME);
2843  def _gfx6_gfx7 : SOPC_Real<op, ps>,
2844                   Select_gfx6_gfx7<ps.PseudoInstr>;
2845}
2846
2847multiclass SOPC_Real_gfx8_gfx9<bits<7> op> {
2848  defvar ps = !cast<SOPC_Pseudo>(NAME);
2849  def _vi : SOPC_Real<op, ps>,
2850            Select_vi<ps.PseudoInstr>;
2851}
2852
2853multiclass SOPC_Real_gfx10<bits<7> op> {
2854  defvar ps = !cast<SOPC_Pseudo>(NAME);
2855  def _gfx10 : SOPC_Real<op, ps>,
2856               Select<GFX10Gen, ps.PseudoInstr>;
2857}
2858
2859multiclass SOPC_Real_gfx8_gfx9_gfx10<bits<7> op> :
2860  SOPC_Real_gfx8_gfx9<op>, SOPC_Real_gfx10<op>;
2861
2862multiclass SOPC_Real_gfx6_gfx7_gfx8_gfx9<bits<7> op> :
2863  SOPC_Real_gfx6_gfx7<op>, SOPC_Real_gfx8_gfx9<op>;
2864
2865multiclass SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<bits<7> op> :
2866  SOPC_Real_gfx6_gfx7_gfx8_gfx9<op>, SOPC_Real_gfx10<op>, SOPC_Real_gfx11<op>,
2867  SOPC_Real_gfx12<op>;
2868
2869defm S_CMP_EQ_I32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x00>;
2870defm S_CMP_LG_I32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x01>;
2871defm S_CMP_GT_I32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x02>;
2872defm S_CMP_GE_I32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x03>;
2873defm S_CMP_LT_I32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x04>;
2874defm S_CMP_LE_I32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x05>;
2875defm S_CMP_EQ_U32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x06>;
2876defm S_CMP_LG_U32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x07>;
2877defm S_CMP_GT_U32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x08>;
2878defm S_CMP_GE_U32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x09>;
2879defm S_CMP_LT_U32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0a>;
2880defm S_CMP_LE_U32     : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0b>;
2881defm S_BITCMP0_B32    : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0c>;
2882defm S_BITCMP1_B32    : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0d>;
2883defm S_BITCMP0_B64    : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0e>;
2884defm S_BITCMP1_B64    : SOPC_Real_gfx6_gfx7_gfx8_gfx9_gfx10_gfx11_gfx12<0x0f>;
2885defm S_SETVSKIP       : SOPC_Real_gfx6_gfx7_gfx8_gfx9<0x10>;
2886defm S_SET_GPR_IDX_ON : SOPC_Real_gfx8_gfx9<0x11>;
2887defm S_CMP_EQ_U64     : SOPC_Real_gfx8_gfx9_gfx10<0x12>;
2888defm S_CMP_LG_U64     : SOPC_Real_gfx8_gfx9_gfx10<0x13>;
2889
2890//===----------------------------------------------------------------------===//
2891// GFX8 (VI), GFX9.
2892//===----------------------------------------------------------------------===//
2893
2894class SOP1_Real_vi<bits<8> op, SOP1_Pseudo ps> :
2895  SOP1_Real<op, ps>,
2896  Select_vi<ps.PseudoInstr>;
2897
2898class SOP2_Real_vi<bits<7> op, SOP2_Pseudo ps> :
2899  SOP2_Real32<op, ps>,
2900  Select_vi<ps.PseudoInstr>;
2901
2902class SOPK_Real_vi<bits<5> op, SOPK_Pseudo ps> :
2903  SOPK_Real32<op, ps>,
2904  Select_vi<ps.PseudoInstr>;
2905
2906def S_MOV_B32_vi           : SOP1_Real_vi <0x00, S_MOV_B32>;
2907def S_MOV_B64_vi           : SOP1_Real_vi <0x01, S_MOV_B64>;
2908def S_CMOV_B32_vi          : SOP1_Real_vi <0x02, S_CMOV_B32>;
2909def S_CMOV_B64_vi          : SOP1_Real_vi <0x03, S_CMOV_B64>;
2910def S_NOT_B32_vi           : SOP1_Real_vi <0x04, S_NOT_B32>;
2911def S_NOT_B64_vi           : SOP1_Real_vi <0x05, S_NOT_B64>;
2912def S_WQM_B32_vi           : SOP1_Real_vi <0x06, S_WQM_B32>;
2913def S_WQM_B64_vi           : SOP1_Real_vi <0x07, S_WQM_B64>;
2914def S_BREV_B32_vi          : SOP1_Real_vi <0x08, S_BREV_B32>;
2915def S_BREV_B64_vi          : SOP1_Real_vi <0x09, S_BREV_B64>;
2916def S_BCNT0_I32_B32_vi     : SOP1_Real_vi <0x0a, S_BCNT0_I32_B32>;
2917def S_BCNT0_I32_B64_vi     : SOP1_Real_vi <0x0b, S_BCNT0_I32_B64>;
2918def S_BCNT1_I32_B32_vi     : SOP1_Real_vi <0x0c, S_BCNT1_I32_B32>;
2919def S_BCNT1_I32_B64_vi     : SOP1_Real_vi <0x0d, S_BCNT1_I32_B64>;
2920def S_FF0_I32_B32_vi       : SOP1_Real_vi <0x0e, S_FF0_I32_B32>;
2921def S_FF0_I32_B64_vi       : SOP1_Real_vi <0x0f, S_FF0_I32_B64>;
2922def S_FF1_I32_B32_vi       : SOP1_Real_vi <0x10, S_FF1_I32_B32>;
2923def S_FF1_I32_B64_vi       : SOP1_Real_vi <0x11, S_FF1_I32_B64>;
2924def S_FLBIT_I32_B32_vi     : SOP1_Real_vi <0x12, S_FLBIT_I32_B32>;
2925def S_FLBIT_I32_B64_vi     : SOP1_Real_vi <0x13, S_FLBIT_I32_B64>;
2926def S_FLBIT_I32_vi         : SOP1_Real_vi <0x14, S_FLBIT_I32>;
2927def S_FLBIT_I32_I64_vi     : SOP1_Real_vi <0x15, S_FLBIT_I32_I64>;
2928def S_SEXT_I32_I8_vi       : SOP1_Real_vi <0x16, S_SEXT_I32_I8>;
2929def S_SEXT_I32_I16_vi      : SOP1_Real_vi <0x17, S_SEXT_I32_I16>;
2930def S_BITSET0_B32_vi       : SOP1_Real_vi <0x18, S_BITSET0_B32>;
2931def S_BITSET0_B64_vi       : SOP1_Real_vi <0x19, S_BITSET0_B64>;
2932def S_BITSET1_B32_vi       : SOP1_Real_vi <0x1a, S_BITSET1_B32>;
2933def S_BITSET1_B64_vi       : SOP1_Real_vi <0x1b, S_BITSET1_B64>;
2934def S_GETPC_B64_vi         : SOP1_Real_vi <0x1c, S_GETPC_B64>;
2935def S_SETPC_B64_vi         : SOP1_Real_vi <0x1d, S_SETPC_B64>;
2936def S_SWAPPC_B64_vi        : SOP1_Real_vi <0x1e, S_SWAPPC_B64>;
2937def S_RFE_B64_vi           : SOP1_Real_vi <0x1f, S_RFE_B64>;
2938def S_AND_SAVEEXEC_B64_vi  : SOP1_Real_vi <0x20, S_AND_SAVEEXEC_B64>;
2939def S_OR_SAVEEXEC_B64_vi   : SOP1_Real_vi <0x21, S_OR_SAVEEXEC_B64>;
2940def S_XOR_SAVEEXEC_B64_vi  : SOP1_Real_vi <0x22, S_XOR_SAVEEXEC_B64>;
2941def S_ANDN2_SAVEEXEC_B64_vi: SOP1_Real_vi <0x23, S_ANDN2_SAVEEXEC_B64>;
2942def S_ORN2_SAVEEXEC_B64_vi : SOP1_Real_vi <0x24, S_ORN2_SAVEEXEC_B64>;
2943def S_NAND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x25, S_NAND_SAVEEXEC_B64>;
2944def S_NOR_SAVEEXEC_B64_vi  : SOP1_Real_vi <0x26, S_NOR_SAVEEXEC_B64>;
2945def S_XNOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x27, S_XNOR_SAVEEXEC_B64>;
2946def S_QUADMASK_B32_vi      : SOP1_Real_vi <0x28, S_QUADMASK_B32>;
2947def S_QUADMASK_B64_vi      : SOP1_Real_vi <0x29, S_QUADMASK_B64>;
2948def S_MOVRELS_B32_vi       : SOP1_Real_vi <0x2a, S_MOVRELS_B32>;
2949def S_MOVRELS_B64_vi       : SOP1_Real_vi <0x2b, S_MOVRELS_B64>;
2950def S_MOVRELD_B32_vi       : SOP1_Real_vi <0x2c, S_MOVRELD_B32>;
2951def S_MOVRELD_B64_vi       : SOP1_Real_vi <0x2d, S_MOVRELD_B64>;
2952def S_CBRANCH_JOIN_vi      : SOP1_Real_vi <0x2e, S_CBRANCH_JOIN>;
2953def S_ABS_I32_vi           : SOP1_Real_vi <0x30, S_ABS_I32>;
2954def S_SET_GPR_IDX_IDX_vi   : SOP1_Real_vi <0x32, S_SET_GPR_IDX_IDX>;
2955
2956def S_ADD_U32_vi           : SOP2_Real_vi <0x00, S_ADD_U32>;
2957def S_ADD_I32_vi           : SOP2_Real_vi <0x02, S_ADD_I32>;
2958def S_SUB_U32_vi           : SOP2_Real_vi <0x01, S_SUB_U32>;
2959def S_SUB_I32_vi           : SOP2_Real_vi <0x03, S_SUB_I32>;
2960def S_ADDC_U32_vi          : SOP2_Real_vi <0x04, S_ADDC_U32>;
2961def S_SUBB_U32_vi          : SOP2_Real_vi <0x05, S_SUBB_U32>;
2962def S_MIN_I32_vi           : SOP2_Real_vi <0x06, S_MIN_I32>;
2963def S_MIN_U32_vi           : SOP2_Real_vi <0x07, S_MIN_U32>;
2964def S_MAX_I32_vi           : SOP2_Real_vi <0x08, S_MAX_I32>;
2965def S_MAX_U32_vi           : SOP2_Real_vi <0x09, S_MAX_U32>;
2966def S_CSELECT_B32_vi       : SOP2_Real_vi <0x0a, S_CSELECT_B32>;
2967def S_CSELECT_B64_vi       : SOP2_Real_vi <0x0b, S_CSELECT_B64>;
2968def S_AND_B32_vi           : SOP2_Real_vi <0x0c, S_AND_B32>;
2969def S_AND_B64_vi           : SOP2_Real_vi <0x0d, S_AND_B64>;
2970def S_OR_B32_vi            : SOP2_Real_vi <0x0e, S_OR_B32>;
2971def S_OR_B64_vi            : SOP2_Real_vi <0x0f, S_OR_B64>;
2972def S_XOR_B32_vi           : SOP2_Real_vi <0x10, S_XOR_B32>;
2973def S_XOR_B64_vi           : SOP2_Real_vi <0x11, S_XOR_B64>;
2974def S_ANDN2_B32_vi         : SOP2_Real_vi <0x12, S_ANDN2_B32>;
2975def S_ANDN2_B64_vi         : SOP2_Real_vi <0x13, S_ANDN2_B64>;
2976def S_ORN2_B32_vi          : SOP2_Real_vi <0x14, S_ORN2_B32>;
2977def S_ORN2_B64_vi          : SOP2_Real_vi <0x15, S_ORN2_B64>;
2978def S_NAND_B32_vi          : SOP2_Real_vi <0x16, S_NAND_B32>;
2979def S_NAND_B64_vi          : SOP2_Real_vi <0x17, S_NAND_B64>;
2980def S_NOR_B32_vi           : SOP2_Real_vi <0x18, S_NOR_B32>;
2981def S_NOR_B64_vi           : SOP2_Real_vi <0x19, S_NOR_B64>;
2982def S_XNOR_B32_vi          : SOP2_Real_vi <0x1a, S_XNOR_B32>;
2983def S_XNOR_B64_vi          : SOP2_Real_vi <0x1b, S_XNOR_B64>;
2984def S_LSHL_B32_vi          : SOP2_Real_vi <0x1c, S_LSHL_B32>;
2985def S_LSHL_B64_vi          : SOP2_Real_vi <0x1d, S_LSHL_B64>;
2986def S_LSHR_B32_vi          : SOP2_Real_vi <0x1e, S_LSHR_B32>;
2987def S_LSHR_B64_vi          : SOP2_Real_vi <0x1f, S_LSHR_B64>;
2988def S_ASHR_I32_vi          : SOP2_Real_vi <0x20, S_ASHR_I32>;
2989def S_ASHR_I64_vi          : SOP2_Real_vi <0x21, S_ASHR_I64>;
2990def S_BFM_B32_vi           : SOP2_Real_vi <0x22, S_BFM_B32>;
2991def S_BFM_B64_vi           : SOP2_Real_vi <0x23, S_BFM_B64>;
2992def S_MUL_I32_vi           : SOP2_Real_vi <0x24, S_MUL_I32>;
2993def S_BFE_U32_vi           : SOP2_Real_vi <0x25, S_BFE_U32>;
2994def S_BFE_I32_vi           : SOP2_Real_vi <0x26, S_BFE_I32>;
2995def S_BFE_U64_vi           : SOP2_Real_vi <0x27, S_BFE_U64>;
2996def S_BFE_I64_vi           : SOP2_Real_vi <0x28, S_BFE_I64>;
2997def S_CBRANCH_G_FORK_vi    : SOP2_Real_vi <0x29, S_CBRANCH_G_FORK>;
2998def S_ABSDIFF_I32_vi       : SOP2_Real_vi <0x2a, S_ABSDIFF_I32>;
2999def S_PACK_LL_B32_B16_vi   : SOP2_Real_vi <0x32, S_PACK_LL_B32_B16>;
3000def S_PACK_LH_B32_B16_vi   : SOP2_Real_vi <0x33, S_PACK_LH_B32_B16>;
3001def S_PACK_HH_B32_B16_vi   : SOP2_Real_vi <0x34, S_PACK_HH_B32_B16>;
3002def S_RFE_RESTORE_B64_vi   : SOP2_Real_vi <0x2b, S_RFE_RESTORE_B64>;
3003
3004def S_MOVK_I32_vi          : SOPK_Real_vi <0x00, S_MOVK_I32>;
3005def S_CMOVK_I32_vi         : SOPK_Real_vi <0x01, S_CMOVK_I32>;
3006def S_CMPK_EQ_I32_vi       : SOPK_Real_vi <0x02, S_CMPK_EQ_I32>;
3007def S_CMPK_LG_I32_vi       : SOPK_Real_vi <0x03, S_CMPK_LG_I32>;
3008def S_CMPK_GT_I32_vi       : SOPK_Real_vi <0x04, S_CMPK_GT_I32>;
3009def S_CMPK_GE_I32_vi       : SOPK_Real_vi <0x05, S_CMPK_GE_I32>;
3010def S_CMPK_LT_I32_vi       : SOPK_Real_vi <0x06, S_CMPK_LT_I32>;
3011def S_CMPK_LE_I32_vi       : SOPK_Real_vi <0x07, S_CMPK_LE_I32>;
3012def S_CMPK_EQ_U32_vi       : SOPK_Real_vi <0x08, S_CMPK_EQ_U32>;
3013def S_CMPK_LG_U32_vi       : SOPK_Real_vi <0x09, S_CMPK_LG_U32>;
3014def S_CMPK_GT_U32_vi       : SOPK_Real_vi <0x0A, S_CMPK_GT_U32>;
3015def S_CMPK_GE_U32_vi       : SOPK_Real_vi <0x0B, S_CMPK_GE_U32>;
3016def S_CMPK_LT_U32_vi       : SOPK_Real_vi <0x0C, S_CMPK_LT_U32>;
3017def S_CMPK_LE_U32_vi       : SOPK_Real_vi <0x0D, S_CMPK_LE_U32>;
3018def S_ADDK_I32_vi          : SOPK_Real_vi <0x0E, S_ADDK_I32>;
3019def S_MULK_I32_vi          : SOPK_Real_vi <0x0F, S_MULK_I32>;
3020def S_CBRANCH_I_FORK_vi    : SOPK_Real_vi <0x10, S_CBRANCH_I_FORK>;
3021def S_GETREG_B32_vi        : SOPK_Real_vi <0x11, S_GETREG_B32>;
3022def S_SETREG_B32_vi        : SOPK_Real_vi <0x12, S_SETREG_B32>;
3023//def S_GETREG_REGRD_B32_vi  : SOPK_Real_vi <0x13, S_GETREG_REGRD_B32>; // see pseudo for comments
3024def S_SETREG_IMM32_B32_vi  : SOPK_Real64<0x14, S_SETREG_IMM32_B32>,
3025                             Select_vi<S_SETREG_IMM32_B32.PseudoInstr>;
3026
3027def S_CALL_B64_vi          : SOPK_Real_vi <0x15, S_CALL_B64>;
3028
3029//===----------------------------------------------------------------------===//
3030// SOP1 - GFX9.
3031//===----------------------------------------------------------------------===//
3032
3033def S_ANDN1_SAVEEXEC_B64_vi   : SOP1_Real_vi<0x33, S_ANDN1_SAVEEXEC_B64>;
3034def S_ORN1_SAVEEXEC_B64_vi    : SOP1_Real_vi<0x34, S_ORN1_SAVEEXEC_B64>;
3035def S_ANDN1_WREXEC_B64_vi     : SOP1_Real_vi<0x35, S_ANDN1_WREXEC_B64>;
3036def S_ANDN2_WREXEC_B64_vi     : SOP1_Real_vi<0x36, S_ANDN2_WREXEC_B64>;
3037def S_BITREPLICATE_B64_B32_vi : SOP1_Real_vi<0x37, S_BITREPLICATE_B64_B32>;
3038
3039//===----------------------------------------------------------------------===//
3040// SOP2 - GFX9.
3041//===----------------------------------------------------------------------===//
3042
3043def S_LSHL1_ADD_U32_vi   : SOP2_Real_vi<0x2e, S_LSHL1_ADD_U32>;
3044def S_LSHL2_ADD_U32_vi   : SOP2_Real_vi<0x2f, S_LSHL2_ADD_U32>;
3045def S_LSHL3_ADD_U32_vi   : SOP2_Real_vi<0x30, S_LSHL3_ADD_U32>;
3046def S_LSHL4_ADD_U32_vi   : SOP2_Real_vi<0x31, S_LSHL4_ADD_U32>;
3047def S_MUL_HI_U32_vi      : SOP2_Real_vi<0x2c, S_MUL_HI_U32>;
3048def S_MUL_HI_I32_vi      : SOP2_Real_vi<0x2d, S_MUL_HI_I32>;
3049