1// RUN: llvm-mc -triple=amdgcn -show-encoding -mcpu=gfx1200 %s | FileCheck --check-prefix=GFX12 %s 2 3v_dot2_f32_bf16 v5, v1, v2, v3 4// GFX12: [0x05,0x40,0x1a,0xcc,0x01,0x05,0x0e,0x1c] 5 6v_dot2_f32_bf16 v5, v1, v2, s3 7// GFX12: [0x05,0x40,0x1a,0xcc,0x01,0x05,0x0e,0x18] 8 9v_dot2_f32_bf16 v5, v255, v255, s105 10// GFX12: [0x05,0x40,0x1a,0xcc,0xff,0xff,0xa7,0x19] 11 12v_dot2_f32_bf16 v5, s1, s2, v255 13// GFX12: [0x05,0x40,0x1a,0xcc,0x01,0x04,0xfc,0x1f] 14 15v_dot2_f32_bf16 v5, s105, s105, m0 16// GFX12: [0x05,0x40,0x1a,0xcc,0x69,0xd2,0xf4,0x19] 17 18v_dot2_f32_bf16 v5, vcc_lo, ttmp15, vcc_lo 19// GFX12: [0x05,0x40,0x1a,0xcc,0x6a,0xf6,0xa8,0x19] 20 21v_dot2_f32_bf16 v5, vcc_hi, 0xfe0b, vcc_hi 22// GFX12: [0x05,0x40,0x1a,0xcc,0x6b,0xfe,0xad,0x19,0x0b,0xfe,0x00,0x00] 23 24v_dot2_f32_bf16 v5, ttmp15, src_scc, ttmp15 25// GFX12: [0x05,0x40,0x1a,0xcc,0x7b,0xfa,0xed,0x19] 26 27v_dot2_f32_bf16 v5, m0, -1, exec_hi 28// GFX12: [0x05,0x40,0x1a,0xcc,0x7d,0x82,0xfd,0x19] 29 30v_dot2_f32_bf16 v5, exec_lo, null, exec_lo 31// GFX12: [0x05,0x40,0x1a,0xcc,0x7e,0xf8,0xf8,0x19] 32 33v_dot2_f32_bf16 v5, exec_hi, exec_lo, null 34// GFX12: [0x05,0x40,0x1a,0xcc,0x7f,0xfc,0xf0,0x19] 35 36v_dot2_f32_bf16 v5, null, exec_hi, -1 37// GFX12: [0x05,0x40,0x1a,0xcc,0x7c,0xfe,0x04,0x1b] 38 39v_dot2_f32_bf16 v5, -1, m0, 0xaf123456 40// GFX12: [0x05,0x40,0x1a,0xcc,0xc1,0xfa,0xfc,0x1b,0x56,0x34,0x12,0xaf] 41 42v_dot2_f32_bf16 v5, src_scc, vcc_lo, src_scc neg_lo:[1,0,0] neg_hi:[1,0,0] 43// GFX12: [0x05,0x41,0x1a,0xcc,0xfd,0xd4,0xf4,0x3b] 44 45v_dot2_f32_bf16 v255, 0xfe0b, vcc_hi, 0.5 neg_lo:[0,0,0] neg_hi:[0,0,0] clamp 46// GFX12: [0xff,0xc0,0x1a,0xcc,0xff,0xd6,0xc0,0x1b,0x0b,0xfe,0x00,0x00] 47 48v_dot2_f32_f16 v5, v1, v2, s3 49// GFX12: [0x05,0x40,0x13,0xcc,0x01,0x05,0x0e,0x18] 50 51v_dot2_f32_f16 v5, v255, s2, s105 52// GFX12: [0x05,0x40,0x13,0xcc,0xff,0x05,0xa4,0x19] 53 54v_dot2_f32_f16 v5, s1, v255, exec_hi 55// GFX12: [0x05,0x40,0x13,0xcc,0x01,0xfe,0xff,0x19] 56 57v_dot2_f32_f16 v5, s105, s105, exec_lo 58// GFX12: [0x05,0x40,0x13,0xcc,0x69,0xd2,0xf8,0x19] 59 60v_dot2_f32_f16 v5, vcc_lo, ttmp15, v3 61// GFX12: [0x05,0x40,0x13,0xcc,0x6a,0xf6,0x0c,0x1c] 62 63v_dot2_f32_f16 v5, vcc_hi, 0xfe0b, v255 64// GFX12: [0x05,0x40,0x13,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00] 65 66v_dot2_f32_f16 v5, ttmp15, src_scc, ttmp15 67// GFX12: [0x05,0x40,0x13,0xcc,0x7b,0xfa,0xed,0x19] 68 69v_dot2_f32_f16 v5, m0, 0.5, m0 70// GFX12: [0x05,0x40,0x13,0xcc,0x7d,0xe0,0xf5,0x19] 71 72v_dot2_f32_f16 v5, exec_lo, -1, vcc_hi 73// GFX12: [0x05,0x40,0x13,0xcc,0x7e,0x82,0xad,0x19] 74 75v_dot2_f32_f16 v5, exec_hi, null, vcc_lo 76// GFX12: [0x05,0x40,0x13,0xcc,0x7f,0xf8,0xa8,0x19] 77 78v_dot2_f32_f16 v5, null, exec_lo, 0xaf123456 79// GFX12: [0x05,0x40,0x13,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf] 80 81v_dot2_f32_f16 v5, -1, exec_hi, src_scc 82// GFX12: [0x05,0x40,0x13,0xcc,0xc1,0xfe,0xf4,0x1b] 83 84v_dot2_f32_f16 v5, 0.5, m0, 0.5 neg_lo:[1,0,0] neg_hi:[1,0,0] 85// GFX12: [0x05,0x41,0x13,0xcc,0xf0,0xfa,0xc0,0x3b] 86 87v_dot2_f32_f16 v5, src_scc, vcc_lo, -1 neg_lo:[0,1,0] neg_hi:[0,1,0] 88// GFX12: [0x05,0x42,0x13,0xcc,0xfd,0xd4,0x04,0x5b] 89 90v_dot2_f32_f16 v255, 0xfe0b, vcc_hi, null neg_lo:[0,0,0] neg_hi:[0,0,0] clamp 91// GFX12: [0xff,0xc0,0x13,0xcc,0xff,0xd6,0xf0,0x19,0x0b,0xfe,0x00,0x00] 92 93v_dot4_i32_iu8 v5, v1, v2, s3 94// GFX12: [0x05,0x40,0x16,0xcc,0x01,0x05,0x0e,0x18] 95 96v_dot4_i32_iu8 v5, v255, s2, s105 97// GFX12: [0x05,0x40,0x16,0xcc,0xff,0x05,0xa4,0x19] 98 99v_dot4_i32_iu8 v5, s1, v255, exec_hi 100// GFX12: [0x05,0x40,0x16,0xcc,0x01,0xfe,0xff,0x19] 101 102v_dot4_i32_iu8 v5, s105, s105, exec_lo 103// GFX12: [0x05,0x40,0x16,0xcc,0x69,0xd2,0xf8,0x19] 104 105v_dot4_i32_iu8 v5, vcc_lo, ttmp15, v3 106// GFX12: [0x05,0x40,0x16,0xcc,0x6a,0xf6,0x0c,0x1c] 107 108v_dot4_i32_iu8 v5, vcc_hi, 0xaf123456, v255 109// GFX12: [0x05,0x40,0x16,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf] 110 111v_dot4_i32_iu8 v5, ttmp15, src_scc, ttmp15 112// GFX12: [0x05,0x40,0x16,0xcc,0x7b,0xfa,0xed,0x19] 113 114v_dot4_i32_iu8 v5, m0, 0.5, m0 115// GFX12: [0x05,0x40,0x16,0xcc,0x7d,0xe0,0xf5,0x19] 116 117v_dot4_i32_iu8 v5, exec_lo, -1, vcc_hi 118// GFX12: [0x05,0x40,0x16,0xcc,0x7e,0x82,0xad,0x19] 119 120v_dot4_i32_iu8 v5, exec_hi, null, vcc_lo 121// GFX12: [0x05,0x40,0x16,0xcc,0x7f,0xf8,0xa8,0x19] 122 123v_dot4_i32_iu8 v5, null, exec_lo, 0xaf123456 124// GFX12: [0x05,0x40,0x16,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf] 125 126v_dot4_i32_iu8 v5, -1, exec_hi, src_scc 127// GFX12: [0x05,0x40,0x16,0xcc,0xc1,0xfe,0xf4,0x1b] 128 129v_dot4_i32_iu8 v5, 0.5, m0, 0.5 neg_lo:[1,0,0] 130// GFX12: [0x05,0x40,0x16,0xcc,0xf0,0xfa,0xc0,0x3b] 131 132v_dot4_i32_iu8 v5, src_scc, vcc_lo, -1 neg_lo:[0,1,0] 133// GFX12: [0x05,0x40,0x16,0xcc,0xfd,0xd4,0x04,0x5b] 134 135v_dot4_i32_iu8 v255, 0xaf123456, vcc_hi, null neg_lo:[0,0,0] 136// GFX12: [0xff,0x40,0x16,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf] 137 138v_dot4_u32_u8 v5, v1, v2, s3 139// GFX12: [0x05,0x40,0x17,0xcc,0x01,0x05,0x0e,0x18] 140 141v_dot4_u32_u8 v5, v255, s2, s105 142// GFX12: [0x05,0x40,0x17,0xcc,0xff,0x05,0xa4,0x19] 143 144v_dot4_u32_u8 v5, s1, v255, exec_hi 145// GFX12: [0x05,0x40,0x17,0xcc,0x01,0xfe,0xff,0x19] 146 147v_dot4_u32_u8 v5, s105, s105, exec_lo 148// GFX12: [0x05,0x40,0x17,0xcc,0x69,0xd2,0xf8,0x19] 149 150v_dot4_u32_u8 v5, vcc_lo, ttmp15, v3 151// GFX12: [0x05,0x40,0x17,0xcc,0x6a,0xf6,0x0c,0x1c] 152 153v_dot4_u32_u8 v5, vcc_hi, 0xaf123456, v255 154// GFX12: [0x05,0x40,0x17,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf] 155 156v_dot4_u32_u8 v5, ttmp15, src_scc, ttmp15 157// GFX12: [0x05,0x40,0x17,0xcc,0x7b,0xfa,0xed,0x19] 158 159v_dot4_u32_u8 v5, m0, 0.5, m0 160// GFX12: [0x05,0x40,0x17,0xcc,0x7d,0xe0,0xf5,0x19] 161 162v_dot4_u32_u8 v5, exec_lo, -1, vcc_hi 163// GFX12: [0x05,0x40,0x17,0xcc,0x7e,0x82,0xad,0x19] 164 165v_dot4_u32_u8 v5, exec_hi, null, vcc_lo 166// GFX12: [0x05,0x40,0x17,0xcc,0x7f,0xf8,0xa8,0x19] 167 168v_dot4_u32_u8 v5, null, exec_lo, 0xaf123456 169// GFX12: [0x05,0x40,0x17,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf] 170 171v_dot4_u32_u8 v5, -1, exec_hi, src_scc 172// GFX12: [0x05,0x40,0x17,0xcc,0xc1,0xfe,0xf4,0x1b] 173 174v_dot4_u32_u8 v5, 0.5, m0, 0.5 175// GFX12: [0x05,0x40,0x17,0xcc,0xf0,0xfa,0xc0,0x1b] 176 177v_dot4_u32_u8 v5, src_scc, vcc_lo, -1 178// GFX12: [0x05,0x40,0x17,0xcc,0xfd,0xd4,0x04,0x1b] 179 180v_dot4_u32_u8 v255, 0xaf123456, vcc_hi, null 181// GFX12: [0xff,0x40,0x17,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf] 182 183v_dot8_i32_iu4 v5, v1, v2, s3 184// GFX12: [0x05,0x40,0x18,0xcc,0x01,0x05,0x0e,0x18] 185 186v_dot8_i32_iu4 v5, v255, s2, s105 187// GFX12: [0x05,0x40,0x18,0xcc,0xff,0x05,0xa4,0x19] 188 189v_dot8_i32_iu4 v5, s1, v255, exec_hi 190// GFX12: [0x05,0x40,0x18,0xcc,0x01,0xfe,0xff,0x19] 191 192v_dot8_i32_iu4 v5, s105, s105, exec_lo 193// GFX12: [0x05,0x40,0x18,0xcc,0x69,0xd2,0xf8,0x19] 194 195v_dot8_i32_iu4 v5, vcc_lo, ttmp15, v3 196// GFX12: [0x05,0x40,0x18,0xcc,0x6a,0xf6,0x0c,0x1c] 197 198v_dot8_i32_iu4 v5, vcc_hi, 0xaf123456, v255 199// GFX12: [0x05,0x40,0x18,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf] 200 201v_dot8_i32_iu4 v5, ttmp15, src_scc, ttmp15 202// GFX12: [0x05,0x40,0x18,0xcc,0x7b,0xfa,0xed,0x19] 203 204v_dot8_i32_iu4 v5, m0, 0.5, m0 205// GFX12: [0x05,0x40,0x18,0xcc,0x7d,0xe0,0xf5,0x19] 206 207v_dot8_i32_iu4 v5, exec_lo, -1, vcc_hi 208// GFX12: [0x05,0x40,0x18,0xcc,0x7e,0x82,0xad,0x19] 209 210v_dot8_i32_iu4 v5, exec_hi, null, vcc_lo 211// GFX12: [0x05,0x40,0x18,0xcc,0x7f,0xf8,0xa8,0x19] 212 213v_dot8_i32_iu4 v5, null, exec_lo, 0xaf123456 214// GFX12: [0x05,0x40,0x18,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf] 215 216v_dot8_i32_iu4 v5, -1, exec_hi, src_scc 217// GFX12: [0x05,0x40,0x18,0xcc,0xc1,0xfe,0xf4,0x1b] 218 219v_dot8_i32_iu4 v5, 0.5, m0, 0.5 neg_lo:[1,0,0] 220// GFX12: [0x05,0x40,0x18,0xcc,0xf0,0xfa,0xc0,0x3b] 221 222v_dot8_i32_iu4 v5, src_scc, vcc_lo, -1 neg_lo:[0,1,0] 223// GFX12: [0x05,0x40,0x18,0xcc,0xfd,0xd4,0x04,0x5b] 224 225v_dot8_i32_iu4 v255, 0xaf123456, vcc_hi, null neg_lo:[0,0,0] clamp 226// GFX12: [0xff,0xc0,0x18,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf] 227 228v_dot8_u32_u4 v5, v1, v2, s3 229// GFX12: [0x05,0x40,0x19,0xcc,0x01,0x05,0x0e,0x18] 230 231v_dot8_u32_u4 v5, v255, s2, s105 232// GFX12: [0x05,0x40,0x19,0xcc,0xff,0x05,0xa4,0x19] 233 234v_dot8_u32_u4 v5, s1, v255, exec_hi 235// GFX12: [0x05,0x40,0x19,0xcc,0x01,0xfe,0xff,0x19] 236 237v_dot8_u32_u4 v5, s105, s105, exec_lo 238// GFX12: [0x05,0x40,0x19,0xcc,0x69,0xd2,0xf8,0x19] 239 240v_dot8_u32_u4 v5, vcc_lo, ttmp15, v3 241// GFX12: [0x05,0x40,0x19,0xcc,0x6a,0xf6,0x0c,0x1c] 242 243v_dot8_u32_u4 v5, vcc_hi, 0xaf123456, v255 244// GFX12: [0x05,0x40,0x19,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf] 245 246v_dot8_u32_u4 v5, ttmp15, src_scc, ttmp15 247// GFX12: [0x05,0x40,0x19,0xcc,0x7b,0xfa,0xed,0x19] 248 249v_dot8_u32_u4 v5, m0, 0.5, m0 250// GFX12: [0x05,0x40,0x19,0xcc,0x7d,0xe0,0xf5,0x19] 251 252v_dot8_u32_u4 v5, exec_lo, -1, vcc_hi 253// GFX12: [0x05,0x40,0x19,0xcc,0x7e,0x82,0xad,0x19] 254 255v_dot8_u32_u4 v5, exec_hi, null, vcc_lo 256// GFX12: [0x05,0x40,0x19,0xcc,0x7f,0xf8,0xa8,0x19] 257 258v_dot8_u32_u4 v5, null, exec_lo, 0xaf123456 259// GFX12: [0x05,0x40,0x19,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf] 260 261v_dot8_u32_u4 v5, -1, exec_hi, src_scc 262// GFX12: [0x05,0x40,0x19,0xcc,0xc1,0xfe,0xf4,0x1b] 263 264v_dot8_u32_u4 v5, 0.5, m0, 0.5 265// GFX12: [0x05,0x40,0x19,0xcc,0xf0,0xfa,0xc0,0x1b] 266 267v_dot8_u32_u4 v5, src_scc, vcc_lo, -1 268// GFX12: [0x05,0x40,0x19,0xcc,0xfd,0xd4,0x04,0x1b] 269 270v_dot8_u32_u4 v255, 0xaf123456, vcc_hi, null clamp 271// GFX12: [0xff,0xc0,0x19,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf] 272 273v_fma_mix_f32 v5, v1, v2, s3 274// GFX12: [0x05,0x00,0x20,0xcc,0x01,0x05,0x0e,0x00] 275 276v_fma_mix_f32 v5, v255, v255, s105 277// GFX12: [0x05,0x00,0x20,0xcc,0xff,0xff,0xa7,0x01] 278 279v_fma_mix_f32 v5, s1, s2, v3 280// GFX12: [0x05,0x00,0x20,0xcc,0x01,0x04,0x0c,0x04] 281 282v_fma_mix_f32 v5, s105, s105, m0 283// GFX12: [0x05,0x00,0x20,0xcc,0x69,0xd2,0xf4,0x01] 284 285v_fma_mix_f32 v5, vcc_lo, ttmp15, ttmp15 286// GFX12: [0x05,0x00,0x20,0xcc,0x6a,0xf6,0xec,0x01] 287 288v_fma_mix_f32 v5, vcc_hi, src_scc, v255 289// GFX12: [0x05,0x00,0x20,0xcc,0x6b,0xfa,0xfd,0x07] 290 291v_fma_mix_f32 v5, |ttmp15|, 0.5, -vcc_hi 292// GFX12: [0x05,0x01,0x20,0xcc,0x7b,0xe0,0xad,0x81] 293 294v_fma_mix_f32 v5, -m0, -1, |vcc_lo| 295// GFX12: [0x05,0x04,0x20,0xcc,0x7d,0x82,0xa9,0x21] 296 297v_fma_mix_f32 v5, -|exec_lo|, null, -|src_scc| 298// GFX12: [0x05,0x05,0x20,0xcc,0x7e,0xf8,0xf4,0xa3] 299 300v_fma_mix_f32 v5, -|exec_hi|, -|exec_lo|, -|exec_lo| op_sel:[1,1,1] op_sel_hi:[1,1,1] 301// GFX12: [0x05,0x7f,0x20,0xcc,0x7f,0xfc,0xf8,0xf9] 302 303v_fma_mix_f32 v5, null, exec_hi, 0.5 op_sel:[0,0,0] op_sel_hi:[0,0,1] 304// GFX12: [0x05,0x40,0x20,0xcc,0x7c,0xfe,0xc0,0x03] 305 306v_fma_mix_f32 v5, -1, -|m0|, -1 op_sel:[1,0,0] op_sel_hi:[0,1,0] 307// GFX12: [0x05,0x0a,0x20,0xcc,0xc1,0xfa,0x04,0x53] 308 309v_fma_mix_f32 v5, 0.5, -|vcc_lo|, -|exec_hi| op_sel:[0,1,0] op_sel_hi:[1,0,0] 310// GFX12: [0x05,0x16,0x20,0xcc,0xf0,0xd4,0xfc,0xc9] 311 312v_fma_mix_f32 v255, -|src_scc|, -|vcc_hi|, null op_sel:[0,0,1] op_sel_hi:[0,0,0] clamp 313// GFX12: [0xff,0xa3,0x20,0xcc,0xfd,0xd6,0xf0,0x61] 314 315v_fma_mixhi_f16 v5, v1, v2, s3 316// GFX12: [0x05,0x00,0x22,0xcc,0x01,0x05,0x0e,0x00] 317 318v_fma_mixhi_f16 v5, v255, v255, s105 319// GFX12: [0x05,0x00,0x22,0xcc,0xff,0xff,0xa7,0x01] 320 321v_fma_mixhi_f16 v5, s1, s2, v3 322// GFX12: [0x05,0x00,0x22,0xcc,0x01,0x04,0x0c,0x04] 323 324v_fma_mixhi_f16 v5, s105, s105, m0 325// GFX12: [0x05,0x00,0x22,0xcc,0x69,0xd2,0xf4,0x01] 326 327v_fma_mixhi_f16 v5, vcc_lo, ttmp15, ttmp15 328// GFX12: [0x05,0x00,0x22,0xcc,0x6a,0xf6,0xec,0x01] 329 330v_fma_mixhi_f16 v5, vcc_hi, src_scc, v255 331// GFX12: [0x05,0x00,0x22,0xcc,0x6b,0xfa,0xfd,0x07] 332 333v_fma_mixhi_f16 v5, |ttmp15|, 0.5, -vcc_hi 334// GFX12: [0x05,0x01,0x22,0xcc,0x7b,0xe0,0xad,0x81] 335 336v_fma_mixhi_f16 v5, -m0, -1, |vcc_lo| 337// GFX12: [0x05,0x04,0x22,0xcc,0x7d,0x82,0xa9,0x21] 338 339v_fma_mixhi_f16 v5, -|exec_lo|, null, -|src_scc| 340// GFX12: [0x05,0x05,0x22,0xcc,0x7e,0xf8,0xf4,0xa3] 341 342v_fma_mixhi_f16 v5, -|exec_hi|, -|exec_lo|, -|exec_lo| op_sel:[1,1,1] op_sel_hi:[1,1,1] 343// GFX12: [0x05,0x7f,0x22,0xcc,0x7f,0xfc,0xf8,0xf9] 344 345v_fma_mixhi_f16 v5, null, exec_hi, 0.5 op_sel:[0,0,0] op_sel_hi:[0,0,1] 346// GFX12: [0x05,0x40,0x22,0xcc,0x7c,0xfe,0xc0,0x03] 347 348v_fma_mixhi_f16 v5, -1, -|m0|, -1 op_sel:[1,0,0] op_sel_hi:[0,1,0] 349// GFX12: [0x05,0x0a,0x22,0xcc,0xc1,0xfa,0x04,0x53] 350 351v_fma_mixhi_f16 v5, 0.5, -|vcc_lo|, -|exec_hi| op_sel:[0,1,0] op_sel_hi:[1,0,0] 352// GFX12: [0x05,0x16,0x22,0xcc,0xf0,0xd4,0xfc,0xc9] 353 354v_fma_mixhi_f16 v255, -|src_scc|, -|vcc_hi|, null op_sel:[0,0,1] op_sel_hi:[0,0,0] clamp 355// GFX12: [0xff,0xa3,0x22,0xcc,0xfd,0xd6,0xf0,0x61] 356 357v_fma_mixlo_f16 v5, v1, v2, s3 358// GFX12: [0x05,0x00,0x21,0xcc,0x01,0x05,0x0e,0x00] 359 360v_fma_mixlo_f16 v5, v255, v255, s105 361// GFX12: [0x05,0x00,0x21,0xcc,0xff,0xff,0xa7,0x01] 362 363v_fma_mixlo_f16 v5, s1, s2, v3 364// GFX12: [0x05,0x00,0x21,0xcc,0x01,0x04,0x0c,0x04] 365 366v_fma_mixlo_f16 v5, s105, s105, m0 367// GFX12: [0x05,0x00,0x21,0xcc,0x69,0xd2,0xf4,0x01] 368 369v_fma_mixlo_f16 v5, vcc_lo, ttmp15, ttmp15 370// GFX12: [0x05,0x00,0x21,0xcc,0x6a,0xf6,0xec,0x01] 371 372v_fma_mixlo_f16 v5, vcc_hi, src_scc, v255 373// GFX12: [0x05,0x00,0x21,0xcc,0x6b,0xfa,0xfd,0x07] 374 375v_fma_mixlo_f16 v5, |ttmp15|, 0.5, -vcc_hi 376// GFX12: [0x05,0x01,0x21,0xcc,0x7b,0xe0,0xad,0x81] 377 378v_fma_mixlo_f16 v5, -m0, -1, |vcc_lo| 379// GFX12: [0x05,0x04,0x21,0xcc,0x7d,0x82,0xa9,0x21] 380 381v_fma_mixlo_f16 v5, -|exec_lo|, null, -|src_scc| 382// GFX12: [0x05,0x05,0x21,0xcc,0x7e,0xf8,0xf4,0xa3] 383 384v_fma_mixlo_f16 v5, -|exec_hi|, -|exec_lo|, -|exec_lo| op_sel:[1,1,1] op_sel_hi:[1,1,1] 385// GFX12: [0x05,0x7f,0x21,0xcc,0x7f,0xfc,0xf8,0xf9] 386 387v_fma_mixlo_f16 v5, null, exec_hi, 0.5 op_sel:[0,0,0] op_sel_hi:[0,0,1] 388// GFX12: [0x05,0x40,0x21,0xcc,0x7c,0xfe,0xc0,0x03] 389 390v_fma_mixlo_f16 v5, -1, -|m0|, -1 op_sel:[1,0,0] op_sel_hi:[0,1,0] 391// GFX12: [0x05,0x0a,0x21,0xcc,0xc1,0xfa,0x04,0x53] 392 393v_fma_mixlo_f16 v5, 0.5, -|vcc_lo|, -|exec_hi| op_sel:[0,1,0] op_sel_hi:[1,0,0] 394// GFX12: [0x05,0x16,0x21,0xcc,0xf0,0xd4,0xfc,0xc9] 395 396v_fma_mixlo_f16 v255, -|src_scc|, -|vcc_hi|, null op_sel:[0,0,1] op_sel_hi:[0,0,0] clamp 397// GFX12: [0xff,0xa3,0x21,0xcc,0xfd,0xd6,0xf0,0x61] 398 399v_pk_add_f16 v5, v1, v2 400// GFX12: [0x05,0x40,0x0f,0xcc,0x01,0x05,0x02,0x18] 401 402v_pk_add_f16 v5, v255, v255 403// GFX12: [0x05,0x40,0x0f,0xcc,0xff,0xff,0x03,0x18] 404 405v_pk_add_f16 v5, s1, s2 406// GFX12: [0x05,0x40,0x0f,0xcc,0x01,0x04,0x00,0x18] 407 408v_pk_add_f16 v5, s105, s105 409// GFX12: [0x05,0x40,0x0f,0xcc,0x69,0xd2,0x00,0x18] 410 411v_pk_add_f16 v5, vcc_lo, ttmp15 412// GFX12: [0x05,0x40,0x0f,0xcc,0x6a,0xf6,0x00,0x18] 413 414v_pk_add_f16 v5, vcc_hi, 0xfe0b 415// GFX12: [0x05,0x40,0x0f,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 416 417v_pk_add_f16 v5, ttmp15, src_scc 418// GFX12: [0x05,0x40,0x0f,0xcc,0x7b,0xfa,0x01,0x18] 419 420v_pk_add_f16 v5, m0, 0.5 421// GFX12: [0x05,0x40,0x0f,0xcc,0x7d,0xe0,0x01,0x18] 422 423v_pk_add_f16 v5, exec_lo, -1 424// GFX12: [0x05,0x40,0x0f,0xcc,0x7e,0x82,0x01,0x18] 425 426v_pk_add_f16 v5, exec_hi, null 427// GFX12: [0x05,0x40,0x0f,0xcc,0x7f,0xf8,0x00,0x18] 428 429v_pk_add_f16 v5, null, exec_lo 430// GFX12: [0x05,0x40,0x0f,0xcc,0x7c,0xfc,0x00,0x18] 431 432v_pk_add_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0] 433// GFX12: [0x05,0x59,0x0f,0xcc,0xc1,0xfe,0x00,0x20] 434 435v_pk_add_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1] 436// GFX12: [0x05,0x42,0x0f,0xcc,0xf0,0xfa,0x00,0x58] 437 438v_pk_add_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0] 439// GFX12: [0x05,0x48,0x0f,0xcc,0xfd,0xd4,0x00,0x10] 440 441v_pk_add_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp 442// GFX12: [0xff,0xd3,0x0f,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00] 443 444v_pk_add_i16 v5, v1, v2 445// GFX12: [0x05,0x40,0x02,0xcc,0x01,0x05,0x02,0x18] 446 447v_pk_add_i16 v5, v255, v255 448// GFX12: [0x05,0x40,0x02,0xcc,0xff,0xff,0x03,0x18] 449 450v_pk_add_i16 v5, s1, s2 451// GFX12: [0x05,0x40,0x02,0xcc,0x01,0x04,0x00,0x18] 452 453v_pk_add_i16 v5, s105, s105 454// GFX12: [0x05,0x40,0x02,0xcc,0x69,0xd2,0x00,0x18] 455 456v_pk_add_i16 v5, vcc_lo, ttmp15 457// GFX12: [0x05,0x40,0x02,0xcc,0x6a,0xf6,0x00,0x18] 458 459v_pk_add_i16 v5, vcc_hi, 0xfe0b 460// GFX12: [0x05,0x40,0x02,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 461 462v_pk_add_i16 v5, ttmp15, src_scc 463// GFX12: [0x05,0x40,0x02,0xcc,0x7b,0xfa,0x01,0x18] 464 465v_pk_add_i16 v5, m0, 0.5 466// GFX12: [0x05,0x40,0x02,0xcc,0x7d,0xe0,0x01,0x18] 467 468v_pk_add_i16 v5, exec_lo, -1 469// GFX12: [0x05,0x40,0x02,0xcc,0x7e,0x82,0x01,0x18] 470 471v_pk_add_i16 v5, exec_hi, null 472// GFX12: [0x05,0x40,0x02,0xcc,0x7f,0xf8,0x00,0x18] 473 474v_pk_add_i16 v5, null, exec_lo 475// GFX12: [0x05,0x40,0x02,0xcc,0x7c,0xfc,0x00,0x18] 476 477v_pk_add_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 478// GFX12: [0x05,0x58,0x02,0xcc,0xc1,0xfe,0x00,0x00] 479 480v_pk_add_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 481// GFX12: [0x05,0x40,0x02,0xcc,0xf0,0xfa,0x00,0x18] 482 483v_pk_add_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 484// GFX12: [0x05,0x48,0x02,0xcc,0xfd,0xd4,0x00,0x10] 485 486v_pk_add_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp 487// GFX12: [0xff,0xd0,0x02,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 488 489v_pk_add_u16 v5, v1, v2 490// GFX12: [0x05,0x40,0x0a,0xcc,0x01,0x05,0x02,0x18] 491 492v_pk_add_u16 v5, v255, v255 493// GFX12: [0x05,0x40,0x0a,0xcc,0xff,0xff,0x03,0x18] 494 495v_pk_add_u16 v5, s1, s2 496// GFX12: [0x05,0x40,0x0a,0xcc,0x01,0x04,0x00,0x18] 497 498v_pk_add_u16 v5, s105, s105 499// GFX12: [0x05,0x40,0x0a,0xcc,0x69,0xd2,0x00,0x18] 500 501v_pk_add_u16 v5, vcc_lo, ttmp15 502// GFX12: [0x05,0x40,0x0a,0xcc,0x6a,0xf6,0x00,0x18] 503 504v_pk_add_u16 v5, vcc_hi, 0xfe0b 505// GFX12: [0x05,0x40,0x0a,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 506 507v_pk_add_u16 v5, ttmp15, src_scc 508// GFX12: [0x05,0x40,0x0a,0xcc,0x7b,0xfa,0x01,0x18] 509 510v_pk_add_u16 v5, m0, 0.5 511// GFX12: [0x05,0x40,0x0a,0xcc,0x7d,0xe0,0x01,0x18] 512 513v_pk_add_u16 v5, exec_lo, -1 514// GFX12: [0x05,0x40,0x0a,0xcc,0x7e,0x82,0x01,0x18] 515 516v_pk_add_u16 v5, exec_hi, null 517// GFX12: [0x05,0x40,0x0a,0xcc,0x7f,0xf8,0x00,0x18] 518 519v_pk_add_u16 v5, null, exec_lo 520// GFX12: [0x05,0x40,0x0a,0xcc,0x7c,0xfc,0x00,0x18] 521 522v_pk_add_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 523// GFX12: [0x05,0x58,0x0a,0xcc,0xc1,0xfe,0x00,0x00] 524 525v_pk_add_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 526// GFX12: [0x05,0x40,0x0a,0xcc,0xf0,0xfa,0x00,0x18] 527 528v_pk_add_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 529// GFX12: [0x05,0x48,0x0a,0xcc,0xfd,0xd4,0x00,0x10] 530 531v_pk_add_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp 532// GFX12: [0xff,0xd0,0x0a,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 533 534v_pk_ashrrev_i16 v5, v1, v2 535// GFX12: [0x05,0x40,0x06,0xcc,0x01,0x05,0x02,0x18] 536 537v_pk_ashrrev_i16 v5, v255, v255 538// GFX12: [0x05,0x40,0x06,0xcc,0xff,0xff,0x03,0x18] 539 540v_pk_ashrrev_i16 v5, s1, s2 541// GFX12: [0x05,0x40,0x06,0xcc,0x01,0x04,0x00,0x18] 542 543v_pk_ashrrev_i16 v5, s105, s105 544// GFX12: [0x05,0x40,0x06,0xcc,0x69,0xd2,0x00,0x18] 545 546v_pk_ashrrev_i16 v5, vcc_lo, ttmp15 547// GFX12: [0x05,0x40,0x06,0xcc,0x6a,0xf6,0x00,0x18] 548 549v_pk_ashrrev_i16 v5, vcc_hi, 0xfe0b 550// GFX12: [0x05,0x40,0x06,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 551 552v_pk_ashrrev_i16 v5, ttmp15, src_scc 553// GFX12: [0x05,0x40,0x06,0xcc,0x7b,0xfa,0x01,0x18] 554 555v_pk_ashrrev_i16 v5, m0, 0.5 556// GFX12: [0x05,0x40,0x06,0xcc,0x7d,0xe0,0x01,0x18] 557 558v_pk_ashrrev_i16 v5, exec_lo, -1 559// GFX12: [0x05,0x40,0x06,0xcc,0x7e,0x82,0x01,0x18] 560 561v_pk_ashrrev_i16 v5, exec_hi, null 562// GFX12: [0x05,0x40,0x06,0xcc,0x7f,0xf8,0x00,0x18] 563 564v_pk_ashrrev_i16 v5, null, exec_lo 565// GFX12: [0x05,0x40,0x06,0xcc,0x7c,0xfc,0x00,0x18] 566 567v_pk_ashrrev_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 568// GFX12: [0x05,0x58,0x06,0xcc,0xc1,0xfe,0x00,0x00] 569 570v_pk_ashrrev_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 571// GFX12: [0x05,0x40,0x06,0xcc,0xf0,0xfa,0x00,0x18] 572 573v_pk_ashrrev_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 574// GFX12: [0x05,0x48,0x06,0xcc,0xfd,0xd4,0x00,0x10] 575 576v_pk_ashrrev_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 577// GFX12: [0xff,0x50,0x06,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 578 579v_pk_fma_f16 v5, v1, v2, s3 580// GFX12: [0x05,0x40,0x0e,0xcc,0x01,0x05,0x0e,0x18] 581 582v_pk_fma_f16 v5, v255, s2, s105 583// GFX12: [0x05,0x40,0x0e,0xcc,0xff,0x05,0xa4,0x19] 584 585v_pk_fma_f16 v5, s1, v255, exec_hi 586// GFX12: [0x05,0x40,0x0e,0xcc,0x01,0xfe,0xff,0x19] 587 588v_pk_fma_f16 v5, s105, s105, exec_lo 589// GFX12: [0x05,0x40,0x0e,0xcc,0x69,0xd2,0xf8,0x19] 590 591v_pk_fma_f16 v5, vcc_lo, ttmp15, v3 592// GFX12: [0x05,0x40,0x0e,0xcc,0x6a,0xf6,0x0c,0x1c] 593 594v_pk_fma_f16 v5, vcc_hi, 0xfe0b, v255 595// GFX12: [0x05,0x40,0x0e,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00] 596 597v_pk_fma_f16 v5, ttmp15, src_scc, ttmp15 598// GFX12: [0x05,0x40,0x0e,0xcc,0x7b,0xfa,0xed,0x19] 599 600v_pk_fma_f16 v5, m0, 0.5, m0 op_sel_hi:[0,0,0] 601// GFX12: [0x05,0x00,0x0e,0xcc,0x7d,0xe0,0xf5,0x01] 602 603v_pk_fma_f16 v5, exec_lo, -1, vcc_hi op_sel_hi:[0,0,1] 604// GFX12: [0x05,0x40,0x0e,0xcc,0x7e,0x82,0xad,0x01] 605 606v_pk_fma_f16 v5, exec_hi, null, vcc_lo op_sel_hi:[0,1,0] 607// GFX12: [0x05,0x00,0x0e,0xcc,0x7f,0xf8,0xa8,0x11] 608 609v_pk_fma_f16 v5, null, exec_lo, 0xfe0b op_sel:[1,1,1] op_sel_hi:[1,0,0] neg_lo:[1,0,0] neg_hi:[1,0,0] 610// GFX12: [0x05,0x39,0x0e,0xcc,0x7c,0xfc,0xfc,0x2b,0x0b,0xfe,0x00,0x00] 611 612v_pk_fma_f16 v5, -1, exec_hi, src_scc op_sel:[0,0,0] op_sel_hi:[1,1,1] neg_lo:[0,1,0] neg_hi:[0,1,0] 613// GFX12: [0x05,0x42,0x0e,0xcc,0xc1,0xfe,0xf4,0x5b] 614 615v_pk_fma_f16 v5, 0.5, m0, 0.5 op_sel:[1,0,0] op_sel_hi:[0,1,1] neg_lo:[0,0,1] neg_hi:[0,0,1] 616// GFX12: [0x05,0x4c,0x0e,0xcc,0xf0,0xfa,0xc0,0x93] 617 618v_pk_fma_f16 v5, src_scc, vcc_lo, -1 op_sel:[0,1,0] op_sel_hi:[1,0,1] neg_lo:[0,0,0] neg_hi:[0,0,0] 619// GFX12: [0x05,0x50,0x0e,0xcc,0xfd,0xd4,0x04,0x0b] 620 621v_pk_fma_f16 v255, 0xfe0b, vcc_hi, null op_sel:[0,0,1] op_sel_hi:[1,1,0] neg_lo:[1,1,1] neg_hi:[1,1,1] clamp 622// GFX12: [0xff,0xa7,0x0e,0xcc,0xff,0xd6,0xf0,0xf9,0x0b,0xfe,0x00,0x00] 623 624v_pk_lshlrev_b16 v5, v1, v2 625// GFX12: [0x05,0x40,0x04,0xcc,0x01,0x05,0x02,0x18] 626 627v_pk_lshlrev_b16 v5, v255, v255 628// GFX12: [0x05,0x40,0x04,0xcc,0xff,0xff,0x03,0x18] 629 630v_pk_lshlrev_b16 v5, s1, s2 631// GFX12: [0x05,0x40,0x04,0xcc,0x01,0x04,0x00,0x18] 632 633v_pk_lshlrev_b16 v5, s105, s105 634// GFX12: [0x05,0x40,0x04,0xcc,0x69,0xd2,0x00,0x18] 635 636v_pk_lshlrev_b16 v5, vcc_lo, ttmp15 637// GFX12: [0x05,0x40,0x04,0xcc,0x6a,0xf6,0x00,0x18] 638 639v_pk_lshlrev_b16 v5, vcc_hi, 0xfe0b 640// GFX12: [0x05,0x40,0x04,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 641 642v_pk_lshlrev_b16 v5, ttmp15, src_scc 643// GFX12: [0x05,0x40,0x04,0xcc,0x7b,0xfa,0x01,0x18] 644 645v_pk_lshlrev_b16 v5, m0, 0.5 646// GFX12: [0x05,0x40,0x04,0xcc,0x7d,0xe0,0x01,0x18] 647 648v_pk_lshlrev_b16 v5, exec_lo, -1 649// GFX12: [0x05,0x40,0x04,0xcc,0x7e,0x82,0x01,0x18] 650 651v_pk_lshlrev_b16 v5, exec_hi, null 652// GFX12: [0x05,0x40,0x04,0xcc,0x7f,0xf8,0x00,0x18] 653 654v_pk_lshlrev_b16 v5, null, exec_lo 655// GFX12: [0x05,0x40,0x04,0xcc,0x7c,0xfc,0x00,0x18] 656 657v_pk_lshlrev_b16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 658// GFX12: [0x05,0x58,0x04,0xcc,0xc1,0xfe,0x00,0x00] 659 660v_pk_lshlrev_b16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 661// GFX12: [0x05,0x40,0x04,0xcc,0xf0,0xfa,0x00,0x18] 662 663v_pk_lshlrev_b16 v5, 0x3800, m0 op_sel:[0,0] op_sel_hi:[1,1] 664// GFX12: [0x05,0x40,0x04,0xcc,0xff,0xfa,0x00,0x18,0x00,0x38,0x00,0x00] 665 666v_pk_lshlrev_b16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 667// GFX12: [0x05,0x48,0x04,0xcc,0xfd,0xd4,0x00,0x10] 668 669v_pk_lshlrev_b16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 670// GFX12: [0xff,0x50,0x04,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 671 672v_pk_lshrrev_b16 v5, v1, v2 673// GFX12: [0x05,0x40,0x05,0xcc,0x01,0x05,0x02,0x18] 674 675v_pk_lshrrev_b16 v5, v255, v255 676// GFX12: [0x05,0x40,0x05,0xcc,0xff,0xff,0x03,0x18] 677 678v_pk_lshrrev_b16 v5, s1, s2 679// GFX12: [0x05,0x40,0x05,0xcc,0x01,0x04,0x00,0x18] 680 681v_pk_lshrrev_b16 v5, s105, s105 682// GFX12: [0x05,0x40,0x05,0xcc,0x69,0xd2,0x00,0x18] 683 684v_pk_lshrrev_b16 v5, vcc_lo, ttmp15 685// GFX12: [0x05,0x40,0x05,0xcc,0x6a,0xf6,0x00,0x18] 686 687v_pk_lshrrev_b16 v5, vcc_hi, 0xfe0b 688// GFX12: [0x05,0x40,0x05,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 689 690v_pk_lshrrev_b16 v5, ttmp15, src_scc 691// GFX12: [0x05,0x40,0x05,0xcc,0x7b,0xfa,0x01,0x18] 692 693v_pk_lshrrev_b16 v5, m0, 0.5 694// GFX12: [0x05,0x40,0x05,0xcc,0x7d,0xe0,0x01,0x18] 695 696v_pk_lshrrev_b16 v5, exec_lo, -1 697// GFX12: [0x05,0x40,0x05,0xcc,0x7e,0x82,0x01,0x18] 698 699v_pk_lshrrev_b16 v5, exec_hi, null 700// GFX12: [0x05,0x40,0x05,0xcc,0x7f,0xf8,0x00,0x18] 701 702v_pk_lshrrev_b16 v5, null, exec_lo 703// GFX12: [0x05,0x40,0x05,0xcc,0x7c,0xfc,0x00,0x18] 704 705v_pk_lshrrev_b16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 706// GFX12: [0x05,0x58,0x05,0xcc,0xc1,0xfe,0x00,0x00] 707 708v_pk_lshrrev_b16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 709// GFX12: [0x05,0x40,0x05,0xcc,0xf0,0xfa,0x00,0x18] 710 711v_pk_lshrrev_b16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 712// GFX12: [0x05,0x48,0x05,0xcc,0xfd,0xd4,0x00,0x10] 713 714v_pk_lshrrev_b16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 715// GFX12: [0xff,0x50,0x05,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 716 717v_pk_mad_i16 v5, v1, v2, s3 718// GFX12: [0x05,0x40,0x00,0xcc,0x01,0x05,0x0e,0x18] 719 720v_pk_mad_i16 v5, v255, s2, s105 721// GFX12: [0x05,0x40,0x00,0xcc,0xff,0x05,0xa4,0x19] 722 723v_pk_mad_i16 v5, s1, v255, exec_hi 724// GFX12: [0x05,0x40,0x00,0xcc,0x01,0xfe,0xff,0x19] 725 726v_pk_mad_i16 v5, s105, s105, exec_lo 727// GFX12: [0x05,0x40,0x00,0xcc,0x69,0xd2,0xf8,0x19] 728 729v_pk_mad_i16 v5, vcc_lo, ttmp15, v3 730// GFX12: [0x05,0x40,0x00,0xcc,0x6a,0xf6,0x0c,0x1c] 731 732v_pk_mad_i16 v5, vcc_hi, 0xfe0b, v255 733// GFX12: [0x05,0x40,0x00,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00] 734 735v_pk_mad_i16 v5, ttmp15, src_scc, ttmp15 736// GFX12: [0x05,0x40,0x00,0xcc,0x7b,0xfa,0xed,0x19] 737 738v_pk_mad_i16 v5, m0, 0.5, m0 op_sel_hi:[0,0,0] 739// GFX12: [0x05,0x00,0x00,0xcc,0x7d,0xe0,0xf5,0x01] 740 741v_pk_mad_i16 v5, exec_lo, -1, vcc_hi op_sel_hi:[0,0,1] 742// GFX12: [0x05,0x40,0x00,0xcc,0x7e,0x82,0xad,0x01] 743 744v_pk_mad_i16 v5, exec_hi, null, vcc_lo op_sel_hi:[0,1,0] 745// GFX12: [0x05,0x00,0x00,0xcc,0x7f,0xf8,0xa8,0x11] 746 747v_pk_mad_i16 v5, null, exec_lo, 0xfe0b op_sel:[1,1,1] op_sel_hi:[1,0,0] 748// GFX12: [0x05,0x38,0x00,0xcc,0x7c,0xfc,0xfc,0x0b,0x0b,0xfe,0x00,0x00] 749 750v_pk_mad_i16 v5, -1, exec_hi, src_scc op_sel:[0,0,0] op_sel_hi:[1,1,1] 751// GFX12: [0x05,0x40,0x00,0xcc,0xc1,0xfe,0xf4,0x1b] 752 753v_pk_mad_i16 v5, 0.5, m0, 0.5 op_sel:[1,0,0] op_sel_hi:[0,1,1] 754// GFX12: [0x05,0x48,0x00,0xcc,0xf0,0xfa,0xc0,0x13] 755 756v_pk_mad_i16 v5, src_scc, vcc_lo, -1 op_sel:[0,1,0] op_sel_hi:[1,0,1] 757// GFX12: [0x05,0x50,0x00,0xcc,0xfd,0xd4,0x04,0x0b] 758 759v_pk_mad_i16 v255, 0xfe0b, vcc_hi, null op_sel:[0,0,1] op_sel_hi:[1,1,0] clamp 760// GFX12: [0xff,0xa0,0x00,0xcc,0xff,0xd6,0xf0,0x19,0x0b,0xfe,0x00,0x00] 761 762v_pk_mad_u16 v5, v1, v2, s3 763// GFX12: [0x05,0x40,0x09,0xcc,0x01,0x05,0x0e,0x18] 764 765v_pk_mad_u16 v5, v255, s2, s105 766// GFX12: [0x05,0x40,0x09,0xcc,0xff,0x05,0xa4,0x19] 767 768v_pk_mad_u16 v5, s1, v255, exec_hi 769// GFX12: [0x05,0x40,0x09,0xcc,0x01,0xfe,0xff,0x19] 770 771v_pk_mad_u16 v5, s105, s105, exec_lo 772// GFX12: [0x05,0x40,0x09,0xcc,0x69,0xd2,0xf8,0x19] 773 774v_pk_mad_u16 v5, vcc_lo, ttmp15, v3 775// GFX12: [0x05,0x40,0x09,0xcc,0x6a,0xf6,0x0c,0x1c] 776 777v_pk_mad_u16 v5, vcc_hi, 0xfe0b, v255 778// GFX12: [0x05,0x40,0x09,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00] 779 780v_pk_mad_u16 v5, ttmp15, src_scc, ttmp15 781// GFX12: [0x05,0x40,0x09,0xcc,0x7b,0xfa,0xed,0x19] 782 783v_pk_mad_u16 v5, m0, 0.5, m0 op_sel_hi:[0,0,0] 784// GFX12: [0x05,0x00,0x09,0xcc,0x7d,0xe0,0xf5,0x01] 785 786v_pk_mad_u16 v5, exec_lo, -1, vcc_hi op_sel_hi:[0,0,1] 787// GFX12: [0x05,0x40,0x09,0xcc,0x7e,0x82,0xad,0x01] 788 789v_pk_mad_u16 v5, exec_hi, null, vcc_lo op_sel_hi:[0,1,0] 790// GFX12: [0x05,0x00,0x09,0xcc,0x7f,0xf8,0xa8,0x11] 791 792v_pk_mad_u16 v5, null, exec_lo, 0xfe0b op_sel:[1,1,1] op_sel_hi:[1,0,0] 793// GFX12: [0x05,0x38,0x09,0xcc,0x7c,0xfc,0xfc,0x0b,0x0b,0xfe,0x00,0x00] 794 795v_pk_mad_u16 v5, -1, exec_hi, src_scc op_sel:[0,0,0] op_sel_hi:[1,1,1] 796// GFX12: [0x05,0x40,0x09,0xcc,0xc1,0xfe,0xf4,0x1b] 797 798v_pk_mad_u16 v5, 0.5, m0, 0.5 op_sel:[1,0,0] op_sel_hi:[0,1,1] 799// GFX12: [0x05,0x48,0x09,0xcc,0xf0,0xfa,0xc0,0x13] 800 801v_pk_mad_u16 v5, src_scc, vcc_lo, -1 op_sel:[0,1,0] op_sel_hi:[1,0,1] 802// GFX12: [0x05,0x50,0x09,0xcc,0xfd,0xd4,0x04,0x0b] 803 804v_pk_mad_u16 v255, 0xfe0b, vcc_hi, null op_sel:[0,0,1] op_sel_hi:[1,1,0] clamp 805// GFX12: [0xff,0xa0,0x09,0xcc,0xff,0xd6,0xf0,0x19,0x0b,0xfe,0x00,0x00] 806 807v_pk_max_num_f16 v5, v1, v2 808// GFX12: [0x05,0x40,0x1c,0xcc,0x01,0x05,0x02,0x18] 809 810v_pk_max_num_f16 v5, v255, v255 811// GFX12: [0x05,0x40,0x1c,0xcc,0xff,0xff,0x03,0x18] 812 813v_pk_max_num_f16 v5, s1, s2 814// GFX12: [0x05,0x40,0x1c,0xcc,0x01,0x04,0x00,0x18] 815 816v_pk_max_num_f16 v5, s105, s105 817// GFX12: [0x05,0x40,0x1c,0xcc,0x69,0xd2,0x00,0x18] 818 819v_pk_max_num_f16 v5, vcc_lo, ttmp15 820// GFX12: [0x05,0x40,0x1c,0xcc,0x6a,0xf6,0x00,0x18] 821 822v_pk_max_num_f16 v5, vcc_hi, 0xfe0b 823// GFX12: [0x05,0x40,0x1c,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 824 825v_pk_max_num_f16 v5, ttmp15, src_scc 826// GFX12: [0x05,0x40,0x1c,0xcc,0x7b,0xfa,0x01,0x18] 827 828v_pk_max_num_f16 v5, m0, 0.5 829// GFX12: [0x05,0x40,0x1c,0xcc,0x7d,0xe0,0x01,0x18] 830 831v_pk_max_num_f16 v5, exec_lo, -1 832// GFX12: [0x05,0x40,0x1c,0xcc,0x7e,0x82,0x01,0x18] 833 834v_pk_max_num_f16 v5, exec_hi, null 835// GFX12: [0x05,0x40,0x1c,0xcc,0x7f,0xf8,0x00,0x18] 836 837v_pk_max_num_f16 v5, null, exec_lo 838// GFX12: [0x05,0x40,0x1c,0xcc,0x7c,0xfc,0x00,0x18] 839 840v_pk_max_num_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0] 841// GFX12: [0x05,0x59,0x1c,0xcc,0xc1,0xfe,0x00,0x20] 842 843v_pk_max_num_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1] 844// GFX12: [0x05,0x42,0x1c,0xcc,0xf0,0xfa,0x00,0x58] 845 846v_pk_max_num_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0] 847// GFX12: [0x05,0x48,0x1c,0xcc,0xfd,0xd4,0x00,0x10] 848 849v_pk_max_num_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp 850// GFX12: [0xff,0xd3,0x1c,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00] 851 852v_pk_max_i16 v5, v1, v2 853// GFX12: [0x05,0x40,0x07,0xcc,0x01,0x05,0x02,0x18] 854 855v_pk_max_i16 v5, v255, v255 856// GFX12: [0x05,0x40,0x07,0xcc,0xff,0xff,0x03,0x18] 857 858v_pk_max_i16 v5, s1, s2 859// GFX12: [0x05,0x40,0x07,0xcc,0x01,0x04,0x00,0x18] 860 861v_pk_max_i16 v5, s105, s105 862// GFX12: [0x05,0x40,0x07,0xcc,0x69,0xd2,0x00,0x18] 863 864v_pk_max_i16 v5, vcc_lo, ttmp15 865// GFX12: [0x05,0x40,0x07,0xcc,0x6a,0xf6,0x00,0x18] 866 867v_pk_max_i16 v5, vcc_hi, 0xfe0b 868// GFX12: [0x05,0x40,0x07,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 869 870v_pk_max_i16 v5, ttmp15, src_scc 871// GFX12: [0x05,0x40,0x07,0xcc,0x7b,0xfa,0x01,0x18] 872 873v_pk_max_i16 v5, m0, 0.5 874// GFX12: [0x05,0x40,0x07,0xcc,0x7d,0xe0,0x01,0x18] 875 876v_pk_max_i16 v5, exec_lo, -1 877// GFX12: [0x05,0x40,0x07,0xcc,0x7e,0x82,0x01,0x18] 878 879v_pk_max_i16 v5, exec_hi, null 880// GFX12: [0x05,0x40,0x07,0xcc,0x7f,0xf8,0x00,0x18] 881 882v_pk_max_i16 v5, null, exec_lo 883// GFX12: [0x05,0x40,0x07,0xcc,0x7c,0xfc,0x00,0x18] 884 885v_pk_max_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 886// GFX12: [0x05,0x58,0x07,0xcc,0xc1,0xfe,0x00,0x00] 887 888v_pk_max_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 889// GFX12: [0x05,0x40,0x07,0xcc,0xf0,0xfa,0x00,0x18] 890 891v_pk_max_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 892// GFX12: [0x05,0x48,0x07,0xcc,0xfd,0xd4,0x00,0x10] 893 894v_pk_max_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 895// GFX12: [0xff,0x50,0x07,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 896 897v_pk_max_u16 v5, v1, v2 898// GFX12: [0x05,0x40,0x0c,0xcc,0x01,0x05,0x02,0x18] 899 900v_pk_max_u16 v5, v255, v255 901// GFX12: [0x05,0x40,0x0c,0xcc,0xff,0xff,0x03,0x18] 902 903v_pk_max_u16 v5, s1, s2 904// GFX12: [0x05,0x40,0x0c,0xcc,0x01,0x04,0x00,0x18] 905 906v_pk_max_u16 v5, s105, s105 907// GFX12: [0x05,0x40,0x0c,0xcc,0x69,0xd2,0x00,0x18] 908 909v_pk_max_u16 v5, vcc_lo, ttmp15 910// GFX12: [0x05,0x40,0x0c,0xcc,0x6a,0xf6,0x00,0x18] 911 912v_pk_max_u16 v5, vcc_hi, 0xfe0b 913// GFX12: [0x05,0x40,0x0c,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 914 915v_pk_max_u16 v5, ttmp15, src_scc 916// GFX12: [0x05,0x40,0x0c,0xcc,0x7b,0xfa,0x01,0x18] 917 918v_pk_max_u16 v5, m0, 0.5 919// GFX12: [0x05,0x40,0x0c,0xcc,0x7d,0xe0,0x01,0x18] 920 921v_pk_max_u16 v5, exec_lo, -1 922// GFX12: [0x05,0x40,0x0c,0xcc,0x7e,0x82,0x01,0x18] 923 924v_pk_max_u16 v5, exec_hi, null 925// GFX12: [0x05,0x40,0x0c,0xcc,0x7f,0xf8,0x00,0x18] 926 927v_pk_max_u16 v5, null, exec_lo 928// GFX12: [0x05,0x40,0x0c,0xcc,0x7c,0xfc,0x00,0x18] 929 930v_pk_max_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 931// GFX12: [0x05,0x58,0x0c,0xcc,0xc1,0xfe,0x00,0x00] 932 933v_pk_max_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 934// GFX12: [0x05,0x40,0x0c,0xcc,0xf0,0xfa,0x00,0x18] 935 936v_pk_max_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 937// GFX12: [0x05,0x48,0x0c,0xcc,0xfd,0xd4,0x00,0x10] 938 939v_pk_max_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 940// GFX12: [0xff,0x50,0x0c,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 941 942v_pk_min_num_f16 v5, v1, v2 943// GFX12: [0x05,0x40,0x1b,0xcc,0x01,0x05,0x02,0x18] 944 945v_pk_min_num_f16 v5, v255, v255 946// GFX12: [0x05,0x40,0x1b,0xcc,0xff,0xff,0x03,0x18] 947 948v_pk_min_num_f16 v5, s1, s2 949// GFX12: [0x05,0x40,0x1b,0xcc,0x01,0x04,0x00,0x18] 950 951v_pk_min_num_f16 v5, s105, s105 952// GFX12: [0x05,0x40,0x1b,0xcc,0x69,0xd2,0x00,0x18] 953 954v_pk_min_num_f16 v5, vcc_lo, ttmp15 955// GFX12: [0x05,0x40,0x1b,0xcc,0x6a,0xf6,0x00,0x18] 956 957v_pk_min_num_f16 v5, vcc_hi, 0xfe0b 958// GFX12: [0x05,0x40,0x1b,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 959 960v_pk_min_num_f16 v5, ttmp15, src_scc 961// GFX12: [0x05,0x40,0x1b,0xcc,0x7b,0xfa,0x01,0x18] 962 963v_pk_min_num_f16 v5, m0, 0.5 964// GFX12: [0x05,0x40,0x1b,0xcc,0x7d,0xe0,0x01,0x18] 965 966v_pk_min_num_f16 v5, exec_lo, -1 967// GFX12: [0x05,0x40,0x1b,0xcc,0x7e,0x82,0x01,0x18] 968 969v_pk_min_num_f16 v5, exec_hi, null 970// GFX12: [0x05,0x40,0x1b,0xcc,0x7f,0xf8,0x00,0x18] 971 972v_pk_min_num_f16 v5, null, exec_lo 973// GFX12: [0x05,0x40,0x1b,0xcc,0x7c,0xfc,0x00,0x18] 974 975v_pk_min_num_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0] 976// GFX12: [0x05,0x59,0x1b,0xcc,0xc1,0xfe,0x00,0x20] 977 978v_pk_min_num_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1] 979// GFX12: [0x05,0x42,0x1b,0xcc,0xf0,0xfa,0x00,0x58] 980 981v_pk_min_num_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0] 982// GFX12: [0x05,0x48,0x1b,0xcc,0xfd,0xd4,0x00,0x10] 983 984v_pk_min_num_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp 985// GFX12: [0xff,0xd3,0x1b,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00] 986 987v_pk_min_i16 v5, v1, v2 988// GFX12: [0x05,0x40,0x08,0xcc,0x01,0x05,0x02,0x18] 989 990v_pk_min_i16 v5, v255, v255 991// GFX12: [0x05,0x40,0x08,0xcc,0xff,0xff,0x03,0x18] 992 993v_pk_min_i16 v5, s1, s2 994// GFX12: [0x05,0x40,0x08,0xcc,0x01,0x04,0x00,0x18] 995 996v_pk_min_i16 v5, s105, s105 997// GFX12: [0x05,0x40,0x08,0xcc,0x69,0xd2,0x00,0x18] 998 999v_pk_min_i16 v5, vcc_lo, ttmp15 1000// GFX12: [0x05,0x40,0x08,0xcc,0x6a,0xf6,0x00,0x18] 1001 1002v_pk_min_i16 v5, vcc_hi, 0xfe0b 1003// GFX12: [0x05,0x40,0x08,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1004 1005v_pk_min_i16 v5, ttmp15, src_scc 1006// GFX12: [0x05,0x40,0x08,0xcc,0x7b,0xfa,0x01,0x18] 1007 1008v_pk_min_i16 v5, m0, 0.5 1009// GFX12: [0x05,0x40,0x08,0xcc,0x7d,0xe0,0x01,0x18] 1010 1011v_pk_min_i16 v5, exec_lo, -1 1012// GFX12: [0x05,0x40,0x08,0xcc,0x7e,0x82,0x01,0x18] 1013 1014v_pk_min_i16 v5, exec_hi, null 1015// GFX12: [0x05,0x40,0x08,0xcc,0x7f,0xf8,0x00,0x18] 1016 1017v_pk_min_i16 v5, null, exec_lo 1018// GFX12: [0x05,0x40,0x08,0xcc,0x7c,0xfc,0x00,0x18] 1019 1020v_pk_min_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 1021// GFX12: [0x05,0x58,0x08,0xcc,0xc1,0xfe,0x00,0x00] 1022 1023v_pk_min_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 1024// GFX12: [0x05,0x40,0x08,0xcc,0xf0,0xfa,0x00,0x18] 1025 1026v_pk_min_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 1027// GFX12: [0x05,0x48,0x08,0xcc,0xfd,0xd4,0x00,0x10] 1028 1029v_pk_min_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 1030// GFX12: [0xff,0x50,0x08,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 1031 1032v_pk_min_u16 v5, v1, v2 1033// GFX12: [0x05,0x40,0x0d,0xcc,0x01,0x05,0x02,0x18] 1034 1035v_pk_min_u16 v5, v255, v255 1036// GFX12: [0x05,0x40,0x0d,0xcc,0xff,0xff,0x03,0x18] 1037 1038v_pk_min_u16 v5, s1, s2 1039// GFX12: [0x05,0x40,0x0d,0xcc,0x01,0x04,0x00,0x18] 1040 1041v_pk_min_u16 v5, s105, s105 1042// GFX12: [0x05,0x40,0x0d,0xcc,0x69,0xd2,0x00,0x18] 1043 1044v_pk_min_u16 v5, vcc_lo, ttmp15 1045// GFX12: [0x05,0x40,0x0d,0xcc,0x6a,0xf6,0x00,0x18] 1046 1047v_pk_min_u16 v5, vcc_hi, 0xfe0b 1048// GFX12: [0x05,0x40,0x0d,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1049 1050v_pk_min_u16 v5, ttmp15, src_scc 1051// GFX12: [0x05,0x40,0x0d,0xcc,0x7b,0xfa,0x01,0x18] 1052 1053v_pk_min_u16 v5, m0, 0.5 1054// GFX12: [0x05,0x40,0x0d,0xcc,0x7d,0xe0,0x01,0x18] 1055 1056v_pk_min_u16 v5, exec_lo, -1 1057// GFX12: [0x05,0x40,0x0d,0xcc,0x7e,0x82,0x01,0x18] 1058 1059v_pk_min_u16 v5, exec_hi, null 1060// GFX12: [0x05,0x40,0x0d,0xcc,0x7f,0xf8,0x00,0x18] 1061 1062v_pk_min_u16 v5, null, exec_lo 1063// GFX12: [0x05,0x40,0x0d,0xcc,0x7c,0xfc,0x00,0x18] 1064 1065v_pk_min_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 1066// GFX12: [0x05,0x58,0x0d,0xcc,0xc1,0xfe,0x00,0x00] 1067 1068v_pk_min_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 1069// GFX12: [0x05,0x40,0x0d,0xcc,0xf0,0xfa,0x00,0x18] 1070 1071v_pk_min_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 1072// GFX12: [0x05,0x48,0x0d,0xcc,0xfd,0xd4,0x00,0x10] 1073 1074v_pk_min_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 1075// GFX12: [0xff,0x50,0x0d,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 1076 1077v_pk_mul_f16 v5, v1, v2 1078// GFX12: [0x05,0x40,0x10,0xcc,0x01,0x05,0x02,0x18] 1079 1080v_pk_mul_f16 v5, v255, v255 1081// GFX12: [0x05,0x40,0x10,0xcc,0xff,0xff,0x03,0x18] 1082 1083v_pk_mul_f16 v5, s1, s2 1084// GFX12: [0x05,0x40,0x10,0xcc,0x01,0x04,0x00,0x18] 1085 1086v_pk_mul_f16 v5, s105, s105 1087// GFX12: [0x05,0x40,0x10,0xcc,0x69,0xd2,0x00,0x18] 1088 1089v_pk_mul_f16 v5, vcc_lo, ttmp15 1090// GFX12: [0x05,0x40,0x10,0xcc,0x6a,0xf6,0x00,0x18] 1091 1092v_pk_mul_f16 v5, vcc_hi, 0xfe0b 1093// GFX12: [0x05,0x40,0x10,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1094 1095v_pk_mul_f16 v5, ttmp15, src_scc 1096// GFX12: [0x05,0x40,0x10,0xcc,0x7b,0xfa,0x01,0x18] 1097 1098v_pk_mul_f16 v5, m0, 0.5 1099// GFX12: [0x05,0x40,0x10,0xcc,0x7d,0xe0,0x01,0x18] 1100 1101v_pk_mul_f16 v5, exec_lo, -1 1102// GFX12: [0x05,0x40,0x10,0xcc,0x7e,0x82,0x01,0x18] 1103 1104v_pk_mul_f16 v5, exec_hi, null 1105// GFX12: [0x05,0x40,0x10,0xcc,0x7f,0xf8,0x00,0x18] 1106 1107v_pk_mul_f16 v5, null, exec_lo 1108// GFX12: [0x05,0x40,0x10,0xcc,0x7c,0xfc,0x00,0x18] 1109 1110v_pk_mul_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0] 1111// GFX12: [0x05,0x59,0x10,0xcc,0xc1,0xfe,0x00,0x20] 1112 1113v_pk_mul_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1] 1114// GFX12: [0x05,0x42,0x10,0xcc,0xf0,0xfa,0x00,0x58] 1115 1116v_pk_mul_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0] 1117// GFX12: [0x05,0x48,0x10,0xcc,0xfd,0xd4,0x00,0x10] 1118 1119v_pk_mul_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp 1120// GFX12: [0xff,0xd3,0x10,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00] 1121 1122v_pk_mul_lo_u16 v5, v1, v2 1123// GFX12: [0x05,0x40,0x01,0xcc,0x01,0x05,0x02,0x18] 1124 1125v_pk_mul_lo_u16 v5, v255, v255 1126// GFX12: [0x05,0x40,0x01,0xcc,0xff,0xff,0x03,0x18] 1127 1128v_pk_mul_lo_u16 v5, s1, s2 1129// GFX12: [0x05,0x40,0x01,0xcc,0x01,0x04,0x00,0x18] 1130 1131v_pk_mul_lo_u16 v5, s105, s105 1132// GFX12: [0x05,0x40,0x01,0xcc,0x69,0xd2,0x00,0x18] 1133 1134v_pk_mul_lo_u16 v5, vcc_lo, ttmp15 1135// GFX12: [0x05,0x40,0x01,0xcc,0x6a,0xf6,0x00,0x18] 1136 1137v_pk_mul_lo_u16 v5, vcc_hi, 0xfe0b 1138// GFX12: [0x05,0x40,0x01,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1139 1140v_pk_mul_lo_u16 v5, ttmp15, src_scc 1141// GFX12: [0x05,0x40,0x01,0xcc,0x7b,0xfa,0x01,0x18] 1142 1143v_pk_mul_lo_u16 v5, m0, 0.5 1144// GFX12: [0x05,0x40,0x01,0xcc,0x7d,0xe0,0x01,0x18] 1145 1146v_pk_mul_lo_u16 v5, exec_lo, -1 1147// GFX12: [0x05,0x40,0x01,0xcc,0x7e,0x82,0x01,0x18] 1148 1149v_pk_mul_lo_u16 v5, exec_hi, null 1150// GFX12: [0x05,0x40,0x01,0xcc,0x7f,0xf8,0x00,0x18] 1151 1152v_pk_mul_lo_u16 v5, null, exec_lo 1153// GFX12: [0x05,0x40,0x01,0xcc,0x7c,0xfc,0x00,0x18] 1154 1155v_pk_mul_lo_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 1156// GFX12: [0x05,0x58,0x01,0xcc,0xc1,0xfe,0x00,0x00] 1157 1158v_pk_mul_lo_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 1159// GFX12: [0x05,0x40,0x01,0xcc,0xf0,0xfa,0x00,0x18] 1160 1161v_pk_mul_lo_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 1162// GFX12: [0x05,0x48,0x01,0xcc,0xfd,0xd4,0x00,0x10] 1163 1164v_pk_mul_lo_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] 1165// GFX12: [0xff,0x50,0x01,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 1166 1167v_pk_sub_i16 v5, v1, v2 1168// GFX12: [0x05,0x40,0x03,0xcc,0x01,0x05,0x02,0x18] 1169 1170v_pk_sub_i16 v5, v255, v255 1171// GFX12: [0x05,0x40,0x03,0xcc,0xff,0xff,0x03,0x18] 1172 1173v_pk_sub_i16 v5, s1, s2 1174// GFX12: [0x05,0x40,0x03,0xcc,0x01,0x04,0x00,0x18] 1175 1176v_pk_sub_i16 v5, s105, s105 1177// GFX12: [0x05,0x40,0x03,0xcc,0x69,0xd2,0x00,0x18] 1178 1179v_pk_sub_i16 v5, vcc_lo, ttmp15 1180// GFX12: [0x05,0x40,0x03,0xcc,0x6a,0xf6,0x00,0x18] 1181 1182v_pk_sub_i16 v5, vcc_hi, 0xfe0b 1183// GFX12: [0x05,0x40,0x03,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1184 1185v_pk_sub_i16 v5, ttmp15, src_scc 1186// GFX12: [0x05,0x40,0x03,0xcc,0x7b,0xfa,0x01,0x18] 1187 1188v_pk_sub_i16 v5, m0, 0.5 1189// GFX12: [0x05,0x40,0x03,0xcc,0x7d,0xe0,0x01,0x18] 1190 1191v_pk_sub_i16 v5, exec_lo, -1 1192// GFX12: [0x05,0x40,0x03,0xcc,0x7e,0x82,0x01,0x18] 1193 1194v_pk_sub_i16 v5, exec_hi, null 1195// GFX12: [0x05,0x40,0x03,0xcc,0x7f,0xf8,0x00,0x18] 1196 1197v_pk_sub_i16 v5, null, exec_lo 1198// GFX12: [0x05,0x40,0x03,0xcc,0x7c,0xfc,0x00,0x18] 1199 1200v_pk_sub_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 1201// GFX12: [0x05,0x58,0x03,0xcc,0xc1,0xfe,0x00,0x00] 1202 1203v_pk_sub_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 1204// GFX12: [0x05,0x40,0x03,0xcc,0xf0,0xfa,0x00,0x18] 1205 1206v_pk_sub_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 1207// GFX12: [0x05,0x48,0x03,0xcc,0xfd,0xd4,0x00,0x10] 1208 1209v_pk_sub_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp 1210// GFX12: [0xff,0xd0,0x03,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 1211 1212v_pk_sub_u16 v5, v1, v2 1213// GFX12: [0x05,0x40,0x0b,0xcc,0x01,0x05,0x02,0x18] 1214 1215v_pk_sub_u16 v5, v255, v255 1216// GFX12: [0x05,0x40,0x0b,0xcc,0xff,0xff,0x03,0x18] 1217 1218v_pk_sub_u16 v5, s1, s2 1219// GFX12: [0x05,0x40,0x0b,0xcc,0x01,0x04,0x00,0x18] 1220 1221v_pk_sub_u16 v5, s105, s105 1222// GFX12: [0x05,0x40,0x0b,0xcc,0x69,0xd2,0x00,0x18] 1223 1224v_pk_sub_u16 v5, vcc_lo, ttmp15 1225// GFX12: [0x05,0x40,0x0b,0xcc,0x6a,0xf6,0x00,0x18] 1226 1227v_pk_sub_u16 v5, vcc_hi, 0xfe0b 1228// GFX12: [0x05,0x40,0x0b,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1229 1230v_pk_sub_u16 v5, ttmp15, src_scc 1231// GFX12: [0x05,0x40,0x0b,0xcc,0x7b,0xfa,0x01,0x18] 1232 1233v_pk_sub_u16 v5, m0, 0.5 1234// GFX12: [0x05,0x40,0x0b,0xcc,0x7d,0xe0,0x01,0x18] 1235 1236v_pk_sub_u16 v5, exec_lo, -1 1237// GFX12: [0x05,0x40,0x0b,0xcc,0x7e,0x82,0x01,0x18] 1238 1239v_pk_sub_u16 v5, exec_hi, null 1240// GFX12: [0x05,0x40,0x0b,0xcc,0x7f,0xf8,0x00,0x18] 1241 1242v_pk_sub_u16 v5, null, exec_lo 1243// GFX12: [0x05,0x40,0x0b,0xcc,0x7c,0xfc,0x00,0x18] 1244 1245v_pk_sub_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] 1246// GFX12: [0x05,0x58,0x0b,0xcc,0xc1,0xfe,0x00,0x00] 1247 1248v_pk_sub_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] 1249// GFX12: [0x05,0x40,0x0b,0xcc,0xf0,0xfa,0x00,0x18] 1250 1251v_pk_sub_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] 1252// GFX12: [0x05,0x48,0x0b,0xcc,0xfd,0xd4,0x00,0x10] 1253 1254v_pk_sub_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp 1255// GFX12: [0xff,0xd0,0x0b,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00] 1256 1257v_pk_minimum_f16 v5, v1, v2 1258// GFX12: [0x05,0x40,0x1d,0xcc,0x01,0x05,0x02,0x18] 1259 1260v_pk_minimum_f16 v5, v255, v255 1261// GFX12: [0x05,0x40,0x1d,0xcc,0xff,0xff,0x03,0x18] 1262 1263v_pk_minimum_f16 v5, s1, s2 1264// GFX12: [0x05,0x40,0x1d,0xcc,0x01,0x04,0x00,0x18] 1265 1266v_pk_minimum_f16 v5, s105, s105 1267// GFX12: [0x05,0x40,0x1d,0xcc,0x69,0xd2,0x00,0x18] 1268 1269v_pk_minimum_f16 v5, vcc_lo, ttmp15 1270// GFX12: [0x05,0x40,0x1d,0xcc,0x6a,0xf6,0x00,0x18] 1271 1272v_pk_minimum_f16 v5, vcc_hi, 0xfe0b 1273// GFX12: [0x05,0x40,0x1d,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1274 1275v_pk_minimum_f16 v5, ttmp15, src_scc 1276// GFX12: [0x05,0x40,0x1d,0xcc,0x7b,0xfa,0x01,0x18] 1277 1278v_pk_minimum_f16 v5, m0, 0.5 1279// GFX12: [0x05,0x40,0x1d,0xcc,0x7d,0xe0,0x01,0x18] 1280 1281v_pk_minimum_f16 v5, exec_lo, -1 1282// GFX12: [0x05,0x40,0x1d,0xcc,0x7e,0x82,0x01,0x18] 1283 1284v_pk_minimum_f16 v5, exec_hi, null 1285// GFX12: [0x05,0x40,0x1d,0xcc,0x7f,0xf8,0x00,0x18] 1286 1287v_pk_minimum_f16 v5, null, exec_lo 1288// GFX12: [0x05,0x40,0x1d,0xcc,0x7c,0xfc,0x00,0x18] 1289 1290v_pk_minimum_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0] 1291// GFX12: [0x05,0x59,0x1d,0xcc,0xc1,0xfe,0x00,0x20] 1292 1293v_pk_minimum_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1] 1294// GFX12: [0x05,0x42,0x1d,0xcc,0xf0,0xfa,0x00,0x58] 1295 1296v_pk_minimum_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0] 1297// GFX12: [0x05,0x48,0x1d,0xcc,0xfd,0xd4,0x00,0x10] 1298 1299v_pk_minimum_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp 1300// GFX12: [0xff,0xd3,0x1d,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00] 1301 1302v_pk_maximum_f16 v5, v1, v2 1303// GFX12: [0x05,0x40,0x1e,0xcc,0x01,0x05,0x02,0x18] 1304 1305v_pk_maximum_f16 v5, v255, v255 1306// GFX12: [0x05,0x40,0x1e,0xcc,0xff,0xff,0x03,0x18] 1307 1308v_pk_maximum_f16 v5, s1, s2 1309// GFX12: [0x05,0x40,0x1e,0xcc,0x01,0x04,0x00,0x18] 1310 1311v_pk_maximum_f16 v5, s105, s105 1312// GFX12: [0x05,0x40,0x1e,0xcc,0x69,0xd2,0x00,0x18] 1313 1314v_pk_maximum_f16 v5, vcc_lo, ttmp15 1315// GFX12: [0x05,0x40,0x1e,0xcc,0x6a,0xf6,0x00,0x18] 1316 1317v_pk_maximum_f16 v5, vcc_hi, 0xfe0b 1318// GFX12: [0x05,0x40,0x1e,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00] 1319 1320v_pk_maximum_f16 v5, ttmp15, src_scc 1321// GFX12: [0x05,0x40,0x1e,0xcc,0x7b,0xfa,0x01,0x18] 1322 1323v_pk_maximum_f16 v5, m0, 0.5 1324// GFX12: [0x05,0x40,0x1e,0xcc,0x7d,0xe0,0x01,0x18] 1325 1326v_pk_maximum_f16 v5, exec_lo, -1 1327// GFX12: [0x05,0x40,0x1e,0xcc,0x7e,0x82,0x01,0x18] 1328 1329v_pk_maximum_f16 v5, exec_hi, null 1330// GFX12: [0x05,0x40,0x1e,0xcc,0x7f,0xf8,0x00,0x18] 1331 1332v_pk_maximum_f16 v5, null, exec_lo 1333// GFX12: [0x05,0x40,0x1e,0xcc,0x7c,0xfc,0x00,0x18] 1334 1335v_pk_maximum_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0] 1336// GFX12: [0x05,0x59,0x1e,0xcc,0xc1,0xfe,0x00,0x20] 1337 1338v_pk_maximum_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1] 1339// GFX12: [0x05,0x42,0x1e,0xcc,0xf0,0xfa,0x00,0x58] 1340 1341v_pk_maximum_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0] 1342// GFX12: [0x05,0x48,0x1e,0xcc,0xfd,0xd4,0x00,0x10] 1343 1344v_pk_maximum_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp 1345// GFX12: [0xff,0xd3,0x1e,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00] 1346 1347v_dot4_f32_fp8_bf8 v0, v1, v2, v3 1348// GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x0e,0x1c] 1349 1350v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1] 1351// GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x0e,0x9c] 1352 1353v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1] 1354// GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x24,0xcc,0x01,0x05,0x0e,0x1c] 1355 1356v_dot4_f32_fp8_bf8 v0, s0, v2, v3 1357// GFX12: v_dot4_f32_fp8_bf8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x00,0x04,0x0e,0x1c] 1358 1359v_dot4_f32_fp8_bf8 v0, v1, s0, v3 1360// GFX12: v_dot4_f32_fp8_bf8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x01,0x0c,0x1c] 1361 1362v_dot4_f32_fp8_bf8 v0, v1, v2, s0 1363// GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x02,0x18] 1364 1365v_dot4_f32_fp8_bf8 v0, 1.0, v2, v3 1366// GFX12: v_dot4_f32_fp8_bf8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x24,0xcc,0xf2,0x04,0x0e,0x1c] 1367 1368v_dot4_f32_fp8_bf8 v0, v1, 1.0, v3 1369// GFX12: v_dot4_f32_fp8_bf8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0xe5,0x0d,0x1c] 1370 1371v_dot4_f32_fp8_bf8 v0, v1, v2, 1.0 1372// GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0xca,0x1b] 1373 1374v_dot4_f32_fp8_bf8 v0, v1, v2, 1 1375// GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x06,0x1a] 1376 1377v_dot4_f32_bf8_fp8 v0, v1, v2, v3 1378// GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x0e,0x1c] 1379 1380v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1] 1381// GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x0e,0x9c] 1382 1383v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1] 1384// GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x25,0xcc,0x01,0x05,0x0e,0x1c] 1385 1386v_dot4_f32_bf8_fp8 v0, s0, v2, v3 1387// GFX12: v_dot4_f32_bf8_fp8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x00,0x04,0x0e,0x1c] 1388 1389v_dot4_f32_bf8_fp8 v0, v1, s0, v3 1390// GFX12: v_dot4_f32_bf8_fp8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x01,0x0c,0x1c] 1391 1392v_dot4_f32_bf8_fp8 v0, v1, v2, s0 1393// GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x02,0x18] 1394 1395v_dot4_f32_bf8_fp8 v0, 1.0, v2, v3 1396// GFX12: v_dot4_f32_bf8_fp8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x25,0xcc,0xf2,0x04,0x0e,0x1c] 1397 1398v_dot4_f32_bf8_fp8 v0, v1, 1.0, v3 1399// GFX12: v_dot4_f32_bf8_fp8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0xe5,0x0d,0x1c] 1400 1401v_dot4_f32_bf8_fp8 v0, v1, v2, 1.0 1402// GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0xca,0x1b] 1403 1404v_dot4_f32_bf8_fp8 v0, v1, v2, 1 1405// GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x06,0x1a] 1406 1407v_dot4_f32_fp8_fp8 v0, v1, v2, v3 1408// GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x0e,0x1c] 1409 1410v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1] 1411// GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x0e,0x9c] 1412 1413v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1] 1414// GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x26,0xcc,0x01,0x05,0x0e,0x1c] 1415 1416v_dot4_f32_fp8_fp8 v0, s0, v2, v3 1417// GFX12: v_dot4_f32_fp8_fp8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x00,0x04,0x0e,0x1c] 1418 1419v_dot4_f32_fp8_fp8 v0, v1, s0, v3 1420// GFX12: v_dot4_f32_fp8_fp8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x01,0x0c,0x1c] 1421 1422v_dot4_f32_fp8_fp8 v0, v1, v2, s0 1423// GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x02,0x18] 1424 1425v_dot4_f32_fp8_fp8 v0, 1.0, v2, v3 1426// GFX12: v_dot4_f32_fp8_fp8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x26,0xcc,0xf2,0x04,0x0e,0x1c] 1427 1428v_dot4_f32_fp8_fp8 v0, v1, 1.0, v3 1429// GFX12: v_dot4_f32_fp8_fp8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0xe5,0x0d,0x1c] 1430 1431v_dot4_f32_fp8_fp8 v0, v1, v2, 1.0 1432// GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0xca,0x1b] 1433 1434v_dot4_f32_fp8_fp8 v0, v1, v2, 1 1435// GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x06,0x1a] 1436 1437v_dot4_f32_bf8_bf8 v0, v1, v2, v3 1438// GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x0e,0x1c] 1439 1440v_dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1] 1441// GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x0e,0x9c] 1442 1443v_dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1] 1444// GFX12: _dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x27,0xcc,0x01,0x05,0x0e,0x1c] 1445 1446v_dot4_f32_bf8_bf8 v0, s0, v2, v3 1447// GFX12: v_dot4_f32_bf8_bf8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x00,0x04,0x0e,0x1c] 1448 1449v_dot4_f32_bf8_bf8 v0, v1, s0, v3 1450// GFX12: v_dot4_f32_bf8_bf8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x01,0x0c,0x1c] 1451 1452v_dot4_f32_bf8_bf8 v0, v1, v2, s0 1453// GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x02,0x18] 1454 1455v_dot4_f32_bf8_bf8 v0, 1.0, v2, v3 1456// GFX12: v_dot4_f32_bf8_bf8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x27,0xcc,0xf2,0x04,0x0e,0x1c] 1457 1458v_dot4_f32_bf8_bf8 v0, v1, 1.0, v3 1459// GFX12: v_dot4_f32_bf8_bf8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0xe5,0x0d,0x1c] 1460 1461v_dot4_f32_bf8_bf8 v0, v1, v2, 1.0 1462// GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0xca,0x1b] 1463 1464v_dot4_f32_bf8_bf8 v0, v1, v2, 1 1465// GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x06,0x1a] 1466