1// REQUIRES: amdgpu-registered-target 2// RUN: %clang_cc1 -emit-llvm -O0 -o - -triple amdgcn %s | FileCheck %s 3// RUN: %clang_cc1 -emit-llvm -O0 -o - -triple spirv64-amd-amdhsa %s | FileCheck %s 4 5typedef float float32 __attribute__((ext_vector_type(32))); 6 7kernel void test_long(int arg0) { 8 long v15_16; 9 // CHECK: call{{.*}} i64 asm sideeffect "v_lshlrev_b64 v[15:16], 0, $0", "={v[15:16]},v" 10 __asm volatile("v_lshlrev_b64 v[15:16], 0, %0" : "={v[15:16]}"(v15_16) : "v"(arg0)); 11} 12 13kernel void test_agpr() { 14 float32 acc_c; 15 float reg_a; 16 float reg_b; 17 float32 reg_c; 18 // CHECK: call{{.*}} <32 x float> asm "v_mfma_f32_32x32x1f32 $0, $1, $2, $3", "=a,v,v,a,~{a0},~{a1},~{a2},~{a3},~{a4},~{a5},~{a6},~{a7},~{a8},~{a9},~{a10},~{a11},~{a12},~{a13},~{a14},~{a15},~{a16},~{a17},~{a18},~{a19},~{a20},~{a21},~{a22},~{a23},~{a24},~{a25},~{a26},~{a27},~{a28},~{a29},~{a30},~{a31}" 19 __asm ("v_mfma_f32_32x32x1f32 %0, %1, %2, %3" 20 : "=a"(acc_c) 21 : "v"(reg_a), "v"(reg_b), "a"(reg_c) 22 : "a0", "a1", "a2", "a3", "a4", "a5", "a6", "a7", 23 "a8", "a9", "a10", "a11", "a12", "a13", "a14", "a15", 24 "a16", "a17", "a18", "a19", "a20", "a21", "a22", "a23", 25 "a24", "a25", "a26", "a27", "a28", "a29", "a30", "a31"); 26 27 // CHECK: call{{.*}} <32 x float> asm sideeffect "v_mfma_f32_32x32x1f32 a[0:31], $0, $1, a[0:31]", "={a[0:31]},v,v,{a[0:31]}" 28 __asm volatile("v_mfma_f32_32x32x1f32 a[0:31], %0, %1, a[0:31]" 29 : "={a[0:31]}"(acc_c) 30 : "v"(reg_a),"v"(reg_b), "{a[0:31]}"(reg_c)); 31 32 // CHECK: call{{.*}} float asm "v_accvgpr_read_b32 $0, $1", "={a1},{a1}" 33 __asm ("v_accvgpr_read_b32 %0, %1" 34 : "={a1}"(reg_a) 35 : "{a1}"(reg_b)); 36} 37 38kernel void test_constraint_DA() { 39 const long x = 0x200000001; 40 int res; 41 // CHECK: call{{.*}} i32 asm sideeffect "v_mov_b32 $0, $1 & 0xFFFFFFFF", "=v,^DA"(i64 8589934593) 42 __asm volatile("v_mov_b32 %0, %1 & 0xFFFFFFFF" : "=v"(res) : "DA"(x)); 43} 44 45kernel void test_constraint_DB() { 46 const long x = 0x200000001; 47 int res; 48 // CHECK: call{{.*}} i32 asm sideeffect "v_mov_b32 $0, $1 & 0xFFFFFFFF", "=v,^DB"(i64 8589934593) 49 __asm volatile("v_mov_b32 %0, %1 & 0xFFFFFFFF" : "=v"(res) : "DB"(x)); 50} 51