1*b43c97c2SEvgenii Kudriashov // RUN: %clang_cc1 %s -flax-vector-conversions=none -ffreestanding -triple=x86_64-unknown-unknown -target-feature +amx-tile \ 2*b43c97c2SEvgenii Kudriashov // RUN: -emit-llvm -o - -Werror -pedantic | FileCheck %s --check-prefixes=CHECK 3*b43c97c2SEvgenii Kudriashov 4*b43c97c2SEvgenii Kudriashov #include <immintrin.h> 5*b43c97c2SEvgenii Kudriashov 6*b43c97c2SEvgenii Kudriashov char buf[1024]; 7*b43c97c2SEvgenii Kudriashov #define STRIDE 32 8*b43c97c2SEvgenii Kudriashov 9*b43c97c2SEvgenii Kudriashov void test_tile_loadd(short row, short col) { 10*b43c97c2SEvgenii Kudriashov //CHECK-LABEL: @test_tile_loadd 11*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call x86_amx @llvm.x86.tileloadd64.internal 12*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call <256 x i32> @llvm.x86.cast.tile.to.vector.v256i32(x86_amx {{%.*}}) 13*b43c97c2SEvgenii Kudriashov __tile1024i a = {row, col}; 14*b43c97c2SEvgenii Kudriashov __tile_loadd(&a, buf, STRIDE); 15*b43c97c2SEvgenii Kudriashov } 16*b43c97c2SEvgenii Kudriashov 17*b43c97c2SEvgenii Kudriashov void test_tile_stream_loadd(short row, short col) { 18*b43c97c2SEvgenii Kudriashov //CHECK-LABEL: @test_tile_stream_loadd 19*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call x86_amx @llvm.x86.tileloaddt164.internal 20*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call <256 x i32> @llvm.x86.cast.tile.to.vector.v256i32(x86_amx {{%.*}}) 21*b43c97c2SEvgenii Kudriashov __tile1024i a = {row, col}; 22*b43c97c2SEvgenii Kudriashov __tile_stream_loadd(&a, buf, STRIDE); 23*b43c97c2SEvgenii Kudriashov } 24*b43c97c2SEvgenii Kudriashov 25*b43c97c2SEvgenii Kudriashov void test_tile_stored(__tile1024i c) { 26*b43c97c2SEvgenii Kudriashov //CHECK-LABEL: @test_tile_stored 27*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call x86_amx @llvm.x86.cast.vector.to.tile.v256i32(<256 x i32> {{%.*}}) 28*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call void @llvm.x86.tilestored64.internal 29*b43c97c2SEvgenii Kudriashov __tile_stored(buf, STRIDE, c); 30*b43c97c2SEvgenii Kudriashov } 31*b43c97c2SEvgenii Kudriashov 32*b43c97c2SEvgenii Kudriashov void test_tile_zero(__tile1024i c) { 33*b43c97c2SEvgenii Kudriashov //CHECK-LABEL: @test_tile_zero 34*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call x86_amx @llvm.x86.tilezero.internal 35*b43c97c2SEvgenii Kudriashov //CHECK-DAG: call <256 x i32> @llvm.x86.cast.tile.to.vector.v256i32(x86_amx {{%.*}}) 36*b43c97c2SEvgenii Kudriashov __tile_zero(&c); 37*b43c97c2SEvgenii Kudriashov } 38