1; RUN: opt -S -dxil-intrinsic-expansion -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s --check-prefixes=CHECK,EXPCHECK 2; RUN: opt -S -dxil-intrinsic-expansion -dxil-op-lower -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s --check-prefixes=CHECK,DOPCHECK 3 4; Make sure dxil operation function calls for dot are generated for int/uint vectors. 5 6; CHECK-LABEL: dot_int16_t2 7define noundef i16 @dot_int16_t2(<2 x i16> noundef %a, <2 x i16> noundef %b) { 8entry: 9; CHECK: extractelement <2 x i16> %a, i64 0 10; CHECK: extractelement <2 x i16> %b, i64 0 11; CHECK: mul i16 %{{.*}}, %{{.*}} 12; CHECK: extractelement <2 x i16> %a, i64 1 13; CHECK: extractelement <2 x i16> %b, i64 1 14; EXPCHECK: call i16 @llvm.dx.imad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) 15; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 48, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR:]] 16 %dot = call i16 @llvm.dx.sdot.v3i16(<2 x i16> %a, <2 x i16> %b) 17 ret i16 %dot 18} 19 20; CHECK-LABEL: dot_int4 21define noundef i32 @dot_int4(<4 x i32> noundef %a, <4 x i32> noundef %b) { 22entry: 23; CHECK: extractelement <4 x i32> %a, i64 0 24; CHECK: extractelement <4 x i32> %b, i64 0 25; CHECK: mul i32 %{{.*}}, %{{.*}} 26; CHECK: extractelement <4 x i32> %a, i64 1 27; CHECK: extractelement <4 x i32> %b, i64 1 28; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) 29; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]] 30; CHECK: extractelement <4 x i32> %a, i64 2 31; CHECK: extractelement <4 x i32> %b, i64 2 32; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) 33; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]] 34; CHECK: extractelement <4 x i32> %a, i64 3 35; CHECK: extractelement <4 x i32> %b, i64 3 36; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) 37; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]] 38 %dot = call i32 @llvm.dx.sdot.v4i32(<4 x i32> %a, <4 x i32> %b) 39 ret i32 %dot 40} 41 42; CHECK-LABEL: dot_uint16_t3 43define noundef i16 @dot_uint16_t3(<3 x i16> noundef %a, <3 x i16> noundef %b) { 44entry: 45; CHECK: extractelement <3 x i16> %a, i64 0 46; CHECK: extractelement <3 x i16> %b, i64 0 47; CHECK: mul i16 %{{.*}}, %{{.*}} 48; CHECK: extractelement <3 x i16> %a, i64 1 49; CHECK: extractelement <3 x i16> %b, i64 1 50; EXPCHECK: call i16 @llvm.dx.umad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) 51; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 49, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR]] 52; CHECK: extractelement <3 x i16> %a, i64 2 53; CHECK: extractelement <3 x i16> %b, i64 2 54; EXPCHECK: call i16 @llvm.dx.umad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) 55; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 49, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR]] 56 %dot = call i16 @llvm.dx.udot.v3i16(<3 x i16> %a, <3 x i16> %b) 57 ret i16 %dot 58} 59 60; CHECK-LABEL: dot_uint4 61define noundef i32 @dot_uint4(<4 x i32> noundef %a, <4 x i32> noundef %b) { 62entry: 63; CHECK: extractelement <4 x i32> %a, i64 0 64; CHECK: extractelement <4 x i32> %b, i64 0 65; CHECK: mul i32 %{{.*}}, %{{.*}} 66; CHECK: extractelement <4 x i32> %a, i64 1 67; CHECK: extractelement <4 x i32> %b, i64 1 68; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) 69; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]] 70; CHECK: extractelement <4 x i32> %a, i64 2 71; CHECK: extractelement <4 x i32> %b, i64 2 72; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) 73; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]] 74; CHECK: extractelement <4 x i32> %a, i64 3 75; CHECK: extractelement <4 x i32> %b, i64 3 76; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) 77; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]] 78 %dot = call i32 @llvm.dx.udot.v4i32(<4 x i32> %a, <4 x i32> %b) 79 ret i32 %dot 80} 81 82; CHECK-LABEL: dot_uint64_t4 83define noundef i64 @dot_uint64_t4(<2 x i64> noundef %a, <2 x i64> noundef %b) { 84entry: 85; CHECK: extractelement <2 x i64> %a, i64 0 86; CHECK: extractelement <2 x i64> %b, i64 0 87; CHECK: mul i64 %{{.*}}, %{{.*}} 88; CHECK: extractelement <2 x i64> %a, i64 1 89; CHECK: extractelement <2 x i64> %b, i64 1 90; EXPCHECK: call i64 @llvm.dx.umad.i64(i64 %{{.*}}, i64 %{{.*}}, i64 %{{.*}}) 91; DOPCHECK: call i64 @dx.op.tertiary.i64(i32 49, i64 %{{.*}}, i64 %{{.*}}, i64 %{{.*}}) #[[#ATTR]] 92 %dot = call i64 @llvm.dx.udot.v2i64(<2 x i64> %a, <2 x i64> %b) 93 ret i64 %dot 94} 95 96; DOPCHECK: attributes #[[#ATTR]] = {{{.*}} memory(none) {{.*}}} 97 98declare i16 @llvm.dx.sdot.v2i16(<2 x i16>, <2 x i16>) 99declare i32 @llvm.dx.sdot.v4i32(<4 x i32>, <4 x i32>) 100declare i16 @llvm.dx.udot.v3i32(<3 x i16>, <3 x i16>) 101declare i32 @llvm.dx.udot.v4i32(<4 x i32>, <4 x i32>) 102declare i64 @llvm.dx.udot.v2i64(<2 x i64>, <2 x i64>) 103