xref: /llvm-project/llvm/test/CodeGen/DirectX/idot.ll (revision 011b618644113996e2c0a8e57db40f89d20878e3)
1; RUN: opt -S  -dxil-intrinsic-expansion -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s --check-prefixes=CHECK,EXPCHECK
2; RUN: opt -S  -dxil-intrinsic-expansion -dxil-op-lower -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s --check-prefixes=CHECK,DOPCHECK
3
4; Make sure dxil operation function calls for dot are generated for int/uint vectors.
5
6; CHECK-LABEL: dot_int16_t2
7define noundef i16 @dot_int16_t2(<2 x i16> noundef %a, <2 x i16> noundef %b) {
8entry:
9; CHECK: extractelement <2 x i16> %a, i64 0
10; CHECK: extractelement <2 x i16> %b, i64 0
11; CHECK: mul i16 %{{.*}}, %{{.*}}
12; CHECK: extractelement <2 x i16> %a, i64 1
13; CHECK: extractelement <2 x i16> %b, i64 1
14; EXPCHECK: call i16 @llvm.dx.imad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}})
15; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 48, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR:]]
16  %dot = call i16 @llvm.dx.sdot.v3i16(<2 x i16> %a, <2 x i16> %b)
17  ret i16 %dot
18}
19
20; CHECK-LABEL: dot_int4
21define noundef i32 @dot_int4(<4 x i32> noundef %a, <4 x i32> noundef %b) {
22entry:
23; CHECK: extractelement <4 x i32> %a, i64 0
24; CHECK: extractelement <4 x i32> %b, i64 0
25; CHECK: mul i32 %{{.*}}, %{{.*}}
26; CHECK: extractelement <4 x i32> %a, i64 1
27; CHECK: extractelement <4 x i32> %b, i64 1
28; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
29; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
30; CHECK: extractelement <4 x i32> %a, i64 2
31; CHECK: extractelement <4 x i32> %b, i64 2
32; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
33; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
34; CHECK: extractelement <4 x i32> %a, i64 3
35; CHECK: extractelement <4 x i32> %b, i64 3
36; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
37; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
38  %dot = call i32 @llvm.dx.sdot.v4i32(<4 x i32> %a, <4 x i32> %b)
39  ret i32 %dot
40}
41
42; CHECK-LABEL: dot_uint16_t3
43define noundef i16 @dot_uint16_t3(<3 x i16> noundef %a, <3 x i16> noundef %b) {
44entry:
45; CHECK: extractelement <3 x i16> %a, i64 0
46; CHECK: extractelement <3 x i16> %b, i64 0
47; CHECK: mul i16 %{{.*}}, %{{.*}}
48; CHECK: extractelement <3 x i16> %a, i64 1
49; CHECK: extractelement <3 x i16> %b, i64 1
50; EXPCHECK: call i16 @llvm.dx.umad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}})
51; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 49, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR]]
52; CHECK: extractelement <3 x i16> %a, i64 2
53; CHECK: extractelement <3 x i16> %b, i64 2
54; EXPCHECK: call i16 @llvm.dx.umad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}})
55; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 49, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR]]
56  %dot = call i16 @llvm.dx.udot.v3i16(<3 x i16> %a, <3 x i16> %b)
57  ret i16 %dot
58}
59
60; CHECK-LABEL: dot_uint4
61define noundef i32 @dot_uint4(<4 x i32> noundef %a, <4 x i32> noundef %b) {
62entry:
63; CHECK: extractelement <4 x i32> %a, i64 0
64; CHECK: extractelement <4 x i32> %b, i64 0
65; CHECK: mul i32 %{{.*}}, %{{.*}}
66; CHECK: extractelement <4 x i32> %a, i64 1
67; CHECK: extractelement <4 x i32> %b, i64 1
68; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
69; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
70; CHECK: extractelement <4 x i32> %a, i64 2
71; CHECK: extractelement <4 x i32> %b, i64 2
72; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
73; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
74; CHECK: extractelement <4 x i32> %a, i64 3
75; CHECK: extractelement <4 x i32> %b, i64 3
76; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
77; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
78  %dot = call i32 @llvm.dx.udot.v4i32(<4 x i32> %a, <4 x i32> %b)
79  ret i32 %dot
80}
81
82; CHECK-LABEL: dot_uint64_t4
83define noundef i64 @dot_uint64_t4(<2 x i64> noundef %a, <2 x i64> noundef %b) {
84entry:
85; CHECK: extractelement <2 x i64> %a, i64 0
86; CHECK: extractelement <2 x i64> %b, i64 0
87; CHECK: mul i64 %{{.*}}, %{{.*}}
88; CHECK: extractelement <2 x i64> %a, i64 1
89; CHECK: extractelement <2 x i64> %b, i64 1
90; EXPCHECK: call i64 @llvm.dx.umad.i64(i64 %{{.*}}, i64 %{{.*}}, i64 %{{.*}})
91; DOPCHECK: call i64 @dx.op.tertiary.i64(i32 49, i64 %{{.*}}, i64 %{{.*}}, i64 %{{.*}}) #[[#ATTR]]
92  %dot = call i64 @llvm.dx.udot.v2i64(<2 x i64> %a, <2 x i64> %b)
93  ret i64 %dot
94}
95
96; DOPCHECK: attributes #[[#ATTR]] = {{{.*}} memory(none) {{.*}}}
97
98declare i16 @llvm.dx.sdot.v2i16(<2 x i16>, <2 x i16>)
99declare i32 @llvm.dx.sdot.v4i32(<4 x i32>, <4 x i32>)
100declare i16 @llvm.dx.udot.v3i32(<3 x i16>, <3 x i16>)
101declare i32 @llvm.dx.udot.v4i32(<4 x i32>, <4 x i32>)
102declare i64 @llvm.dx.udot.v2i64(<2 x i64>, <2 x i64>)
103