xref: /llvm-project/llvm/test/CodeGen/SPIRV/hlsl-intrinsics/dot4add_u8packed.ll (revision bf30b6c33c17d43402d23f8cade450437fcff800)
1*bf30b6c3SFinn Plummer; RUN: llc -O0 -mtriple=spirv1.5-unknown-unknown %s -o - | FileCheck %s --check-prefixes=CHECK,CHECK-EXP
2*bf30b6c3SFinn Plummer; RUN: llc -O0 -mtriple=spirv1.6-unknown-unknown %s -o - | FileCheck %s --check-prefixes=CHECK,CHECK-DOT
3*bf30b6c3SFinn Plummer; RUN: llc -O0 -mtriple=spirv-unknown-unknown -spirv-ext=+SPV_KHR_integer_dot_product %s -o - | FileCheck %s --check-prefixes=CHECK,CHECK-DOT,CHECK-EXT
4*bf30b6c3SFinn Plummer; RUN: %if spirv-tools %{ llc -verify-machineinstrs -O0 -mtriple=spirv1.5-unknown-unknown %s -o - -filetype=obj | spirv-val %}
5*bf30b6c3SFinn Plummer; RUN: %if spirv-tools %{ llc -verify-machineinstrs -O0 -mtriple=spirv1.6-unknown-unknown %s -o - -filetype=obj | spirv-val %}
6*bf30b6c3SFinn Plummer; RUN: %if spirv-tools %{ llc -verify-machineinstrs -O0 -mtriple=spirv-unknown-unknown -spirv-ext=+SPV_KHR_integer_dot_product %s -o - -filetype=obj | spirv-val %}
7*bf30b6c3SFinn Plummer
8*bf30b6c3SFinn Plummer; CHECK-DOT: OpCapability DotProduct
9*bf30b6c3SFinn Plummer; CHECK-DOT: OpCapability DotProductInput4x8BitPacked
10*bf30b6c3SFinn Plummer; CHECK-EXT: OpExtension "SPV_KHR_integer_dot_product"
11*bf30b6c3SFinn Plummer
12*bf30b6c3SFinn Plummer; CHECK: %[[#int_32:]] = OpTypeInt 32 0
13*bf30b6c3SFinn Plummer; CHECK-EXP-DAG: %[[#int_8:]] = OpTypeInt 8 0
14*bf30b6c3SFinn Plummer; CHECK-EXP-DAG: %[[#zero:]] = OpConstantNull %[[#int_8]]
15*bf30b6c3SFinn Plummer; CHECK-EXP-DAG: %[[#eight:]] = OpConstant %[[#int_8]] 8
16*bf30b6c3SFinn Plummer; CHECK-EXP-DAG: %[[#sixteen:]] = OpConstant %[[#int_8]] 16
17*bf30b6c3SFinn Plummer; CHECK-EXP-DAG: %[[#twentyfour:]] = OpConstant %[[#int_8]] 24
18*bf30b6c3SFinn Plummer
19*bf30b6c3SFinn Plummer; CHECK-LABEL: Begin function test_dot
20*bf30b6c3SFinn Plummerdefine noundef i32 @test_dot(i32 noundef %a, i32 noundef %b, i32 noundef %c) {
21*bf30b6c3SFinn Plummerentry:
22*bf30b6c3SFinn Plummer; CHECK: %[[#A:]] = OpFunctionParameter %[[#int_32]]
23*bf30b6c3SFinn Plummer; CHECK: %[[#B:]] = OpFunctionParameter %[[#int_32]]
24*bf30b6c3SFinn Plummer; CHECK: %[[#C:]] = OpFunctionParameter %[[#int_32]]
25*bf30b6c3SFinn Plummer
26*bf30b6c3SFinn Plummer; Test that we use the dot product op when capabilities allow
27*bf30b6c3SFinn Plummer
28*bf30b6c3SFinn Plummer; CHECK-DOT: %[[#DOT:]] = OpUDot %[[#int_32]] %[[#A]] %[[#B]]
29*bf30b6c3SFinn Plummer; CHECK-DOT: %[[#RES:]] = OpIAdd %[[#int_32]] %[[#DOT]] %[[#C]]
30*bf30b6c3SFinn Plummer
31*bf30b6c3SFinn Plummer; Test expansion is used when spirv dot product capabilities aren't available:
32*bf30b6c3SFinn Plummer
33*bf30b6c3SFinn Plummer; First element of the packed vector
34*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#A0:]] = OpBitFieldUExtract %[[#int_32]] %[[#A]] %[[#zero]] %[[#eight]]
35*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#B0:]] = OpBitFieldUExtract %[[#int_32]] %[[#B]] %[[#zero]] %[[#eight]]
36*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MUL0:]] = OpIMul %[[#int_32]] %[[#A0]] %[[#B0]]
37*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MASK0:]] = OpBitFieldUExtract %[[#int_32]] %[[#MUL0]] %[[#zero]] %[[#eight]]
38*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#ACC0:]] = OpIAdd %[[#int_32]] %[[#C]] %[[#MASK0]]
39*bf30b6c3SFinn Plummer
40*bf30b6c3SFinn Plummer; Second element of the packed vector
41*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#A1:]] = OpBitFieldUExtract %[[#int_32]] %[[#A]] %[[#eight]] %[[#eight]]
42*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#B1:]] = OpBitFieldUExtract %[[#int_32]] %[[#B]] %[[#eight]] %[[#eight]]
43*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MUL1:]] = OpIMul %[[#int_32]] %[[#A1]] %[[#B1]]
44*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MASK1:]] = OpBitFieldUExtract %[[#int_32]] %[[#MUL1]] %[[#zero]] %[[#eight]]
45*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#ACC1:]] = OpIAdd %[[#int_32]] %[[#ACC0]] %[[#MASK1]]
46*bf30b6c3SFinn Plummer
47*bf30b6c3SFinn Plummer; Third element of the packed vector
48*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#A2:]] = OpBitFieldUExtract %[[#int_32]] %[[#A]] %[[#sixteen]] %[[#eight]]
49*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#B2:]] = OpBitFieldUExtract %[[#int_32]] %[[#B]] %[[#sixteen]] %[[#eight]]
50*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MUL2:]] = OpIMul %[[#int_32]] %[[#A2]] %[[#B2]]
51*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MASK2:]] = OpBitFieldUExtract %[[#int_32]] %[[#MUL2]] %[[#zero]] %[[#eight]]
52*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#ACC2:]] = OpIAdd %[[#int_32]] %[[#ACC1]] %[[#MASK2]]
53*bf30b6c3SFinn Plummer
54*bf30b6c3SFinn Plummer; Fourth element of the packed vector
55*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#A3:]] = OpBitFieldUExtract %[[#int_32]] %[[#A]] %[[#twentyfour]] %[[#eight]]
56*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#B3:]] = OpBitFieldUExtract %[[#int_32]] %[[#B]] %[[#twentyfour]] %[[#eight]]
57*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MUL3:]] = OpIMul %[[#int_32]] %[[#A3]] %[[#B3]]
58*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#MASK3:]] = OpBitFieldUExtract %[[#int_32]] %[[#MUL3]] %[[#zero]] %[[#eight]]
59*bf30b6c3SFinn Plummer
60*bf30b6c3SFinn Plummer; CHECK-EXP: %[[#RES:]] = OpIAdd %[[#int_32]] %[[#ACC2]] %[[#MASK3]]
61*bf30b6c3SFinn Plummer; CHECK: OpReturnValue %[[#RES]]
62*bf30b6c3SFinn Plummer  %spv.dot = call i32 @llvm.spv.dot4add.u8packed(i32 %a, i32 %b, i32 %c)
63*bf30b6c3SFinn Plummer
64*bf30b6c3SFinn Plummer  ret i32 %spv.dot
65*bf30b6c3SFinn Plummer}
66