xref: /llvm-project/llvm/test/Bitcode/amdgpu-unsafe-fp-atomics-upgrade.ll (revision 70feafdb27b45018f5f72e8f1359fdf9889c3f2a)
1*70feafdbSMatt Arsenault; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals all --version 4
2*70feafdbSMatt Arsenault; RUN: llvm-as < %s | llvm-dis | FileCheck %s
3*70feafdbSMatt Arsenault
4*70feafdbSMatt Arsenault; amdgpu-unsafe-fp-atomics attribute should be removed and replaced
5*70feafdbSMatt Arsenault; with metadata attached to any atomicrmw with floating-point
6*70feafdbSMatt Arsenault; operations.
7*70feafdbSMatt Arsenault
8*70feafdbSMatt Arsenault; Maybe the attribute should be dropped from declarations, but it
9*70feafdbSMatt Arsenault; didn't do anything on one and clang never added it.
10*70feafdbSMatt Arsenaultdeclare void @unsafe_fp_atomics_true_decl() "amdgpu-unsafe-fp-atomics"="true"
11*70feafdbSMatt Arsenaultdeclare void @unsafe_fp_atomics_false_decl() "amdgpu-unsafe-fp-atomics"="false"
12*70feafdbSMatt Arsenault
13*70feafdbSMatt Arsenault; Delete the attribute and replace with the most aggressive metadata possible
14*70feafdbSMatt Arsenaultdefine void @unsafe_fp_atomics_true(ptr addrspace(1) %ptr, float %val, i32 %ival, <2 x half> %vval) "amdgpu-unsafe-fp-atomics"="true" {
15*70feafdbSMatt Arsenault; CHECK-LABEL: define void @unsafe_fp_atomics_true(
16*70feafdbSMatt Arsenault; CHECK-SAME: ptr addrspace(1) [[PTR:%.*]], float [[VAL:%.*]], i32 [[IVAL:%.*]], <2 x half> [[VVAL:%.*]]) {
17*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FADD:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0:![0-9]+]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
18*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FSUB:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
19*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMIN:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
20*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMAX:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
21*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_XOR:%.*]] = atomicrmw xor ptr addrspace(1) [[PTR]], i32 [[IVAL]] syncscope("one-as") seq_cst, align 4
22*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FADD_VECTOR:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
23*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FSUB_VECTOR:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
24*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMIN_VECTOR:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
25*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMAX_VECTOR:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]]
26*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_XCHG:%.*]] = atomicrmw xchg ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4
27*70feafdbSMatt Arsenault; CHECK-NEXT:    ret void
28*70feafdbSMatt Arsenault;
29*70feafdbSMatt Arsenault  %rmw.fadd = atomicrmw fadd ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
30*70feafdbSMatt Arsenault  %rmw.fsub = atomicrmw fsub ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
31*70feafdbSMatt Arsenault  %rmw.fmin = atomicrmw fmin ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
32*70feafdbSMatt Arsenault  %rmw.fmax = atomicrmw fmax ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
33*70feafdbSMatt Arsenault  %rmw.xor = atomicrmw xor ptr addrspace(1) %ptr, i32 %ival syncscope("one-as") seq_cst
34*70feafdbSMatt Arsenault  %rmw.fadd.vector = atomicrmw fadd ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
35*70feafdbSMatt Arsenault  %rmw.fsub.vector = atomicrmw fsub ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
36*70feafdbSMatt Arsenault  %rmw.fmin.vector = atomicrmw fmin ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
37*70feafdbSMatt Arsenault  %rmw.fmax.vector = atomicrmw fmax ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
38*70feafdbSMatt Arsenault
39*70feafdbSMatt Arsenault  ; xchg doesn't need any metadata
40*70feafdbSMatt Arsenault  %rmw.xchg = atomicrmw xchg ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
41*70feafdbSMatt Arsenault  ret void
42*70feafdbSMatt Arsenault}
43*70feafdbSMatt Arsenault
44*70feafdbSMatt Arsenault; Should just delete the effectless attribute if it exists
45*70feafdbSMatt Arsenaultdefine void @unsafe_fp_atomics_false(ptr addrspace(1) %ptr, float %val, i32 %ival, <2 x half> %vval) "amdgpu-unsafe-fp-atomics"="false" {
46*70feafdbSMatt Arsenault; CHECK-LABEL: define void @unsafe_fp_atomics_false(
47*70feafdbSMatt Arsenault; CHECK-SAME: ptr addrspace(1) [[PTR:%.*]], float [[VAL:%.*]], i32 [[IVAL:%.*]], <2 x half> [[VVAL:%.*]]) {
48*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FADD:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4
49*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FSUB:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4
50*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMIN:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4
51*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMAX:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4
52*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_XOR:%.*]] = atomicrmw xor ptr addrspace(1) [[PTR]], i32 [[IVAL]] syncscope("one-as") seq_cst, align 4
53*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FADD_VECTOR:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4
54*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FSUB_VECTOR:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4
55*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMIN_VECTOR:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4
56*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_FMAX_VECTOR:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4
57*70feafdbSMatt Arsenault; CHECK-NEXT:    [[RMW_XCHG:%.*]] = atomicrmw xchg ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4
58*70feafdbSMatt Arsenault; CHECK-NEXT:    ret void
59*70feafdbSMatt Arsenault;
60*70feafdbSMatt Arsenault  %rmw.fadd = atomicrmw fadd ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
61*70feafdbSMatt Arsenault  %rmw.fsub = atomicrmw fsub ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
62*70feafdbSMatt Arsenault  %rmw.fmin = atomicrmw fmin ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
63*70feafdbSMatt Arsenault  %rmw.fmax = atomicrmw fmax ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
64*70feafdbSMatt Arsenault  %rmw.xor = atomicrmw xor ptr addrspace(1) %ptr, i32 %ival syncscope("one-as") seq_cst
65*70feafdbSMatt Arsenault  %rmw.fadd.vector = atomicrmw fadd ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
66*70feafdbSMatt Arsenault  %rmw.fsub.vector = atomicrmw fsub ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
67*70feafdbSMatt Arsenault  %rmw.fmin.vector = atomicrmw fmin ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
68*70feafdbSMatt Arsenault  %rmw.fmax.vector = atomicrmw fmax ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst
69*70feafdbSMatt Arsenault
70*70feafdbSMatt Arsenault  ; xchg doesn't need any metadata
71*70feafdbSMatt Arsenault  %rmw.xchg = atomicrmw xchg ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst
72*70feafdbSMatt Arsenault  ret void
73*70feafdbSMatt Arsenault}
74*70feafdbSMatt Arsenault
75*70feafdbSMatt Arsenault;.
76*70feafdbSMatt Arsenault; CHECK: attributes #[[ATTR0:[0-9]+]] = { "amdgpu-unsafe-fp-atomics"="true" }
77*70feafdbSMatt Arsenault; CHECK: attributes #[[ATTR1:[0-9]+]] = { "amdgpu-unsafe-fp-atomics"="false" }
78*70feafdbSMatt Arsenault;.
79*70feafdbSMatt Arsenault; CHECK: [[META0]] = !{}
80*70feafdbSMatt Arsenault;.
81