1*70feafdbSMatt Arsenault; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals all --version 4 2*70feafdbSMatt Arsenault; RUN: llvm-as < %s | llvm-dis | FileCheck %s 3*70feafdbSMatt Arsenault 4*70feafdbSMatt Arsenault; amdgpu-unsafe-fp-atomics attribute should be removed and replaced 5*70feafdbSMatt Arsenault; with metadata attached to any atomicrmw with floating-point 6*70feafdbSMatt Arsenault; operations. 7*70feafdbSMatt Arsenault 8*70feafdbSMatt Arsenault; Maybe the attribute should be dropped from declarations, but it 9*70feafdbSMatt Arsenault; didn't do anything on one and clang never added it. 10*70feafdbSMatt Arsenaultdeclare void @unsafe_fp_atomics_true_decl() "amdgpu-unsafe-fp-atomics"="true" 11*70feafdbSMatt Arsenaultdeclare void @unsafe_fp_atomics_false_decl() "amdgpu-unsafe-fp-atomics"="false" 12*70feafdbSMatt Arsenault 13*70feafdbSMatt Arsenault; Delete the attribute and replace with the most aggressive metadata possible 14*70feafdbSMatt Arsenaultdefine void @unsafe_fp_atomics_true(ptr addrspace(1) %ptr, float %val, i32 %ival, <2 x half> %vval) "amdgpu-unsafe-fp-atomics"="true" { 15*70feafdbSMatt Arsenault; CHECK-LABEL: define void @unsafe_fp_atomics_true( 16*70feafdbSMatt Arsenault; CHECK-SAME: ptr addrspace(1) [[PTR:%.*]], float [[VAL:%.*]], i32 [[IVAL:%.*]], <2 x half> [[VVAL:%.*]]) { 17*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FADD:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0:![0-9]+]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 18*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FSUB:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 19*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMIN:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 20*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMAX:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 21*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_XOR:%.*]] = atomicrmw xor ptr addrspace(1) [[PTR]], i32 [[IVAL]] syncscope("one-as") seq_cst, align 4 22*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FADD_VECTOR:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 23*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FSUB_VECTOR:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 24*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMIN_VECTOR:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 25*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMAX_VECTOR:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4, !amdgpu.no.fine.grained.host.memory [[META0]], !amdgpu.no.remote.memory.access [[META0]], !amdgpu.ignore.denormal.mode [[META0]] 26*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_XCHG:%.*]] = atomicrmw xchg ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4 27*70feafdbSMatt Arsenault; CHECK-NEXT: ret void 28*70feafdbSMatt Arsenault; 29*70feafdbSMatt Arsenault %rmw.fadd = atomicrmw fadd ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 30*70feafdbSMatt Arsenault %rmw.fsub = atomicrmw fsub ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 31*70feafdbSMatt Arsenault %rmw.fmin = atomicrmw fmin ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 32*70feafdbSMatt Arsenault %rmw.fmax = atomicrmw fmax ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 33*70feafdbSMatt Arsenault %rmw.xor = atomicrmw xor ptr addrspace(1) %ptr, i32 %ival syncscope("one-as") seq_cst 34*70feafdbSMatt Arsenault %rmw.fadd.vector = atomicrmw fadd ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 35*70feafdbSMatt Arsenault %rmw.fsub.vector = atomicrmw fsub ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 36*70feafdbSMatt Arsenault %rmw.fmin.vector = atomicrmw fmin ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 37*70feafdbSMatt Arsenault %rmw.fmax.vector = atomicrmw fmax ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 38*70feafdbSMatt Arsenault 39*70feafdbSMatt Arsenault ; xchg doesn't need any metadata 40*70feafdbSMatt Arsenault %rmw.xchg = atomicrmw xchg ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 41*70feafdbSMatt Arsenault ret void 42*70feafdbSMatt Arsenault} 43*70feafdbSMatt Arsenault 44*70feafdbSMatt Arsenault; Should just delete the effectless attribute if it exists 45*70feafdbSMatt Arsenaultdefine void @unsafe_fp_atomics_false(ptr addrspace(1) %ptr, float %val, i32 %ival, <2 x half> %vval) "amdgpu-unsafe-fp-atomics"="false" { 46*70feafdbSMatt Arsenault; CHECK-LABEL: define void @unsafe_fp_atomics_false( 47*70feafdbSMatt Arsenault; CHECK-SAME: ptr addrspace(1) [[PTR:%.*]], float [[VAL:%.*]], i32 [[IVAL:%.*]], <2 x half> [[VVAL:%.*]]) { 48*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FADD:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4 49*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FSUB:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4 50*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMIN:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4 51*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMAX:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4 52*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_XOR:%.*]] = atomicrmw xor ptr addrspace(1) [[PTR]], i32 [[IVAL]] syncscope("one-as") seq_cst, align 4 53*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FADD_VECTOR:%.*]] = atomicrmw fadd ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4 54*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FSUB_VECTOR:%.*]] = atomicrmw fsub ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4 55*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMIN_VECTOR:%.*]] = atomicrmw fmin ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4 56*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_FMAX_VECTOR:%.*]] = atomicrmw fmax ptr addrspace(1) [[PTR]], <2 x half> [[VVAL]] syncscope("one-as") seq_cst, align 4 57*70feafdbSMatt Arsenault; CHECK-NEXT: [[RMW_XCHG:%.*]] = atomicrmw xchg ptr addrspace(1) [[PTR]], float [[VAL]] syncscope("one-as") seq_cst, align 4 58*70feafdbSMatt Arsenault; CHECK-NEXT: ret void 59*70feafdbSMatt Arsenault; 60*70feafdbSMatt Arsenault %rmw.fadd = atomicrmw fadd ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 61*70feafdbSMatt Arsenault %rmw.fsub = atomicrmw fsub ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 62*70feafdbSMatt Arsenault %rmw.fmin = atomicrmw fmin ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 63*70feafdbSMatt Arsenault %rmw.fmax = atomicrmw fmax ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 64*70feafdbSMatt Arsenault %rmw.xor = atomicrmw xor ptr addrspace(1) %ptr, i32 %ival syncscope("one-as") seq_cst 65*70feafdbSMatt Arsenault %rmw.fadd.vector = atomicrmw fadd ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 66*70feafdbSMatt Arsenault %rmw.fsub.vector = atomicrmw fsub ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 67*70feafdbSMatt Arsenault %rmw.fmin.vector = atomicrmw fmin ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 68*70feafdbSMatt Arsenault %rmw.fmax.vector = atomicrmw fmax ptr addrspace(1) %ptr, <2 x half> %vval syncscope("one-as") seq_cst 69*70feafdbSMatt Arsenault 70*70feafdbSMatt Arsenault ; xchg doesn't need any metadata 71*70feafdbSMatt Arsenault %rmw.xchg = atomicrmw xchg ptr addrspace(1) %ptr, float %val syncscope("one-as") seq_cst 72*70feafdbSMatt Arsenault ret void 73*70feafdbSMatt Arsenault} 74*70feafdbSMatt Arsenault 75*70feafdbSMatt Arsenault;. 76*70feafdbSMatt Arsenault; CHECK: attributes #[[ATTR0:[0-9]+]] = { "amdgpu-unsafe-fp-atomics"="true" } 77*70feafdbSMatt Arsenault; CHECK: attributes #[[ATTR1:[0-9]+]] = { "amdgpu-unsafe-fp-atomics"="false" } 78*70feafdbSMatt Arsenault;. 79*70feafdbSMatt Arsenault; CHECK: [[META0]] = !{} 80*70feafdbSMatt Arsenault;. 81