1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2 2; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s 3 4target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9" 5 6declare float @_Z3madfff(float, float, float) 7declare <2 x float> @_Z3madDv2_fS_S_(<2 x float>, <2 x float>, <2 x float>) 8declare <3 x float> @_Z3madDv3_fS_S_(<3 x float>, <3 x float>, <3 x float>) 9declare <4 x float> @_Z3madDv4_fS_S_(<4 x float>, <4 x float>, <4 x float>) 10declare <8 x float> @_Z3madDv8_fS_S_(<8 x float>, <8 x float>, <8 x float>) 11declare <16 x float> @_Z3madDv16_fS_S_(<16 x float>, <16 x float>, <16 x float>) 12declare double @_Z3madddd(double, double, double) 13declare <2 x double> @_Z3madDv2_dS_S_(<2 x double>, <2 x double>, <2 x double>) 14declare <3 x double> @_Z3madDv3_dS_S_(<3 x double>, <3 x double>, <3 x double>) 15declare <4 x double> @_Z3madDv4_dS_S_(<4 x double>, <4 x double>, <4 x double>) 16declare <8 x double> @_Z3madDv8_dS_S_(<8 x double>, <8 x double>, <8 x double>) 17declare <16 x double> @_Z3madDv16_dS_S_(<16 x double>, <16 x double>, <16 x double>) 18declare half @_Z3madDhDhDh(half, half, half) 19declare <2 x half> @_Z3madDv2_DhS_S_(<2 x half>, <2 x half>, <2 x half>) 20declare <3 x half> @_Z3madDv3_DhS_S_(<3 x half>, <3 x half>, <3 x half>) 21declare <4 x half> @_Z3madDv4_DhS_S_(<4 x half>, <4 x half>, <4 x half>) 22declare <8 x half> @_Z3madDv8_DhS_S_(<8 x half>, <8 x half>, <8 x half>) 23declare <16 x half> @_Z3madDv16_DhS_S_(<16 x half>, <16 x half>, <16 x half>) 24 25define float @test_mad_f32(float %x, float %y, float %z) { 26; CHECK-LABEL: define float @test_mad_f32 27; CHECK-SAME: (float [[X:%.*]], float [[Y:%.*]], float [[Z:%.*]]) { 28; CHECK-NEXT: [[MAD:%.*]] = tail call float @llvm.fmuladd.f32(float [[X]], float [[Y]], float [[Z]]) 29; CHECK-NEXT: ret float [[MAD]] 30; 31 %mad = tail call float @_Z3madfff(float %x, float %y, float %z) 32 ret float %mad 33} 34 35define <2 x float> @test_mad_v2f32(<2 x float> %x, <2 x float> %y, <2 x float> %z) { 36; CHECK-LABEL: define <2 x float> @test_mad_v2f32 37; CHECK-SAME: (<2 x float> [[X:%.*]], <2 x float> [[Y:%.*]], <2 x float> [[Z:%.*]]) { 38; CHECK-NEXT: [[MAD:%.*]] = tail call <2 x float> @llvm.fmuladd.v2f32(<2 x float> [[X]], <2 x float> [[Y]], <2 x float> [[Z]]) 39; CHECK-NEXT: ret <2 x float> [[MAD]] 40; 41 %mad = tail call <2 x float> @_Z3madDv2_fS_S_(<2 x float> %x, <2 x float> %y, <2 x float> %z) 42 ret <2 x float> %mad 43} 44 45define <3 x float> @test_mad_v3f32(<3 x float> %x, <3 x float> %y, <3 x float> %z) { 46; CHECK-LABEL: define <3 x float> @test_mad_v3f32 47; CHECK-SAME: (<3 x float> [[X:%.*]], <3 x float> [[Y:%.*]], <3 x float> [[Z:%.*]]) { 48; CHECK-NEXT: [[MAD:%.*]] = tail call <3 x float> @llvm.fmuladd.v3f32(<3 x float> [[X]], <3 x float> [[Y]], <3 x float> [[Z]]) 49; CHECK-NEXT: ret <3 x float> [[MAD]] 50; 51 %mad = tail call <3 x float> @_Z3madDv3_fS_S_(<3 x float> %x, <3 x float> %y, <3 x float> %z) 52 ret <3 x float> %mad 53} 54 55define <4 x float> @test_mad_v4f32(<4 x float> %x, <4 x float> %y, <4 x float> %z) { 56; CHECK-LABEL: define <4 x float> @test_mad_v4f32 57; CHECK-SAME: (<4 x float> [[X:%.*]], <4 x float> [[Y:%.*]], <4 x float> [[Z:%.*]]) { 58; CHECK-NEXT: [[MAD:%.*]] = tail call <4 x float> @llvm.fmuladd.v4f32(<4 x float> [[X]], <4 x float> [[Y]], <4 x float> [[Z]]) 59; CHECK-NEXT: ret <4 x float> [[MAD]] 60; 61 %mad = tail call <4 x float> @_Z3madDv4_fS_S_(<4 x float> %x, <4 x float> %y, <4 x float> %z) 62 ret <4 x float> %mad 63} 64 65define <8 x float> @test_mad_v8f32(<8 x float> %x, <8 x float> %y, <8 x float> %z) { 66; CHECK-LABEL: define <8 x float> @test_mad_v8f32 67; CHECK-SAME: (<8 x float> [[X:%.*]], <8 x float> [[Y:%.*]], <8 x float> [[Z:%.*]]) { 68; CHECK-NEXT: [[MAD:%.*]] = tail call <8 x float> @llvm.fmuladd.v8f32(<8 x float> [[X]], <8 x float> [[Y]], <8 x float> [[Z]]) 69; CHECK-NEXT: ret <8 x float> [[MAD]] 70; 71 %mad = tail call <8 x float> @_Z3madDv8_fS_S_(<8 x float> %x, <8 x float> %y, <8 x float> %z) 72 ret <8 x float> %mad 73} 74 75define <16 x float> @test_mad_v16f32(<16 x float> %x, <16 x float> %y, <16 x float> %z) { 76; CHECK-LABEL: define <16 x float> @test_mad_v16f32 77; CHECK-SAME: (<16 x float> [[X:%.*]], <16 x float> [[Y:%.*]], <16 x float> [[Z:%.*]]) { 78; CHECK-NEXT: [[MAD:%.*]] = tail call <16 x float> @llvm.fmuladd.v16f32(<16 x float> [[X]], <16 x float> [[Y]], <16 x float> [[Z]]) 79; CHECK-NEXT: ret <16 x float> [[MAD]] 80; 81 %mad = tail call <16 x float> @_Z3madDv16_fS_S_(<16 x float> %x, <16 x float> %y, <16 x float> %z) 82 ret <16 x float> %mad 83} 84 85define double @test_mad_f64(double %x, double %y, double %z) { 86; CHECK-LABEL: define double @test_mad_f64 87; CHECK-SAME: (double [[X:%.*]], double [[Y:%.*]], double [[Z:%.*]]) { 88; CHECK-NEXT: [[MAD:%.*]] = tail call double @llvm.fmuladd.f64(double [[X]], double [[Y]], double [[Z]]) 89; CHECK-NEXT: ret double [[MAD]] 90; 91 %mad = tail call double @_Z3madddd(double %x, double %y, double %z) 92 ret double %mad 93} 94 95define <2 x double> @test_mad_v2f64(<2 x double> %x, <2 x double> %y, <2 x double> %z) { 96; CHECK-LABEL: define <2 x double> @test_mad_v2f64 97; CHECK-SAME: (<2 x double> [[X:%.*]], <2 x double> [[Y:%.*]], <2 x double> [[Z:%.*]]) { 98; CHECK-NEXT: [[MAD:%.*]] = tail call <2 x double> @llvm.fmuladd.v2f64(<2 x double> [[X]], <2 x double> [[Y]], <2 x double> [[Z]]) 99; CHECK-NEXT: ret <2 x double> [[MAD]] 100; 101 %mad = tail call <2 x double> @_Z3madDv2_dS_S_(<2 x double> %x, <2 x double> %y, <2 x double> %z) 102 ret <2 x double> %mad 103} 104 105define <3 x double> @test_mad_v3f64(<3 x double> %x, <3 x double> %y, <3 x double> %z) { 106; CHECK-LABEL: define <3 x double> @test_mad_v3f64 107; CHECK-SAME: (<3 x double> [[X:%.*]], <3 x double> [[Y:%.*]], <3 x double> [[Z:%.*]]) { 108; CHECK-NEXT: [[MAD:%.*]] = tail call <3 x double> @llvm.fmuladd.v3f64(<3 x double> [[X]], <3 x double> [[Y]], <3 x double> [[Z]]) 109; CHECK-NEXT: ret <3 x double> [[MAD]] 110; 111 %mad = tail call <3 x double> @_Z3madDv3_dS_S_(<3 x double> %x, <3 x double> %y, <3 x double> %z) 112 ret <3 x double> %mad 113} 114 115define <4 x double> @test_mad_v4f64(<4 x double> %x, <4 x double> %y, <4 x double> %z) { 116; CHECK-LABEL: define <4 x double> @test_mad_v4f64 117; CHECK-SAME: (<4 x double> [[X:%.*]], <4 x double> [[Y:%.*]], <4 x double> [[Z:%.*]]) { 118; CHECK-NEXT: [[MAD:%.*]] = tail call <4 x double> @llvm.fmuladd.v4f64(<4 x double> [[X]], <4 x double> [[Y]], <4 x double> [[Z]]) 119; CHECK-NEXT: ret <4 x double> [[MAD]] 120; 121 %mad = tail call <4 x double> @_Z3madDv4_dS_S_(<4 x double> %x, <4 x double> %y, <4 x double> %z) 122 ret <4 x double> %mad 123} 124 125define <8 x double> @test_mad_v8f64(<8 x double> %x, <8 x double> %y, <8 x double> %z) { 126; CHECK-LABEL: define <8 x double> @test_mad_v8f64 127; CHECK-SAME: (<8 x double> [[X:%.*]], <8 x double> [[Y:%.*]], <8 x double> [[Z:%.*]]) { 128; CHECK-NEXT: [[MAD:%.*]] = tail call <8 x double> @llvm.fmuladd.v8f64(<8 x double> [[X]], <8 x double> [[Y]], <8 x double> [[Z]]) 129; CHECK-NEXT: ret <8 x double> [[MAD]] 130; 131 %mad = tail call <8 x double> @_Z3madDv8_dS_S_(<8 x double> %x, <8 x double> %y, <8 x double> %z) 132 ret <8 x double> %mad 133} 134 135define <16 x double> @test_mad_v16f64(<16 x double> %x, <16 x double> %y, <16 x double> %z) { 136; CHECK-LABEL: define <16 x double> @test_mad_v16f64 137; CHECK-SAME: (<16 x double> [[X:%.*]], <16 x double> [[Y:%.*]], <16 x double> [[Z:%.*]]) { 138; CHECK-NEXT: [[MAD:%.*]] = tail call <16 x double> @llvm.fmuladd.v16f64(<16 x double> [[X]], <16 x double> [[Y]], <16 x double> [[Z]]) 139; CHECK-NEXT: ret <16 x double> [[MAD]] 140; 141 %mad = tail call <16 x double> @_Z3madDv16_dS_S_(<16 x double> %x, <16 x double> %y, <16 x double> %z) 142 ret <16 x double> %mad 143} 144 145define half @test_mad_f16(half %x, half %y, half %z) { 146; CHECK-LABEL: define half @test_mad_f16 147; CHECK-SAME: (half [[X:%.*]], half [[Y:%.*]], half [[Z:%.*]]) { 148; CHECK-NEXT: [[MAD:%.*]] = tail call half @llvm.fmuladd.f16(half [[X]], half [[Y]], half [[Z]]) 149; CHECK-NEXT: ret half [[MAD]] 150; 151 %mad = tail call half @_Z3madDhDhDh(half %x, half %y, half %z) 152 ret half %mad 153} 154 155define <2 x half> @test_mad_v2f16(<2 x half> %x, <2 x half> %y, <2 x half> %z) { 156; CHECK-LABEL: define <2 x half> @test_mad_v2f16 157; CHECK-SAME: (<2 x half> [[X:%.*]], <2 x half> [[Y:%.*]], <2 x half> [[Z:%.*]]) { 158; CHECK-NEXT: [[MAD:%.*]] = tail call <2 x half> @llvm.fmuladd.v2f16(<2 x half> [[X]], <2 x half> [[Y]], <2 x half> [[Z]]) 159; CHECK-NEXT: ret <2 x half> [[MAD]] 160; 161 %mad = tail call <2 x half> @_Z3madDv2_DhS_S_(<2 x half> %x, <2 x half> %y, <2 x half> %z) 162 ret <2 x half> %mad 163} 164 165define <3 x half> @test_mad_v3f16(<3 x half> %x, <3 x half> %y, <3 x half> %z) { 166; CHECK-LABEL: define <3 x half> @test_mad_v3f16 167; CHECK-SAME: (<3 x half> [[X:%.*]], <3 x half> [[Y:%.*]], <3 x half> [[Z:%.*]]) { 168; CHECK-NEXT: [[MAD:%.*]] = tail call <3 x half> @llvm.fmuladd.v3f16(<3 x half> [[X]], <3 x half> [[Y]], <3 x half> [[Z]]) 169; CHECK-NEXT: ret <3 x half> [[MAD]] 170; 171 %mad = tail call <3 x half> @_Z3madDv3_DhS_S_(<3 x half> %x, <3 x half> %y, <3 x half> %z) 172 ret <3 x half> %mad 173} 174 175define <4 x half> @test_mad_v4f16(<4 x half> %x, <4 x half> %y, <4 x half> %z) { 176; CHECK-LABEL: define <4 x half> @test_mad_v4f16 177; CHECK-SAME: (<4 x half> [[X:%.*]], <4 x half> [[Y:%.*]], <4 x half> [[Z:%.*]]) { 178; CHECK-NEXT: [[MAD:%.*]] = tail call <4 x half> @llvm.fmuladd.v4f16(<4 x half> [[X]], <4 x half> [[Y]], <4 x half> [[Z]]) 179; CHECK-NEXT: ret <4 x half> [[MAD]] 180; 181 %mad = tail call <4 x half> @_Z3madDv4_DhS_S_(<4 x half> %x, <4 x half> %y, <4 x half> %z) 182 ret <4 x half> %mad 183} 184 185define <8 x half> @test_mad_v8f16(<8 x half> %x, <8 x half> %y, <8 x half> %z) { 186; CHECK-LABEL: define <8 x half> @test_mad_v8f16 187; CHECK-SAME: (<8 x half> [[X:%.*]], <8 x half> [[Y:%.*]], <8 x half> [[Z:%.*]]) { 188; CHECK-NEXT: [[MAD:%.*]] = tail call <8 x half> @llvm.fmuladd.v8f16(<8 x half> [[X]], <8 x half> [[Y]], <8 x half> [[Z]]) 189; CHECK-NEXT: ret <8 x half> [[MAD]] 190; 191 %mad = tail call <8 x half> @_Z3madDv8_DhS_S_(<8 x half> %x, <8 x half> %y, <8 x half> %z) 192 ret <8 x half> %mad 193} 194 195define <16 x half> @test_mad_v16f16(<16 x half> %x, <16 x half> %y, <16 x half> %z) { 196; CHECK-LABEL: define <16 x half> @test_mad_v16f16 197; CHECK-SAME: (<16 x half> [[X:%.*]], <16 x half> [[Y:%.*]], <16 x half> [[Z:%.*]]) { 198; CHECK-NEXT: [[MAD:%.*]] = tail call <16 x half> @llvm.fmuladd.v16f16(<16 x half> [[X]], <16 x half> [[Y]], <16 x half> [[Z]]) 199; CHECK-NEXT: ret <16 x half> [[MAD]] 200; 201 %mad = tail call <16 x half> @_Z3madDv16_DhS_S_(<16 x half> %x, <16 x half> %y, <16 x half> %z) 202 ret <16 x half> %mad 203} 204 205define float @test_mad_f32_fast(float %x, float %y, float %z) { 206; CHECK-LABEL: define float @test_mad_f32_fast 207; CHECK-SAME: (float [[X:%.*]], float [[Y:%.*]], float [[Z:%.*]]) { 208; CHECK-NEXT: [[MAD:%.*]] = tail call fast float @llvm.fmuladd.f32(float [[X]], float [[Y]], float [[Z]]) 209; CHECK-NEXT: ret float [[MAD]] 210; 211 %mad = tail call fast float @_Z3madfff(float %x, float %y, float %z) 212 ret float %mad 213} 214 215define float @test_mad_f32_noinline(float %x, float %y, float %z) { 216; CHECK-LABEL: define float @test_mad_f32_noinline 217; CHECK-SAME: (float [[X:%.*]], float [[Y:%.*]], float [[Z:%.*]]) { 218; CHECK-NEXT: [[MAD:%.*]] = tail call fast float @_Z3madfff(float [[X]], float [[Y]], float [[Z]]) #[[ATTR3:[0-9]+]] 219; CHECK-NEXT: ret float [[MAD]] 220; 221 %mad = tail call fast float @_Z3madfff(float %x, float %y, float %z) #1 222 ret float %mad 223} 224 225define float @test_mad_f32_fast_minsize(float %x, float %y, float %z) #0 { 226; CHECK-LABEL: define float @test_mad_f32_fast_minsize 227; CHECK-SAME: (float [[X:%.*]], float [[Y:%.*]], float [[Z:%.*]]) #[[ATTR0:[0-9]+]] { 228; CHECK-NEXT: [[MAD:%.*]] = tail call fast float @llvm.fmuladd.f32(float [[X]], float [[Y]], float [[Z]]) 229; CHECK-NEXT: ret float [[MAD]] 230; 231 %mad = tail call fast float @_Z3madfff(float %x, float %y, float %z) 232 ret float %mad 233} 234 235define float @test_mad_f32_fast_strictfp(float %x, float %y, float %z) #2 { 236; CHECK-LABEL: define float @test_mad_f32_fast_strictfp 237; CHECK-SAME: (float [[X:%.*]], float [[Y:%.*]], float [[Z:%.*]]) #[[ATTR1:[0-9]+]] { 238; CHECK-NEXT: [[MAD:%.*]] = tail call nnan nsz float @_Z3madfff(float [[X]], float [[Y]], float [[Z]]) #[[ATTR1]] 239; CHECK-NEXT: ret float [[MAD]] 240; 241 %mad = tail call nsz nnan float @_Z3madfff(float %x, float %y, float %z) #2 242 ret float %mad 243} 244 245define float @test_mad_f32_fast_nobuiltin(float %x, float %y, float %z) { 246; CHECK-LABEL: define float @test_mad_f32_fast_nobuiltin 247; CHECK-SAME: (float [[X:%.*]], float [[Y:%.*]], float [[Z:%.*]]) { 248; CHECK-NEXT: [[MAD:%.*]] = tail call fast float @_Z3madfff(float [[X]], float [[Y]], float [[Z]]) #[[ATTR4:[0-9]+]] 249; CHECK-NEXT: ret float [[MAD]] 250; 251 %mad = tail call fast float @_Z3madfff(float %x, float %y, float %z) #3 252 ret float %mad 253} 254 255attributes #0 = { minsize } 256attributes #1 = { noinline } 257attributes #2 = { strictfp } 258attributes #3 = { nobuiltin } 259