Home
last modified time | relevance | path

Searched full:rsqrt (Results 1 – 25 of 179) sorted by relevance

12345678

/llvm-project/clang/test/CodeGenHLSL/builtins/
H A Drsqrt.hlsl21 // NATIVE_HALF: %hlsl.rsqrt = call reassoc nnan ninf nsz arcp afn half @llvm.[[TARGET]].rsqrt.f16(
22 // NATIVE_HALF: ret half %hlsl.rsqrt
24 // NO_HALF: %hlsl.rsqrt = call reassoc nnan ninf nsz arcp afn float @llvm.[[TARGET]].rsqrt.f32(
25 // NO_HALF: ret float %hlsl.rsqrt
26 half test_rsqrt_half(half p0) { return rsqrt(p0); }
28 // NATIVE_HALF: %hlsl.rsqrt = call reassoc nnan ninf nsz arcp afn <2 x half> @llvm.[[TARGET]].rsqrt.v2f16
29 // NATIVE_HALF: ret <2 x half> %hlsl.rsqrt
[all...]
/llvm-project/llvm/test/CodeGen/SPIRV/hlsl-intrinsics/
H A Drsqrt.ll18 %elt.rsqrt = call float @llvm.spv.rsqrt.f32(float %a)
19 ret float %elt.rsqrt
26 %elt.rsqrt = call half @llvm.spv.rsqrt.f16(half %a)
27 ret half %elt.rsqrt
34 %elt.rsqrt = call double @llvm.spv.rsqrt.f64(double %a)
35 ret double %elt.rsqrt
42 %elt.rsqrt
[all...]
/llvm-project/llvm/test/CodeGen/NVPTX/
H A Drsqrt-opt.ll3 ; RUN: llc < %s -mtriple=nvptx64 -nvptx-rsqrt-approx-opt=0 | FileCheck %s --check-prefixes CHECK,CHECK-APPROX-NOOPT,CHECK-SQRT-NOOPT
7 ; RUN: %if ptxas %{ llc < %s -mtriple=nvptx64 -nvptx-rsqrt-approx-opt=0 | %ptxas-verify %}
12 ; CHECK-APPROX-OPT: rsqrt.approx.f32
16 %rsqrt = fdiv float 1.0, %sqrt
17 ret float %rsqrt
21 ; CHECK-APPROX-OPT: rsqrt.approx.ftz.f32
25 %rsqrt = fdiv float 1.0, %sqrt
26 ret float %rsqrt
31 ; CHECK-SQRT-OPT: rsqrt.approx.f32
35 %rsqrt
[all...]
H A Drsqrt.ll6 ; CHECK: rsqrt.approx.f32
7 %call = call float @llvm.nvvm.rsqrt.approx.f(float %in)
13 ; CHECK: rsqrt.approx.f64
14 %call = call double @llvm.nvvm.rsqrt.approx.d(double %in)
20 ; CHECK: rsqrt.approx.ftz.f32
21 %call = tail call float @llvm.nvvm.rsqrt.approx.ftz.f(float %in)
27 ; CHECK: rsqrt.approx.ftz.f64
28 %call = tail call double @llvm.nvvm.rsqrt.approx.ftz.d(double %in)
32 declare float @llvm.nvvm.rsqrt.approx.ftz.f(float)
33 declare double @llvm.nvvm.rsqrt
[all...]
H A Dsqrt-approx.ll17 ; CHECK: rsqrt.approx.f32
25 ; CHECK: rsqrt.approx.ftz.f32
33 ; CHECK: rsqrt.approx.f64
41 ; There's no rsqrt.approx.ftz.f64 instruction; we just use the non-ftz version.
42 ; CHECK: rsqrt.approx.f64
88 ; reciprocal(rsqrt.approx.f64(x)). There's no non-ftz approximate reciprocal,
90 ; CHECK: rsqrt.approx.f64
106 ; CHECK: rsqrt.approx.f64
112 ; -- refined sqrt and rsqrt --
114 ; The sqrt and rsqrt refinemen
[all...]
H A Dfast-math.ll62 ; reciprocal(rsqrt(x)) for sqrt(x), and emit a vanilla divide.
74 ; CHECK: rsqrt.approx.f64
83 ; CHECK-LABEL: rsqrt(
84 ; CHECK-NOT: rsqrt.approx
86 ; CHECK-NOT: rsqrt.approx
87 define float @rsqrt(float %a) {
96 ; CHECK: rsqrt.approx.f32
108 ; CHECK: rsqrt.approx.ftz.f32
/llvm-project/llvm/test/CodeGen/DirectX/
H A Drsqrt.ll4 ; Make sure dxil operation function calls for rsqrt are generated for float and half.
14 %dx.rsqrt = call float @llvm.dx.rsqrt.f32(float %a)
15 ret float %dx.rsqrt
26 %dx.rsqrt = call half @llvm.dx.rsqrt.f16(half %a)
27 ret half %dx.rsqrt
49 %2 = call <4 x float> @llvm.dx.rsqrt.v4f32(<4 x float> %a)
55 declare half @llvm.dx.rsqrt.f16(half)
56 declare float @llvm.dx.rsqrt
[all...]
H A Drsqrt_error.ll3 ; DXIL operation rsqrt does not support double overload type
5 ; CHECK-SAME: Cannot create RSqrt operation: Invalid overload type
13 %dx.rsqrt = call double @llvm.dx.rsqrt.f64(double %0)
14 ret double %dx.rsqrt
/llvm-project/llvm/test/Transforms/InstCombine/
H A Dfmul-sqrt.ll97 %rsqrt = fdiv fast double 1.0, %sqrt
98 %squared = fmul fast double %rsqrt, %rsqrt
105 ; CHECK-NEXT: [[RSQRT:%.*]] = fdiv double 1.000000e+00, [[SQRT]]
107 ; CHECK-NEXT: store double [[RSQRT]], ptr [[P:%.*]], align 8
111 %rsqrt = fdiv double 1.0, %sqrt
112 %res = fmul reassoc nsz double %rsqrt, %x
113 store double %rsqrt, ptr %p
121 ; CHECK-NEXT: [[RSQRT:%.*]] = fdiv fast <2 x float> splat (float 1.000000e+00), [[SQRT]]
123 ; CHECK-NEXT: store <2 x float> [[RSQRT]], pt
[all...]
/llvm-project/mlir/test/mlir-cpu-runner/X86Vector/
H A Dmath-polynomial-approx-avx2.mlir
/llvm-project/libclc/generic/lib/math/
H A Drsqrt.cl4 _CLC_OVERLOAD _CLC_DEF float rsqrt(float x)
9 _CLC_UNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, rsqrt, float);
15 _CLC_OVERLOAD _CLC_DEF double rsqrt(double x)
20 _CLC_UNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, rsqrt, double);
/llvm-project/libclc/r600/lib/math/
H A Drsqrt.cl4 _CLC_OVERLOAD _CLC_DEF float rsqrt(float x)
9 _CLC_UNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, rsqrt, float);
15 _CLC_OVERLOAD _CLC_DEF double rsqrt(double x)
20 _CLC_UNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, rsqrt, double);
/llvm-project/libclc/generic/lib/geometric/
H A Dnormalize.cl46 return p * rsqrt(l2);
66 return p * rsqrt(l2);
86 return p * rsqrt(l2);
114 return p * rsqrt(l2);
134 return p * rsqrt(l2);
154 return p * rsqrt(l2);
/llvm-project/clang/test/CodeGen/PowerPC/
H A Dbuiltins-ppc-fastmath.c45 // CHECK-NEXT: [[RSQRT:%.*]] = fdiv fast <4 x float> splat (float 1.000000e+00), [[TMP1]]
47 // CHECK-NEXT: [[ADD:%.*]] = fadd <4 x float> [[RSQRT]], [[TMP2]]
57 // CHECK-NEXT: [[RSQRT:%.*]] = fdiv fast <2 x double> splat (double 1.000000e+00), [[TMP1]]
59 // CHECK-NEXT: [[ADD:%.*]] = fadd <2 x double> [[RSQRT]], [[TMP2]]
/llvm-project/llvm/test/CodeGen/X86/
H A Dextractps.ll16 … call <4 x float> @llvm.x86.sse.rsqrt.ss( <4 x float> %2 ) ; <<4 x float>>:3 [#uses=1]
31 … call <4 x float> @llvm.x86.sse.rsqrt.ss( <4 x float> %2 ) ; <<4 x float>>:3 [#uses=1]
37 declare <4 x float> @llvm.x86.sse.rsqrt.ss(<4 x float>) nounwind readnone
/llvm-project/llvm/test/Transforms/Reassociate/
H A Dfactorize-again.ll9 ; CHECK-NEXT: [[TMP4:%.*]] = call float @llvm.rsqrt.f32(float undef)
22 %4 = call float @llvm.rsqrt.f32(float undef)
41 declare float @llvm.rsqrt.f32(float) #1
/llvm-project/mlir/test/Conversion/MathToLLVM/
H A Dmath-to-llvm.mlir152 // CHECK-LABEL: func @rsqrt(
154 func.func @rsqrt(%arg0 : f32) {
158 %0 = math.rsqrt %arg0 : f32
250 %0 = math.rsqrt %arg0 : f64
262 %0 = math.rsqrt %arg0 fastmath<fast> : f64
274 %0 = math.rsqrt %arg0 : vector<4xf32>
286 %0 = math.rsqrt %arg0 : vector<[4]xf32>
298 %0 = math.rsqrt %arg0 fastmath<fast> : vector<4xf32>
310 %0 = math.rsqrt %arg0 fastmath<fast> : vector<[4]xf32>
323 %0 = math.rsqrt %arg0 : vector<4x3xf32>
[all …]
/llvm-project/libclc/test/
H A Drsqrt.cl4 x[1] = rsqrt(x[0]);
5 y[1] = rsqrt(y[0]);
/llvm-project/mlir/test/Integration/Dialect/Vector/CPU/X86Vector/
H A Drsqrt.mlir10 %r = x86vector.avx.rsqrt %v : vector<8xf32>
11 …// `rsqrt` may produce slightly different results on Intel and AMD machines: accept both results h…
/llvm-project/mlir/test/Dialect/Complex/
H A Dops.mlir80 // CHECK: complex.rsqrt %[[C]] : complex<f32>
81 %rsqrt = complex.rsqrt %complex : complex<f32>
/llvm-project/mlir/test/Conversion/MathToSPIRV/
H A Dmath-to-opencl-spirv.mlir33 // CHECK: spirv.CL.rsqrt %{{.*}}: f32
34 %9 = math.rsqrt %arg0 : f32
82 // CHECK: spirv.CL.rsqrt %{{.*}}: vector<3xf32>
83 %9 = math.rsqrt %arg0 : vector<3xf32>
/llvm-project/mlir/test/Dialect/Math/
H A Dpolynomial-approximation.mlir562 // We only approximate rsqrt for vectors and when the AVX2 option is enabled.
565 // CHECK: math.rsqrt
566 // AVX2: math.rsqrt
568 %0 = math.rsqrt %arg0 : f32
573 // CHECK: math.rsqrt
584 // AVX2: %[[VAL_9:.*]] = x86vector.avx.rsqrt %[[VAL_0]] : vector<8xf32>
592 %0 = math.rsqrt %arg0 : vector<8xf32>
599 // CHECK: math.rsqrt
601 // AVX2: math.rsqrt
603 %0 = math.rsqrt
[all...]
H A Dops.mlir187 // CHECK-LABEL: func @rsqrt(
189 func.func @rsqrt(%f: f32, %v: vector<4xf32>, %t: tensor<4x4x?xf32>) {
190 // CHECK: %{{.*}} = math.rsqrt %[[F]] : f32
191 %0 = math.rsqrt %f : f32
192 // CHECK: %{{.*}} = math.rsqrt %[[V]] : vector<4xf32>
193 %1 = math.rsqrt %v : vector<4xf32>
194 // CHECK: %{{.*}} = math.rsqrt %[[T]] : tensor<4x4x?xf32>
195 %2 = math.rsqrt %t : tensor<4x4x?xf32>
/llvm-project/llvm/test/CodeGen/X86/GlobalISel/
H A Dregbankselect-sse-intrinsics.ll128 …; CHECK-NEXT: [[INT:%[0-9]+]]:vecr(<4 x s32>) = G_INTRINSIC intrinsic(@llvm.x86.sse.rsqrt.ps), […
132 %res = call <4 x float> @llvm.x86.sse.rsqrt.ps(<4 x float> %a0) ; <<4 x float>> [#uses=1]
136 declare <4 x float> @llvm.x86.sse.rsqrt.ps(<4 x float>) nounwind readnone
145 …; CHECK-NEXT: [[INT:%[0-9]+]]:vecr(<4 x s32>) = G_INTRINSIC intrinsic(@llvm.x86.sse.rsqrt.ss), […
149 %res = call <4 x float> @llvm.x86.sse.rsqrt.ss(<4 x float> %a0) ; <<4 x float>> [#uses=1]
153 declare <4 x float> @llvm.x86.sse.rsqrt.ss(<4 x float>) nounwind readnone
/llvm-project/libc/docs/
H A Dc23.rst

12345678