1*f3087befSAndrew Turner// polynomial used for __v_log2f(x) 2*f3087befSAndrew Turner// 3*f3087befSAndrew Turner// Copyright (c) 2022-2024, Arm Limited. 4*f3087befSAndrew Turner// SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception 5*f3087befSAndrew Turner 6*f3087befSAndrew Turnerdeg = 9; // poly degree 7*f3087befSAndrew Turnera = -1/3; 8*f3087befSAndrew Turnerb = 1/3; 9*f3087befSAndrew Turner 10*f3087befSAndrew Turnerln2 = evaluate(log(2),0); 11*f3087befSAndrew Turnerinvln2 = single(1/ln2); 12*f3087befSAndrew Turner 13*f3087befSAndrew Turner// find log2(1+x)/x polynomial with minimal relative error 14*f3087befSAndrew Turner// (minimal relative error polynomial for log2(1+x) is the same * x) 15*f3087befSAndrew Turnerdeg = deg-1; // because of /x 16*f3087befSAndrew Turner 17*f3087befSAndrew Turner// f = log2(1+x)/x; using taylor series 18*f3087befSAndrew Turnerf = 0; 19*f3087befSAndrew Turnerfor i from 0 to 60 do { f = f + (-x)^i/(i+1); }; 20*f3087befSAndrew Turnerf = f * invln2; 21*f3087befSAndrew Turner 22*f3087befSAndrew Turner// return p that minimizes |f(x) - poly(x) - x^d*p(x)|/|f(x)| 23*f3087befSAndrew Turnerapprox = proc(poly,d) { 24*f3087befSAndrew Turner return remez(1 - poly(x)/f(x), deg-d, [a;b], x^d/f(x), 1e-10); 25*f3087befSAndrew Turner}; 26*f3087befSAndrew Turner 27*f3087befSAndrew Turner// first coeff is fixed, iteratively find optimal double prec coeffs 28*f3087befSAndrew Turnerpoly = invln2; 29*f3087befSAndrew Turnerfor i from 1 to deg do { 30*f3087befSAndrew Turner p = roundcoefficients(approx(poly,i), [|SG ...|]); 31*f3087befSAndrew Turner poly = poly + x^i*coeff(p,0); 32*f3087befSAndrew Turner}; 33*f3087befSAndrew Turner 34*f3087befSAndrew Turnerdisplay = hexadecimal; 35*f3087befSAndrew Turnerprint("rel error:", accurateinfnorm(1-poly(x)/f(x), [a;b], 30)); 36*f3087befSAndrew Turnerprint("in [",a,b,"]"); 37*f3087befSAndrew Turnerprint("coeffs:"); 38*f3087befSAndrew Turnerfor i from 0 to deg do coeff(poly,i); 39