xref: /aosp_15_r20/external/llvm-libc/src/math/generic/sincosf16_utils.h (revision 71db0c75aadcf003ffe3238005f61d7618a3fead)
1*71db0c75SAndroid Build Coastguard Worker //===-- Collection of utils for sinf16/cosf16 -------------------*- C++ -*-===//
2*71db0c75SAndroid Build Coastguard Worker //
3*71db0c75SAndroid Build Coastguard Worker // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*71db0c75SAndroid Build Coastguard Worker // See https://llvm.org/LICENSE.txt for license information.
5*71db0c75SAndroid Build Coastguard Worker // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*71db0c75SAndroid Build Coastguard Worker //
7*71db0c75SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
8*71db0c75SAndroid Build Coastguard Worker 
9*71db0c75SAndroid Build Coastguard Worker #ifndef LLVM_LIBC_SRC_MATH_GENERIC_SINCOSF16_UTILS_H
10*71db0c75SAndroid Build Coastguard Worker #define LLVM_LIBC_SRC_MATH_GENERIC_SINCOSF16_UTILS_H
11*71db0c75SAndroid Build Coastguard Worker 
12*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/FPBits.h"
13*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/PolyEval.h"
14*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/nearest_integer.h"
15*71db0c75SAndroid Build Coastguard Worker #include "src/__support/common.h"
16*71db0c75SAndroid Build Coastguard Worker #include "src/__support/macros/config.h"
17*71db0c75SAndroid Build Coastguard Worker 
18*71db0c75SAndroid Build Coastguard Worker namespace LIBC_NAMESPACE_DECL {
19*71db0c75SAndroid Build Coastguard Worker 
20*71db0c75SAndroid Build Coastguard Worker // Lookup table for sin(k * pi / 32) with k = 0, ..., 63.
21*71db0c75SAndroid Build Coastguard Worker // Table is generated with Sollya as follows:
22*71db0c75SAndroid Build Coastguard Worker // > display = hexadecimmal;
23*71db0c75SAndroid Build Coastguard Worker // > for k from 0 to 63 do { round(sin(k * pi/32), SG, RN); };
24*71db0c75SAndroid Build Coastguard Worker constexpr float SIN_K_PI_OVER_32[64] = {
25*71db0c75SAndroid Build Coastguard Worker     0x0.0p0,        0x1.917a6cp-4,  0x1.8f8b84p-3,  0x1.294062p-2,
26*71db0c75SAndroid Build Coastguard Worker     0x1.87de2ap-2,  0x1.e2b5d4p-2,  0x1.1c73b4p-1,  0x1.44cf32p-1,
27*71db0c75SAndroid Build Coastguard Worker     0x1.6a09e6p-1,  0x1.8bc806p-1,  0x1.a9b662p-1,  0x1.c38b3p-1,
28*71db0c75SAndroid Build Coastguard Worker     0x1.d906bcp-1,  0x1.e9f416p-1,  0x1.f6297cp-1,  0x1.fd88dap-1,
29*71db0c75SAndroid Build Coastguard Worker     0x1p0,          0x1.fd88dap-1,  0x1.f6297cp-1,  0x1.e9f416p-1,
30*71db0c75SAndroid Build Coastguard Worker     0x1.d906bcp-1,  0x1.c38b3p-1,   0x1.a9b662p-1,  0x1.8bc806p-1,
31*71db0c75SAndroid Build Coastguard Worker     0x1.6a09e6p-1,  0x1.44cf32p-1,  0x1.1c73b4p-1,  0x1.e2b5d4p-2,
32*71db0c75SAndroid Build Coastguard Worker     0x1.87de2ap-2,  0x1.294062p-2,  0x1.8f8b84p-3,  0x1.917a6cp-4,
33*71db0c75SAndroid Build Coastguard Worker     0x0.0p0,        -0x1.917a6cp-4, -0x1.8f8b84p-3, -0x1.294062p-2,
34*71db0c75SAndroid Build Coastguard Worker     -0x1.87de2ap-2, -0x1.e2b5d4p-2, -0x1.1c73b4p-1, -0x1.44cf32p-1,
35*71db0c75SAndroid Build Coastguard Worker     -0x1.6a09e6p-1, -0x1.8bc806p-1, -0x1.a9b662p-1, -0x1.c38b3p-1,
36*71db0c75SAndroid Build Coastguard Worker     -0x1.d906bcp-1, -0x1.e9f416p-1, -0x1.f6297ep-1, -0x1.fd88dap-1,
37*71db0c75SAndroid Build Coastguard Worker     -0x1p0,         -0x1.fd88dap-1, -0x1.f6297cp-1, -0x1.e9f416p-1,
38*71db0c75SAndroid Build Coastguard Worker     -0x1.d906bcp-1, -0x1.c38b3p-1,  -0x1.a9b662p-1, -0x1.8bc806p-1,
39*71db0c75SAndroid Build Coastguard Worker     -0x1.6a09e6p-1, -0x1.44cf32p-1, -0x1.1c73b4p-1, -0x1.e2b5d4p-2,
40*71db0c75SAndroid Build Coastguard Worker     -0x1.87de2ap-2, -0x1.294062p-2, -0x1.8f8b84p-3, -0x1.917a6cp-4};
41*71db0c75SAndroid Build Coastguard Worker 
range_reduction_sincospif16(float x,float & y)42*71db0c75SAndroid Build Coastguard Worker LIBC_INLINE int32_t range_reduction_sincospif16(float x, float &y) {
43*71db0c75SAndroid Build Coastguard Worker   float kf = fputil::nearest_integer(x * 32);
44*71db0c75SAndroid Build Coastguard Worker   y = fputil::multiply_add<float>(x, 32.0, -kf);
45*71db0c75SAndroid Build Coastguard Worker 
46*71db0c75SAndroid Build Coastguard Worker   return static_cast<int32_t>(kf);
47*71db0c75SAndroid Build Coastguard Worker }
48*71db0c75SAndroid Build Coastguard Worker 
sincospif16_eval(float xf,float & sin_k,float & cos_k,float & sin_y,float & cosm1_y)49*71db0c75SAndroid Build Coastguard Worker LIBC_INLINE void sincospif16_eval(float xf, float &sin_k, float &cos_k,
50*71db0c75SAndroid Build Coastguard Worker                                   float &sin_y, float &cosm1_y) {
51*71db0c75SAndroid Build Coastguard Worker   float y;
52*71db0c75SAndroid Build Coastguard Worker   int32_t k = range_reduction_sincospif16(xf, y);
53*71db0c75SAndroid Build Coastguard Worker 
54*71db0c75SAndroid Build Coastguard Worker   sin_k = SIN_K_PI_OVER_32[k & 63];
55*71db0c75SAndroid Build Coastguard Worker   cos_k = SIN_K_PI_OVER_32[(k + 16) & 63];
56*71db0c75SAndroid Build Coastguard Worker 
57*71db0c75SAndroid Build Coastguard Worker   // Recall, after range reduction, -0.5 <= y <= 0.5. For very small values of
58*71db0c75SAndroid Build Coastguard Worker   // y, calculating sin(y * p/32) can be inaccurate. Generating a polynomial for
59*71db0c75SAndroid Build Coastguard Worker   // sin(y * p/32)/y instead significantly reduces the relative errors.
60*71db0c75SAndroid Build Coastguard Worker   float ysq = y * y;
61*71db0c75SAndroid Build Coastguard Worker 
62*71db0c75SAndroid Build Coastguard Worker   // Degree-6 minimax even polynomial for sin(y*pi/32)/y generated by Sollya
63*71db0c75SAndroid Build Coastguard Worker   // with:
64*71db0c75SAndroid Build Coastguard Worker   // > Q = fpminimax(sin(y * pi/32)/y, [|0, 2, 4, 6|], [|SG...|], [0, 0.5]);
65*71db0c75SAndroid Build Coastguard Worker   sin_y = y * fputil::polyeval(ysq, 0x1.921fb6p-4f, -0x1.4aeabcp-13f,
66*71db0c75SAndroid Build Coastguard Worker                                0x1.a03354p-21f, -0x1.ad02d2p-20f);
67*71db0c75SAndroid Build Coastguard Worker 
68*71db0c75SAndroid Build Coastguard Worker   // Degree-6 minimax even polynomial for cos(y*pi/32) generated by Sollya
69*71db0c75SAndroid Build Coastguard Worker   // with:
70*71db0c75SAndroid Build Coastguard Worker   // > P = fpminimax(cos(y * pi/32), [|0, 2, 4, 6|],[|1, SG...|], [0, 0.5]);
71*71db0c75SAndroid Build Coastguard Worker   cosm1_y = ysq * fputil::polyeval(ysq, -0x1.3bd3ccp-8f, 0x1.03a61ap-18f,
72*71db0c75SAndroid Build Coastguard Worker                                    0x1.a6f7a2p-29f);
73*71db0c75SAndroid Build Coastguard Worker }
74*71db0c75SAndroid Build Coastguard Worker 
75*71db0c75SAndroid Build Coastguard Worker } // namespace LIBC_NAMESPACE_DECL
76*71db0c75SAndroid Build Coastguard Worker 
77*71db0c75SAndroid Build Coastguard Worker #endif // LLVM_LIBC_SRC_MATH_GENERIC_SINCOSF16_UTILS_H
78