xref: /aosp_15_r20/external/llvm-libc/src/math/generic/tanpif16.cpp (revision 71db0c75aadcf003ffe3238005f61d7618a3fead)
1*71db0c75SAndroid Build Coastguard Worker //===-- Half-precision tanpif function ------------------------------------===//
2*71db0c75SAndroid Build Coastguard Worker //
3*71db0c75SAndroid Build Coastguard Worker // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*71db0c75SAndroid Build Coastguard Worker // See https://llvm.org/LICENSE.txt for license information.
5*71db0c75SAndroid Build Coastguard Worker // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*71db0c75SAndroid Build Coastguard Worker //
7*71db0c75SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
8*71db0c75SAndroid Build Coastguard Worker 
9*71db0c75SAndroid Build Coastguard Worker #include "src/math/tanpif16.h"
10*71db0c75SAndroid Build Coastguard Worker #include "hdr/errno_macros.h"
11*71db0c75SAndroid Build Coastguard Worker #include "hdr/fenv_macros.h"
12*71db0c75SAndroid Build Coastguard Worker #include "sincosf16_utils.h"
13*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/FEnvImpl.h"
14*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/FPBits.h"
15*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/cast.h"
16*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/except_value_utils.h"
17*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/multiply_add.h"
18*71db0c75SAndroid Build Coastguard Worker #include "src/__support/macros/optimization.h"
19*71db0c75SAndroid Build Coastguard Worker 
20*71db0c75SAndroid Build Coastguard Worker namespace LIBC_NAMESPACE_DECL {
21*71db0c75SAndroid Build Coastguard Worker 
22*71db0c75SAndroid Build Coastguard Worker constexpr size_t N_EXCEPTS = 21;
23*71db0c75SAndroid Build Coastguard Worker 
24*71db0c75SAndroid Build Coastguard Worker constexpr fputil::ExceptValues<float16, N_EXCEPTS> TANF16_EXCEPTS{{
25*71db0c75SAndroid Build Coastguard Worker     // (input, RZ output, RU offset, RD offset, RN offset)
26*71db0c75SAndroid Build Coastguard Worker     {0x07f2, 0x0e3d, 1, 0, 0}, {0x086a, 0x0eee, 1, 0, 1},
27*71db0c75SAndroid Build Coastguard Worker     {0x08db, 0x0fa0, 1, 0, 0}, {0x094c, 0x1029, 1, 0, 0},
28*71db0c75SAndroid Build Coastguard Worker     {0x0b10, 0x118c, 1, 0, 0}, {0x1ce0, 0x23a8, 1, 0, 1},
29*71db0c75SAndroid Build Coastguard Worker     {0x1235, 0x18e0, 1, 0, 0}, {0x2579, 0x2c4e, 1, 0, 0},
30*71db0c75SAndroid Build Coastguard Worker     {0x28b2, 0x2f68, 1, 0, 1}, {0x2a43, 0x30f4, 1, 0, 1},
31*71db0c75SAndroid Build Coastguard Worker     {0x31b7, 0x3907, 1, 0, 0}, {0x329d, 0x3a12, 1, 0, 1},
32*71db0c75SAndroid Build Coastguard Worker     {0x34f1, 0x3dd7, 1, 0, 0}, {0x3658, 0x41ee, 1, 0, 0},
33*71db0c75SAndroid Build Coastguard Worker     {0x38d4, 0xc1ee, 0, 1, 0}, {0x3d96, 0x41ee, 1, 0, 0},
34*71db0c75SAndroid Build Coastguard Worker     {0x3e6a, 0xc1ee, 0, 1, 0}, {0x40cb, 0x41ee, 1, 0, 0},
35*71db0c75SAndroid Build Coastguard Worker     {0x4135, 0xc1ee, 0, 1, 0}, {0x42cb, 0x41ee, 1, 0, 0},
36*71db0c75SAndroid Build Coastguard Worker     {0x4335, 0xc1ee, 0, 1, 0},
37*71db0c75SAndroid Build Coastguard Worker }};
38*71db0c75SAndroid Build Coastguard Worker 
39*71db0c75SAndroid Build Coastguard Worker LLVM_LIBC_FUNCTION(float16, tanpif16, (float16 x)) {
40*71db0c75SAndroid Build Coastguard Worker   using FPBits = typename fputil::FPBits<float16>;
41*71db0c75SAndroid Build Coastguard Worker   FPBits xbits(x);
42*71db0c75SAndroid Build Coastguard Worker 
43*71db0c75SAndroid Build Coastguard Worker   uint16_t x_u = xbits.uintval();
44*71db0c75SAndroid Build Coastguard Worker   uint16_t x_abs = x_u & 0x7fff;
45*71db0c75SAndroid Build Coastguard Worker 
46*71db0c75SAndroid Build Coastguard Worker   // Handle exceptional values
47*71db0c75SAndroid Build Coastguard Worker   if (LIBC_UNLIKELY(x_abs <= 0x4335)) {
48*71db0c75SAndroid Build Coastguard Worker     if (LIBC_UNLIKELY(x_abs == 0U))
49*71db0c75SAndroid Build Coastguard Worker       return x;
50*71db0c75SAndroid Build Coastguard Worker 
51*71db0c75SAndroid Build Coastguard Worker     bool x_sign = x_u >> 15;
52*71db0c75SAndroid Build Coastguard Worker     if (auto r = TANF16_EXCEPTS.lookup_odd(x_abs, x_sign);
53*71db0c75SAndroid Build Coastguard Worker         LIBC_UNLIKELY(r.has_value()))
54*71db0c75SAndroid Build Coastguard Worker       return r.value();
55*71db0c75SAndroid Build Coastguard Worker   }
56*71db0c75SAndroid Build Coastguard Worker 
57*71db0c75SAndroid Build Coastguard Worker   // Numbers greater or equal to 2^10 are integers, or infinity, or NaN
58*71db0c75SAndroid Build Coastguard Worker   if (LIBC_UNLIKELY(x_abs >= 0x6400)) {
59*71db0c75SAndroid Build Coastguard Worker     // Check for NaN or infinity values
60*71db0c75SAndroid Build Coastguard Worker     if (LIBC_UNLIKELY(x_abs >= 0x7c00)) {
61*71db0c75SAndroid Build Coastguard Worker       if (x_abs == 0x7c00) {
62*71db0c75SAndroid Build Coastguard Worker         fputil::set_errno_if_required(EDOM);
63*71db0c75SAndroid Build Coastguard Worker         fputil::raise_except_if_required(FE_INVALID);
64*71db0c75SAndroid Build Coastguard Worker       }
65*71db0c75SAndroid Build Coastguard Worker 
66*71db0c75SAndroid Build Coastguard Worker       return x + FPBits::quiet_nan().get_val();
67*71db0c75SAndroid Build Coastguard Worker     }
68*71db0c75SAndroid Build Coastguard Worker 
69*71db0c75SAndroid Build Coastguard Worker     return FPBits::zero(xbits.sign()).get_val();
70*71db0c75SAndroid Build Coastguard Worker   }
71*71db0c75SAndroid Build Coastguard Worker   // Range reduction:
72*71db0c75SAndroid Build Coastguard Worker   // For |x| > 1/32, we perform range reduction as follows:
73*71db0c75SAndroid Build Coastguard Worker   // Find k and y such that:
74*71db0c75SAndroid Build Coastguard Worker   //   x = (k + y) * 1/32
75*71db0c75SAndroid Build Coastguard Worker   //   k is an integer
76*71db0c75SAndroid Build Coastguard Worker   //   |y| < 0.5
77*71db0c75SAndroid Build Coastguard Worker   //
78*71db0c75SAndroid Build Coastguard Worker   // This is done by performing:
79*71db0c75SAndroid Build Coastguard Worker   //   k = round(x * 32)
80*71db0c75SAndroid Build Coastguard Worker   //   y = x * 32 - k
81*71db0c75SAndroid Build Coastguard Worker   //
82*71db0c75SAndroid Build Coastguard Worker   // Once k and y are computed, we then deduce the answer by tthe formula:
83*71db0c75SAndroid Build Coastguard Worker   // tan(x) = sin(x) / cos(x)
84*71db0c75SAndroid Build Coastguard Worker   //        = (sin_y * cos_k + cos_y * sin_k) / (cos_y * cos_k - sin_y * sin_k)
85*71db0c75SAndroid Build Coastguard Worker   float xf = x;
86*71db0c75SAndroid Build Coastguard Worker   float sin_k, cos_k, sin_y, cosm1_y;
87*71db0c75SAndroid Build Coastguard Worker   sincospif16_eval(xf, sin_k, cos_k, sin_y, cosm1_y);
88*71db0c75SAndroid Build Coastguard Worker 
89*71db0c75SAndroid Build Coastguard Worker   if (LIBC_UNLIKELY(sin_y == 0 && cos_k == 0)) {
90*71db0c75SAndroid Build Coastguard Worker     fputil::set_errno_if_required(EDOM);
91*71db0c75SAndroid Build Coastguard Worker     fputil::raise_except_if_required(FE_DIVBYZERO);
92*71db0c75SAndroid Build Coastguard Worker 
93*71db0c75SAndroid Build Coastguard Worker     int16_t x_mp5_u = static_cast<int16_t>(x - 0.5);
94*71db0c75SAndroid Build Coastguard Worker     return ((x_mp5_u & 0x1) ? -1 : 1) * FPBits::inf().get_val();
95*71db0c75SAndroid Build Coastguard Worker   }
96*71db0c75SAndroid Build Coastguard Worker 
97*71db0c75SAndroid Build Coastguard Worker   using fputil::multiply_add;
98*71db0c75SAndroid Build Coastguard Worker   return fputil::cast<float16>(
99*71db0c75SAndroid Build Coastguard Worker       multiply_add(sin_y, cos_k, multiply_add(cosm1_y, sin_k, sin_k)) /
100*71db0c75SAndroid Build Coastguard Worker       multiply_add(sin_y, -sin_k, multiply_add(cosm1_y, cos_k, cos_k)));
101*71db0c75SAndroid Build Coastguard Worker }
102*71db0c75SAndroid Build Coastguard Worker 
103*71db0c75SAndroid Build Coastguard Worker } // namespace LIBC_NAMESPACE_DECL
104