1*71db0c75SAndroid Build Coastguard Worker //===-- Single-precision cospi function -----------------------------------===// 2*71db0c75SAndroid Build Coastguard Worker // 3*71db0c75SAndroid Build Coastguard Worker // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4*71db0c75SAndroid Build Coastguard Worker // See https://llvm.org/LICENSE.txt for license information. 5*71db0c75SAndroid Build Coastguard Worker // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6*71db0c75SAndroid Build Coastguard Worker // 7*71db0c75SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===// 8*71db0c75SAndroid Build Coastguard Worker 9*71db0c75SAndroid Build Coastguard Worker #include "src/math/cospif.h" 10*71db0c75SAndroid Build Coastguard Worker #include "sincosf_utils.h" 11*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/FEnvImpl.h" 12*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/FPBits.h" 13*71db0c75SAndroid Build Coastguard Worker #include "src/__support/FPUtil/multiply_add.h" 14*71db0c75SAndroid Build Coastguard Worker #include "src/__support/common.h" 15*71db0c75SAndroid Build Coastguard Worker #include "src/__support/macros/config.h" 16*71db0c75SAndroid Build Coastguard Worker #include "src/__support/macros/optimization.h" // LIBC_UNLIKELY 17*71db0c75SAndroid Build Coastguard Worker #include "src/__support/macros/properties/cpu_features.h" // LIBC_TARGET_CPU_HAS_FMA 18*71db0c75SAndroid Build Coastguard Worker 19*71db0c75SAndroid Build Coastguard Worker namespace LIBC_NAMESPACE_DECL { 20*71db0c75SAndroid Build Coastguard Worker 21*71db0c75SAndroid Build Coastguard Worker LLVM_LIBC_FUNCTION(float, cospif, (float x)) { 22*71db0c75SAndroid Build Coastguard Worker using FPBits = typename fputil::FPBits<float>; 23*71db0c75SAndroid Build Coastguard Worker 24*71db0c75SAndroid Build Coastguard Worker FPBits xbits(x); 25*71db0c75SAndroid Build Coastguard Worker xbits.set_sign(Sign::POS); 26*71db0c75SAndroid Build Coastguard Worker 27*71db0c75SAndroid Build Coastguard Worker uint32_t x_abs = xbits.uintval(); 28*71db0c75SAndroid Build Coastguard Worker double xd = static_cast<double>(xbits.get_val()); 29*71db0c75SAndroid Build Coastguard Worker 30*71db0c75SAndroid Build Coastguard Worker // Range reduction: 31*71db0c75SAndroid Build Coastguard Worker // For |x| > 1/32, we perform range reduction as follows: 32*71db0c75SAndroid Build Coastguard Worker // Find k and y such that: 33*71db0c75SAndroid Build Coastguard Worker // x = (k + y) * 1/32 34*71db0c75SAndroid Build Coastguard Worker // k is an integer 35*71db0c75SAndroid Build Coastguard Worker // |y| < 0.5 36*71db0c75SAndroid Build Coastguard Worker // 37*71db0c75SAndroid Build Coastguard Worker // This is done by performing: 38*71db0c75SAndroid Build Coastguard Worker // k = round(x * 32) 39*71db0c75SAndroid Build Coastguard Worker // y = x * 32 - k 40*71db0c75SAndroid Build Coastguard Worker // 41*71db0c75SAndroid Build Coastguard Worker // Once k and y are computed, we then deduce the answer by the cosine of sum 42*71db0c75SAndroid Build Coastguard Worker // formula: 43*71db0c75SAndroid Build Coastguard Worker // cospi(x) = cos((k + y)*pi/32) 44*71db0c75SAndroid Build Coastguard Worker // = cos(y*pi/32) * cos(k*pi/32) - sin(y*pi/32) * sin(k*pi/32) 45*71db0c75SAndroid Build Coastguard Worker // The values of sin(k*pi/32) and cos(k*pi/32) for k = 0..63 are precomputed 46*71db0c75SAndroid Build Coastguard Worker // and stored using a vector of 32 doubles. Sin(y*pi/32) and cos(y*pi/32) are 47*71db0c75SAndroid Build Coastguard Worker // computed using degree-7 and degree-6 minimax polynomials generated by 48*71db0c75SAndroid Build Coastguard Worker // Sollya respectively. 49*71db0c75SAndroid Build Coastguard Worker 50*71db0c75SAndroid Build Coastguard Worker // The exhautive test passes for smaller values 51*71db0c75SAndroid Build Coastguard Worker if (LIBC_UNLIKELY(x_abs < 0x38A2'F984U)) { 52*71db0c75SAndroid Build Coastguard Worker 53*71db0c75SAndroid Build Coastguard Worker #if defined(LIBC_TARGET_CPU_HAS_FMA) 54*71db0c75SAndroid Build Coastguard Worker return fputil::multiply_add(xbits.get_val(), -0x1.0p-25f, 1.0f); 55*71db0c75SAndroid Build Coastguard Worker #else 56*71db0c75SAndroid Build Coastguard Worker return static_cast<float>(fputil::multiply_add(xd, -0x1.0p-25, 1.0)); 57*71db0c75SAndroid Build Coastguard Worker #endif // LIBC_TARGET_CPU_HAS_FMA 58*71db0c75SAndroid Build Coastguard Worker } 59*71db0c75SAndroid Build Coastguard Worker 60*71db0c75SAndroid Build Coastguard Worker // Numbers greater or equal to 2^23 are always integers or NaN 61*71db0c75SAndroid Build Coastguard Worker if (LIBC_UNLIKELY(x_abs >= 0x4B00'0000)) { 62*71db0c75SAndroid Build Coastguard Worker 63*71db0c75SAndroid Build Coastguard Worker if (LIBC_UNLIKELY(x_abs < 0x4B80'0000)) { 64*71db0c75SAndroid Build Coastguard Worker return (x_abs & 0x1) ? -1.0f : 1.0f; 65*71db0c75SAndroid Build Coastguard Worker } 66*71db0c75SAndroid Build Coastguard Worker 67*71db0c75SAndroid Build Coastguard Worker // x is inf or nan. 68*71db0c75SAndroid Build Coastguard Worker if (LIBC_UNLIKELY(x_abs >= 0x7f80'0000U)) { 69*71db0c75SAndroid Build Coastguard Worker if (x_abs == 0x7f80'0000U) { 70*71db0c75SAndroid Build Coastguard Worker fputil::set_errno_if_required(EDOM); 71*71db0c75SAndroid Build Coastguard Worker fputil::raise_except_if_required(FE_INVALID); 72*71db0c75SAndroid Build Coastguard Worker } 73*71db0c75SAndroid Build Coastguard Worker return x + FPBits::quiet_nan().get_val(); 74*71db0c75SAndroid Build Coastguard Worker } 75*71db0c75SAndroid Build Coastguard Worker 76*71db0c75SAndroid Build Coastguard Worker return 1.0f; 77*71db0c75SAndroid Build Coastguard Worker } 78*71db0c75SAndroid Build Coastguard Worker 79*71db0c75SAndroid Build Coastguard Worker // Combine the results with the sine of sum formula: 80*71db0c75SAndroid Build Coastguard Worker // cos(pi * x) = cos((k + y)*pi/32) 81*71db0c75SAndroid Build Coastguard Worker // = cos(y*pi/32) * cos(k*pi/32) - sin(y*pi/32) * sin(k*pi/32) 82*71db0c75SAndroid Build Coastguard Worker // = (cosm1_y + 1) * cos_k - sin_y * sin_k 83*71db0c75SAndroid Build Coastguard Worker // = (cosm1_y * cos_k + cos_k) - sin_y * sin_k 84*71db0c75SAndroid Build Coastguard Worker double sin_k, cos_k, sin_y, cosm1_y; 85*71db0c75SAndroid Build Coastguard Worker 86*71db0c75SAndroid Build Coastguard Worker sincospif_eval(xd, sin_k, cos_k, sin_y, cosm1_y); 87*71db0c75SAndroid Build Coastguard Worker 88*71db0c75SAndroid Build Coastguard Worker if (LIBC_UNLIKELY(sin_y == 0 && cos_k == 0)) { 89*71db0c75SAndroid Build Coastguard Worker return 0.0f; 90*71db0c75SAndroid Build Coastguard Worker } 91*71db0c75SAndroid Build Coastguard Worker 92*71db0c75SAndroid Build Coastguard Worker return static_cast<float>(fputil::multiply_add( 93*71db0c75SAndroid Build Coastguard Worker sin_y, -sin_k, fputil::multiply_add(cosm1_y, cos_k, cos_k))); 94*71db0c75SAndroid Build Coastguard Worker } 95*71db0c75SAndroid Build Coastguard Worker 96*71db0c75SAndroid Build Coastguard Worker } // namespace LIBC_NAMESPACE_DECL 97