[libc-commits] [libc] [libc][math][c23] implement C23 math function asinpif16 (PR #146226)
via libc-commits
libc-commits at lists.llvm.org
Mon Jul 14 10:51:28 PDT 2025
================
@@ -0,0 +1,151 @@
+//===-- Half-precision asinpif16(x) function ------------------------------===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception.
+//
+//===----------------------------------------------------------------------===//
+
+#include "src/math/asinpif16.h"
+#include "hdr/errno_macros.h"
+#include "hdr/fenv_macros.h"
+#include "src/__support/FPUtil/FEnvImpl.h"
+#include "src/__support/FPUtil/FPBits.h"
+#include "src/__support/FPUtil/PolyEval.h"
+#include "src/__support/FPUtil/cast.h"
+#include "src/__support/FPUtil/except_value_utils.h"
+#include "src/__support/FPUtil/multiply_add.h"
+#include "src/__support/FPUtil/sqrt.h"
+#include "src/__support/macros/optimization.h"
+
+namespace LIBC_NAMESPACE_DECL {
+
+#ifndef LIBC_MATH_HAS_SKIP_ACCURATE_PASS
+static constexpr size_t N_ASINPIF16_EXCEPTS = 3;
+
+static constexpr fputil::ExceptValues<float16, N_ASINPIF16_EXCEPTS>
+ ASINPIF16_EXCEPTS{{
+ // (input_hex, RZ_output_hex, RU_offset, RD_offset, RN_offset)
+ // x = 0.0, asinfpi(0.0) = 0.0
+ {0x0000, 0x0000, 0, 0, 0},
+
+ // x = 0x1.004p-3, asinpif16(x) = 0x1.47p-5 (RZ)
+ {0x3001U, 0x291cU, 1U, 0U, 1U},
+ // x = 0x1.0bp-1, asinpif16(x) = 0x1.658p-3 (RZ)
+ {0x382cU, 0x3196U, 1U, 0U, 0U},
+ }};
+
+#endif // !LIBC_MATH_HAS_SKIP_ACCURATE_PASS
+
+LLVM_LIBC_FUNCTION(float16, asinpif16, (float16 x)) {
+ using FPBits = fputil::FPBits<float16>;
+
+ FPBits xbits(x);
+ uint16_t x_uint = xbits.uintval();
+ bool is_neg = xbits.is_neg();
+ float16 x_abs = xbits.abs().get_val();
+
+ auto signed_result = [is_neg](auto r) -> auto { return is_neg ? -r : r; };
+
+ if (LIBC_UNLIKELY(x_abs > 1.0f16)) {
+ // aspinf16(NaN) = NaN
+ if (xbits.is_nan()) {
+ if (xbits.is_signaling_nan()) {
+ fputil::raise_except_if_required(FE_INVALID);
+ return FPBits::quiet_nan().get_val();
+ }
+ return x;
+ }
+
+ // 1 < |x| <= +/-inf
+ fputil::raise_except_if_required(FE_INVALID);
+ fputil::set_errno_if_required(EDOM);
+
+ return FPBits::quiet_nan().get_val();
+ }
+
+#ifndef LIBC_MATH_HAS_SKIP_ACCURATE_PASS
+ // exceptional values
+ if (auto r = ASINPIF16_EXCEPTS.lookup(x_uint); LIBC_UNLIKELY(r.has_value()))
+ return r.value();
+#endif // !LIBC_MATH_HAS_SKIP_ACCURATE_PASS
+
+ // the coefficients for the polynomial approximation of asin(x)/pi in the
+ // range [0, 0.5] extracted using python-sympy
+ //
+ // Python code to generate the coefficients:
+ // > from sympy import *
+ // > import math
+ // > x = symbols('x')
+ // > print(series(asin(x)/math.pi, x, 0, 21))
+ //
+ // OUTPUT:
+ //
+ // 0.318309886183791*x + 0.0530516476972984*x**3 + 0.0238732414637843*x**5 +
+ // 0.0142102627760621*x**7 + 0.00967087327815336*x**9 +
+ // 0.00712127941391293*x**11 + 0.00552355646848375*x**13 +
+ // 0.00444514782463692*x**15 + 0.00367705242846804*x**17 +
+ // 0.00310721681820837*x**19 + O(x**21)
+ //
+ // it's very accurate in the range [0, 0.5] and has a maximum error of
+ // 0.0000000000000001 in the range [0, 0.5].
+ constexpr double POLY_COEFFS[10] = {
+ 0x1.45f306dc9c889p-2, // x^1
+ 0x1.b2995e7b7b5fdp-5, // x^3
+ 0x1.8723a1d588a36p-6, // x^5
+ 0x1.d1a452f20430dp-7, // x^7
+ 0x1.3ce52a3a09f61p-7, // x^9
+ 0x1.d2b33e303d375p-8, // x^11
+ 0x1.69fde663c674fp-8, // x^13
+ 0x1.235134885f19bp-8, // x^15
+ };
+ // polynomial evaluation using horner's method
+ // work only for |x| in [0, 0.5]
+ auto asinpi_polyeval = [](double x) -> double {
+ return x * fputil::polyeval(x * x, POLY_COEFFS[0], POLY_COEFFS[1],
+ POLY_COEFFS[2], POLY_COEFFS[3], POLY_COEFFS[4],
+ POLY_COEFFS[5], POLY_COEFFS[6], POLY_COEFFS[7]);
+ };
+
+ // if |x| <= 0.5:
+ if (LIBC_UNLIKELY(x_abs <= 0.5f16)) {
----------------
overmighty wrote:
Same here. On targets without any hardware support for float16, this causes a call to the compiler runtime's half->single-precision conversion function.
https://github.com/llvm/llvm-project/pull/146226
More information about the libc-commits
mailing list