[libc-commits] [libc] [llvm] [libc][math][c23] Add acosbf16 math function (PR #184633)

via libc-commits libc-commits at lists.llvm.org
Sat Jun 6 08:47:28 PDT 2026


================
@@ -0,0 +1,94 @@
+//===-- Implementation header for acosbf16 ----------------------*- C++ -*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+#ifndef LLVM_LIBC_SRC___SUPPORT_MATH_ACOSBF16_H
+#define LLVM_LIBC_SRC___SUPPORT_MATH_ACOSBF16_H
+
+#include "src/__support/FPUtil/FEnvImpl.h"
+#include "src/__support/FPUtil/FPBits.h"
+#include "src/__support/FPUtil/bfloat16.h"
+#include "src/__support/FPUtil/cast.h"
+#include "src/__support/FPUtil/multiply_add.h"
+#include "src/__support/FPUtil/sqrt.h"
+#include "src/__support/macros/optimization.h"
+#include "src/__support/math/inv_trigf_utils.h"
+
+namespace LIBC_NAMESPACE_DECL {
+namespace math {
+
+LIBC_INLINE bfloat16 acosbf16(bfloat16 x) {
+  // Generated by Sollya using the following command:
+  // > display = hexadecimal;
+  // > round(pi/2, SG, RN);
+  constexpr float PI_2 = 0x1.921fb6p0f;
+  // > round(pi, SG, RN);
+  constexpr float PI = 0x1.921fb6p1;
+
+  using FPBits = fputil::FPBits<bfloat16>;
+  FPBits xbits(x);
+
+  uint16_t x_u = xbits.uintval();
+  uint16_t x_abs = x_u & 0x7fff;
+  bool sign = (x_u >> 15);
+  float xf = x;
+
+  float xf_abs = (xf < 0 ? -xf : xf);
+  float x_sq = xf_abs * xf_abs;
+
+  // case 1: x <= 0.5
+  if (x_abs <= 0x3F00) {
+    // |x| = {0}
+    if (LIBC_UNLIKELY(x_abs == 0))
+      return fputil::cast<bfloat16>(PI_2);
+
+    float xp = fputil::cast<float>(inv_trigf_utils_internal::asin_eval(x_sq));
+    float result = xf * fputil::multiply_add(x_sq, xp, 1.0f);
+    return fputil::cast<bfloat16>(PI_2 - result);
+  }
+
+  // case 2: 0.5< |x|<= 1.0
+  if (x_abs <= 0x3F80) {
+    // |x| = {1}
+    if (x_abs == 0x3F80) {
+      if (sign)
+        return fputil::cast<bfloat16>(PI);
+      else
+        return fputil::cast<bfloat16>(0.0f);
+    }
+
+    // using reduction for acos:
+    // acos(|x|) = 2*asin(sqrt((1 - |x|)/2)),
+    // and acos(x) = acos(|x|) for x >= 0, pi - acos(|x|) for x < 0
+    float t = fputil::multiply_add<float>(xf_abs, -0.5f, 0.5f);
+    float t_sqrt = fputil::sqrt<float>(t);
+    float tp = fputil::cast<float>(inv_trigf_utils_internal::asin_eval(t));
+    float asin_sqrt_t = t_sqrt * (fputil::multiply_add(t, tp, 1.0f));
+
+    return fputil::cast<bfloat16>(
+        (sign) ? fputil::multiply_add(asin_sqrt_t, -2.0f, PI)
+               : 2 * asin_sqrt_t);
----------------
lntue wrote:

`2.0f`

https://github.com/llvm/llvm-project/pull/184633


More information about the libc-commits mailing list