xref: /freebsd/contrib/arm-optimized-routines/math/aarch64/sve/acoshf.c (revision f3087bef11543b42e0d69b708f367097a4118d24)
1*f3087befSAndrew Turner /*
2*f3087befSAndrew Turner  * Single-precision SVE acosh(x) function.
3*f3087befSAndrew Turner  * Copyright (c) 2023-2024, Arm Limited.
4*f3087befSAndrew Turner  * SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception
5*f3087befSAndrew Turner  */
6*f3087befSAndrew Turner 
7*f3087befSAndrew Turner #include "sv_math.h"
8*f3087befSAndrew Turner #include "test_sig.h"
9*f3087befSAndrew Turner #include "test_defs.h"
10*f3087befSAndrew Turner 
11*f3087befSAndrew Turner #define One 0x3f800000
12*f3087befSAndrew Turner #define Thres 0x20000000 /* asuint(0x1p64) - One.  */
13*f3087befSAndrew Turner 
14*f3087befSAndrew Turner #include "sv_log1pf_inline.h"
15*f3087befSAndrew Turner 
16*f3087befSAndrew Turner static svfloat32_t NOINLINE
special_case(svfloat32_t xm1,svfloat32_t tmp,svbool_t special)17*f3087befSAndrew Turner special_case (svfloat32_t xm1, svfloat32_t tmp, svbool_t special)
18*f3087befSAndrew Turner {
19*f3087befSAndrew Turner   svfloat32_t x = svadd_x (svptrue_b32 (), xm1, 1.0f);
20*f3087befSAndrew Turner   svfloat32_t y = sv_log1pf_inline (tmp, svptrue_b32 ());
21*f3087befSAndrew Turner   return sv_call_f32 (acoshf, x, y, special);
22*f3087befSAndrew Turner }
23*f3087befSAndrew Turner 
24*f3087befSAndrew Turner /* Single-precision SVE acosh(x) routine. Implements the same algorithm as
25*f3087befSAndrew Turner    vector acoshf and log1p.
26*f3087befSAndrew Turner 
27*f3087befSAndrew Turner    Maximum error is 2.47 ULPs:
28*f3087befSAndrew Turner    SV_NAME_F1 (acosh) (0x1.01ca76p+0) got 0x1.e435a6p-4
29*f3087befSAndrew Turner 				     want 0x1.e435a2p-4.  */
SV_NAME_F1(acosh)30*f3087befSAndrew Turner svfloat32_t SV_NAME_F1 (acosh) (svfloat32_t x, const svbool_t pg)
31*f3087befSAndrew Turner {
32*f3087befSAndrew Turner   svuint32_t ix = svreinterpret_u32 (x);
33*f3087befSAndrew Turner   svbool_t special = svcmpge (pg, svsub_x (pg, ix, One), Thres);
34*f3087befSAndrew Turner 
35*f3087befSAndrew Turner   svfloat32_t xm1 = svsub_x (pg, x, 1.0f);
36*f3087befSAndrew Turner   svfloat32_t u = svmul_x (pg, xm1, svadd_x (pg, x, 1.0f));
37*f3087befSAndrew Turner   svfloat32_t tmp = svadd_x (pg, xm1, svsqrt_x (pg, u));
38*f3087befSAndrew Turner 
39*f3087befSAndrew Turner   if (unlikely (svptest_any (pg, special)))
40*f3087befSAndrew Turner     return special_case (xm1, tmp, special);
41*f3087befSAndrew Turner   return sv_log1pf_inline (tmp, pg);
42*f3087befSAndrew Turner }
43*f3087befSAndrew Turner 
44*f3087befSAndrew Turner TEST_SIG (SV, F, 1, acosh, 1.0, 10.0)
45*f3087befSAndrew Turner TEST_ULP (SV_NAME_F1 (acosh), 1.97)
46*f3087befSAndrew Turner TEST_DISABLE_FENV (SV_NAME_F1 (acosh))
47*f3087befSAndrew Turner TEST_INTERVAL (SV_NAME_F1 (acosh), 0, 1, 500)
48*f3087befSAndrew Turner TEST_INTERVAL (SV_NAME_F1 (acosh), 1, 0x1p64, 100000)
49*f3087befSAndrew Turner TEST_INTERVAL (SV_NAME_F1 (acosh), 0x1p64, inf, 1000)
50*f3087befSAndrew Turner TEST_INTERVAL (SV_NAME_F1 (acosh), -0, -inf, 1000)
51*f3087befSAndrew Turner CLOSE_SVE_ATTR
52