diff options
author | Szabolcs Nagy <szabolcs.nagy@arm.com> | 2019-08-09 15:39:09 +0100 |
---|---|---|
committer | Szabolcs Nagy <szabolcs.nagy@arm.com> | 2019-10-14 11:58:53 +0100 |
commit | c5cba8528da13fe0d647dbd0f80d0cf21434b224 (patch) | |
tree | fe2dfbc6732ee358a011073e39adf4d36c71a86a /math/test/ulp.c | |
parent | c280e49d7b1d1987e75de0e0e57a63ee7167ad5f (diff) | |
download | arm-optimized-routines-c5cba8528da13fe0d647dbd0f80d0cf21434b224.tar.gz |
Add vector sinf and cosf
The polynomials were produced by searching the coefficient space using
heuristics and ideas from https://arxiv.org/abs/1508.03211
The worst-case error is 1.886 ulp, large inputs (> 2^20) and other
special cases use scalar sinf and cosf.
Diffstat (limited to 'math/test/ulp.c')
-rw-r--r-- | math/test/ulp.c | 14 |
1 files changed, 14 insertions, 0 deletions
diff --git a/math/test/ulp.c b/math/test/ulp.c index 2ffba9b..4eb9d85 100644 --- a/math/test/ulp.c +++ b/math/test/ulp.c @@ -223,15 +223,21 @@ static const double dv[2] = {1.0, -INFINITY}; static inline v_float argf(float x) { return (v_float){x,x,x,fv[secondcall]}; } static inline v_double argd(double x) { return (v_double){x,dv[secondcall]}; } +static float v_sinf(float x) { return __v_sinf(argf(x))[0]; } +static float v_cosf(float x) { return __v_cosf(argf(x))[0]; } static float v_expf_1u(float x) { return __v_expf_1u(argf(x))[0]; } static float v_expf(float x) { return __v_expf(argf(x))[0]; } static float v_logf(float x) { return __v_logf(argf(x))[0]; } static double v_exp(double x) { return __v_exp(argd(x))[0]; } #ifdef __vpcs +static float vn_sinf(float x) { return __vn_sinf(argf(x))[0]; } +static float vn_cosf(float x) { return __vn_cosf(argf(x))[0]; } static float vn_expf_1u(float x) { return __vn_expf_1u(argf(x))[0]; } static float vn_expf(float x) { return __vn_expf(argf(x))[0]; } static float vn_logf(float x) { return __vn_logf(argf(x))[0]; } static double vn_exp(double x) { return __vn_exp(argd(x))[0]; } +static float Z_sinf(float x) { return _ZGVnN4v_sinf(argf(x))[0]; } +static float Z_cosf(float x) { return _ZGVnN4v_cosf(argf(x))[0]; } static float Z_expf(float x) { return _ZGVnN4v_expf(argf(x))[0]; } static float Z_logf(float x) { return _ZGVnN4v_logf(argf(x))[0]; } static double Z_exp(double x) { return _ZGVnN2v_exp(argd(x))[0]; } @@ -293,20 +299,28 @@ static const struct fun fun[] = { D1 (log) D1 (log2) D2 (pow) + F (__s_sinf, __s_sinf, sin, mpfr_sin, 1, 1, f1, 0) + F (__s_cosf, __s_cosf, cos, mpfr_cos, 1, 1, f1, 0) F (__s_expf_1u, __s_expf_1u, exp, mpfr_exp, 1, 1, f1, 0) F (__s_expf, __s_expf, exp, mpfr_exp, 1, 1, f1, 0) F (__s_logf, __s_logf, log, mpfr_log, 1, 1, f1, 0) F (__s_exp, __s_exp, expl, mpfr_exp, 1, 0, d1, 0) #if __aarch64__ + F (__v_sinf, v_sinf, sin, mpfr_sin, 1, 1, f1, 1) + F (__v_cosf, v_cosf, cos, mpfr_cos, 1, 1, f1, 1) F (__v_expf_1u, v_expf_1u, exp, mpfr_exp, 1, 1, f1, 1) F (__v_expf, v_expf, exp, mpfr_exp, 1, 1, f1, 1) F (__v_logf, v_logf, log, mpfr_log, 1, 1, f1, 1) F (__v_exp, v_exp, expl, mpfr_exp, 1, 0, d1, 1) #ifdef __vpcs + F (__vn_sinf, vn_sinf, sin, mpfr_sin, 1, 1, f1, 1) + F (__vn_cosf, vn_cosf, cos, mpfr_cos, 1, 1, f1, 1) F (__vn_expf_1u, vn_expf_1u, exp, mpfr_exp, 1, 1, f1, 1) F (__vn_expf, vn_expf, exp, mpfr_exp, 1, 1, f1, 1) F (__vn_logf, vn_logf, log, mpfr_log, 1, 1, f1, 1) F (__vn_exp, vn_exp, expl, mpfr_exp, 1, 0, d1, 1) + F (_ZGVnN4v_sinf, Z_sinf, sin, mpfr_sin, 1, 1, f1, 1) + F (_ZGVnN4v_cosf, Z_cosf, cos, mpfr_cos, 1, 1, f1, 1) F (_ZGVnN4v_expf, Z_expf, exp, mpfr_exp, 1, 1, f1, 1) F (_ZGVnN4v_logf, Z_logf, log, mpfr_log, 1, 1, f1, 1) F (_ZGVnN2v_exp, Z_exp, expl, mpfr_exp, 1, 0, d1, 1) |