Add vector exp2f

Same design as in expf. Worst-case error of __v_exp2f and __v_exp2f_1u is 1.96 and 0.88 ulp respectively. It is not clear if round/convert instructions are better or +- Shift. For expf the latter, for exp2f the former seems more consistently faster, but both options are kept in the code for now.
author: Szabolcs Nagy <szabolcs.nagy@arm.com> 2019-10-14 15:21:28 +0100
committer: Szabolcs Nagy <szabolcs.nagy@arm.com> 2019-11-05 18:38:51 +0000
commit: 69170e15cc2a10d7883e2fb40fb4437052febc13 (patch)
tree: 80a149cd724906606532751fab4ff870ad750930 /math/test/ulp.c
parent: 65464ec60ba73d113c8bd1632708014fa82dc9c6 (diff)
download: arm-optimized-routines-69170e15cc2a10d7883e2fb40fb4437052febc13.tar.gz
1 files changed, 12 insertions, 0 deletions
diff --git a/math/test/ulp.c b/math/test/ulp.c
index 60d89bf..ffe3501 100644
--- a/math/test/ulp.c
+++ b/math/test/ulp.c
@@ -227,6 +227,8 @@ static float v_sinf(float x) { return __v_sinf(argf(x))[0]; }
 static float v_cosf(float x) { return __v_cosf(argf(x))[0]; }
 static float v_expf_1u(float x) { return __v_expf_1u(argf(x))[0]; }
 static float v_expf(float x) { return __v_expf(argf(x))[0]; }
+static float v_exp2f_1u(float x) { return __v_exp2f_1u(argf(x))[0]; }
+static float v_exp2f(float x) { return __v_exp2f(argf(x))[0]; }
 static float v_logf(float x) { return __v_logf(argf(x))[0]; }
 static float v_powf(float x, float y) { return __v_powf(argf(x),argf(y))[0]; }
 static double v_sin(double x) { return __v_sin(argd(x))[0]; }
@@ -238,6 +240,8 @@ static float vn_sinf(float x) { return __vn_sinf(argf(x))[0]; }
 static float vn_cosf(float x) { return __vn_cosf(argf(x))[0]; }
 static float vn_expf_1u(float x) { return __vn_expf_1u(argf(x))[0]; }
 static float vn_expf(float x) { return __vn_expf(argf(x))[0]; }
+static float vn_exp2f_1u(float x) { return __vn_exp2f_1u(argf(x))[0]; }
+static float vn_exp2f(float x) { return __vn_exp2f(argf(x))[0]; }
 static float vn_logf(float x) { return __vn_logf(argf(x))[0]; }
 static float vn_powf(float x, float y) { return __vn_powf(argf(x),argf(y))[0]; }
 static double vn_sin(double x) { return __vn_sin(argd(x))[0]; }
@@ -247,6 +251,7 @@ static double vn_log(double x) { return __vn_log(argd(x))[0]; }
 static float Z_sinf(float x) { return _ZGVnN4v_sinf(argf(x))[0]; }
 static float Z_cosf(float x) { return _ZGVnN4v_cosf(argf(x))[0]; }
 static float Z_expf(float x) { return _ZGVnN4v_expf(argf(x))[0]; }
+static float Z_exp2f(float x) { return _ZGVnN4v_exp2f(argf(x))[0]; }
 static float Z_logf(float x) { return _ZGVnN4v_logf(argf(x))[0]; }
 static float Z_powf(float x, float y) { return _ZGVnN4vv_powf(argf(x),argf(y))[0]; }
 static double Z_sin(double x) { return _ZGVnN2v_sin(argd(x))[0]; }
@@ -315,6 +320,8 @@ static const struct fun fun[] = {
  F (__s_cosf, __s_cosf, cos, mpfr_cos, 1, 1, f1, 0)
  F (__s_expf_1u, __s_expf_1u, exp, mpfr_exp, 1, 1, f1, 0)
  F (__s_expf, __s_expf, exp, mpfr_exp, 1, 1, f1, 0)
+ F (__s_exp2f_1u, __s_exp2f_1u, exp2, mpfr_exp2, 1, 1, f1, 0)
+ F (__s_exp2f, __s_exp2f, exp2, mpfr_exp2, 1, 1, f1, 0)
  F (__s_powf, __s_powf, pow, mpfr_pow, 2, 1, f2, 0)
  F (__s_logf, __s_logf, log, mpfr_log, 1, 1, f1, 0)
  F (__s_sin, __s_sin, sinl, mpfr_sin, 1, 0, d1, 0)
@@ -326,6 +333,8 @@ static const struct fun fun[] = {
  F (__v_cosf, v_cosf, cos, mpfr_cos, 1, 1, f1, 1)
  F (__v_expf_1u, v_expf_1u, exp, mpfr_exp, 1, 1, f1, 1)
  F (__v_expf, v_expf, exp, mpfr_exp, 1, 1, f1, 1)
+ F (__v_exp2f_1u, v_exp2f_1u, exp2, mpfr_exp2, 1, 1, f1, 1)
+ F (__v_exp2f, v_exp2f, exp2, mpfr_exp2, 1, 1, f1, 1)
  F (__v_logf, v_logf, log, mpfr_log, 1, 1, f1, 1)
  F (__v_powf, v_powf, pow, mpfr_pow, 2, 1, f2, 1)
  F (__v_sin, v_sin, sinl, mpfr_sin, 1, 0, d1, 1)
@@ -337,6 +346,8 @@ static const struct fun fun[] = {
  F (__vn_cosf, vn_cosf, cos, mpfr_cos, 1, 1, f1, 1)
  F (__vn_expf_1u, vn_expf_1u, exp, mpfr_exp, 1, 1, f1, 1)
  F (__vn_expf, vn_expf, exp, mpfr_exp, 1, 1, f1, 1)
+ F (__vn_exp2f_1u, vn_exp2f_1u, exp2, mpfr_exp2, 1, 1, f1, 1)
+ F (__vn_exp2f, vn_exp2f, exp2, mpfr_exp2, 1, 1, f1, 1)
  F (__vn_logf, vn_logf, log, mpfr_log, 1, 1, f1, 1)
  F (__vn_powf, vn_powf, pow, mpfr_pow, 2, 1, f2, 1)
  F (__vn_sin, vn_sin, sinl, mpfr_sin, 1, 0, d1, 1)
@@ -346,6 +357,7 @@ static const struct fun fun[] = {
  F (_ZGVnN4v_sinf, Z_sinf, sin, mpfr_sin, 1, 1, f1, 1)
  F (_ZGVnN4v_cosf, Z_cosf, cos, mpfr_cos, 1, 1, f1, 1)
  F (_ZGVnN4v_expf, Z_expf, exp, mpfr_exp, 1, 1, f1, 1)
+ F (_ZGVnN4v_exp2f, Z_exp2f, exp2, mpfr_exp2, 1, 1, f1, 1)
  F (_ZGVnN4v_logf, Z_logf, log, mpfr_log, 1, 1, f1, 1)
  F (_ZGVnN4vv_powf, Z_powf, pow, mpfr_pow, 2, 1, f2, 1)
  F (_ZGVnN2v_sin, Z_sin, sinl, mpfr_sin, 1, 0, d1, 1)
author	Szabolcs Nagy <szabolcs.nagy@arm.com>	2019-10-14 15:21:28 +0100
committer	Szabolcs Nagy <szabolcs.nagy@arm.com>	2019-11-05 18:38:51 +0000
commit	69170e15cc2a10d7883e2fb40fb4437052febc13 (patch)
tree	80a149cd724906606532751fab4ff870ad750930 /math/test/ulp.c
parent	65464ec60ba73d113c8bd1632708014fa82dc9c6 (diff)
download	arm-optimized-routines-69170e15cc2a10d7883e2fb40fb4437052febc13.tar.gz