You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
853 lines
21 KiB
853 lines
21 KiB
/*
|
|
* ULP error checking tool for math functions.
|
|
*
|
|
* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
* See https://llvm.org/LICENSE.txt for license information.
|
|
* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
*/
|
|
|
|
#include <ctype.h>
|
|
#include <fenv.h>
|
|
#include <float.h>
|
|
#include <math.h>
|
|
#include <stdint.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include "mathlib.h"
|
|
|
|
/* Don't depend on mpfr by default. */
|
|
#ifndef USE_MPFR
|
|
# define USE_MPFR 0
|
|
#endif
|
|
#if USE_MPFR
|
|
# include <mpfr.h>
|
|
#endif
|
|
|
|
#ifndef WANT_VMATH
|
|
/* Enable the build of vector math code. */
|
|
# define WANT_VMATH 1
|
|
#endif
|
|
|
|
static inline uint64_t
|
|
asuint64 (double f)
|
|
{
|
|
union
|
|
{
|
|
double f;
|
|
uint64_t i;
|
|
} u = {f};
|
|
return u.i;
|
|
}
|
|
|
|
static inline double
|
|
asdouble (uint64_t i)
|
|
{
|
|
union
|
|
{
|
|
uint64_t i;
|
|
double f;
|
|
} u = {i};
|
|
return u.f;
|
|
}
|
|
|
|
static inline uint32_t
|
|
asuint (float f)
|
|
{
|
|
union
|
|
{
|
|
float f;
|
|
uint32_t i;
|
|
} u = {f};
|
|
return u.i;
|
|
}
|
|
|
|
static inline float
|
|
asfloat (uint32_t i)
|
|
{
|
|
union
|
|
{
|
|
uint32_t i;
|
|
float f;
|
|
} u = {i};
|
|
return u.f;
|
|
}
|
|
|
|
static uint64_t seed = 0x0123456789abcdef;
|
|
static uint64_t
|
|
rand64 (void)
|
|
{
|
|
seed = 6364136223846793005ull * seed + 1;
|
|
return seed ^ (seed >> 32);
|
|
}
|
|
|
|
/* Uniform random in [0,n]. */
|
|
static uint64_t
|
|
randn (uint64_t n)
|
|
{
|
|
uint64_t r, m;
|
|
|
|
if (n == 0)
|
|
return 0;
|
|
n++;
|
|
if (n == 0)
|
|
return rand64 ();
|
|
for (;;)
|
|
{
|
|
r = rand64 ();
|
|
m = r % n;
|
|
if (r - m <= -n)
|
|
return m;
|
|
}
|
|
}
|
|
|
|
struct gen
|
|
{
|
|
uint64_t start;
|
|
uint64_t len;
|
|
uint64_t start2;
|
|
uint64_t len2;
|
|
uint64_t off;
|
|
uint64_t step;
|
|
uint64_t cnt;
|
|
};
|
|
|
|
struct args_f1
|
|
{
|
|
float x;
|
|
};
|
|
|
|
struct args_f2
|
|
{
|
|
float x;
|
|
float x2;
|
|
};
|
|
|
|
struct args_d1
|
|
{
|
|
double x;
|
|
};
|
|
|
|
struct args_d2
|
|
{
|
|
double x;
|
|
double x2;
|
|
};
|
|
|
|
/* result = y + tail*2^ulpexp. */
|
|
struct ret_f
|
|
{
|
|
float y;
|
|
double tail;
|
|
int ulpexp;
|
|
int ex;
|
|
int ex_may;
|
|
};
|
|
|
|
struct ret_d
|
|
{
|
|
double y;
|
|
double tail;
|
|
int ulpexp;
|
|
int ex;
|
|
int ex_may;
|
|
};
|
|
|
|
static inline uint64_t
|
|
next1 (struct gen *g)
|
|
{
|
|
/* For single argument use randomized incremental steps,
|
|
that produce dense sampling without collisions and allow
|
|
testing all inputs in a range. */
|
|
uint64_t r = g->start + g->off;
|
|
g->off += g->step + randn (g->step / 2);
|
|
if (g->off > g->len)
|
|
g->off -= g->len; /* hack. */
|
|
return r;
|
|
}
|
|
|
|
static inline uint64_t
|
|
next2 (uint64_t *x2, struct gen *g)
|
|
{
|
|
/* For two arguments use uniform random sampling. */
|
|
uint64_t r = g->start + randn (g->len);
|
|
*x2 = g->start2 + randn (g->len2);
|
|
return r;
|
|
}
|
|
|
|
static struct args_f1
|
|
next_f1 (void *g)
|
|
{
|
|
return (struct args_f1){asfloat (next1 (g))};
|
|
}
|
|
|
|
static struct args_f2
|
|
next_f2 (void *g)
|
|
{
|
|
uint64_t x2;
|
|
uint64_t x = next2 (&x2, g);
|
|
return (struct args_f2){asfloat (x), asfloat (x2)};
|
|
}
|
|
|
|
static struct args_d1
|
|
next_d1 (void *g)
|
|
{
|
|
return (struct args_d1){asdouble (next1 (g))};
|
|
}
|
|
|
|
static struct args_d2
|
|
next_d2 (void *g)
|
|
{
|
|
uint64_t x2;
|
|
uint64_t x = next2 (&x2, g);
|
|
return (struct args_d2){asdouble (x), asdouble (x2)};
|
|
}
|
|
|
|
struct conf
|
|
{
|
|
int r;
|
|
int rc;
|
|
int quiet;
|
|
int mpfr;
|
|
int fenv;
|
|
unsigned long long n;
|
|
double softlim;
|
|
double errlim;
|
|
};
|
|
|
|
/* Wrappers for sincos. */
|
|
static float sincosf_sinf(float x) {(void)cosf(x); return sinf(x);}
|
|
static float sincosf_cosf(float x) {(void)sinf(x); return cosf(x);}
|
|
static double sincos_sin(double x) {(void)cos(x); return sin(x);}
|
|
static double sincos_cos(double x) {(void)sin(x); return cos(x);}
|
|
#if USE_MPFR
|
|
static int sincos_mpfr_sin(mpfr_t y, const mpfr_t x, mpfr_rnd_t r) { mpfr_cos(y,x,r); return mpfr_sin(y,x,r); }
|
|
static int sincos_mpfr_cos(mpfr_t y, const mpfr_t x, mpfr_rnd_t r) { mpfr_sin(y,x,r); return mpfr_cos(y,x,r); }
|
|
#endif
|
|
|
|
/* A bit of a hack: call vector functions twice with the same
|
|
input in lane 0 but a different value in other lanes: once
|
|
with an in-range value and then with a special case value. */
|
|
static int secondcall;
|
|
|
|
/* Wrappers for vector functions. */
|
|
#if __aarch64__ && WANT_VMATH
|
|
typedef __f32x4_t v_float;
|
|
typedef __f64x2_t v_double;
|
|
static const float fv[2] = {1.0f, -INFINITY};
|
|
static const double dv[2] = {1.0, -INFINITY};
|
|
static inline v_float argf(float x) { return (v_float){x,x,x,fv[secondcall]}; }
|
|
static inline v_double argd(double x) { return (v_double){x,dv[secondcall]}; }
|
|
|
|
static float v_sinf(float x) { return __v_sinf(argf(x))[0]; }
|
|
static float v_cosf(float x) { return __v_cosf(argf(x))[0]; }
|
|
static float v_expf_1u(float x) { return __v_expf_1u(argf(x))[0]; }
|
|
static float v_expf(float x) { return __v_expf(argf(x))[0]; }
|
|
static float v_exp2f_1u(float x) { return __v_exp2f_1u(argf(x))[0]; }
|
|
static float v_exp2f(float x) { return __v_exp2f(argf(x))[0]; }
|
|
static float v_logf(float x) { return __v_logf(argf(x))[0]; }
|
|
static float v_powf(float x, float y) { return __v_powf(argf(x),argf(y))[0]; }
|
|
static double v_sin(double x) { return __v_sin(argd(x))[0]; }
|
|
static double v_cos(double x) { return __v_cos(argd(x))[0]; }
|
|
static double v_exp(double x) { return __v_exp(argd(x))[0]; }
|
|
static double v_log(double x) { return __v_log(argd(x))[0]; }
|
|
static double v_pow(double x, double y) { return __v_pow(argd(x),argd(y))[0]; }
|
|
#ifdef __vpcs
|
|
static float vn_sinf(float x) { return __vn_sinf(argf(x))[0]; }
|
|
static float vn_cosf(float x) { return __vn_cosf(argf(x))[0]; }
|
|
static float vn_expf_1u(float x) { return __vn_expf_1u(argf(x))[0]; }
|
|
static float vn_expf(float x) { return __vn_expf(argf(x))[0]; }
|
|
static float vn_exp2f_1u(float x) { return __vn_exp2f_1u(argf(x))[0]; }
|
|
static float vn_exp2f(float x) { return __vn_exp2f(argf(x))[0]; }
|
|
static float vn_logf(float x) { return __vn_logf(argf(x))[0]; }
|
|
static float vn_powf(float x, float y) { return __vn_powf(argf(x),argf(y))[0]; }
|
|
static double vn_sin(double x) { return __vn_sin(argd(x))[0]; }
|
|
static double vn_cos(double x) { return __vn_cos(argd(x))[0]; }
|
|
static double vn_exp(double x) { return __vn_exp(argd(x))[0]; }
|
|
static double vn_log(double x) { return __vn_log(argd(x))[0]; }
|
|
static double vn_pow(double x, double y) { return __vn_pow(argd(x),argd(y))[0]; }
|
|
static float Z_sinf(float x) { return _ZGVnN4v_sinf(argf(x))[0]; }
|
|
static float Z_cosf(float x) { return _ZGVnN4v_cosf(argf(x))[0]; }
|
|
static float Z_expf(float x) { return _ZGVnN4v_expf(argf(x))[0]; }
|
|
static float Z_exp2f(float x) { return _ZGVnN4v_exp2f(argf(x))[0]; }
|
|
static float Z_logf(float x) { return _ZGVnN4v_logf(argf(x))[0]; }
|
|
static float Z_powf(float x, float y) { return _ZGVnN4vv_powf(argf(x),argf(y))[0]; }
|
|
static double Z_sin(double x) { return _ZGVnN2v_sin(argd(x))[0]; }
|
|
static double Z_cos(double x) { return _ZGVnN2v_cos(argd(x))[0]; }
|
|
static double Z_exp(double x) { return _ZGVnN2v_exp(argd(x))[0]; }
|
|
static double Z_log(double x) { return _ZGVnN2v_log(argd(x))[0]; }
|
|
static double Z_pow(double x, double y) { return _ZGVnN2vv_pow(argd(x),argd(y))[0]; }
|
|
#endif
|
|
#endif
|
|
|
|
struct fun
|
|
{
|
|
const char *name;
|
|
int arity;
|
|
int singleprec;
|
|
int twice;
|
|
union
|
|
{
|
|
float (*f1) (float);
|
|
float (*f2) (float, float);
|
|
double (*d1) (double);
|
|
double (*d2) (double, double);
|
|
} fun;
|
|
union
|
|
{
|
|
double (*f1) (double);
|
|
double (*f2) (double, double);
|
|
long double (*d1) (long double);
|
|
long double (*d2) (long double, long double);
|
|
} fun_long;
|
|
#if USE_MPFR
|
|
union
|
|
{
|
|
int (*f1) (mpfr_t, const mpfr_t, mpfr_rnd_t);
|
|
int (*f2) (mpfr_t, const mpfr_t, const mpfr_t, mpfr_rnd_t);
|
|
int (*d1) (mpfr_t, const mpfr_t, mpfr_rnd_t);
|
|
int (*d2) (mpfr_t, const mpfr_t, const mpfr_t, mpfr_rnd_t);
|
|
} fun_mpfr;
|
|
#endif
|
|
};
|
|
|
|
static const struct fun fun[] = {
|
|
#if USE_MPFR
|
|
# define F(x, x_wrap, x_long, x_mpfr, a, s, t, twice) \
|
|
{#x, a, s, twice, {.t = x_wrap}, {.t = x_long}, {.t = x_mpfr}},
|
|
#else
|
|
# define F(x, x_wrap, x_long, x_mpfr, a, s, t, twice) \
|
|
{#x, a, s, twice, {.t = x_wrap}, {.t = x_long}},
|
|
#endif
|
|
#define F1(x) F (x##f, x##f, x, mpfr_##x, 1, 1, f1, 0)
|
|
#define F2(x) F (x##f, x##f, x, mpfr_##x, 2, 1, f2, 0)
|
|
#define D1(x) F (x, x, x##l, mpfr_##x, 1, 0, d1, 0)
|
|
#define D2(x) F (x, x, x##l, mpfr_##x, 2, 0, d2, 0)
|
|
F1 (sin)
|
|
F1 (cos)
|
|
F (sincosf_sinf, sincosf_sinf, sincos_sin, sincos_mpfr_sin, 1, 1, f1, 0)
|
|
F (sincosf_cosf, sincosf_cosf, sincos_cos, sincos_mpfr_cos, 1, 1, f1, 0)
|
|
F1 (exp)
|
|
F1 (exp2)
|
|
F1 (log)
|
|
F1 (log2)
|
|
F2 (pow)
|
|
D1 (exp)
|
|
D1 (exp2)
|
|
D1 (log)
|
|
D1 (log2)
|
|
D2 (pow)
|
|
#if WANT_VMATH
|
|
F (__s_sinf, __s_sinf, sin, mpfr_sin, 1, 1, f1, 0)
|
|
F (__s_cosf, __s_cosf, cos, mpfr_cos, 1, 1, f1, 0)
|
|
F (__s_expf_1u, __s_expf_1u, exp, mpfr_exp, 1, 1, f1, 0)
|
|
F (__s_expf, __s_expf, exp, mpfr_exp, 1, 1, f1, 0)
|
|
F (__s_exp2f_1u, __s_exp2f_1u, exp2, mpfr_exp2, 1, 1, f1, 0)
|
|
F (__s_exp2f, __s_exp2f, exp2, mpfr_exp2, 1, 1, f1, 0)
|
|
F (__s_powf, __s_powf, pow, mpfr_pow, 2, 1, f2, 0)
|
|
F (__s_logf, __s_logf, log, mpfr_log, 1, 1, f1, 0)
|
|
F (__s_sin, __s_sin, sinl, mpfr_sin, 1, 0, d1, 0)
|
|
F (__s_cos, __s_cos, cosl, mpfr_cos, 1, 0, d1, 0)
|
|
F (__s_exp, __s_exp, expl, mpfr_exp, 1, 0, d1, 0)
|
|
F (__s_log, __s_log, logl, mpfr_log, 1, 0, d1, 0)
|
|
F (__s_pow, __s_pow, powl, mpfr_pow, 2, 0, d2, 0)
|
|
#if __aarch64__
|
|
F (__v_sinf, v_sinf, sin, mpfr_sin, 1, 1, f1, 1)
|
|
F (__v_cosf, v_cosf, cos, mpfr_cos, 1, 1, f1, 1)
|
|
F (__v_expf_1u, v_expf_1u, exp, mpfr_exp, 1, 1, f1, 1)
|
|
F (__v_expf, v_expf, exp, mpfr_exp, 1, 1, f1, 1)
|
|
F (__v_exp2f_1u, v_exp2f_1u, exp2, mpfr_exp2, 1, 1, f1, 1)
|
|
F (__v_exp2f, v_exp2f, exp2, mpfr_exp2, 1, 1, f1, 1)
|
|
F (__v_logf, v_logf, log, mpfr_log, 1, 1, f1, 1)
|
|
F (__v_powf, v_powf, pow, mpfr_pow, 2, 1, f2, 1)
|
|
F (__v_sin, v_sin, sinl, mpfr_sin, 1, 0, d1, 1)
|
|
F (__v_cos, v_cos, cosl, mpfr_cos, 1, 0, d1, 1)
|
|
F (__v_exp, v_exp, expl, mpfr_exp, 1, 0, d1, 1)
|
|
F (__v_log, v_log, logl, mpfr_log, 1, 0, d1, 1)
|
|
F (__v_pow, v_pow, powl, mpfr_pow, 2, 0, d2, 1)
|
|
#ifdef __vpcs
|
|
F (__vn_sinf, vn_sinf, sin, mpfr_sin, 1, 1, f1, 1)
|
|
F (__vn_cosf, vn_cosf, cos, mpfr_cos, 1, 1, f1, 1)
|
|
F (__vn_expf_1u, vn_expf_1u, exp, mpfr_exp, 1, 1, f1, 1)
|
|
F (__vn_expf, vn_expf, exp, mpfr_exp, 1, 1, f1, 1)
|
|
F (__vn_exp2f_1u, vn_exp2f_1u, exp2, mpfr_exp2, 1, 1, f1, 1)
|
|
F (__vn_exp2f, vn_exp2f, exp2, mpfr_exp2, 1, 1, f1, 1)
|
|
F (__vn_logf, vn_logf, log, mpfr_log, 1, 1, f1, 1)
|
|
F (__vn_powf, vn_powf, pow, mpfr_pow, 2, 1, f2, 1)
|
|
F (__vn_sin, vn_sin, sinl, mpfr_sin, 1, 0, d1, 1)
|
|
F (__vn_cos, vn_cos, cosl, mpfr_cos, 1, 0, d1, 1)
|
|
F (__vn_exp, vn_exp, expl, mpfr_exp, 1, 0, d1, 1)
|
|
F (__vn_log, vn_log, logl, mpfr_log, 1, 0, d1, 1)
|
|
F (__vn_pow, vn_pow, powl, mpfr_pow, 2, 0, d2, 1)
|
|
F (_ZGVnN4v_sinf, Z_sinf, sin, mpfr_sin, 1, 1, f1, 1)
|
|
F (_ZGVnN4v_cosf, Z_cosf, cos, mpfr_cos, 1, 1, f1, 1)
|
|
F (_ZGVnN4v_expf, Z_expf, exp, mpfr_exp, 1, 1, f1, 1)
|
|
F (_ZGVnN4v_exp2f, Z_exp2f, exp2, mpfr_exp2, 1, 1, f1, 1)
|
|
F (_ZGVnN4v_logf, Z_logf, log, mpfr_log, 1, 1, f1, 1)
|
|
F (_ZGVnN4vv_powf, Z_powf, pow, mpfr_pow, 2, 1, f2, 1)
|
|
F (_ZGVnN2v_sin, Z_sin, sinl, mpfr_sin, 1, 0, d1, 1)
|
|
F (_ZGVnN2v_cos, Z_cos, cosl, mpfr_cos, 1, 0, d1, 1)
|
|
F (_ZGVnN2v_exp, Z_exp, expl, mpfr_exp, 1, 0, d1, 1)
|
|
F (_ZGVnN2v_log, Z_log, logl, mpfr_log, 1, 0, d1, 1)
|
|
F (_ZGVnN2vv_pow, Z_pow, powl, mpfr_pow, 2, 0, d2, 1)
|
|
#endif
|
|
#endif
|
|
#endif
|
|
#undef F
|
|
#undef F1
|
|
#undef F2
|
|
#undef D1
|
|
#undef D2
|
|
{0}};
|
|
|
|
/* Boilerplate for generic calls. */
|
|
|
|
static inline int
|
|
ulpscale_f (float x)
|
|
{
|
|
int e = asuint (x) >> 23 & 0xff;
|
|
if (!e)
|
|
e++;
|
|
return e - 0x7f - 23;
|
|
}
|
|
static inline int
|
|
ulpscale_d (double x)
|
|
{
|
|
int e = asuint64 (x) >> 52 & 0x7ff;
|
|
if (!e)
|
|
e++;
|
|
return e - 0x3ff - 52;
|
|
}
|
|
static inline float
|
|
call_f1 (const struct fun *f, struct args_f1 a)
|
|
{
|
|
return f->fun.f1 (a.x);
|
|
}
|
|
static inline float
|
|
call_f2 (const struct fun *f, struct args_f2 a)
|
|
{
|
|
return f->fun.f2 (a.x, a.x2);
|
|
}
|
|
|
|
static inline double
|
|
call_d1 (const struct fun *f, struct args_d1 a)
|
|
{
|
|
return f->fun.d1 (a.x);
|
|
}
|
|
static inline double
|
|
call_d2 (const struct fun *f, struct args_d2 a)
|
|
{
|
|
return f->fun.d2 (a.x, a.x2);
|
|
}
|
|
static inline double
|
|
call_long_f1 (const struct fun *f, struct args_f1 a)
|
|
{
|
|
return f->fun_long.f1 (a.x);
|
|
}
|
|
static inline double
|
|
call_long_f2 (const struct fun *f, struct args_f2 a)
|
|
{
|
|
return f->fun_long.f2 (a.x, a.x2);
|
|
}
|
|
static inline long double
|
|
call_long_d1 (const struct fun *f, struct args_d1 a)
|
|
{
|
|
return f->fun_long.d1 (a.x);
|
|
}
|
|
static inline long double
|
|
call_long_d2 (const struct fun *f, struct args_d2 a)
|
|
{
|
|
return f->fun_long.d2 (a.x, a.x2);
|
|
}
|
|
static inline void
|
|
printcall_f1 (const struct fun *f, struct args_f1 a)
|
|
{
|
|
printf ("%s(%a)", f->name, a.x);
|
|
}
|
|
static inline void
|
|
printcall_f2 (const struct fun *f, struct args_f2 a)
|
|
{
|
|
printf ("%s(%a, %a)", f->name, a.x, a.x2);
|
|
}
|
|
static inline void
|
|
printcall_d1 (const struct fun *f, struct args_d1 a)
|
|
{
|
|
printf ("%s(%a)", f->name, a.x);
|
|
}
|
|
static inline void
|
|
printcall_d2 (const struct fun *f, struct args_d2 a)
|
|
{
|
|
printf ("%s(%a, %a)", f->name, a.x, a.x2);
|
|
}
|
|
static inline void
|
|
printgen_f1 (const struct fun *f, struct gen *gen)
|
|
{
|
|
printf ("%s in [%a;%a]", f->name, asfloat (gen->start),
|
|
asfloat (gen->start + gen->len));
|
|
}
|
|
static inline void
|
|
printgen_f2 (const struct fun *f, struct gen *gen)
|
|
{
|
|
printf ("%s in [%a;%a] x [%a;%a]", f->name, asfloat (gen->start),
|
|
asfloat (gen->start + gen->len), asfloat (gen->start2),
|
|
asfloat (gen->start2 + gen->len2));
|
|
}
|
|
static inline void
|
|
printgen_d1 (const struct fun *f, struct gen *gen)
|
|
{
|
|
printf ("%s in [%a;%a]", f->name, asdouble (gen->start),
|
|
asdouble (gen->start + gen->len));
|
|
}
|
|
static inline void
|
|
printgen_d2 (const struct fun *f, struct gen *gen)
|
|
{
|
|
printf ("%s in [%a;%a] x [%a;%a]", f->name, asdouble (gen->start),
|
|
asdouble (gen->start + gen->len), asdouble (gen->start2),
|
|
asdouble (gen->start2 + gen->len2));
|
|
}
|
|
|
|
#define reduce_f1(a, f, op) (f (a.x))
|
|
#define reduce_f2(a, f, op) (f (a.x) op f (a.x2))
|
|
#define reduce_d1(a, f, op) (f (a.x))
|
|
#define reduce_d2(a, f, op) (f (a.x) op f (a.x2))
|
|
|
|
#ifndef IEEE_754_2008_SNAN
|
|
# define IEEE_754_2008_SNAN 1
|
|
#endif
|
|
static inline int
|
|
issignaling_f (float x)
|
|
{
|
|
uint32_t ix = asuint (x);
|
|
if (!IEEE_754_2008_SNAN)
|
|
return (ix & 0x7fc00000) == 0x7fc00000;
|
|
return 2 * (ix ^ 0x00400000) > 2u * 0x7fc00000;
|
|
}
|
|
static inline int
|
|
issignaling_d (double x)
|
|
{
|
|
uint64_t ix = asuint64 (x);
|
|
if (!IEEE_754_2008_SNAN)
|
|
return (ix & 0x7ff8000000000000) == 0x7ff8000000000000;
|
|
return 2 * (ix ^ 0x0008000000000000) > 2 * 0x7ff8000000000000ULL;
|
|
}
|
|
|
|
#if USE_MPFR
|
|
static mpfr_rnd_t
|
|
rmap (int r)
|
|
{
|
|
switch (r)
|
|
{
|
|
case FE_TONEAREST:
|
|
return MPFR_RNDN;
|
|
case FE_TOWARDZERO:
|
|
return MPFR_RNDZ;
|
|
case FE_UPWARD:
|
|
return MPFR_RNDU;
|
|
case FE_DOWNWARD:
|
|
return MPFR_RNDD;
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
#define prec_mpfr_f 50
|
|
#define prec_mpfr_d 80
|
|
#define prec_f 24
|
|
#define prec_d 53
|
|
#define emin_f -148
|
|
#define emin_d -1073
|
|
#define emax_f 128
|
|
#define emax_d 1024
|
|
static inline int
|
|
call_mpfr_f1 (mpfr_t y, const struct fun *f, struct args_f1 a, mpfr_rnd_t r)
|
|
{
|
|
MPFR_DECL_INIT (x, prec_f);
|
|
mpfr_set_flt (x, a.x, MPFR_RNDN);
|
|
return f->fun_mpfr.f1 (y, x, r);
|
|
}
|
|
static inline int
|
|
call_mpfr_f2 (mpfr_t y, const struct fun *f, struct args_f2 a, mpfr_rnd_t r)
|
|
{
|
|
MPFR_DECL_INIT (x, prec_f);
|
|
MPFR_DECL_INIT (x2, prec_f);
|
|
mpfr_set_flt (x, a.x, MPFR_RNDN);
|
|
mpfr_set_flt (x2, a.x2, MPFR_RNDN);
|
|
return f->fun_mpfr.f2 (y, x, x2, r);
|
|
}
|
|
static inline int
|
|
call_mpfr_d1 (mpfr_t y, const struct fun *f, struct args_d1 a, mpfr_rnd_t r)
|
|
{
|
|
MPFR_DECL_INIT (x, prec_d);
|
|
mpfr_set_d (x, a.x, MPFR_RNDN);
|
|
return f->fun_mpfr.d1 (y, x, r);
|
|
}
|
|
static inline int
|
|
call_mpfr_d2 (mpfr_t y, const struct fun *f, struct args_d2 a, mpfr_rnd_t r)
|
|
{
|
|
MPFR_DECL_INIT (x, prec_d);
|
|
MPFR_DECL_INIT (x2, prec_d);
|
|
mpfr_set_d (x, a.x, MPFR_RNDN);
|
|
mpfr_set_d (x2, a.x2, MPFR_RNDN);
|
|
return f->fun_mpfr.d2 (y, x, x2, r);
|
|
}
|
|
#endif
|
|
|
|
#define float_f float
|
|
#define double_f double
|
|
#define copysign_f copysignf
|
|
#define nextafter_f nextafterf
|
|
#define fabs_f fabsf
|
|
#define asuint_f asuint
|
|
#define asfloat_f asfloat
|
|
#define scalbn_f scalbnf
|
|
#define lscalbn_f scalbn
|
|
#define halfinf_f 0x1p127f
|
|
#define min_normal_f 0x1p-126f
|
|
|
|
#define float_d double
|
|
#define double_d long double
|
|
#define copysign_d copysign
|
|
#define nextafter_d nextafter
|
|
#define fabs_d fabs
|
|
#define asuint_d asuint64
|
|
#define asfloat_d asdouble
|
|
#define scalbn_d scalbn
|
|
#define lscalbn_d scalbnl
|
|
#define halfinf_d 0x1p1023
|
|
#define min_normal_d 0x1p-1022
|
|
|
|
#define NEW_RT
|
|
#define RT(x) x##_f
|
|
#define T(x) x##_f1
|
|
#include "ulp.h"
|
|
#undef T
|
|
#define T(x) x##_f2
|
|
#include "ulp.h"
|
|
#undef T
|
|
#undef RT
|
|
|
|
#define NEW_RT
|
|
#define RT(x) x##_d
|
|
#define T(x) x##_d1
|
|
#include "ulp.h"
|
|
#undef T
|
|
#define T(x) x##_d2
|
|
#include "ulp.h"
|
|
#undef T
|
|
#undef RT
|
|
|
|
static void
|
|
usage (void)
|
|
{
|
|
puts ("./ulp [-q] [-m] [-f] [-r nudz] [-l soft-ulplimit] [-e ulplimit] func "
|
|
"lo [hi [x lo2 hi2] [count]]");
|
|
puts ("Compares func against a higher precision implementation in [lo; hi].");
|
|
puts ("-q: quiet.");
|
|
puts ("-m: use mpfr even if faster method is available.");
|
|
puts ("-f: disable fenv testing (rounding modes and exceptions).");
|
|
puts ("Supported func:");
|
|
for (const struct fun *f = fun; f->name; f++)
|
|
printf ("\t%s\n", f->name);
|
|
exit (1);
|
|
}
|
|
|
|
static int
|
|
cmp (const struct fun *f, struct gen *gen, const struct conf *conf)
|
|
{
|
|
int r = 1;
|
|
if (f->arity == 1 && f->singleprec)
|
|
r = cmp_f1 (f, gen, conf);
|
|
else if (f->arity == 2 && f->singleprec)
|
|
r = cmp_f2 (f, gen, conf);
|
|
else if (f->arity == 1 && !f->singleprec)
|
|
r = cmp_d1 (f, gen, conf);
|
|
else if (f->arity == 2 && !f->singleprec)
|
|
r = cmp_d2 (f, gen, conf);
|
|
else
|
|
usage ();
|
|
return r;
|
|
}
|
|
|
|
static uint64_t
|
|
getnum (const char *s, int singleprec)
|
|
{
|
|
// int i;
|
|
uint64_t sign = 0;
|
|
// char buf[12];
|
|
|
|
if (s[0] == '+')
|
|
s++;
|
|
else if (s[0] == '-')
|
|
{
|
|
sign = singleprec ? 1ULL << 31 : 1ULL << 63;
|
|
s++;
|
|
}
|
|
/* 0xXXXX is treated as bit representation, '-' flips the sign bit. */
|
|
if (s[0] == '0' && tolower (s[1]) == 'x' && strchr (s, 'p') == 0)
|
|
return sign ^ strtoull (s, 0, 0);
|
|
// /* SNaN, QNaN, NaN, Inf. */
|
|
// for (i=0; s[i] && i < sizeof buf; i++)
|
|
// buf[i] = tolower(s[i]);
|
|
// buf[i] = 0;
|
|
// if (strcmp(buf, "snan") == 0)
|
|
// return sign | (singleprec ? 0x7fa00000 : 0x7ff4000000000000);
|
|
// if (strcmp(buf, "qnan") == 0 || strcmp(buf, "nan") == 0)
|
|
// return sign | (singleprec ? 0x7fc00000 : 0x7ff8000000000000);
|
|
// if (strcmp(buf, "inf") == 0 || strcmp(buf, "infinity") == 0)
|
|
// return sign | (singleprec ? 0x7f800000 : 0x7ff0000000000000);
|
|
/* Otherwise assume it's a floating-point literal. */
|
|
return sign
|
|
| (singleprec ? asuint (strtof (s, 0)) : asuint64 (strtod (s, 0)));
|
|
}
|
|
|
|
static void
|
|
parsegen (struct gen *g, int argc, char *argv[], const struct fun *f)
|
|
{
|
|
int singleprec = f->singleprec;
|
|
int arity = f->arity;
|
|
uint64_t a, b, a2, b2, n;
|
|
if (argc < 1)
|
|
usage ();
|
|
b = a = getnum (argv[0], singleprec);
|
|
n = 0;
|
|
if (argc > 1 && strcmp (argv[1], "x") == 0)
|
|
{
|
|
argc -= 2;
|
|
argv += 2;
|
|
}
|
|
else if (argc > 1)
|
|
{
|
|
b = getnum (argv[1], singleprec);
|
|
if (argc > 2 && strcmp (argv[2], "x") == 0)
|
|
{
|
|
argc -= 3;
|
|
argv += 3;
|
|
}
|
|
}
|
|
b2 = a2 = getnum (argv[0], singleprec);
|
|
if (argc > 1)
|
|
b2 = getnum (argv[1], singleprec);
|
|
if (argc > 2)
|
|
n = strtoull (argv[2], 0, 0);
|
|
if (argc > 3)
|
|
usage ();
|
|
//printf("ab %lx %lx ab2 %lx %lx n %lu\n", a, b, a2, b2, n);
|
|
if (arity == 1)
|
|
{
|
|
g->start = a;
|
|
g->len = b - a;
|
|
if (n - 1 > b - a)
|
|
n = b - a + 1;
|
|
g->off = 0;
|
|
g->step = n ? (g->len + 1) / n : 1;
|
|
g->start2 = g->len2 = 0;
|
|
g->cnt = n;
|
|
}
|
|
else if (arity == 2)
|
|
{
|
|
g->start = a;
|
|
g->len = b - a;
|
|
g->off = g->step = 0;
|
|
g->start2 = a2;
|
|
g->len2 = b2 - a2;
|
|
g->cnt = n;
|
|
}
|
|
else
|
|
usage ();
|
|
}
|
|
|
|
int
|
|
main (int argc, char *argv[])
|
|
{
|
|
const struct fun *f;
|
|
struct gen gen;
|
|
struct conf conf;
|
|
conf.rc = 'n';
|
|
conf.quiet = 0;
|
|
conf.mpfr = 0;
|
|
conf.fenv = 1;
|
|
conf.softlim = 0;
|
|
conf.errlim = INFINITY;
|
|
for (;;)
|
|
{
|
|
argc--;
|
|
argv++;
|
|
if (argc < 1)
|
|
usage ();
|
|
if (argv[0][0] != '-')
|
|
break;
|
|
switch (argv[0][1])
|
|
{
|
|
case 'e':
|
|
argc--;
|
|
argv++;
|
|
if (argc < 1)
|
|
usage ();
|
|
conf.errlim = strtod (argv[0], 0);
|
|
break;
|
|
case 'f':
|
|
conf.fenv = 0;
|
|
break;
|
|
case 'l':
|
|
argc--;
|
|
argv++;
|
|
if (argc < 1)
|
|
usage ();
|
|
conf.softlim = strtod (argv[0], 0);
|
|
break;
|
|
case 'm':
|
|
conf.mpfr = 1;
|
|
break;
|
|
case 'q':
|
|
conf.quiet = 1;
|
|
break;
|
|
case 'r':
|
|
conf.rc = argv[0][2];
|
|
if (!conf.rc)
|
|
{
|
|
argc--;
|
|
argv++;
|
|
if (argc < 1)
|
|
usage ();
|
|
conf.rc = argv[0][0];
|
|
}
|
|
break;
|
|
default:
|
|
usage ();
|
|
}
|
|
}
|
|
switch (conf.rc)
|
|
{
|
|
case 'n':
|
|
conf.r = FE_TONEAREST;
|
|
break;
|
|
case 'u':
|
|
conf.r = FE_UPWARD;
|
|
break;
|
|
case 'd':
|
|
conf.r = FE_DOWNWARD;
|
|
break;
|
|
case 'z':
|
|
conf.r = FE_TOWARDZERO;
|
|
break;
|
|
default:
|
|
usage ();
|
|
}
|
|
for (f = fun; f->name; f++)
|
|
if (strcmp (argv[0], f->name) == 0)
|
|
break;
|
|
if (!f->name)
|
|
usage ();
|
|
if (!f->singleprec && LDBL_MANT_DIG == DBL_MANT_DIG)
|
|
conf.mpfr = 1; /* Use mpfr if long double has no extra precision. */
|
|
if (!USE_MPFR && conf.mpfr)
|
|
{
|
|
puts ("mpfr is not available.");
|
|
return 0;
|
|
}
|
|
argc--;
|
|
argv++;
|
|
parsegen (&gen, argc, argv, f);
|
|
conf.n = gen.cnt;
|
|
return cmp (f, &gen, &conf);
|
|
}
|