diff options
Diffstat (limited to 'pl/math/math_config.h')
-rw-r--r-- | pl/math/math_config.h | 624 |
1 files changed, 0 insertions, 624 deletions
diff --git a/pl/math/math_config.h b/pl/math/math_config.h deleted file mode 100644 index c3dd8f2db8c7..000000000000 --- a/pl/math/math_config.h +++ /dev/null @@ -1,624 +0,0 @@ -/* - * Configuration for math routines. - * - * Copyright (c) 2017-2023, Arm Limited. - * SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception - */ - -#ifndef _MATH_CONFIG_H -#define _MATH_CONFIG_H - -#include <math.h> -#include <stdint.h> - -#ifndef WANT_ROUNDING -/* If defined to 1, return correct results for special cases in non-nearest - rounding modes (logf (1.0f) returns 0.0f with FE_DOWNWARD rather than - -0.0f). This may be set to 0 if there is no fenv support or if math - functions only get called in round to nearest mode. */ -# define WANT_ROUNDING 1 -#endif -#ifndef WANT_ERRNO -/* If defined to 1, set errno in math functions according to ISO C. Many math - libraries do not set errno, so this is 0 by default. It may need to be - set to 1 if math.h has (math_errhandling & MATH_ERRNO) != 0. */ -# define WANT_ERRNO 0 -#endif -#ifndef WANT_SIMD_EXCEPT -/* If defined to 1, trigger fp exceptions in vector routines, consistently with - behaviour expected from the corresponding scalar routine. */ -# define WANT_SIMD_EXCEPT 0 -#endif - -/* Compiler can inline round as a single instruction. */ -#ifndef HAVE_FAST_ROUND -# if __aarch64__ -# define HAVE_FAST_ROUND 1 -# else -# define HAVE_FAST_ROUND 0 -# endif -#endif - -/* Compiler can inline lround, but not (long)round(x). */ -#ifndef HAVE_FAST_LROUND -# if __aarch64__ && (100 * __GNUC__ + __GNUC_MINOR__) >= 408 \ - && __NO_MATH_ERRNO__ -# define HAVE_FAST_LROUND 1 -# else -# define HAVE_FAST_LROUND 0 -# endif -#endif - -/* Compiler can inline fma as a single instruction. */ -#ifndef HAVE_FAST_FMA -# if defined FP_FAST_FMA || __aarch64__ -# define HAVE_FAST_FMA 1 -# else -# define HAVE_FAST_FMA 0 -# endif -#endif - -/* Provide *_finite symbols and some of the glibc hidden symbols - so libmathlib can be used with binaries compiled against glibc - to interpose math functions with both static and dynamic linking. */ -#ifndef USE_GLIBC_ABI -# if __GNUC__ -# define USE_GLIBC_ABI 1 -# else -# define USE_GLIBC_ABI 0 -# endif -#endif - -/* Optionally used extensions. */ -#ifdef __GNUC__ -# define HIDDEN __attribute__ ((__visibility__ ("hidden"))) -# define NOINLINE __attribute__ ((noinline)) -# define UNUSED __attribute__ ((unused)) -# define likely(x) __builtin_expect (!!(x), 1) -# define unlikely(x) __builtin_expect (x, 0) -# if __GNUC__ >= 9 -# define attribute_copy(f) __attribute__ ((copy (f))) -# else -# define attribute_copy(f) -# endif -# define strong_alias(f, a) \ - extern __typeof (f) a __attribute__ ((alias (#f))) attribute_copy (f); -# define hidden_alias(f, a) \ - extern __typeof (f) a __attribute__ ((alias (#f), visibility ("hidden"))) \ - attribute_copy (f); -#else -# define HIDDEN -# define NOINLINE -# define UNUSED -# define likely(x) (x) -# define unlikely(x) (x) -#endif - -/* Return ptr but hide its value from the compiler so accesses through it - cannot be optimized based on the contents. */ -#define ptr_barrier(ptr) \ - ({ \ - __typeof (ptr) __ptr = (ptr); \ - __asm("" : "+r"(__ptr)); \ - __ptr; \ - }) - -/* Symbol renames to avoid libc conflicts. */ -#define __math_oflowf arm_math_oflowf -#define __math_uflowf arm_math_uflowf -#define __math_may_uflowf arm_math_may_uflowf -#define __math_divzerof arm_math_divzerof -#define __math_oflow arm_math_oflow -#define __math_uflow arm_math_uflow -#define __math_may_uflow arm_math_may_uflow -#define __math_divzero arm_math_divzero -#define __math_invalidf arm_math_invalidf -#define __math_invalid arm_math_invalid -#define __math_check_oflow arm_math_check_oflow -#define __math_check_uflow arm_math_check_uflow -#define __math_check_oflowf arm_math_check_oflowf -#define __math_check_uflowf arm_math_check_uflowf - -#if HAVE_FAST_ROUND -/* When set, the roundtoint and converttoint functions are provided with - the semantics documented below. */ -# define TOINT_INTRINSICS 1 - -/* Round x to nearest int in all rounding modes, ties have to be rounded - consistently with converttoint so the results match. If the result - would be outside of [-2^31, 2^31-1] then the semantics is unspecified. */ -static inline double_t -roundtoint (double_t x) -{ - return round (x); -} - -/* Convert x to nearest int in all rounding modes, ties have to be rounded - consistently with roundtoint. If the result is not representible in an - int32_t then the semantics is unspecified. */ -static inline int32_t -converttoint (double_t x) -{ -# if HAVE_FAST_LROUND - return lround (x); -# else - return (long) round (x); -# endif -} -#endif - -static inline uint32_t -asuint (float f) -{ - union - { - float f; - uint32_t i; - } u = { f }; - return u.i; -} - -static inline float -asfloat (uint32_t i) -{ - union - { - uint32_t i; - float f; - } u = { i }; - return u.f; -} - -static inline uint64_t -asuint64 (double f) -{ - union - { - double f; - uint64_t i; - } u = { f }; - return u.i; -} - -static inline double -asdouble (uint64_t i) -{ - union - { - uint64_t i; - double f; - } u = { i }; - return u.f; -} - -#ifndef IEEE_754_2008_SNAN -# define IEEE_754_2008_SNAN 1 -#endif -static inline int -issignalingf_inline (float x) -{ - uint32_t ix = asuint (x); - if (!IEEE_754_2008_SNAN) - return (ix & 0x7fc00000) == 0x7fc00000; - return 2 * (ix ^ 0x00400000) > 2u * 0x7fc00000; -} - -static inline int -issignaling_inline (double x) -{ - uint64_t ix = asuint64 (x); - if (!IEEE_754_2008_SNAN) - return (ix & 0x7ff8000000000000) == 0x7ff8000000000000; - return 2 * (ix ^ 0x0008000000000000) > 2 * 0x7ff8000000000000ULL; -} - -#if __aarch64__ && __GNUC__ -/* Prevent the optimization of a floating-point expression. */ -static inline float -opt_barrier_float (float x) -{ - __asm__ __volatile__ ("" : "+w" (x)); - return x; -} -static inline double -opt_barrier_double (double x) -{ - __asm__ __volatile__ ("" : "+w" (x)); - return x; -} -/* Force the evaluation of a floating-point expression for its side-effect. */ -static inline void -force_eval_float (float x) -{ - __asm__ __volatile__ ("" : "+w" (x)); -} -static inline void -force_eval_double (double x) -{ - __asm__ __volatile__ ("" : "+w" (x)); -} -#else -static inline float -opt_barrier_float (float x) -{ - volatile float y = x; - return y; -} -static inline double -opt_barrier_double (double x) -{ - volatile double y = x; - return y; -} -static inline void -force_eval_float (float x) -{ - volatile float y UNUSED = x; -} -static inline void -force_eval_double (double x) -{ - volatile double y UNUSED = x; -} -#endif - -/* Evaluate an expression as the specified type, normally a type - cast should be enough, but compilers implement non-standard - excess-precision handling, so when FLT_EVAL_METHOD != 0 then - these functions may need to be customized. */ -static inline float -eval_as_float (float x) -{ - return x; -} -static inline double -eval_as_double (double x) -{ - return x; -} - -/* Error handling tail calls for special cases, with a sign argument. - The sign of the return value is set if the argument is non-zero. */ - -/* The result overflows. */ -HIDDEN float __math_oflowf (uint32_t); -/* The result underflows to 0 in nearest rounding mode. */ -HIDDEN float __math_uflowf (uint32_t); -/* The result underflows to 0 in some directed rounding mode only. */ -HIDDEN float __math_may_uflowf (uint32_t); -/* Division by zero. */ -HIDDEN float __math_divzerof (uint32_t); -/* The result overflows. */ -HIDDEN double __math_oflow (uint32_t); -/* The result underflows to 0 in nearest rounding mode. */ -HIDDEN double __math_uflow (uint32_t); -/* The result underflows to 0 in some directed rounding mode only. */ -HIDDEN double __math_may_uflow (uint32_t); -/* Division by zero. */ -HIDDEN double __math_divzero (uint32_t); - -/* Error handling using input checking. */ - -/* Invalid input unless it is a quiet NaN. */ -HIDDEN float __math_invalidf (float); -/* Invalid input unless it is a quiet NaN. */ -HIDDEN double __math_invalid (double); - -/* Error handling using output checking, only for errno setting. */ - -/* Check if the result overflowed to infinity. */ -HIDDEN double __math_check_oflow (double); -/* Check if the result underflowed to 0. */ -HIDDEN double __math_check_uflow (double); - -/* Check if the result overflowed to infinity. */ -static inline double -check_oflow (double x) -{ - return WANT_ERRNO ? __math_check_oflow (x) : x; -} - -/* Check if the result underflowed to 0. */ -static inline double -check_uflow (double x) -{ - return WANT_ERRNO ? __math_check_uflow (x) : x; -} - -/* Check if the result overflowed to infinity. */ -HIDDEN float __math_check_oflowf (float); -/* Check if the result underflowed to 0. */ -HIDDEN float __math_check_uflowf (float); - -/* Check if the result overflowed to infinity. */ -static inline float -check_oflowf (float x) -{ - return WANT_ERRNO ? __math_check_oflowf (x) : x; -} - -/* Check if the result underflowed to 0. */ -static inline float -check_uflowf (float x) -{ - return WANT_ERRNO ? __math_check_uflowf (x) : x; -} - -extern const struct erff_data -{ - struct - { - float erf, scale; - } tab[513]; -} __erff_data HIDDEN; - -extern const struct sv_erff_data -{ - float erf[513]; - float scale[513]; -} __sv_erff_data HIDDEN; - -extern const struct erfcf_data -{ - struct - { - float erfc, scale; - } tab[645]; -} __erfcf_data HIDDEN; - -/* Data for logf and log10f. */ -#define LOGF_TABLE_BITS 4 -#define LOGF_POLY_ORDER 4 -extern const struct logf_data -{ - struct - { - double invc, logc; - } tab[1 << LOGF_TABLE_BITS]; - double ln2; - double invln10; - double poly[LOGF_POLY_ORDER - 1]; /* First order coefficient is 1. */ -} __logf_data HIDDEN; - -/* Data for low accuracy log10 (with 1/ln(10) included in coefficients). */ -#define LOG10_TABLE_BITS 7 -#define LOG10_POLY_ORDER 6 -#define LOG10_POLY1_ORDER 12 -extern const struct log10_data -{ - double ln2hi; - double ln2lo; - double invln10; - double poly[LOG10_POLY_ORDER - 1]; /* First coefficient is 1/log(10). */ - double poly1[LOG10_POLY1_ORDER - 1]; - struct - { - double invc, logc; - } tab[1 << LOG10_TABLE_BITS]; -#if !HAVE_FAST_FMA - struct - { - double chi, clo; - } tab2[1 << LOG10_TABLE_BITS]; -#endif -} __log10_data HIDDEN; - -#define EXP_TABLE_BITS 7 -#define EXP_POLY_ORDER 5 -/* Use polynomial that is optimized for a wider input range. This may be - needed for good precision in non-nearest rounding and !TOINT_INTRINSICS. */ -#define EXP_POLY_WIDE 0 -/* Use close to nearest rounding toint when !TOINT_INTRINSICS. This may be - needed for good precision in non-nearest rouning and !EXP_POLY_WIDE. */ -#define EXP_USE_TOINT_NARROW 0 -#define EXP2_POLY_ORDER 5 -#define EXP2_POLY_WIDE 0 -extern const struct exp_data -{ - double invln2N; - double shift; - double negln2hiN; - double negln2loN; - double poly[4]; /* Last four coefficients. */ - double exp2_shift; - double exp2_poly[EXP2_POLY_ORDER]; - uint64_t tab[2 * (1 << EXP_TABLE_BITS)]; -} __exp_data HIDDEN; - -/* Copied from math/v_exp.h for use in vector exp_tail. */ -#define V_EXP_TAIL_TABLE_BITS 8 -extern const uint64_t __v_exp_tail_data[1 << V_EXP_TAIL_TABLE_BITS] HIDDEN; - -/* Copied from math/v_exp.h for use in vector exp2. */ -#define V_EXP_TABLE_BITS 7 -extern const uint64_t __v_exp_data[1 << V_EXP_TABLE_BITS] HIDDEN; - -extern const struct erf_data -{ - struct - { - double erf, scale; - } tab[769]; -} __erf_data HIDDEN; - -extern const struct sv_erf_data -{ - double erf[769]; - double scale[769]; -} __sv_erf_data HIDDEN; - -extern const struct erfc_data -{ - struct - { - double erfc, scale; - } tab[3488]; -} __erfc_data HIDDEN; - -#define ATAN_POLY_NCOEFFS 20 -extern const struct atan_poly_data -{ - double poly[ATAN_POLY_NCOEFFS]; -} __atan_poly_data HIDDEN; - -#define ATANF_POLY_NCOEFFS 8 -extern const struct atanf_poly_data -{ - float poly[ATANF_POLY_NCOEFFS]; -} __atanf_poly_data HIDDEN; - -#define ASINHF_NCOEFFS 8 -extern const struct asinhf_data -{ - float coeffs[ASINHF_NCOEFFS]; -} __asinhf_data HIDDEN; - -#define LOG_TABLE_BITS 7 -#define LOG_POLY_ORDER 6 -#define LOG_POLY1_ORDER 12 -extern const struct log_data -{ - double ln2hi; - double ln2lo; - double poly[LOG_POLY_ORDER - 1]; /* First coefficient is 1. */ - double poly1[LOG_POLY1_ORDER - 1]; - struct - { - double invc, logc; - } tab[1 << LOG_TABLE_BITS]; -#if !HAVE_FAST_FMA - struct - { - double chi, clo; - } tab2[1 << LOG_TABLE_BITS]; -#endif -} __log_data HIDDEN; - -#define ASINH_NCOEFFS 18 -extern const struct asinh_data -{ - double poly[ASINH_NCOEFFS]; -} __asinh_data HIDDEN; - -#define LOG1P_NCOEFFS 19 -extern const struct log1p_data -{ - double coeffs[LOG1P_NCOEFFS]; -} __log1p_data HIDDEN; - -#define LOG1PF_2U5 -#define LOG1PF_NCOEFFS 9 -extern const struct log1pf_data -{ - float coeffs[LOG1PF_NCOEFFS]; -} __log1pf_data HIDDEN; - -#define TANF_P_POLY_NCOEFFS 6 -/* cotan approach needs order 3 on [0, pi/4] to reach <3.5ulps. */ -#define TANF_Q_POLY_NCOEFFS 4 -extern const struct tanf_poly_data -{ - float poly_tan[TANF_P_POLY_NCOEFFS]; - float poly_cotan[TANF_Q_POLY_NCOEFFS]; -} __tanf_poly_data HIDDEN; - -#define V_LOG2_TABLE_BITS 7 -extern const struct v_log2_data -{ - double poly[5]; - double invln2; - struct - { - double invc, log2c; - } table[1 << V_LOG2_TABLE_BITS]; -} __v_log2_data HIDDEN; - -#define V_LOG10_TABLE_BITS 7 -extern const struct v_log10_data -{ - double poly[5]; - double invln10, log10_2; - struct - { - double invc, log10c; - } table[1 << V_LOG10_TABLE_BITS]; -} __v_log10_data HIDDEN; - -/* Some data for SVE powf's internal exp and log. */ -#define V_POWF_EXP2_TABLE_BITS 5 -#define V_POWF_EXP2_N (1 << V_POWF_EXP2_TABLE_BITS) -#define V_POWF_LOG2_TABLE_BITS 5 -#define V_POWF_LOG2_N (1 << V_POWF_LOG2_TABLE_BITS) -extern const struct v_powf_data -{ - double invc[V_POWF_LOG2_N]; - double logc[V_POWF_LOG2_N]; - uint64_t scale[V_POWF_EXP2_N]; -} __v_powf_data HIDDEN; - -#define V_LOG_POLY_ORDER 6 -#define V_LOG_TABLE_BITS 7 -extern const struct v_log_data -{ - /* Shared data for vector log and log-derived routines (e.g. asinh). */ - double poly[V_LOG_POLY_ORDER - 1]; - double ln2; - struct - { - double invc, logc; - } table[1 << V_LOG_TABLE_BITS]; -} __v_log_data HIDDEN; - -#define EXPM1F_POLY_ORDER 5 -extern const float __expm1f_poly[EXPM1F_POLY_ORDER] HIDDEN; - -#define EXPF_TABLE_BITS 5 -#define EXPF_POLY_ORDER 3 -extern const struct expf_data -{ - uint64_t tab[1 << EXPF_TABLE_BITS]; - double invln2_scaled; - double poly_scaled[EXPF_POLY_ORDER]; -} __expf_data HIDDEN; - -#define EXPM1_POLY_ORDER 11 -extern const double __expm1_poly[EXPM1_POLY_ORDER] HIDDEN; - -extern const struct cbrtf_data -{ - float poly[4]; - float table[5]; -} __cbrtf_data HIDDEN; - -extern const struct cbrt_data -{ - double poly[4]; - double table[5]; -} __cbrt_data HIDDEN; - -#define ASINF_POLY_ORDER 4 -extern const float __asinf_poly[ASINF_POLY_ORDER + 1] HIDDEN; - -#define ASIN_POLY_ORDER 11 -extern const double __asin_poly[ASIN_POLY_ORDER + 1] HIDDEN; - -/* Some data for AdvSIMD and SVE pow's internal exp and log. */ -#define V_POW_EXP_TABLE_BITS 8 -extern const struct v_pow_exp_data -{ - double poly[3]; - double n_over_ln2, ln2_over_n_hi, ln2_over_n_lo, shift; - uint64_t sbits[1 << V_POW_EXP_TABLE_BITS]; -} __v_pow_exp_data HIDDEN; - -#define V_POW_LOG_TABLE_BITS 7 -extern const struct v_pow_log_data -{ - double poly[7]; /* First coefficient is 1. */ - double ln2_hi, ln2_lo; - double invc[1 << V_POW_LOG_TABLE_BITS]; - double logc[1 << V_POW_LOG_TABLE_BITS]; - double logctail[1 << V_POW_LOG_TABLE_BITS]; -} __v_pow_log_data HIDDEN; - -#endif |