Userland/Libraries/LibC/math.cpp

/*
 * Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
 * Copyright (c) 2021, Mițca Dumitru <dumitru0mitca@gmail.com>
 * Copyright (c) 2022, the SerenityOS developers.
 * Copyright (c) 2022, Leon Albrecht <leon.a@serenityos.org>
 *
 * SPDX-License-Identifier: BSD-2-Clause
 */

#include <AK/BuiltinWrappers.h>
#include <AK/FloatingPoint.h>
#if ARCH(X86_64)
#    include <AK/FPControl.h>
#endif
#include <AK/Math.h>
#include <AK/Platform.h>
#include <AK/StdLibExtras.h>
#include <assert.h>
#include <fenv.h>
#include <math.h>
#include <stdint.h>

#if defined(AK_COMPILER_CLANG)
#    pragma clang diagnostic push
#    pragma clang diagnostic ignored "-Wdouble-promotion"
#endif

template<size_t>
constexpr double e_to_power();
template<>
constexpr double e_to_power<0>() { return 1; }
template<size_t exponent>
constexpr double e_to_power() { return M_E * e_to_power<exponent - 1>(); }

template<size_t>
constexpr size_t factorial();
template<>
constexpr size_t factorial<0>() { return 1; }
template<size_t value>
constexpr size_t factorial() { return value * factorial<value - 1>(); }

template<size_t>
constexpr size_t product_even();
template<>
constexpr size_t product_even<2>() { return 2; }
template<size_t value>
constexpr size_t product_even() { return value * product_even<value - 2>(); }

template<size_t>
constexpr size_t product_odd();
template<>
constexpr size_t product_odd<1>() { return 1; }
template<size_t value>
constexpr size_t product_odd() { return value * product_odd<value - 2>(); }

enum class RoundingMode {
    ToZero = FE_TOWARDZERO,
    Up = FE_UPWARD,
    Down = FE_DOWNWARD,
    ToEven = FE_TONEAREST,
    // Round to nearest, ties away from zero.
    ToMaxMagnitude = FE_TOMAXMAGNITUDE,
};

// This is much branchier than it really needs to be
template<typename FloatType>
static FloatType internal_to_integer(FloatType x, RoundingMode rounding_mode)
{
    if (!isfinite(x))
        return x;

    using Extractor = FloatExtractor<decltype(x)>;
    // Most component types are larger than int.
    constexpr auto zero = static_cast<Extractor::ComponentType>(0);
    constexpr auto one = static_cast<Extractor::ComponentType>(1);
    Extractor extractor;
    extractor.d = x;

    auto unbiased_exponent = extractor.exponent - Extractor::exponent_bias;

    bool has_half_fraction = false;
    bool has_nonhalf_fraction = false;
    if (unbiased_exponent < 0) {
        // it was easier to special case [0..1) as it saves us from
        // handling subnormals, underflows, etc
        if (unbiased_exponent == -1) {
            has_half_fraction = true;
        }

        has_nonhalf_fraction = unbiased_exponent < -1 || extractor.mantissa != 0;
        extractor.mantissa = 0;
        extractor.exponent = 0;
    } else {
        if (unbiased_exponent >= Extractor::mantissa_bits)
            return x;

        auto dead_bitcount = Extractor::mantissa_bits - unbiased_exponent;
        // Avoid shifting by the integer type's size since that's UB.
        auto dead_mask = dead_bitcount == sizeof(typename Extractor::ComponentType) * 8 ? ~zero : (one << dead_bitcount) - 1;
        auto dead_bits = extractor.mantissa & dead_mask;
        extractor.mantissa &= ~dead_mask;
#ifdef AK_HAS_FLOAT_80
        if constexpr (IsSame<f80, FloatType>) {
            // x86 80-bit extended floating point requires the top mantissa bit to always be 1, or we get a special Intel NaN.
            if (extractor.mantissa == 0)
                extractor.mantissa = one << (Extractor::mantissa_bits - 1);
        }
#endif

        auto nonhalf_fraction_mask = dead_mask >> 1;
        has_nonhalf_fraction = (dead_bits & nonhalf_fraction_mask) != 0;
        has_half_fraction = (dead_bits & ~nonhalf_fraction_mask) != 0;
    }

    bool should_round = false;
    switch (rounding_mode) {
    case RoundingMode::ToEven:
        should_round = has_half_fraction;
        break;
    case RoundingMode::Up:
        if (!extractor.sign)
            should_round = has_nonhalf_fraction || has_half_fraction;
        break;
    case RoundingMode::Down:
        if (extractor.sign)
            should_round = has_nonhalf_fraction || has_half_fraction;
        break;
    case RoundingMode::ToZero:
        break;
    case RoundingMode::ToMaxMagnitude:
        should_round = true;
        break;
    }

    if (should_round) {
        // We could do this ourselves, but this saves us from manually
        // handling overflow.
        if (extractor.sign)
            extractor.d -= static_cast<FloatType>(1.0);
        else
            extractor.d += static_cast<FloatType>(1.0);
    }

    return extractor.d;
}

// This is much branchier than it really needs to be
template<typename FloatType>
static FloatType internal_nextafter(FloatType x, bool up)
{
    if (!isfinite(x))
        return x;
    using Extractor = FloatExtractor<decltype(x)>;
    Extractor extractor;
    extractor.d = x;
    if (x == 0) {
        if (!extractor.sign) {
            extractor.mantissa = 1;
            extractor.sign = !up;
            return extractor.d;
        }
        if (up) {
            extractor.sign = false;
            extractor.mantissa = 1;
            return extractor.d;
        }
        extractor.mantissa = 1;
        extractor.sign = up != extractor.sign;
        return extractor.d;
    }
    if (up != extractor.sign) {
        extractor.mantissa++;
        if (!extractor.mantissa) {
            // no need to normalize the mantissa as we just hit a power
            // of two.
            extractor.exponent++;
            if (extractor.exponent == Extractor::exponent_max) {
                extractor.exponent = Extractor::exponent_max - 1;
                extractor.mantissa = Extractor::mantissa_max;
            }
        }
        return extractor.d;
    }

    if (!extractor.mantissa) {
        if (extractor.exponent) {
            extractor.exponent--;
            extractor.mantissa = Extractor::mantissa_max;
        } else {
            extractor.d = 0;
        }
        return extractor.d;
    }

    extractor.mantissa--;
    if (extractor.mantissa != Extractor::mantissa_max)
        return extractor.d;
    if (extractor.exponent) {
        extractor.exponent--;
        // normalize
        extractor.mantissa <<= 1;
    } else {
        if (extractor.sign) {
            // Negative infinity
            extractor.mantissa = 0;
            extractor.exponent = Extractor::exponent_max;
        }
    }
    return extractor.d;
}

template<typename FloatT>
static int internal_ilogb(FloatT x) NOEXCEPT
{
    if (x == 0)
        return FP_ILOGB0;

    if (isnan(x))
        return FP_ILOGNAN;

    if (!isfinite(x))
        return INT_MAX;

    using Extractor = FloatExtractor<FloatT>;

    Extractor extractor;
    extractor.d = x;

    return (int)extractor.exponent - Extractor::exponent_bias;
}

template<typename FloatT>
static FloatT internal_modf(FloatT x, FloatT* intpart) NOEXCEPT
{
    FloatT integer_part = internal_to_integer(x, RoundingMode::ToZero);
    *intpart = integer_part;
    auto fraction = x - integer_part;
    if (signbit(fraction) != signbit(x))
        fraction = -fraction;
    return fraction;
}

template<typename FloatT>
static FloatT internal_scalbn(FloatT x, int exponent) NOEXCEPT
{
    if (x == 0 || !isfinite(x) || isnan(x) || exponent == 0)
        return x;

    using Extractor = FloatExtractor<FloatT>;
    Extractor extractor;
    extractor.d = x;

    if (extractor.exponent != 0) {
        extractor.exponent = clamp((int)extractor.exponent + exponent, 0, (int)Extractor::exponent_max);
        return extractor.d;
    }

    unsigned leading_mantissa_zeroes = extractor.mantissa == 0 ? 32 : count_leading_zeroes(extractor.mantissa);
    int shift = min((int)leading_mantissa_zeroes, exponent);
    exponent = max(exponent - shift, 0);

    extractor.exponent <<= shift;
    extractor.exponent = exponent + 1;

    return extractor.d;
}

template<typename FloatT>
static FloatT internal_copysign(FloatT x, FloatT y) NOEXCEPT
{
    using Extractor = FloatExtractor<FloatT>;
    Extractor ex, ey;
    ex.d = x;
    ey.d = y;
    ex.sign = ey.sign;
    return ex.d;
}

template<typename FloatT>
static FloatT internal_gamma(FloatT x) NOEXCEPT
{
    if (isnan(x))
        return (FloatT)NAN;

    if (x == (FloatT)0.0)
        return signbit(x) ? (FloatT)-INFINITY : (FloatT)INFINITY;

    if (x < (FloatT)0 && (rintl(x) == x || isinf(x)))
        return (FloatT)NAN;

    if (isinf(x))
        return (FloatT)INFINITY;

    using Extractor = FloatExtractor<FloatT>;
    // These constants were obtained through use of WolframAlpha
    constexpr long long max_integer_whose_factorial_fits = (Extractor::mantissa_bits == FloatExtractor<long double>::mantissa_bits ? 20 : (Extractor::mantissa_bits == FloatExtractor<double>::mantissa_bits ? 18 : (Extractor::mantissa_bits == FloatExtractor<float>::mantissa_bits ? 10 : 0)));
    static_assert(max_integer_whose_factorial_fits != 0, "internal_gamma needs to be aware of the integer factorial that fits in this floating point type.");
    if ((int)x == x && x <= max_integer_whose_factorial_fits + 1) {
        long long result = 1;
        for (long long cursor = 2; cursor < (long long)x; cursor++)
            result *= cursor;
        return (FloatT)result;
    }

    // Stirling approximation
    return sqrtl(2.0 * M_PIl / static_cast<long double>(x)) * powl(static_cast<long double>(x) / M_El, static_cast<long double>(x));
}

extern "C" {

float nanf(char const* s) NOEXCEPT
{
    return __builtin_nanf(s);
}

double nan(char const* s) NOEXCEPT
{
    return __builtin_nan(s);
}

long double nanl(char const* s) NOEXCEPT
{
    return __builtin_nanl(s);
}

#define MAKE_AK_BACKED1(name)                     \
    long double name##l(long double arg) NOEXCEPT \
    {                                             \
        return AK::name<long double>(arg);        \
    }                                             \
    double name(double arg) NOEXCEPT              \
    {                                             \
        return AK::name<double>(arg);             \
    }                                             \
    float name##f(float arg) NOEXCEPT             \
    {                                             \
        return AK::name<float>(arg);              \
    }
#define MAKE_AK_BACKED2(name)                                        \
    long double name##l(long double arg1, long double arg2) NOEXCEPT \
    {                                                                \
        return AK::name<long double>(arg1, arg2);                    \
    }                                                                \
    double name(double arg1, double arg2) NOEXCEPT                   \
    {                                                                \
        return AK::name<double>(arg1, arg2);                         \
    }                                                                \
    float name##f(float arg1, float arg2) NOEXCEPT                   \
    {                                                                \
        return AK::name<float>(arg1, arg2);                          \
    }

MAKE_AK_BACKED1(sin);
MAKE_AK_BACKED1(cos);
MAKE_AK_BACKED1(tan);
MAKE_AK_BACKED1(asin);
MAKE_AK_BACKED1(acos);
MAKE_AK_BACKED1(atan);
MAKE_AK_BACKED1(sinh);
MAKE_AK_BACKED1(cosh);
MAKE_AK_BACKED1(tanh);
MAKE_AK_BACKED1(asinh);
MAKE_AK_BACKED1(acosh);
MAKE_AK_BACKED1(atanh);
MAKE_AK_BACKED1(sqrt);
MAKE_AK_BACKED1(cbrt);
MAKE_AK_BACKED1(log);
MAKE_AK_BACKED1(log2);
MAKE_AK_BACKED1(log10);
MAKE_AK_BACKED1(exp);
MAKE_AK_BACKED1(exp2);
MAKE_AK_BACKED1(fabs);

MAKE_AK_BACKED2(atan2);
MAKE_AK_BACKED2(hypot);
MAKE_AK_BACKED2(fmod);
MAKE_AK_BACKED2(pow);
MAKE_AK_BACKED2(remainder);

long double truncl(long double x) NOEXCEPT
{
#if ARCH(X86_64)
    if (fabsl(x) < LONG_LONG_MAX) {
        // This is 1.6 times faster than the implementation using the "internal_to_integer"
        // helper (on x86_64)
        // https://quick-bench.com/q/xBmxuY8am9qibSYVna90Y6PIvqA
        u64 temp;
        asm(
            "fisttpq %[temp]\n"
            "fildq %[temp]"
            : "+t"(x)
            : [temp] "m"(temp));
        return x;
    }
#endif

    return internal_to_integer(x, RoundingMode::ToZero);
}

double trunc(double x) NOEXCEPT
{
#if ARCH(X86_64)
    if (fabs(x) < LONG_LONG_MAX) {
        u64 temp;
        asm(
            "fisttpq %[temp]\n"
            "fildq %[temp]"
            : "+t"(x)
            : [temp] "m"(temp));
        return x;
    }
#elif ARCH(RISCV64)
    if (fabs(x) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.d %0, %1, rtz"
            : "=r"(output)
            : "f"(x));
        return static_cast<double>(output);
    }
#endif

    return internal_to_integer(x, RoundingMode::ToZero);
}

float truncf(float x) NOEXCEPT
{
#if ARCH(X86_64)
    if (fabsf(x) < LONG_LONG_MAX) {
        u64 temp;
        asm(
            "fisttpq %[temp]\n"
            "fildq %[temp]"
            : "+t"(x)
            : [temp] "m"(temp));
        return x;
    }
#elif ARCH(RISCV64)
    if (fabsf(x) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.s %0, %1, rtz"
            : "=r"(output)
            : "f"(x));
        return static_cast<float>(output);
    }
#endif

    return internal_to_integer(x, RoundingMode::ToZero);
}

long double rintl(long double value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    (void)value;
    TODO_RISCV64();
#elif ARCH(X86_64)
    long double res;
    asm(
        "frndint\n"
        : "=t"(res)
        : "0"(value));
    return res;
#else
#    error "Unknown architecture"
#endif
}
double rint(double value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    i64 output;
    // FIXME: This saturates at 64-bit integer boundaries; see Table 11.4 (RISC-V Unprivileged ISA V20191213)
    asm("fcvt.l.d %0, %1, dyn"
        : "=r"(output)
        : "f"(value));
    return static_cast<double>(output);
#elif ARCH(X86_64)
    double res;
    asm(
        "frndint\n"
        : "=t"(res)
        : "0"(value));
    return res;
#else
#    error "Unknown architecture"
#endif
}
float rintf(float value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    i64 output;
    // FIXME: This saturates at 64-bit integer boundaries; see Table 11.4 (RISC-V Unprivileged ISA V20191213)
    asm("fcvt.l.s %0, %1, dyn"
        : "=r"(output)
        : "f"(value));
    return static_cast<float>(output);
#elif ARCH(X86_64)
    float res;
    asm(
        "frndint\n"
        : "=t"(res)
        : "0"(value));
    return res;
#else
#    error "Unknown architecture"
#endif
}

long lrintl(long double value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    (void)value;
    TODO_RISCV64();
#elif ARCH(X86_64)
    long res;
    asm(
        "fistpl %0\n"
        : "+m"(res)
        : "t"(value)
        : "st");
    return res;
#else
#    error "Unknown architecture"
#endif
}
long lrint(double value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    i64 output;
    // FIXME: This saturates at 64-bit integer boundaries; see Table 11.4 (RISC-V Unprivileged ISA V20191213)
    asm("fcvt.l.d %0, %1, dyn"
        : "=r"(output)
        : "f"(value));
    return output;
#elif ARCH(X86_64)
    long res;
    asm(
        "fistpl %0\n"
        : "+m"(res)
        : "t"(value)
        : "st");
    return res;
#else
#    error "Unknown architecture"
#endif
}
long lrintf(float value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    i64 output;
    // FIXME: This saturates at 64-bit integer boundaries; see Table 11.4 (RISC-V Unprivileged ISA V20191213)
    asm("fcvt.l.s %0, %1, dyn"
        : "=r"(output)
        : "f"(value));
    return output;
#elif ARCH(X86_64)
    long res;
    asm(
        "fistpl %0\n"
        : "+m"(res)
        : "t"(value)
        : "st");
    return res;
#else
#    error "Unknown architecture"
#endif
}

long long llrintl(long double value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    // NOTE: RISC-V LP64 specifies long long == long.
    return static_cast<long long>(lrintl(value));
#elif ARCH(X86_64)
    long long res;
    asm(
        "fistpq %0\n"
        : "+m"(res)
        : "t"(value)
        : "st");
    return res;
#else
#    error "Unknown architecture"
#endif
}
long long llrint(double value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    // NOTE: RISC-V LP64 specifies long long == long.
    return static_cast<long long>(lrint(value));
#elif ARCH(X86_64)
    long long res;
    asm(
        "fistpq %0\n"
        : "+m"(res)
        : "t"(value)
        : "st");
    return res;
#else
#    error "Unknown architecture"
#endif
}
long long llrintf(float value)
{
#if ARCH(AARCH64)
    (void)value;
    TODO_AARCH64();
#elif ARCH(RISCV64)
    // NOTE: RISC-V LP64 specifies long long == long.
    return static_cast<long long>(lrintf(value));
#elif ARCH(X86_64)
    long long res;
    asm(
        "fistpq %0\n"
        : "+m"(res)
        : "t"(value)
        : "st");
    return res;
#else
#    error "Unknown architecture"
#endif
}

// On systems where FLT_RADIX == 2, ldexp is equivalent to scalbn
long double ldexpl(long double x, int exp) NOEXCEPT
{
    return internal_scalbn(x, exp);
}

double ldexp(double x, int exp) NOEXCEPT
{
    return internal_scalbn(x, exp);
}

float ldexpf(float x, int exp) NOEXCEPT
{
    return internal_scalbn(x, exp);
}

[[maybe_unused]] static long double ampsin(long double angle) NOEXCEPT
{
    long double looped_angle = fmodl(M_PI + angle, M_PI * 2) - M_PI;
    long double looped_angle_squared = looped_angle * looped_angle;

    long double quadratic_term;
    if (looped_angle > 0) {
        quadratic_term = -looped_angle_squared;
    } else {
        quadratic_term = looped_angle_squared;
    }

    long double linear_term = M_PI * looped_angle;

    return quadratic_term + linear_term;
}

int ilogbl(long double x) NOEXCEPT
{
    return internal_ilogb(x);
}

int ilogb(double x) NOEXCEPT
{
    return internal_ilogb(x);
}

int ilogbf(float x) NOEXCEPT
{
    return internal_ilogb(x);
}

long double logbl(long double x) NOEXCEPT
{
    return ilogbl(x);
}

double logb(double x) NOEXCEPT
{
    return ilogb(x);
}

float logbf(float x) NOEXCEPT
{
    return ilogbf(x);
}

double frexp(double x, int* exp) NOEXCEPT
{
    *exp = (x == 0) ? 0 : (1 + ilogb(x));
    return scalbn(x, -(*exp));
}

float frexpf(float x, int* exp) NOEXCEPT
{
    *exp = (x == 0) ? 0 : (1 + ilogbf(x));
    return scalbnf(x, -(*exp));
}

long double frexpl(long double x, int* exp) NOEXCEPT
{
    *exp = (x == 0) ? 0 : (1 + ilogbl(x));
    return scalbnl(x, -(*exp));
}

double round(double x) NOEXCEPT
{
#if ARCH(RISCV64)
    if (fabs(x) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.d %0, %1, rmm"
            : "=r"(output)
            : "f"(x));
        return static_cast<double>(output);
    }
#endif

    return internal_to_integer(x, RoundingMode::ToEven);
}

float roundf(float x) NOEXCEPT
{
#if ARCH(RISCV64)
    if (fabsf(x) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.s %0, %1, rmm"
            : "=r"(output)
            : "f"(x));
        return static_cast<float>(output);
    }
#endif

    return internal_to_integer(x, RoundingMode::ToEven);
}

long double roundl(long double value) NOEXCEPT
{
    return internal_to_integer(value, RoundingMode::ToEven);
}

long lroundf(float value) NOEXCEPT
{
#if ARCH(RISCV64)
    i64 output;
    asm("fcvt.l.s %0, %1, rmm"
        : "=r"(output)
        : "f"(value));
    return output;
#endif

    return internal_to_integer(value, RoundingMode::ToEven);
}

long lround(double value) NOEXCEPT
{
#if ARCH(RISCV64)
    i64 output;
    asm("fcvt.l.d %0, %1, rmm"
        : "=r"(output)
        : "f"(value));
    return output;
#endif

    return internal_to_integer(value, RoundingMode::ToEven);
}

long lroundl(long double value) NOEXCEPT
{
    return internal_to_integer(value, RoundingMode::ToEven);
}

long long llroundf(float value) NOEXCEPT
{
#if ARCH(RISCV64)
    i64 output;
    asm("fcvt.l.s %0, %1, rmm"
        : "=r"(output)
        : "f"(value));
    return output;
#endif

    return internal_to_integer(value, RoundingMode::ToEven);
}

long long llround(double value) NOEXCEPT
{
#if ARCH(RISCV64)
    i64 output;
    asm("fcvt.l.d %0, %1, rmm"
        : "=r"(output)
        : "f"(value));
    return output;
#endif

    return internal_to_integer(value, RoundingMode::ToEven);
}

long long llroundd(long double value) NOEXCEPT
{
    return internal_to_integer(value, RoundingMode::ToEven);
}

float floorf(float value) NOEXCEPT
{
#if ARCH(RISCV64)
    if (fabsf(value) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.s %0, %1, rdn"
            : "=r"(output)
            : "f"(value));
        return static_cast<float>(output);
    }
#elif ARCH(X86_64)
    AK::X87RoundingModeScope scope { AK::RoundingMode::DOWN };
    asm("frndint"
        : "+t"(value));
    return value;
#endif
    return internal_to_integer(value, RoundingMode::Down);
}

double floor(double value) NOEXCEPT
{
#if ARCH(RISCV64)
    if (fabs(value) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.d %0, %1, rdn"
            : "=r"(output)
            : "f"(value));
        return static_cast<double>(output);
    }
#elif ARCH(X86_64)
    AK::X87RoundingModeScope scope { AK::RoundingMode::DOWN };
    asm("frndint"
        : "+t"(value));
    return value;
#endif
    return internal_to_integer(value, RoundingMode::Down);
}

long double floorl(long double value) NOEXCEPT
{
#if ARCH(X86_64)
    AK::X87RoundingModeScope scope { AK::RoundingMode::DOWN };
    asm("frndint"
        : "+t"(value));
    return value;
#endif
    return internal_to_integer(value, RoundingMode::Down);
}

float ceilf(float value) NOEXCEPT
{
#if ARCH(RISCV64)
    if (fabsf(value) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.s %0, %1, rup"
            : "=r"(output)
            : "f"(value));
        return static_cast<float>(output);
    }
#elif ARCH(X86_64)
    AK::X87RoundingModeScope scope { AK::RoundingMode::UP };
    asm("frndint"
        : "+t"(value));
    return value;
#endif
    return internal_to_integer(value, RoundingMode::Up);
}

double ceil(double value) NOEXCEPT
{
#if ARCH(RISCV64)
    if (fabs(value) < LONG_LONG_MAX) {
        i64 output;
        asm("fcvt.l.d %0, %1, rup"
            : "=r"(output)
            : "f"(value));
        return static_cast<double>(output);
    }
#elif ARCH(X86_64)
    AK::X87RoundingModeScope scope { AK::RoundingMode::UP };
    asm("frndint"
        : "+t"(value));
    return value;
#endif
    return internal_to_integer(value, RoundingMode::Up);
}

long double ceill(long double value) NOEXCEPT
{
#if ARCH(X86_64)
    AK::X87RoundingModeScope scope { AK::RoundingMode::UP };
    asm("frndint"
        : "+t"(value));
    return value;
#endif
    return internal_to_integer(value, RoundingMode::Up);
}

long double modfl(long double x, long double* intpart) NOEXCEPT
{
    return internal_modf(x, intpart);
}

double modf(double x, double* intpart) NOEXCEPT
{
    return internal_modf(x, intpart);
}

float modff(float x, float* intpart) NOEXCEPT
{
    return internal_modf(x, intpart);
}

double gamma(double x) NOEXCEPT
{
    // Stirling approximation
    return sqrt(2.0 * M_PI / x) * pow(x / M_E, x);
}

long double tgammal(long double value) NOEXCEPT
{
    return internal_gamma(value);
}

double tgamma(double value) NOEXCEPT
{
    return internal_gamma(value);
}

float tgammaf(float value) NOEXCEPT
{
    return internal_gamma(value);
}

int signgam = 0;

long double lgammal(long double value) NOEXCEPT
{
    return lgammal_r(value, &signgam);
}

double lgamma(double value) NOEXCEPT
{
    return lgamma_r(value, &signgam);
}

float lgammaf(float value) NOEXCEPT
{
    return lgammaf_r(value, &signgam);
}

long double lgammal_r(long double value, int* sign) NOEXCEPT
{
    if (value == 1.0 || value == 2.0)
        return 0.0;
    if (isinf(value) || value == 0.0)
        return INFINITY;
    long double result = logl(internal_gamma(value));
    *sign = signbit(result) ? -1 : 1;
    return result;
}

double lgamma_r(double value, int* sign) NOEXCEPT
{
    if (value == 1.0 || value == 2.0)
        return 0.0;
    if (isinf(value) || value == 0.0)
        return INFINITY;
    double result = log(internal_gamma(value));
    *sign = signbit(result) ? -1 : 1;
    return result;
}

float lgammaf_r(float value, int* sign) NOEXCEPT
{
    if (value == 1.0f || value == 2.0f)
        return 0.0;
    if (isinf(value) || value == 0.0f)
        return INFINITY;
    float result = logf(internal_gamma(value));
    *sign = signbit(result) ? -1 : 1;
    return result;
}

long double expm1l(long double x) NOEXCEPT
{
    return expl(x) - 1;
}

double expm1(double x) NOEXCEPT
{
    return exp(x) - 1;
}

float expm1f(float x) NOEXCEPT
{
    return expf(x) - 1;
}

long double log1pl(long double x) NOEXCEPT
{
    return logl(1 + x);
}

double log1p(double x) NOEXCEPT
{
    return log(1 + x);
}

float log1pf(float x) NOEXCEPT
{
    return logf(1 + x);
}

long double erfl(long double x) NOEXCEPT
{
    // algorithm taken from Abramowitz and Stegun (no. 26.2.17)
    long double t = 1 / (1 + 0.47047l * fabsl(x));
    long double poly = t * (0.3480242l + t * (-0.958798l + t * 0.7478556l));
    long double answer = 1 - poly * expl(-x * x);
    if (x < 0)
        return -answer;

    return answer;
}

double erf(double x) NOEXCEPT
{
    return (double)erfl(x);
}

float erff(float x) NOEXCEPT
{
    return (float)erf(x);
}

long double erfcl(long double x) NOEXCEPT
{
    return 1 - erfl(x);
}

double erfc(double x) NOEXCEPT
{
    return 1 - erf(x);
}

float erfcf(float x) NOEXCEPT
{
    return 1 - erff(x);
}

double nextafter(double x, double target) NOEXCEPT
{
    if (x == target)
        return target;
    return internal_nextafter(x, target >= x);
}

float nextafterf(float x, float target) NOEXCEPT
{
    if (x == target)
        return target;
    return internal_nextafter(x, target >= x);
}

long double nextafterl(long double x, long double target) NOEXCEPT
{
    return internal_nextafter(x, target >= x);
}

double nexttoward(double x, long double target) NOEXCEPT
{
    if (x == target)
        return target;
    return internal_nextafter(x, target >= x);
}

float nexttowardf(float x, long double target) NOEXCEPT
{
    if (x == target)
        return target;
    return internal_nextafter(x, target >= x);
}

long double nexttowardl(long double x, long double target) NOEXCEPT
{
    if (x == target)
        return target;
    return internal_nextafter(x, target >= x);
}

float copysignf(float x, float y) NOEXCEPT
{
    return internal_copysign(x, y);
}

double copysign(double x, double y) NOEXCEPT
{
    return internal_copysign(x, y);
}

long double copysignl(long double x, long double y) NOEXCEPT
{
    return internal_copysign(x, y);
}

float scalbnf(float x, int exponent) NOEXCEPT
{
    return internal_scalbn(x, exponent);
}

double scalbn(double x, int exponent) NOEXCEPT
{
    return internal_scalbn(x, exponent);
}

long double scalbnl(long double x, int exponent) NOEXCEPT
{
    return internal_scalbn(x, exponent);
}

float scalbnlf(float x, long exponent) NOEXCEPT
{
    return internal_scalbn(x, exponent);
}

double scalbln(double x, long exponent) NOEXCEPT
{
    return internal_scalbn(x, exponent);
}

long double scalblnl(long double x, long exponent) NOEXCEPT
{
    return internal_scalbn(x, exponent);
}

long double fmaxl(long double x, long double y) NOEXCEPT
{
    if (isnan(x))
        return y;
    if (isnan(y))
        return x;

    return x > y ? x : y;
}

double fmax(double x, double y) NOEXCEPT
{
    if (isnan(x))
        return y;
    if (isnan(y))
        return x;

    return x > y ? x : y;
}

float fmaxf(float x, float y) NOEXCEPT
{
    if (isnan(x))
        return y;
    if (isnan(y))
        return x;

    return x > y ? x : y;
}

long double fminl(long double x, long double y) NOEXCEPT
{
    if (isnan(x))
        return y;
    if (isnan(y))
        return x;

    return x < y ? x : y;
}

double fmin(double x, double y) NOEXCEPT
{
    if (isnan(x))
        return y;
    if (isnan(y))
        return x;

    return x < y ? x : y;
}

float fminf(float x, float y) NOEXCEPT
{
    if (isnan(x))
        return y;
    if (isnan(y))
        return x;

    return x < y ? x : y;
}

// https://pubs.opengroup.org/onlinepubs/9699919799/functions/fma.html
long double fmal(long double x, long double y, long double z) NOEXCEPT
{
    return (x * y) + z;
}

double fma(double x, double y, double z) NOEXCEPT
{
    return (x * y) + z;
}

float fmaf(float x, float y, float z) NOEXCEPT
{
    return (x * y) + z;
}

long double nearbyintl(long double value) NOEXCEPT
{
    return internal_to_integer(value, RoundingMode { fegetround() });
}

double nearbyint(double value) NOEXCEPT
{
    return internal_to_integer(value, RoundingMode { fegetround() });
}

float nearbyintf(float value) NOEXCEPT
{
    return internal_to_integer(value, RoundingMode { fegetround() });
}
}

#if defined(AK_COMPILER_CLANG)
#    pragma clang diagnostic pop
#endif