blob: 91814bda7dd7edaa9adce42e8b71e9d2e4c6e1c7 [file] [log] [blame]
//===-- Utility class to manipulate fixed point numbers. --*- C++ -*-=========//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#ifndef LLVM_LIBC_SRC___SUPPORT_FIXED_POINT_FX_BITS_H
#define LLVM_LIBC_SRC___SUPPORT_FIXED_POINT_FX_BITS_H
#include "include/llvm-libc-macros/stdfix-macros.h"
#include "src/__support/CPP/algorithm.h"
#include "src/__support/CPP/bit.h"
#include "src/__support/CPP/limits.h" // numeric_limits
#include "src/__support/CPP/type_traits.h"
#include "src/__support/libc_assert.h"
#include "src/__support/macros/attributes.h" // LIBC_INLINE
#include "src/__support/macros/config.h" // LIBC_NAMESPACE_DECL
#include "src/__support/macros/null_check.h" // LIBC_CRASH_ON_VALUE
#include "src/__support/macros/optimization.h" // LIBC_UNLIKELY
#include "src/__support/math_extras.h"
#include "fx_rep.h"
#ifdef LIBC_COMPILER_HAS_FIXED_POINT
namespace LIBC_NAMESPACE_DECL {
namespace fixed_point {
template <typename T> struct FXBits {
private:
using fx_rep = FXRep<T>;
using StorageType = typename fx_rep::StorageType;
StorageType value;
static_assert(fx_rep::FRACTION_LEN > 0);
static constexpr size_t FRACTION_OFFSET = 0; // Just for completeness
static constexpr size_t INTEGRAL_OFFSET =
fx_rep::INTEGRAL_LEN == 0 ? 0 : fx_rep::FRACTION_LEN;
static constexpr size_t SIGN_OFFSET =
fx_rep::SIGN_LEN == 0
? 0
: ((sizeof(StorageType) * CHAR_BIT) - fx_rep::SIGN_LEN);
static constexpr StorageType FRACTION_MASK =
mask_trailing_ones<StorageType, fx_rep::FRACTION_LEN>()
<< FRACTION_OFFSET;
static constexpr StorageType INTEGRAL_MASK =
mask_trailing_ones<StorageType, fx_rep::INTEGRAL_LEN>()
<< INTEGRAL_OFFSET;
static constexpr StorageType SIGN_MASK =
(fx_rep::SIGN_LEN == 0 ? 0 : StorageType(1) << SIGN_OFFSET);
// mask for <integral | fraction>
static constexpr StorageType VALUE_MASK = INTEGRAL_MASK | FRACTION_MASK;
// mask for <sign | integral | fraction>
static constexpr StorageType TOTAL_MASK = SIGN_MASK | VALUE_MASK;
public:
LIBC_INLINE constexpr FXBits() = default;
template <typename XType> LIBC_INLINE constexpr explicit FXBits(XType x) {
using Unqual = typename cpp::remove_cv_t<XType>;
if constexpr (cpp::is_same_v<Unqual, T>) {
value = cpp::bit_cast<StorageType>(x);
} else if constexpr (cpp::is_same_v<Unqual, StorageType>) {
value = x;
} else {
// We don't want accidental type promotions/conversions, so we require
// exact type match.
static_assert(cpp::always_false<XType>);
}
}
LIBC_INLINE constexpr StorageType get_fraction() {
return (value & FRACTION_MASK) >> FRACTION_OFFSET;
}
LIBC_INLINE constexpr StorageType get_integral() {
return (value & INTEGRAL_MASK) >> INTEGRAL_OFFSET;
}
// returns complete bitstring representation the fixed point number
// the bitstring is of the form: padding | sign | integral | fraction
LIBC_INLINE constexpr StorageType get_bits() {
return (value & TOTAL_MASK) >> FRACTION_OFFSET;
}
// TODO: replace bool with Sign
LIBC_INLINE constexpr bool get_sign() {
return static_cast<bool>((value & SIGN_MASK) >> SIGN_OFFSET);
}
// This represents the effective negative exponent applied to this number
LIBC_INLINE constexpr int get_exponent() { return fx_rep::FRACTION_LEN; }
LIBC_INLINE constexpr void set_fraction(StorageType fraction) {
value = (value & (~FRACTION_MASK)) |
((fraction << FRACTION_OFFSET) & FRACTION_MASK);
}
LIBC_INLINE constexpr void set_integral(StorageType integral) {
value = (value & (~INTEGRAL_MASK)) |
((integral << INTEGRAL_OFFSET) & INTEGRAL_MASK);
}
// TODO: replace bool with Sign
LIBC_INLINE constexpr void set_sign(bool sign) {
value = (value & (~SIGN_MASK)) |
((static_cast<StorageType>(sign) << SIGN_OFFSET) & SIGN_MASK);
}
LIBC_INLINE constexpr T get_val() const { return cpp::bit_cast<T>(value); }
};
// Bit-wise operations are not available for fixed point types yet.
template <typename T>
LIBC_INLINE constexpr cpp::enable_if_t<cpp::is_fixed_point_v<T>, T>
bit_and(T x, T y) {
using BitType = typename FXRep<T>::StorageType;
BitType x_bit = cpp::bit_cast<BitType>(x);
BitType y_bit = cpp::bit_cast<BitType>(y);
// For some reason, bit_cast cannot deduce BitType from the input.
return cpp::bit_cast<T, BitType>(x_bit & y_bit);
}
template <typename T>
LIBC_INLINE constexpr cpp::enable_if_t<cpp::is_fixed_point_v<T>, T>
bit_or(T x, T y) {
using BitType = typename FXRep<T>::StorageType;
BitType x_bit = cpp::bit_cast<BitType>(x);
BitType y_bit = cpp::bit_cast<BitType>(y);
// For some reason, bit_cast cannot deduce BitType from the input.
return cpp::bit_cast<T, BitType>(x_bit | y_bit);
}
template <typename T>
LIBC_INLINE constexpr cpp::enable_if_t<cpp::is_fixed_point_v<T>, T>
bit_not(T x) {
using BitType = typename FXRep<T>::StorageType;
BitType x_bit = cpp::bit_cast<BitType>(x);
// For some reason, bit_cast cannot deduce BitType from the input.
return cpp::bit_cast<T, BitType>(static_cast<BitType>(~x_bit));
}
template <typename T> LIBC_INLINE constexpr T abs(T x) {
using FXRep = FXRep<T>;
if constexpr (FXRep::SIGN_LEN == 0)
return x;
else {
if (LIBC_UNLIKELY(x == FXRep::MIN()))
return FXRep::MAX();
return (x < FXRep::ZERO() ? -x : x);
}
}
// Round-to-nearest, tie-to-(+Inf)
template <typename T> LIBC_INLINE constexpr T round(T x, int n) {
using FXRep = FXRep<T>;
if (LIBC_UNLIKELY(n < 0))
n = 0;
if (LIBC_UNLIKELY(n >= FXRep::FRACTION_LEN))
return x;
T round_bit = FXRep::EPS() << (FXRep::FRACTION_LEN - n - 1);
// Check for overflow.
if (LIBC_UNLIKELY(FXRep::MAX() - round_bit < x))
return FXRep::MAX();
T all_ones = bit_not(FXRep::ZERO());
int shift = FXRep::FRACTION_LEN - n;
T rounding_mask =
(shift == FXRep::TOTAL_LEN) ? FXRep::ZERO() : (all_ones << shift);
return bit_and((x + round_bit), rounding_mask);
}
// count leading sign bits
// TODO: support fixed_point_padding
template <typename T>
LIBC_INLINE constexpr cpp::enable_if_t<cpp::is_fixed_point_v<T>, int>
countls(T f) {
using FXRep = FXRep<T>;
using BitType = typename FXRep::StorageType;
using FXBits = FXBits<T>;
if constexpr (FXRep::SIGN_LEN > 0) {
if (f < 0)
f = bit_not(f);
}
BitType value_bits = FXBits(f).get_bits();
return cpp::countl_zero(value_bits) - FXRep::SIGN_LEN;
}
// fixed-point to integer conversion
template <typename T, typename XType>
LIBC_INLINE constexpr cpp::enable_if_t<cpp::is_fixed_point_v<T>, XType>
bitsfx(T f) {
return cpp::bit_cast<XType, T>(f);
}
// divide the two fixed-point types and return an integer result
template <typename T, typename XType>
LIBC_INLINE constexpr cpp::enable_if_t<cpp::is_fixed_point_v<T>, XType>
idiv(T x, T y) {
using FXBits = FXBits<T>;
using FXRep = FXRep<T>;
using CompType = typename FXRep::CompType;
// If the value of the second operand of the / operator is zero, the
// behavior is undefined. Ref: ISO/IEC TR 18037:2008(E) p.g. 16
LIBC_CRASH_ON_VALUE(y, FXRep::ZERO());
CompType x_comp = static_cast<CompType>(FXBits(x).get_bits());
CompType y_comp = static_cast<CompType>(FXBits(y).get_bits());
// If an integer result of one of these functions overflows, the behavior is
// undefined. Ref: ISO/IEC TR 18037:2008(E) p.g. 16
CompType result = x_comp / y_comp;
return static_cast<XType>(result);
}
LIBC_INLINE long accum nrstep(long accum d, long accum x0) {
auto v = x0 * (2.lk - (d * x0));
return v;
}
// Divide the two integers and return a fixed_point value
//
// For reference, see:
// https://en.wikipedia.org/wiki/Division_algorithm#Newton%E2%80%93Raphson_division
// https://stackoverflow.com/a/9231996
template <typename XType> LIBC_INLINE constexpr XType divi(int n, int d) {
// If the value of the second operand of the / operator is zero, the
// behavior is undefined. Ref: ISO/IEC TR 18037:2008(E) p.g. 16
LIBC_CRASH_ON_VALUE(d, 0);
if (LIBC_UNLIKELY(n == 0)) {
return FXRep<XType>::ZERO();
}
auto is_power_of_two = [](int n) { return (n > 0) && ((n & (n - 1)) == 0); };
long accum max_val = static_cast<long accum>(FXRep<XType>::MAX());
long accum min_val = static_cast<long accum>(FXRep<XType>::MIN());
if (is_power_of_two(cpp::abs(d))) {
int k = cpp::countr_zero<uint32_t>(static_cast<uint32_t>(cpp::abs(d)));
constexpr int F = FXRep<XType>::FRACTION_LEN;
int64_t scaled_n = static_cast<int64_t>(n) << F;
int64_t res64 = scaled_n >> k;
constexpr int TOTAL_BITS = sizeof(XType) * 8;
const int64_t max_limit = (1LL << (TOTAL_BITS - 1)) - 1;
const int64_t min_limit = -(1LL << (TOTAL_BITS - 1));
if (res64 > max_limit) {
return FXRep<XType>::MAX();
} else if (res64 < min_limit) {
return FXRep<XType>::MIN();
}
long accum res_accum =
static_cast<long accum>(res64) / static_cast<long accum>(1 << F);
res_accum = (d < 0) ? static_cast<long accum>(-1) * res_accum : res_accum;
if (res_accum > max_val) {
return FXRep<XType>::MAX();
} else if (res_accum < min_val) {
return FXRep<XType>::MIN();
}
return static_cast<XType>(res_accum);
}
bool result_is_negative = ((n < 0) != (d < 0));
int64_t n64 = static_cast<int64_t>(n);
int64_t d64 = static_cast<int64_t>(d);
uint64_t nv = static_cast<uint64_t>(n64 < 0 ? -n64 : n64);
uint64_t dv = static_cast<uint64_t>(d64 < 0 ? -d64 : d64);
if (d == INT_MIN) {
nv <<= 1;
dv >>= 1;
}
uint32_t clz = cpp::countl_zero<uint32_t>(static_cast<uint32_t>(dv)) - 1;
uint64_t scaled_val = dv << clz;
// Scale denominator to be in the range of [0.5,1]
FXBits<long accum> d_scaled{scaled_val};
uint64_t scaled_val_n = nv << clz;
// Scale the numerator as much as the denominator to maintain correctness of
// the original equation
FXBits<long accum> n_scaled{scaled_val_n};
long accum n_scaled_val = n_scaled.get_val();
long accum d_scaled_val = d_scaled.get_val();
// x0 = (48/17) - (32/17) * d_n
long accum a = 0x2.d89d89d8p0lk; // 48/17 = 2.8235294...
long accum b = 0x1.e1e1e1e1p0lk; // 32/17 = 1.8823529...
// Error of the initial approximation, as derived
// from the wikipedia article is
// E0 = 1/17 = 0.059 (5.9%)
long accum initial_approx = a - (b * d_scaled_val);
// Since, 0.5 <= d_scaled_val <= 1.0, 0.9412 <= initial_approx <= 1.88235
LIBC_ASSERT((initial_approx >= 0x0.78793dd9p0lk) &&
(initial_approx <= 0x1.f0f0d845p0lk));
// Each newton-raphson iteration will square the error, due
// to quadratic convergence. So,
// E1 = (0.059)^2 = 0.0034
long accum val = nrstep(d_scaled_val, initial_approx);
if constexpr (FXRep<XType>::FRACTION_LEN > 8) {
// E2 = 0.0000121
val = nrstep(d_scaled_val, val);
if constexpr (FXRep<XType>::FRACTION_LEN > 16) {
// E3 = 1.468e−10
val = nrstep(d_scaled_val, val);
}
}
long accum res = n_scaled_val * val;
if (result_is_negative) {
res *= static_cast<long accum>(-1);
}
// Per clause 7.18a.6.1, saturate values on overflow
if (res > max_val) {
return FXRep<XType>::MAX();
} else if (res < min_val) {
return FXRep<XType>::MIN();
} else {
return static_cast<XType>(res);
}
}
} // namespace fixed_point
} // namespace LIBC_NAMESPACE_DECL
#endif // LIBC_COMPILER_HAS_FIXED_POINT
#endif // LLVM_LIBC_SRC___SUPPORT_FIXED_POINT_FX_BITS_H