use util::*;
use super::float::ExtendedFloat;
use super::mantissa::Mantissa;
use super::shift::*;
#[inline]
pub(crate) fn round_nearest<M>(fp: &mut ExtendedFloat<M>, shift: i32)
-> (bool, bool)
where M: Mantissa
{
let mask: M = lower_n_mask(as_cast(shift));
let halfway: M = lower_n_halfway(as_cast(shift));
let truncated_bits = fp.mant & mask;
let is_above = truncated_bits > halfway;
let is_halfway = truncated_bits == halfway;
overflowing_shr(fp, shift);
(is_above, is_halfway)
}
#[inline]
pub(crate) fn tie_even<M>(fp: &mut ExtendedFloat<M>, is_above: bool, is_halfway: bool)
where M: Mantissa
{
let is_odd = fp.mant & M::ONE == M::ONE;
if is_above || (is_odd && is_halfway) {
fp.mant += M::ONE;
}
}
#[inline]
pub(crate) fn round_nearest_tie_even<M>(fp: &mut ExtendedFloat<M>, shift: i32)
where M: Mantissa
{
let (is_above, is_halfway) = round_nearest(fp, shift);
tie_even(fp, is_above, is_halfway);
}
#[inline]
pub(crate) fn tie_away_zero<M>(fp: &mut ExtendedFloat<M>, is_above: bool, is_halfway: bool)
where M: Mantissa
{
if is_above || is_halfway {
fp.mant += M::ONE;
}
}
#[inline]
pub(crate) fn round_nearest_tie_away_zero<M>(fp: &mut ExtendedFloat<M>, shift: i32)
where M: Mantissa
{
let (is_above, is_halfway) = round_nearest(fp, shift);
tie_away_zero(fp, is_above, is_halfway);
}
#[inline]
pub(crate) fn round_toward<M>(fp: &mut ExtendedFloat<M>, shift: i32)
-> bool
where M: Mantissa
{
let mask: M = lower_n_mask(as_cast(shift));
let truncated_bits = fp.mant & mask;
overflowing_shr(fp, shift);
truncated_bits != M::ZERO
}
#[inline]
pub(crate) fn upward<M>(fp: &mut ExtendedFloat<M>, is_truncated: bool)
where M: Mantissa
{
if is_truncated {
fp.mant += M::ONE;
}
}
#[inline]
pub(crate) fn round_upward<M>(fp: &mut ExtendedFloat<M>, shift: i32)
where M: Mantissa
{
let is_truncated = round_toward(fp, shift);
upward(fp, is_truncated);
}
#[inline]
pub(crate) fn downard<M>(_: &mut ExtendedFloat<M>, _: bool)
where M: Mantissa
{}
#[inline]
pub(crate) fn round_downward<M>(fp: &mut ExtendedFloat<M>, shift: i32)
where M: Mantissa
{
let is_truncated = round_toward(fp, shift);
downard(fp, is_truncated);
}
pub trait FloatRounding<M: Mantissa>: Float {
const DEFAULT_SHIFT: i32;
const CARRY_MASK: M;
}
macro_rules! float_rounding_f32 {
($($t:tt)*) => ($(
impl FloatRounding<$t> for f32 {
const DEFAULT_SHIFT: i32 = $t::FULL - f32::MANTISSA_SIZE - 1;
const CARRY_MASK: $t = 0x1000000;
}
)*)
}
#[cfg(has_i128)]
float_rounding_f32! { u64 u128 }
#[cfg(not(has_i128))]
float_rounding_f32! { u64 }
macro_rules! float_rounding_f64 {
($($t:tt)*) => ($(
impl FloatRounding<$t> for f64 {
const DEFAULT_SHIFT: i32 = $t::FULL - f64::MANTISSA_SIZE - 1;
const CARRY_MASK: $t = 0x20000000000000;
}
)*)
}
#[cfg(has_i128)]
float_rounding_f64! { u64 u128 }
#[cfg(not(has_i128))]
float_rounding_f64! { u64 }
#[inline]
pub(crate) fn round_to_float<T, M, Cb>(fp: &mut ExtendedFloat<M>, cb: Cb)
where T: FloatRounding<M>,
M: Mantissa,
Cb: FnOnce(&mut ExtendedFloat<M>, i32)
{
let final_exp = fp.exp + T::DEFAULT_SHIFT;
if final_exp < T::DENORMAL_EXPONENT {
let diff = T::DENORMAL_EXPONENT - fp.exp;
if diff <= M::FULL {
cb(fp, diff);
} else {
fp.mant = M::ZERO;
fp.exp = 0;
}
} else {
cb(fp, T::DEFAULT_SHIFT);
}
if fp.mant & T::CARRY_MASK == T::CARRY_MASK {
shr(fp, 1);
}
}
#[inline]
pub(crate) fn avoid_overflow<T, M>(fp: &mut ExtendedFloat<M>)
where T: FloatRounding<M>,
M: Mantissa
{
if fp.exp >= T::MAX_EXPONENT {
let diff = fp.exp - T::MAX_EXPONENT;
if diff <= T::MANTISSA_SIZE {
let bit = as_cast(T::MANTISSA_SIZE+1);
let n = as_cast(diff+1);
let mask: M = internal_n_mask(bit, n);
if (fp.mant & mask).is_zero() {
let shift = diff + 1;
shl(fp, shift);
}
}
}
}
#[inline]
pub(crate) fn round_to_native<T, M, Cb>(fp: &mut ExtendedFloat<M>, cb: Cb)
where T: FloatRounding<M>,
M: Mantissa,
Cb: FnOnce(&mut ExtendedFloat<M>, i32)
{
fp.normalize();
round_to_float::<T, M, _>(fp, cb);
avoid_overflow::<T, M>(fp);
}
#[inline]
#[allow(unused_variables)]
pub(crate) fn internal_rounding(kind: RoundingKind, sign: Sign)
-> RoundingKind
{
#[cfg(not(feature = "rounding"))] {
RoundingKind::NearestTieEven
}
#[cfg(feature = "rounding")] {
match sign {
Sign::Positive => {
match kind {
RoundingKind::TowardPositiveInfinity => RoundingKind::Upward,
RoundingKind::TowardNegativeInfinity => RoundingKind::Downward,
RoundingKind::TowardZero => RoundingKind::Downward,
_ => kind,
}
},
Sign::Negative => {
match kind {
RoundingKind::TowardPositiveInfinity => RoundingKind::Downward,
RoundingKind::TowardNegativeInfinity => RoundingKind::Upward,
RoundingKind::TowardZero => RoundingKind::Downward,
_ => kind,
}
},
}
}
}
#[cfg(feature = "correct")]
#[inline]
#[allow(unused_variables)]
pub(crate) fn global_rounding(sign: Sign) -> RoundingKind {
#[cfg(not(feature = "rounding"))] {
RoundingKind::NearestTieEven
}
#[cfg(feature = "rounding")] {
unsafe {
internal_rounding(FLOAT_ROUNDING, sign)
}
}
}
#[cfg(test)]
mod tests {
use float::ExtendedFloat80;
use super::*;
#[test]
fn round_nearest_test() {
let mut fp = ExtendedFloat80 { mant: 0x60, exp: 0 };
let (above, halfway) = round_nearest(&mut fp, 6);
assert!(!above);
assert!(halfway);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x61, exp: 0 };
let (above, halfway) = round_nearest(&mut fp, 6);
assert!(above);
assert!(!halfway);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x5F, exp: 0 };
let (above, halfway) = round_nearest(&mut fp, 6);
assert!(!above);
assert!(!halfway);
assert_eq!(fp.mant, 1);
}
#[test]
fn round_nearest_tie_even_test() {
let mut fp = ExtendedFloat80 { mant: 0x60, exp: 0 };
round_nearest_tie_even(&mut fp, 6);
assert_eq!(fp.mant, 2);
let mut fp = ExtendedFloat80 { mant: 0x20, exp: 0 };
round_nearest_tie_even(&mut fp, 6);
assert_eq!(fp.mant, 0);
let mut fp = ExtendedFloat80 { mant: 0x61, exp: 0 };
round_nearest_tie_even(&mut fp, 6);
assert_eq!(fp.mant, 2);
let mut fp = ExtendedFloat80 { mant: 0x21, exp: 0 };
round_nearest_tie_even(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x5F, exp: 0 };
round_nearest_tie_even(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x1F, exp: 0 };
round_nearest_tie_even(&mut fp, 6);
assert_eq!(fp.mant, 0);
}
#[test]
fn round_nearest_tie_away_zero_test() {
let mut fp = ExtendedFloat80 { mant: 0x60, exp: 0 };
round_nearest_tie_away_zero(&mut fp, 6);
assert_eq!(fp.mant, 2);
let mut fp = ExtendedFloat80 { mant: 0x20, exp: 0 };
round_nearest_tie_away_zero(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x61, exp: 0 };
round_nearest_tie_away_zero(&mut fp, 6);
assert_eq!(fp.mant, 2);
let mut fp = ExtendedFloat80 { mant: 0x21, exp: 0 };
round_nearest_tie_away_zero(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x5F, exp: 0 };
round_nearest_tie_away_zero(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x1F, exp: 0 };
round_nearest_tie_away_zero(&mut fp, 6);
assert_eq!(fp.mant, 0);
}
#[test]
fn round_upward_test() {
let mut fp = ExtendedFloat80 { mant: 0x00, exp: 0 };
round_upward(&mut fp, 6);
assert_eq!(fp.mant, 0);
let mut fp = ExtendedFloat80 { mant: 0x40, exp: 0 };
round_upward(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x60, exp: 0 };
round_upward(&mut fp, 6);
assert_eq!(fp.mant, 2);
let mut fp = ExtendedFloat80 { mant: 0x70, exp: 0 };
round_upward(&mut fp, 6);
assert_eq!(fp.mant, 2);
}
#[test]
fn round_downward_test() {
let mut fp = ExtendedFloat80 { mant: 0x00, exp: 0 };
round_downward(&mut fp, 6);
assert_eq!(fp.mant, 0);
let mut fp = ExtendedFloat80 { mant: 0x40, exp: 0 };
round_downward(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x60, exp: 0 };
round_downward(&mut fp, 6);
assert_eq!(fp.mant, 1);
let mut fp = ExtendedFloat80 { mant: 0x70, exp: 0 };
round_downward(&mut fp, 6);
assert_eq!(fp.mant, 1);
}
#[test]
fn round_to_float_test() {
let mut fp = ExtendedFloat80 { mant: 1<<63, exp: f64::DENORMAL_EXPONENT - 15 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1<<48);
assert_eq!(fp.exp, f64::DENORMAL_EXPONENT);
let mut fp = ExtendedFloat80 { mant: 0x8000000000000400, exp: -63 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1<<52);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x8000000000000C00, exp: -63 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52) + 2);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x8000000000000401, exp: -63 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52)+1);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x8000000000000C01, exp: -63 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52) + 2);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x80000000000003FF, exp: -63 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1<<52);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x8000000000000BFF, exp: -63 };
round_to_float::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52) + 1);
assert_eq!(fp.exp, -52);
}
#[test]
fn avoid_overflow_test() {
let mut fp = ExtendedFloat80 { mant: 0xFFFFFFFFFFFF, exp: f64::MAX_EXPONENT + 5 };
avoid_overflow::<f64, _>(&mut fp);
assert_eq!(fp.mant, 0xFFFFFFFFFFFF);
assert_eq!(fp.exp, f64::MAX_EXPONENT+5);
let mut fp = ExtendedFloat80 { mant: 0xFFFFFFFFFFFF, exp: f64::MAX_EXPONENT + 4 };
avoid_overflow::<f64, _>(&mut fp);
assert_eq!(fp.mant, 0x1FFFFFFFFFFFE0);
assert_eq!(fp.exp, f64::MAX_EXPONENT-1);
}
#[test]
fn round_to_native_test() {
let mut fp = ExtendedFloat80 { mant: 0xFFFFFFFFFFFF, exp: f64::MAX_EXPONENT + 4 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 0x1FFFFFFFFFFFE0);
assert_eq!(fp.exp, f64::MAX_EXPONENT-1);
let mut fp = ExtendedFloat80 { mant: 1, exp: f64::DENORMAL_EXPONENT +48 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1<<48);
assert_eq!(fp.exp, f64::DENORMAL_EXPONENT);
let mut fp = ExtendedFloat80 { mant: 0x400000000000020, exp: -58 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1<<52);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x400000000000060, exp: -58 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52) + 2);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x400000000000021, exp: -58 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52)+1);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x400000000000061, exp: -58 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52) + 2);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x40000000000001F, exp: -58 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1<<52);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { mant: 0x40000000000005F, exp: -58 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, (1<<52) + 1);
assert_eq!(fp.exp, -52);
let mut fp = ExtendedFloat80 { exp: -1139, mant: 18446744073709550712 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 0);
assert_eq!(fp.exp, 0);
let mut fp = ExtendedFloat80 { exp: -1139, mant: 18446744073709551460 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 0);
assert_eq!(fp.exp, 0);
let mut fp = ExtendedFloat80 { exp: -1138, mant: 9223372036854776103 };
round_to_native::<f64, _, _>(&mut fp, round_nearest_tie_even);
assert_eq!(fp.mant, 1);
assert_eq!(fp.exp, -1074);
}
}