Source code for gfloat.round

# Copyright (c) 2024 Graphcore Ltd. All rights reserved.

import math

import numpy as np

from .types import FormatInfo, RoundMode


def _isodd(v: int) -> bool:
    return v & 0x1 == 1


[docs]def round_float(
    fi: FormatInfo,
    v: float,
    rnd: RoundMode = RoundMode.TiesToEven,
    sat: bool = False,
    srbits: int = -1,
    srnumbits: int = 0,
) -> float:
    """
    Round input to the given :py:class:`FormatInfo`, given rounding mode and saturation flag

    An input NaN will convert to a NaN in the target.
    An input Infinity will convert to the largest float if :paramref:`sat`,
    otherwise to an Inf, if present, otherwise to a NaN.
    Negative zero will be returned if the format has negative zero, otherwise zero.

    Args:
      fi (FormatInfo): Describes the target format
      v (float): Input value to be rounded
      rnd (RoundMode): Rounding mode to use
      sat (bool): Saturation flag: if True, round overflowed values to `fi.max`
      srbits (int): Bits to use for stochastic rounding if rnd == Stochastic.
      srnumbits (int): How many bits are in srbits.  Implies srbits < 2**srnumbits.

    Returns:
      A float which is one of the values in the format.

    Raises:
       ValueError: The target format cannot represent the input
             (e.g. converting a `NaN`, or an `Inf` when the target has no
             `NaN` or `Inf`, and :paramref:`sat` is false)
       ValueError: Inconsistent arguments, e.g. srnumbits >= 2**srnumbits
    """

    # Constants
    p = fi.precision
    bias = fi.expBias

    if rnd in (RoundMode.Stochastic, RoundMode.StochasticFast):
        if srbits >= 2**srnumbits:
            raise ValueError(f"srnumbits={srnumbits} >= 2**srnumbits={2**srnumbits}")

    if np.isnan(v):
        if fi.num_nans == 0:
            raise ValueError(f"No NaN in format {fi}")

        # Note that this does not preserve the NaN payload
        return np.nan

    # Extract sign
    sign = np.signbit(v) and fi.is_signed
    vpos = -v if sign else v

    if np.isinf(vpos):
        result = np.inf

    elif vpos == 0:
        result = 0

    else:
        # Extract exponent
        expval = int(np.floor(np.log2(vpos)))

        # Effective precision, accounting for right shift for subnormal values
        if fi.has_subnormals:
            expval = max(expval, 1 - bias)

        # Lift to "integer * 2^e"
        expval = expval - p + 1

        # use ldexp instead of vpos*2**-expval to avoid overflow
        fsignificand = math.ldexp(vpos, -expval)

        # Round
        isignificand = math.floor(fsignificand)
        delta = fsignificand - isignificand

        code_is_odd = (
            _isodd(isignificand)
            if fi.precision > 1
            else (isignificand != 0 and _isodd(expval + bias))
        )

        match rnd:
            case RoundMode.TowardZero:
                should_round_away = False
            case RoundMode.TowardPositive:
                should_round_away = not sign and delta > 0
            case RoundMode.TowardNegative:
                should_round_away = sign and delta > 0
            case RoundMode.TiesToAway:
                should_round_away = delta >= 0.5
            case RoundMode.TiesToEven:
                should_round_away = delta > 0.5 or (delta == 0.5 and code_is_odd)
            case RoundMode.Stochastic:
                ## RTNE delta to srbits
                d = delta * 2.0**srnumbits
                floord = np.floor(d).astype(np.int64)
                d = floord + (
                    (d - floord > 0.5) or ((d - floord == 0.5) and _isodd(floord))
                )

                should_round_away = d > srbits
            case RoundMode.StochasticOdd:
                ## RTNE delta to srbits
                d = delta * 2.0**srnumbits
                floord = np.floor(d).astype(np.int64)
                d = floord + (
                    (d - floord > 0.5) or ((d - floord == 0.5) and ~_isodd(floord))
                )

                should_round_away = d > srbits
            case RoundMode.StochasticFast:
                should_round_away = delta > (0.5 + srbits) * 2.0**-srnumbits
            case RoundMode.StochasticFastest:
                should_round_away = delta > srbits * 2.0**-srnumbits

        if should_round_away:
            # This may increase isignificand to 2**p,
            # which would require special casing in encode,
            # but not here, where we reconstruct a rounded value.
            isignificand += 1

        # Reconstruct rounded result to float
        result = isignificand * (2.0**expval)

    if result == 0:
        if sign and fi.has_nz:
            return -0.0
        else:
            return 0.0

    # Overflow
    amax = -fi.min if sign else fi.max
    if result > amax:
        if (
            sat
            or (rnd == RoundMode.TowardNegative and not sign and np.isfinite(v))
            or (rnd == RoundMode.TowardPositive and sign and np.isfinite(v))
            or (rnd == RoundMode.TowardZero and np.isfinite(v))
        ):
            result = amax
        else:
            if fi.has_infs:
                result = np.inf
            elif fi.num_nans > 0:
                result = np.nan
            else:
                raise ValueError(f"No Infs or NaNs in format {fi}, and sat=False")

    # Set sign
    if sign:
        result = -result

    return result