doxygen/APFloat_8cpp_source.html

//===-- APFloat.cpp - Implement APFloat class -----------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements a class to represent arbitrary precision floating

// point values and provide a variety of arithmetic operations on them.

//

//===----------------------------------------------------------------------===//


#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/FloatingPointMode.h"

#include "llvm/ADT/FoldingSet.h"

#include "llvm/ADT/Hashing.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/StringExtras.h"

#include "llvm/ADT/StringRef.h"

#include "llvm/Config/llvm-config.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/Error.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Support/raw_ostream.h"

#include <cstring>

#include <limits.h>


#define APFLOAT_DISPATCH_ON_SEMANTICS(METHOD_CALL)                             \

  do {                                                                         \

    if (usesLayout<IEEEFloat>(getSemantics()))                                 \

      return U.IEEE.METHOD_CALL;                                               \

    if (usesLayout<DoubleAPFloat>(getSemantics()))                             \

      return U.Double.METHOD_CALL;                                             \

    llvm_unreachable("Unexpected semantics");                                  \

  } while (false)


using namespace llvm;


/// A macro used to combine two fcCategory enums into one key which can be used

/// in a switch statement to classify how the interaction of two APFloat's

/// categories affects an operation.

///

/// TODO: If clang source code is ever allowed to use constexpr in its own

/// codebase, change this into a static inline function.

#define PackCategoriesIntoKey(_lhs, _rhs) ((_lhs) * 4 + (_rhs))


/* Assumed in hexadecimal significand parsing, and conversion to

   hexadecimal strings.  */

static_assert(APFloatBase::integerPartWidth % 4 == 0, "Part width must be divisible by 4!");


namespace llvm {


// How the nonfinite values Inf and NaN are represented.


enum class fltNonfiniteBehavior {

  // Represents standard IEEE 754 behavior. A value is nonfinite if the

  // exponent field is all 1s. In such cases, a value is Inf if the

  // significand bits are all zero, and NaN otherwise

  IEEE754,


  // This behavior is present in the Float8ExMyFN* types (Float8E4M3FN,

  // Float8E5M2FNUZ, Float8E4M3FNUZ, and Float8E4M3B11FNUZ). There is no

  // representation for Inf, and operations that would ordinarily produce Inf

  // produce NaN instead.

  // The details of the NaN representation(s) in this form are determined by the

  // `fltNanEncoding` enum. We treat all NaNs as quiet, as the available

  // encodings do not distinguish between signalling and quiet NaN.

  NanOnly,


  // This behavior is present in Float6E3M2FN, Float6E2M3FN, and

  // Float4E2M1FN types, which do not support Inf or NaN values.

  FiniteOnly,

};


// How NaN values are represented. This is curently only used in combination

// with fltNonfiniteBehavior::NanOnly, and using a variant other than IEEE

// while having IEEE non-finite behavior is liable to lead to unexpected

// results.


enum class fltNanEncoding {

  // Represents the standard IEEE behavior where a value is NaN if its

  // exponent is all 1s and the significand is non-zero.

  IEEE,


  // Represents the behavior in the Float8E4M3FN floating point type where NaN

  // is represented by having the exponent and mantissa set to all 1s.

  // This behavior matches the FP8 E4M3 type described in

  // https://arxiv.org/abs/2209.05433. We treat both signed and unsigned NaNs

  // as non-signalling, although the paper does not state whether the NaN

  // values are signalling or not.

  AllOnes,


  // Represents the behavior in Float8E{5,4}E{2,3}FNUZ floating point types

  // where NaN is represented by a sign bit of 1 and all 0s in the exponent

  // and mantissa (i.e. the negative zero encoding in a IEEE float). Since

  // there is only one NaN value, it is treated as quiet NaN. This matches the

  // behavior described in https://arxiv.org/abs/2206.02915 .

  NegativeZero,

};


/* Represents floating point arithmetic semantics.  */


struct fltSemantics {

  /* The largest E such that 2^E is representable; this matches the

     definition of IEEE 754.  */

  APFloatBase::ExponentType maxExponent;


  /* The smallest E such that 2^E is a normalized number; this

     matches the definition of IEEE 754.  */

  APFloatBase::ExponentType minExponent;


  /* Number of bits in the significand.  This includes the integer

     bit.  */

  unsigned int precision;


  /* Number of bits actually used in the semantics. */

  unsigned int sizeInBits;


  fltNonfiniteBehavior nonFiniteBehavior = fltNonfiniteBehavior::IEEE754;


  fltNanEncoding nanEncoding = fltNanEncoding::IEEE;


  /* Whether this semantics has an encoding for Zero */

  bool hasZero = true;


  /* Whether this semantics can represent signed values */

  bool hasSignedRepr = true;


  /* Whether the sign bit of this semantics is the most significant bit */

  bool hasSignBitInMSB = true;

};


constexpr fltSemantics APFloatBase::semIEEEhalf = {15, -14, 11, 16};

constexpr fltSemantics APFloatBase::semBFloat = {127, -126, 8, 16};

constexpr fltSemantics APFloatBase::semIEEEsingle = {127, -126, 24, 32};

constexpr fltSemantics APFloatBase::semIEEEdouble = {1023, -1022, 53, 64};

constexpr fltSemantics APFloatBase::semIEEEquad = {16383, -16382, 113, 128};

constexpr fltSemantics APFloatBase::semFloat8E5M2 = {15, -14, 3, 8};

constexpr fltSemantics APFloatBase::semFloat8E5M2FNUZ = {

    15, -15, 3, 8, fltNonfiniteBehavior::NanOnly, fltNanEncoding::NegativeZero};

constexpr fltSemantics APFloatBase::semFloat8E4M3 = {7, -6, 4, 8};

constexpr fltSemantics APFloatBase::semFloat8E4M3FN = {

    8, -6, 4, 8, fltNonfiniteBehavior::NanOnly, fltNanEncoding::AllOnes};

constexpr fltSemantics APFloatBase::semFloat8E4M3FNUZ = {

    7, -7, 4, 8, fltNonfiniteBehavior::NanOnly, fltNanEncoding::NegativeZero};

constexpr fltSemantics APFloatBase::semFloat8E4M3B11FNUZ = {

    4, -10, 4, 8, fltNonfiniteBehavior::NanOnly, fltNanEncoding::NegativeZero};

constexpr fltSemantics APFloatBase::semFloat8E3M4 = {3, -2, 5, 8};

constexpr fltSemantics APFloatBase::semFloatTF32 = {127, -126, 11, 19};

constexpr fltSemantics APFloatBase::semFloat8E8M0FNU = {

    127,

    -127,

    1,

    8,

    fltNonfiniteBehavior::NanOnly,

    fltNanEncoding::AllOnes,

    false,

    false,

    false};


constexpr fltSemantics APFloatBase::semFloat6E3M2FN = {

    4, -2, 3, 6, fltNonfiniteBehavior::FiniteOnly};

constexpr fltSemantics APFloatBase::semFloat6E2M3FN = {

    2, 0, 4, 6, fltNonfiniteBehavior::FiniteOnly};

constexpr fltSemantics APFloatBase::semFloat4E2M1FN = {

    2, 0, 2, 4, fltNonfiniteBehavior::FiniteOnly};

constexpr fltSemantics APFloatBase::semX87DoubleExtended = {16383, -16382, 64,

                                                            80};

constexpr fltSemantics APFloatBase::semBogus = {0, 0, 0, 0};

constexpr fltSemantics APFloatBase::semPPCDoubleDouble = {-1, 0, 0, 128};

constexpr fltSemantics APFloatBase::semPPCDoubleDoubleLegacy = {

    1023, -1022 + 53, 53 + 53, 128};


const llvm::fltSemantics &APFloatBase::EnumToSemantics(Semantics S) {

  switch (S) {

  case S_IEEEhalf:

    return IEEEhalf();

  case S_BFloat:

    return BFloat();

  case S_IEEEsingle:

    return IEEEsingle();

  case S_IEEEdouble:

    return IEEEdouble();

  case S_IEEEquad:

    return IEEEquad();

  case S_PPCDoubleDouble:

    return PPCDoubleDouble();

  case S_PPCDoubleDoubleLegacy:

    return PPCDoubleDoubleLegacy();

  case S_Float8E5M2:

    return Float8E5M2();

  case S_Float8E5M2FNUZ:

    return Float8E5M2FNUZ();

  case S_Float8E4M3:

    return Float8E4M3();

  case S_Float8E4M3FN:

    return Float8E4M3FN();

  case S_Float8E4M3FNUZ:

    return Float8E4M3FNUZ();

  case S_Float8E4M3B11FNUZ:

    return Float8E4M3B11FNUZ();

  case S_Float8E3M4:

    return Float8E3M4();

  case S_FloatTF32:

    return FloatTF32();

  case S_Float8E8M0FNU:

    return Float8E8M0FNU();

  case S_Float6E3M2FN:

    return Float6E3M2FN();

  case S_Float6E2M3FN:

    return Float6E2M3FN();

  case S_Float4E2M1FN:

    return Float4E2M1FN();

  case S_x87DoubleExtended:

    return x87DoubleExtended();

  }

  llvm_unreachable("Unrecognised floating semantics");

}


APFloatBase::Semantics


APFloatBase::SemanticsToEnum(const llvm::fltSemantics &Sem) {

  if (&Sem == &llvm::APFloat::IEEEhalf())

    return S_IEEEhalf;

  else if (&Sem == &llvm::APFloat::BFloat())

    return S_BFloat;

  else if (&Sem == &llvm::APFloat::IEEEsingle())

    return S_IEEEsingle;

  else if (&Sem == &llvm::APFloat::IEEEdouble())

    return S_IEEEdouble;

  else if (&Sem == &llvm::APFloat::IEEEquad())

    return S_IEEEquad;

  else if (&Sem == &llvm::APFloat::PPCDoubleDouble())

    return S_PPCDoubleDouble;

  else if (&Sem == &llvm::APFloat::PPCDoubleDoubleLegacy())

    return S_PPCDoubleDoubleLegacy;

  else if (&Sem == &llvm::APFloat::Float8E5M2())

    return S_Float8E5M2;

  else if (&Sem == &llvm::APFloat::Float8E5M2FNUZ())

    return S_Float8E5M2FNUZ;

  else if (&Sem == &llvm::APFloat::Float8E4M3())

    return S_Float8E4M3;

  else if (&Sem == &llvm::APFloat::Float8E4M3FN())

    return S_Float8E4M3FN;

  else if (&Sem == &llvm::APFloat::Float8E4M3FNUZ())

    return S_Float8E4M3FNUZ;

  else if (&Sem == &llvm::APFloat::Float8E4M3B11FNUZ())

    return S_Float8E4M3B11FNUZ;

  else if (&Sem == &llvm::APFloat::Float8E3M4())

    return S_Float8E3M4;

  else if (&Sem == &llvm::APFloat::FloatTF32())

    return S_FloatTF32;

  else if (&Sem == &llvm::APFloat::Float8E8M0FNU())

    return S_Float8E8M0FNU;

  else if (&Sem == &llvm::APFloat::Float6E3M2FN())

    return S_Float6E3M2FN;

  else if (&Sem == &llvm::APFloat::Float6E2M3FN())

    return S_Float6E2M3FN;

  else if (&Sem == &llvm::APFloat::Float4E2M1FN())

    return S_Float4E2M1FN;

  else if (&Sem == &llvm::APFloat::x87DoubleExtended())

    return S_x87DoubleExtended;

  else

    llvm_unreachable("Unknown floating semantics");

}


bool APFloatBase::isRepresentableBy(const fltSemantics &A,

                                    const fltSemantics &B) {

  return A.maxExponent <= B.maxExponent && A.minExponent >= B.minExponent &&

         A.precision <= B.precision;

}


/* A tight upper bound on number of parts required to hold the value

   pow(5, power) is


     power * 815 / (351 * integerPartWidth) + 1


   However, whilst the result may require only this many parts,

   because we are multiplying two values to get it, the

   multiplication may require an extra part with the excess part

   being zero (consider the trivial case of 1 * 1, tcFullMultiply

   requires two parts to hold the single-part result).  So we add an

   extra one to guarantee enough space whilst multiplying.  */

const unsigned int maxExponent = 16383;

const unsigned int maxPrecision = 113;

const unsigned int maxPowerOfFiveExponent = maxExponent + maxPrecision - 1;

const unsigned int maxPowerOfFiveParts =

    2 +

    ((maxPowerOfFiveExponent * 815) / (351 * APFloatBase::integerPartWidth));


unsigned int APFloatBase::semanticsPrecision(const fltSemantics &semantics) {

  return semantics.precision;

}


APFloatBase::ExponentType


APFloatBase::semanticsMaxExponent(const fltSemantics &semantics) {

  return semantics.maxExponent;

}


APFloatBase::ExponentType


APFloatBase::semanticsMinExponent(const fltSemantics &semantics) {

  return semantics.minExponent;

}


unsigned int APFloatBase::semanticsSizeInBits(const fltSemantics &semantics) {

  return semantics.sizeInBits;

}


unsigned int APFloatBase::semanticsIntSizeInBits(const fltSemantics &semantics,

                                                 bool isSigned) {

  // The max FP value is pow(2, MaxExponent) * (1 + MaxFraction), so we need

  // at least one more bit than the MaxExponent to hold the max FP value.

  unsigned int MinBitWidth = semanticsMaxExponent(semantics) + 1;

  // Extra sign bit needed.

  if (isSigned)

    ++MinBitWidth;

  return MinBitWidth;

}


bool APFloatBase::semanticsHasZero(const fltSemantics &semantics) {

  return semantics.hasZero;

}


bool APFloatBase::semanticsHasSignedRepr(const fltSemantics &semantics) {

  return semantics.hasSignedRepr;

}


bool APFloatBase::semanticsHasInf(const fltSemantics &semantics) {

  return semantics.nonFiniteBehavior == fltNonfiniteBehavior::IEEE754;

}


bool APFloatBase::semanticsHasNaN(const fltSemantics &semantics) {

  return semantics.nonFiniteBehavior != fltNonfiniteBehavior::FiniteOnly;

}


bool APFloatBase::isIEEELikeFP(const fltSemantics &semantics) {

  // Keep in sync with Type::isIEEELikeFPTy

  return SemanticsToEnum(semantics) <= S_IEEEquad;

}


bool APFloatBase::hasSignBitInMSB(const fltSemantics &semantics) {

  return semantics.hasSignBitInMSB;

}


bool APFloatBase::isRepresentableAsNormalIn(const fltSemantics &Src,

                                            const fltSemantics &Dst) {

  // Exponent range must be larger.

  if (Src.maxExponent >= Dst.maxExponent || Src.minExponent <= Dst.minExponent)

    return false;


  // If the mantissa is long enough, the result value could still be denormal

  // with a larger exponent range.

  //

  // FIXME: This condition is probably not accurate but also shouldn't be a

  // practical concern with existing types.

  return Dst.precision >= Src.precision;

}


unsigned APFloatBase::getSizeInBits(const fltSemantics &Sem) {

  return Sem.sizeInBits;

}


static constexpr APFloatBase::ExponentType


exponentZero(const fltSemantics &semantics) {

  return semantics.minExponent - 1;

}


static constexpr APFloatBase::ExponentType


exponentInf(const fltSemantics &semantics) {

  return semantics.maxExponent + 1;

}


static constexpr APFloatBase::ExponentType


exponentNaN(const fltSemantics &semantics) {

  if (semantics.nonFiniteBehavior == fltNonfiniteBehavior::NanOnly) {

    if (semantics.nanEncoding == fltNanEncoding::NegativeZero)

      return exponentZero(semantics);

    if (semantics.hasSignedRepr)

      return semantics.maxExponent;

  }

  return semantics.maxExponent + 1;

}


/* A bunch of private, handy routines.  */


static inline Error createError(const Twine &Err) {

  return make_error<StringError>(Err, inconvertibleErrorCode());

}


static constexpr inline unsigned int partCountForBits(unsigned int bits) {

  return std::max(1u, (bits + APFloatBase::integerPartWidth - 1) /

                          APFloatBase::integerPartWidth);

}


/* Returns 0U-9U.  Return values >= 10U are not digits.  */

static inline unsigned int


decDigitValue(unsigned int c)

{

  return c - '0';

}


/* Return the value of a decimal exponent of the form

   [+-]ddddddd.


   If the exponent overflows, returns a large exponent with the

   appropriate sign.  */


static Expected<int> readExponent(StringRef::iterator begin,

                                  StringRef::iterator end) {

  bool isNegative;

  unsigned int absExponent;

  const unsigned int overlargeExponent = 24000;  /* FIXME.  */

  StringRef::iterator p = begin;


  // Treat no exponent as 0 to match binutils

  if (p == end || ((*p == '-' || *p == '+') && (p + 1) == end)) {

    return 0;

  }


  isNegative = (*p == '-');

  if (*p == '-' || *p == '+') {

    p++;

    if (p == end)

      return createError("Exponent has no digits");

  }


  absExponent = decDigitValue(*p++);

  if (absExponent >= 10U)

    return createError("Invalid character in exponent");


  for (; p != end; ++p) {

    unsigned int value;


    value = decDigitValue(*p);

    if (value >= 10U)

      return createError("Invalid character in exponent");


    absExponent = absExponent * 10U + value;

    if (absExponent >= overlargeExponent) {

      absExponent = overlargeExponent;

      break;

    }

  }


  if (isNegative)

    return -(int) absExponent;

  else

    return (int) absExponent;

}


/* This is ugly and needs cleaning up, but I don't immediately see

   how whilst remaining safe.  */


static Expected<int> totalExponent(StringRef::iterator p,

                                   StringRef::iterator end,

                                   int exponentAdjustment) {

  int unsignedExponent;

  bool negative, overflow;

  int exponent = 0;


  if (p == end)

    return createError("Exponent has no digits");


  negative = *p == '-';

  if (*p == '-' || *p == '+') {

    p++;

    if (p == end)

      return createError("Exponent has no digits");

  }


  unsignedExponent = 0;

  overflow = false;

  for (; p != end; ++p) {

    unsigned int value;


    value = decDigitValue(*p);

    if (value >= 10U)

      return createError("Invalid character in exponent");


    unsignedExponent = unsignedExponent * 10 + value;

    if (unsignedExponent > 32767) {

      overflow = true;

      break;

    }

  }


  if (exponentAdjustment > 32767 || exponentAdjustment < -32768)

    overflow = true;


  if (!overflow) {

    exponent = unsignedExponent;

    if (negative)

      exponent = -exponent;

    exponent += exponentAdjustment;

    if (exponent > 32767 || exponent < -32768)

      overflow = true;

  }


  if (overflow)

    exponent = negative ? -32768: 32767;


  return exponent;

}


static Expected<StringRef::iterator>


skipLeadingZeroesAndAnyDot(StringRef::iterator begin, StringRef::iterator end,

                           StringRef::iterator *dot) {

  StringRef::iterator p = begin;

  *dot = end;

  while (p != end && *p == '0')

    p++;


  if (p != end && *p == '.') {

    *dot = p++;


    if (end - begin == 1)

      return createError("Significand has no digits");


    while (p != end && *p == '0')

      p++;

  }


  return p;

}


/* Given a normal decimal floating point number of the form


     dddd.dddd[eE][+-]ddd


   where the decimal point and exponent are optional, fill out the

   structure D.  Exponent is appropriate if the significand is

   treated as an integer, and normalizedExponent if the significand

   is taken to have the decimal point after a single leading

   non-zero digit.


   If the value is zero, V->firstSigDigit points to a non-digit, and

   the return exponent is zero.

*/


struct decimalInfo {

  const char *firstSigDigit;

  const char *lastSigDigit;

  int exponent;

  int normalizedExponent;

};


static Error interpretDecimal(StringRef::iterator begin,

                              StringRef::iterator end, decimalInfo *D) {

  StringRef::iterator dot = end;


  auto PtrOrErr = skipLeadingZeroesAndAnyDot(begin, end, &dot);

  if (!PtrOrErr)

    return PtrOrErr.takeError();

  StringRef::iterator p = *PtrOrErr;


  D->firstSigDigit = p;

  D->exponent = 0;

  D->normalizedExponent = 0;


  for (; p != end; ++p) {

    if (*p == '.') {

      if (dot != end)

        return createError("String contains multiple dots");

      dot = p++;

      if (p == end)

        break;

    }

    if (decDigitValue(*p) >= 10U)

      break;

  }


  if (p != end) {

    if (*p != 'e' && *p != 'E')

      return createError("Invalid character in significand");

    if (p == begin)

      return createError("Significand has no digits");

    if (dot != end && p - begin == 1)

      return createError("Significand has no digits");


    /* p points to the first non-digit in the string */

    auto ExpOrErr = readExponent(p + 1, end);

    if (!ExpOrErr)

      return ExpOrErr.takeError();

    D->exponent = *ExpOrErr;


    /* Implied decimal point?  */

    if (dot == end)

      dot = p;

  }


  /* If number is all zeroes accept any exponent.  */

  if (p != D->firstSigDigit) {

    /* Drop insignificant trailing zeroes.  */

    if (p != begin) {

      do

        do

          p--;

        while (p != begin && *p == '0');

      while (p != begin && *p == '.');

    }


    /* Adjust the exponents for any decimal point.  */

    D->exponent += static_cast<APFloat::ExponentType>((dot - p) - (dot > p));

    D->normalizedExponent = (D->exponent +

              static_cast<APFloat::ExponentType>((p - D->firstSigDigit)

                                      - (dot > D->firstSigDigit && dot < p)));

  }


  D->lastSigDigit = p;

  return Error::success();

}


/* Return the trailing fraction of a hexadecimal number.

   DIGITVALUE is the first hex digit of the fraction, P points to

   the next digit.  */

static Expected<lostFraction>


trailingHexadecimalFraction(StringRef::iterator p, StringRef::iterator end,

                            unsigned int digitValue) {

  unsigned int hexDigit;


  /* If the first trailing digit isn't 0 or 8 we can work out the

     fraction immediately.  */

  if (digitValue > 8)

    return lfMoreThanHalf;

  else if (digitValue < 8 && digitValue > 0)

    return lfLessThanHalf;


  // Otherwise we need to find the first non-zero digit.

  while (p != end && (*p == '0' || *p == '.'))

    p++;


  if (p == end)

    return createError("Invalid trailing hexadecimal fraction!");


  hexDigit = hexDigitValue(*p);


  /* If we ran off the end it is exactly zero or one-half, otherwise

     a little more.  */

  if (hexDigit == UINT_MAX)

    return digitValue == 0 ? lfExactlyZero: lfExactlyHalf;

  else

    return digitValue == 0 ? lfLessThanHalf: lfMoreThanHalf;

}


/* Return the fraction lost were a bignum truncated losing the least

   significant BITS bits.  */

static lostFraction


lostFractionThroughTruncation(const APFloatBase::integerPart *parts,

                              unsigned int partCount,

                              unsigned int bits)

{

  unsigned int lsb;


  lsb = APInt::tcLSB(parts, partCount);


  /* Note this is guaranteed true if bits == 0, or LSB == UINT_MAX.  */

  if (bits <= lsb)

    return lfExactlyZero;

  if (bits == lsb + 1)

    return lfExactlyHalf;

  if (bits <= partCount * APFloatBase::integerPartWidth &&

      APInt::tcExtractBit(parts, bits - 1))

    return lfMoreThanHalf;


  return lfLessThanHalf;

}


/* Shift DST right BITS bits noting lost fraction.  */

static lostFraction


shiftRight(APFloatBase::integerPart *dst, unsigned int parts, unsigned int bits)

{

  lostFraction lost_fraction;


  lost_fraction = lostFractionThroughTruncation(dst, parts, bits);


  APInt::tcShiftRight(dst, parts, bits);


  return lost_fraction;

}


/* Combine the effect of two lost fractions.  */

static lostFraction


combineLostFractions(lostFraction moreSignificant,

                     lostFraction lessSignificant)

{

  if (lessSignificant != lfExactlyZero) {

    if (moreSignificant == lfExactlyZero)

      moreSignificant = lfLessThanHalf;

    else if (moreSignificant == lfExactlyHalf)

      moreSignificant = lfMoreThanHalf;

  }


  return moreSignificant;

}


/* The error from the true value, in half-ulps, on multiplying two

   floating point numbers, which differ from the value they

   approximate by at most HUE1 and HUE2 half-ulps, is strictly less

   than the returned value.


   See "How to Read Floating Point Numbers Accurately" by William D

   Clinger.  */

static unsigned int


HUerrBound(bool inexactMultiply, unsigned int HUerr1, unsigned int HUerr2)

{

  assert(HUerr1 < 2 || HUerr2 < 2 || (HUerr1 + HUerr2 < 8));


  if (HUerr1 + HUerr2 == 0)

    return inexactMultiply * 2;  /* <= inexactMultiply half-ulps.  */

  else

    return inexactMultiply + 2 * (HUerr1 + HUerr2);

}


/* The number of ulps from the boundary (zero, or half if ISNEAREST)

   when the least significant BITS are truncated.  BITS cannot be

   zero.  */

static APFloatBase::integerPart


ulpsFromBoundary(const APFloatBase::integerPart *parts, unsigned int bits,

                 bool isNearest) {

  unsigned int count, partBits;

  APFloatBase::integerPart part, boundary;


  assert(bits != 0);


  bits--;

  count = bits / APFloatBase::integerPartWidth;

  partBits = bits % APFloatBase::integerPartWidth + 1;


  part = parts[count] & (~(APFloatBase::integerPart) 0 >> (APFloatBase::integerPartWidth - partBits));


  if (isNearest)

    boundary = (APFloatBase::integerPart) 1 << (partBits - 1);

  else

    boundary = 0;


  if (count == 0) {

    if (part - boundary <= boundary - part)

      return part - boundary;

    else

      return boundary - part;

  }


  if (part == boundary) {

    while (--count)

      if (parts[count])

        return ~(APFloatBase::integerPart) 0; /* A lot.  */


    return parts[0];

  } else if (part == boundary - 1) {

    while (--count)

      if (~parts[count])

        return ~(APFloatBase::integerPart) 0; /* A lot.  */


    return -parts[0];

  }


  return ~(APFloatBase::integerPart) 0; /* A lot.  */

}


/* Place pow(5, power) in DST, and return the number of parts used.

   DST must be at least one part larger than size of the answer.  */

static unsigned int


powerOf5(APFloatBase::integerPart *dst, unsigned int power) {

  static const APFloatBase::integerPart firstEightPowers[] = { 1, 5, 25, 125, 625, 3125, 15625, 78125 };

  APFloatBase::integerPart pow5s[maxPowerOfFiveParts * 2 + 5];

  pow5s[0] = 78125 * 5;


  unsigned int partsCount = 1;

  APFloatBase::integerPart scratch[maxPowerOfFiveParts], *p1, *p2, *pow5;

  unsigned int result;

  assert(power <= maxExponent);


  p1 = dst;

  p2 = scratch;


  *p1 = firstEightPowers[power & 7];

  power >>= 3;


  result = 1;

  pow5 = pow5s;


  for (unsigned int n = 0; power; power >>= 1, n++) {

    /* Calculate pow(5,pow(2,n+3)) if we haven't yet.  */

    if (n != 0) {

      APInt::tcFullMultiply(pow5, pow5 - partsCount, pow5 - partsCount,

                            partsCount, partsCount);

      partsCount *= 2;

      if (pow5[partsCount - 1] == 0)

        partsCount--;

    }


    if (power & 1) {

      APFloatBase::integerPart *tmp;


      APInt::tcFullMultiply(p2, p1, pow5, result, partsCount);

      result += partsCount;

      if (p2[result - 1] == 0)

        result--;


      /* Now result is in p1 with partsCount parts and p2 is scratch

         space.  */

      tmp = p1;

      p1 = p2;

      p2 = tmp;

    }


    pow5 += partsCount;

  }


  if (p1 != dst)

    APInt::tcAssign(dst, p1, result);


  return result;

}


/* Zero at the end to avoid modular arithmetic when adding one; used

   when rounding up during hexadecimal output.  */

static const char hexDigitsLower[] = "0123456789abcdef0";

static const char hexDigitsUpper[] = "0123456789ABCDEF0";

static const char infinityL[] = "infinity";

static const char infinityU[] = "INFINITY";

static const char NaNL[] = "nan";

static const char NaNU[] = "NAN";


/* Write out an integerPart in hexadecimal, starting with the most

   significant nibble.  Write out exactly COUNT hexdigits, return

   COUNT.  */

static unsigned int


partAsHex (char *dst, APFloatBase::integerPart part, unsigned int count,

           const char *hexDigitChars)

{

  unsigned int result = count;


  assert(count != 0 && count <= APFloatBase::integerPartWidth / 4);


  part >>= (APFloatBase::integerPartWidth - 4 * count);

  while (count--) {

    dst[count] = hexDigitChars[part & 0xf];

    part >>= 4;

  }


  return result;

}


/* Write out an unsigned decimal integer.  */

static char *


writeUnsignedDecimal (char *dst, unsigned int n)

{

  char buff[40], *p;


  p = buff;

  do

    *p++ = '0' + n % 10;

  while (n /= 10);


  do

    *dst++ = *--p;

  while (p != buff);


  return dst;

}


/* Write out a signed decimal integer.  */

static char *


writeSignedDecimal (char *dst, int value)

{

  if (value < 0) {

    *dst++ = '-';

    dst = writeUnsignedDecimal(dst, -(unsigned) value);

  } else {

    dst = writeUnsignedDecimal(dst, value);

  }


  return dst;

}


// Compute the ULP of the input using a definition from:

// Jean-Michel Muller. On the definition of ulp(x). [Research Report] RR-5504,

// LIP RR-2005-09, INRIA, LIP. 2005, pp.16. inria-00070503


static APFloat harrisonUlp(const APFloat &X) {

  const fltSemantics &Sem = X.getSemantics();

  switch (X.getCategory()) {

  case APFloat::fcNaN:

    return APFloat::getQNaN(Sem);

  case APFloat::fcInfinity:

    return APFloat::getInf(Sem);

  case APFloat::fcZero:

    return APFloat::getSmallest(Sem);

  case APFloat::fcNormal:

    break;

  }

  if (X.isDenormal() || X.isSmallestNormalized())

    return APFloat::getSmallest(Sem);

  int Exp = ilogb(X);

  if (X.getExactLog2() != INT_MIN)

    Exp -= 1;

  return scalbn(APFloat::getOne(Sem), Exp - (Sem.precision - 1),

                APFloat::rmNearestTiesToEven);

}


namespace detail {

/* Constructors.  */

void IEEEFloat::initialize(const fltSemantics *ourSemantics) {

  unsigned int count;


  semantics = ourSemantics;

  count = partCount();

  if (count > 1)

    significand.parts = new integerPart[count];

}


void IEEEFloat::freeSignificand() {

  if (needsCleanup())

    delete [] significand.parts;

}


void IEEEFloat::assign(const IEEEFloat &rhs) {

  assert(semantics == rhs.semantics);


  sign = rhs.sign;

  category = rhs.category;

  exponent = rhs.exponent;

  if (isFiniteNonZero() || category == fcNaN)

    copySignificand(rhs);

}


void IEEEFloat::copySignificand(const IEEEFloat &rhs) {

  assert(isFiniteNonZero() || category == fcNaN);

  assert(rhs.partCount() >= partCount());


  APInt::tcAssign(significandParts(), rhs.significandParts(),

                  partCount());

}


/* Make this number a NaN, with an arbitrary but deterministic value

   for the significand.  If double or longer, this is a signalling NaN,

   which may not be ideal.  If float, this is QNaN(0).  */


void IEEEFloat::makeNaN(bool SNaN, bool Negative, const APInt *fill) {

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::FiniteOnly)

    llvm_unreachable("This floating point format does not support NaN");


  if (Negative && !semantics->hasSignedRepr)

    llvm_unreachable(

        "This floating point format does not support signed values");


  category = fcNaN;

  sign = Negative;

  exponent = exponentNaN();


  integerPart *significand = significandParts();

  unsigned numParts = partCount();


  APInt fill_storage;

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly) {

    // Finite-only types do not distinguish signalling and quiet NaN, so

    // make them all signalling.

    SNaN = false;

    if (semantics->nanEncoding == fltNanEncoding::NegativeZero) {

      sign = true;

      fill_storage = APInt::getZero(semantics->precision - 1);

    } else {

      fill_storage = APInt::getAllOnes(semantics->precision - 1);

    }

    fill = &fill_storage;

  }


  // Set the significand bits to the fill.

  if (!fill || fill->getNumWords() < numParts)

    APInt::tcSet(significand, 0, numParts);

  if (fill) {

    APInt::tcAssign(significand, fill->getRawData(),

                    std::min(fill->getNumWords(), numParts));


    // Zero out the excess bits of the significand.

    unsigned bitsToPreserve = semantics->precision - 1;

    unsigned part = bitsToPreserve / 64;

    bitsToPreserve %= 64;

    significand[part] &= ((1ULL << bitsToPreserve) - 1);

    for (part++; part != numParts; ++part)

      significand[part] = 0;

  }


  unsigned QNaNBit =

      (semantics->precision >= 2) ? (semantics->precision - 2) : 0;


  if (SNaN) {

    // We always have to clear the QNaN bit to make it an SNaN.

    APInt::tcClearBit(significand, QNaNBit);


    // If there are no bits set in the payload, we have to set

    // *something* to make it a NaN instead of an infinity;

    // conventionally, this is the next bit down from the QNaN bit.

    if (APInt::tcIsZero(significand, numParts))

      APInt::tcSetBit(significand, QNaNBit - 1);

  } else if (semantics->nanEncoding == fltNanEncoding::NegativeZero) {

    // The only NaN is a quiet NaN, and it has no bits sets in the significand.

    // Do nothing.

  } else {

    // We always have to set the QNaN bit to make it a QNaN.

    APInt::tcSetBit(significand, QNaNBit);

  }


  // For x87 extended precision, we want to make a NaN, not a

  // pseudo-NaN.  Maybe we should expose the ability to make

  // pseudo-NaNs?

  if (semantics == &APFloatBase::semX87DoubleExtended)

    APInt::tcSetBit(significand, QNaNBit + 1);

}


IEEEFloat &IEEEFloat::operator=(const IEEEFloat &rhs) {

  if (this != &rhs) {

    if (semantics != rhs.semantics) {

      freeSignificand();

      initialize(rhs.semantics);

    }

    assign(rhs);

  }


  return *this;

}


IEEEFloat &IEEEFloat::operator=(IEEEFloat &&rhs) {

  freeSignificand();


  semantics = rhs.semantics;

  significand = rhs.significand;

  exponent = rhs.exponent;

  category = rhs.category;

  sign = rhs.sign;


  rhs.semantics = &APFloatBase::semBogus;

  return *this;

}


bool IEEEFloat::isDenormal() const {

  return isFiniteNonZero() && (exponent == semantics->minExponent) &&

         (APInt::tcExtractBit(significandParts(),

                              semantics->precision - 1) == 0);

}


bool IEEEFloat::isSmallest() const {

  // The smallest number by magnitude in our format will be the smallest

  // denormal, i.e. the floating point number with exponent being minimum

  // exponent and significand bitwise equal to 1 (i.e. with MSB equal to 0).

  return isFiniteNonZero() && exponent == semantics->minExponent &&

    significandMSB() == 0;

}


bool IEEEFloat::isSmallestNormalized() const {

  return getCategory() == fcNormal && exponent == semantics->minExponent &&

         isSignificandAllZerosExceptMSB();

}


unsigned int IEEEFloat::getNumHighBits() const {

  const unsigned int PartCount = partCountForBits(semantics->precision);

  const unsigned int Bits = PartCount * integerPartWidth;


  // Compute how many bits are used in the final word.

  // When precision is just 1, it represents the 'Pth'

  // Precision bit and not the actual significand bit.

  const unsigned int NumHighBits = (semantics->precision > 1)

                                       ? (Bits - semantics->precision + 1)

                                       : (Bits - semantics->precision);

  return NumHighBits;

}


bool IEEEFloat::isSignificandAllOnes() const {

  // Test if the significand excluding the integral bit is all ones. This allows

  // us to test for binade boundaries.

  const integerPart *Parts = significandParts();

  const unsigned PartCount = partCountForBits(semantics->precision);

  for (unsigned i = 0; i < PartCount - 1; i++)

    if (~Parts[i])

      return false;


  // Set the unused high bits to all ones when we compare.

  const unsigned NumHighBits = getNumHighBits();

  assert(NumHighBits <= integerPartWidth && NumHighBits > 0 &&

         "Can not have more high bits to fill than integerPartWidth");

  const integerPart HighBitFill =

    ~integerPart(0) << (integerPartWidth - NumHighBits);

  if ((semantics->precision <= 1) || (~(Parts[PartCount - 1] | HighBitFill)))

    return false;


  return true;

}


bool IEEEFloat::isSignificandAllOnesExceptLSB() const {

  // Test if the significand excluding the integral bit is all ones except for

  // the least significant bit.

  const integerPart *Parts = significandParts();


  if (Parts[0] & 1)

    return false;


  const unsigned PartCount = partCountForBits(semantics->precision);

  for (unsigned i = 0; i < PartCount - 1; i++) {

    if (~Parts[i] & ~unsigned{!i})

      return false;

  }


  // Set the unused high bits to all ones when we compare.

  const unsigned NumHighBits = getNumHighBits();

  assert(NumHighBits <= integerPartWidth && NumHighBits > 0 &&

         "Can not have more high bits to fill than integerPartWidth");

  const integerPart HighBitFill = ~integerPart(0)

                                  << (integerPartWidth - NumHighBits);

  if (~(Parts[PartCount - 1] | HighBitFill | 0x1))

    return false;


  return true;

}


bool IEEEFloat::isSignificandAllZeros() const {

  // Test if the significand excluding the integral bit is all zeros. This

  // allows us to test for binade boundaries.

  const integerPart *Parts = significandParts();

  const unsigned PartCount = partCountForBits(semantics->precision);


  for (unsigned i = 0; i < PartCount - 1; i++)

    if (Parts[i])

      return false;


  // Compute how many bits are used in the final word.

  const unsigned NumHighBits = getNumHighBits();

  assert(NumHighBits < integerPartWidth && "Can not have more high bits to "

         "clear than integerPartWidth");

  const integerPart HighBitMask = ~integerPart(0) >> NumHighBits;


  if ((semantics->precision > 1) && (Parts[PartCount - 1] & HighBitMask))

    return false;


  return true;

}


bool IEEEFloat::isSignificandAllZerosExceptMSB() const {

  const integerPart *Parts = significandParts();

  const unsigned PartCount = partCountForBits(semantics->precision);


  for (unsigned i = 0; i < PartCount - 1; i++) {

    if (Parts[i])

      return false;

  }


  const unsigned NumHighBits = getNumHighBits();

  const integerPart MSBMask = integerPart(1)

                              << (integerPartWidth - NumHighBits);

  return ((semantics->precision <= 1) || (Parts[PartCount - 1] == MSBMask));

}


bool IEEEFloat::isLargest() const {

  bool IsMaxExp = isFiniteNonZero() && exponent == semantics->maxExponent;

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly &&

      semantics->nanEncoding == fltNanEncoding::AllOnes) {

    // The largest number by magnitude in our format will be the floating point

    // number with maximum exponent and with significand that is all ones except

    // the LSB.

    return (IsMaxExp && APFloat::hasSignificand(*semantics))

               ? isSignificandAllOnesExceptLSB()

               : IsMaxExp;

  } else {

    // The largest number by magnitude in our format will be the floating point

    // number with maximum exponent and with significand that is all ones.

    return IsMaxExp && isSignificandAllOnes();

  }

}


bool IEEEFloat::isInteger() const {

  // This could be made more efficient; I'm going for obviously correct.

  if (!isFinite()) return false;

  IEEEFloat truncated = *this;

  truncated.roundToIntegral(rmTowardZero);

  return compare(truncated) == cmpEqual;

}


bool IEEEFloat::bitwiseIsEqual(const IEEEFloat &rhs) const {

  if (this == &rhs)

    return true;

  if (semantics != rhs.semantics ||

      category != rhs.category ||

      sign != rhs.sign)

    return false;

  if (category==fcZero || category==fcInfinity)

    return true;


  if (isFiniteNonZero() && exponent != rhs.exponent)

    return false;


  return std::equal(significandParts(), significandParts() + partCount(),

                    rhs.significandParts());

}


IEEEFloat::IEEEFloat(const fltSemantics &ourSemantics, integerPart value) {

  initialize(&ourSemantics);

  sign = 0;

  category = fcNormal;

  zeroSignificand();

  exponent = ourSemantics.precision - 1;

  significandParts()[0] = value;

  normalize(rmNearestTiesToEven, lfExactlyZero);

}


IEEEFloat::IEEEFloat(const fltSemantics &ourSemantics) {

  initialize(&ourSemantics);

  // The Float8E8MOFNU format does not have a representation

  // for zero. So, use the closest representation instead.

  // Moreover, the all-zero encoding represents a valid

  // normal value (which is the smallestNormalized here).

  // Hence, we call makeSmallestNormalized (where category is

  // 'fcNormal') instead of makeZero (where category is 'fcZero').

  ourSemantics.hasZero ? makeZero(false) : makeSmallestNormalized(false);

}


// Delegate to the previous constructor, because later copy constructor may

// actually inspects category, which can't be garbage.


IEEEFloat::IEEEFloat(const fltSemantics &ourSemantics, uninitializedTag tag)

    : IEEEFloat(ourSemantics) {}


IEEEFloat::IEEEFloat(const IEEEFloat &rhs) {

  initialize(rhs.semantics);

  assign(rhs);

}


IEEEFloat::IEEEFloat(IEEEFloat &&rhs) : semantics(&APFloatBase::semBogus) {

  *this = std::move(rhs);

}


IEEEFloat::~IEEEFloat() { freeSignificand(); }


unsigned int IEEEFloat::partCount() const {

  return partCountForBits(semantics->precision + 1);

}


const APFloat::integerPart *IEEEFloat::significandParts() const {

  return const_cast<IEEEFloat *>(this)->significandParts();

}


APFloat::integerPart *IEEEFloat::significandParts() {

  if (partCount() > 1)

    return significand.parts;

  else

    return &significand.part;

}


void IEEEFloat::zeroSignificand() {

  APInt::tcSet(significandParts(), 0, partCount());

}


/* Increment an fcNormal floating point number's significand.  */

void IEEEFloat::incrementSignificand() {

  integerPart carry;


  carry = APInt::tcIncrement(significandParts(), partCount());


  /* Our callers should never cause us to overflow.  */

  assert(carry == 0);

  (void)carry;

}


/* Add the significand of the RHS.  Returns the carry flag.  */

APFloat::integerPart IEEEFloat::addSignificand(const IEEEFloat &rhs) {

  integerPart *parts;


  parts = significandParts();


  assert(semantics == rhs.semantics);

  assert(exponent == rhs.exponent);


  return APInt::tcAdd(parts, rhs.significandParts(), 0, partCount());

}


/* Subtract the significand of the RHS with a borrow flag.  Returns

   the borrow flag.  */

APFloat::integerPart IEEEFloat::subtractSignificand(const IEEEFloat &rhs,

                                                    integerPart borrow) {

  integerPart *parts;


  parts = significandParts();


  assert(semantics == rhs.semantics);

  assert(exponent == rhs.exponent);


  return APInt::tcSubtract(parts, rhs.significandParts(), borrow,

                           partCount());

}


/* Multiply the significand of the RHS.  If ADDEND is non-NULL, add it

   on to the full-precision result of the multiplication.  Returns the

   lost fraction.  */

lostFraction IEEEFloat::multiplySignificand(const IEEEFloat &rhs,

                                            IEEEFloat addend,

                                            bool ignoreAddend) {

  unsigned int omsb;        // One, not zero, based MSB.

  unsigned int partsCount, newPartsCount, precision;

  integerPart *lhsSignificand;

  integerPart scratch[4];

  integerPart *fullSignificand;

  lostFraction lost_fraction;

  bool ignored;


  assert(semantics == rhs.semantics);


  precision = semantics->precision;


  // Allocate space for twice as many bits as the original significand, plus one

  // extra bit for the addition to overflow into.

  newPartsCount = partCountForBits(precision * 2 + 1);


  if (newPartsCount > 4)

    fullSignificand = new integerPart[newPartsCount];

  else

    fullSignificand = scratch;


  lhsSignificand = significandParts();

  partsCount = partCount();


  APInt::tcFullMultiply(fullSignificand, lhsSignificand,

                        rhs.significandParts(), partsCount, partsCount);


  lost_fraction = lfExactlyZero;

  omsb = APInt::tcMSB(fullSignificand, newPartsCount) + 1;

  exponent += rhs.exponent;


  // Assume the operands involved in the multiplication are single-precision

  // FP, and the two multiplicants are:

  //   *this = a23 . a22 ... a0 * 2^e1

  //     rhs = b23 . b22 ... b0 * 2^e2

  // the result of multiplication is:

  //   *this = c48 c47 c46 . c45 ... c0 * 2^(e1+e2)

  // Note that there are three significant bits at the left-hand side of the

  // radix point: two for the multiplication, and an overflow bit for the

  // addition (that will always be zero at this point). Move the radix point

  // toward left by two bits, and adjust exponent accordingly.

  exponent += 2;


  if (!ignoreAddend && addend.isNonZero()) {

    // The intermediate result of the multiplication has "2 * precision"

    // signicant bit; adjust the addend to be consistent with mul result.

    //

    Significand savedSignificand = significand;

    const fltSemantics *savedSemantics = semantics;

    fltSemantics extendedSemantics;

    opStatus status;

    unsigned int extendedPrecision;


    // Normalize our MSB to one below the top bit to allow for overflow.

    extendedPrecision = 2 * precision + 1;

    if (omsb != extendedPrecision - 1) {

      assert(extendedPrecision > omsb);

      APInt::tcShiftLeft(fullSignificand, newPartsCount,

                         (extendedPrecision - 1) - omsb);

      exponent -= (extendedPrecision - 1) - omsb;

    }


    /* Create new semantics.  */

    extendedSemantics = *semantics;

    extendedSemantics.precision = extendedPrecision;


    if (newPartsCount == 1)

      significand.part = fullSignificand[0];

    else

      significand.parts = fullSignificand;

    semantics = &extendedSemantics;


    // Make a copy so we can convert it to the extended semantics.

    // Note that we cannot convert the addend directly, as the extendedSemantics

    // is a local variable (which we take a reference to).

    IEEEFloat extendedAddend(addend);

    status = extendedAddend.convert(extendedSemantics, APFloat::rmTowardZero,

                                    &ignored);

    assert(status == APFloat::opOK);

    (void)status;


    // Shift the significand of the addend right by one bit. This guarantees

    // that the high bit of the significand is zero (same as fullSignificand),

    // so the addition will overflow (if it does overflow at all) into the top bit.

    lost_fraction = extendedAddend.shiftSignificandRight(1);

    assert(lost_fraction == lfExactlyZero &&

           "Lost precision while shifting addend for fused-multiply-add.");


    lost_fraction = addOrSubtractSignificand(extendedAddend, false);


    /* Restore our state.  */

    if (newPartsCount == 1)

      fullSignificand[0] = significand.part;

    significand = savedSignificand;

    semantics = savedSemantics;


    omsb = APInt::tcMSB(fullSignificand, newPartsCount) + 1;

  }


  // Convert the result having "2 * precision" significant-bits back to the one

  // having "precision" significant-bits. First, move the radix point from

  // poision "2*precision - 1" to "precision - 1". The exponent need to be

  // adjusted by "2*precision - 1" - "precision - 1" = "precision".

  exponent -= precision + 1;


  // In case MSB resides at the left-hand side of radix point, shift the

  // mantissa right by some amount to make sure the MSB reside right before

  // the radix point (i.e. "MSB . rest-significant-bits").

  //

  // Note that the result is not normalized when "omsb < precision". So, the

  // caller needs to call IEEEFloat::normalize() if normalized value is

  // expected.

  if (omsb > precision) {

    unsigned int bits, significantParts;

    lostFraction lf;


    bits = omsb - precision;

    significantParts = partCountForBits(omsb);

    lf = shiftRight(fullSignificand, significantParts, bits);

    lost_fraction = combineLostFractions(lf, lost_fraction);

    exponent += bits;

  }


  APInt::tcAssign(lhsSignificand, fullSignificand, partsCount);


  if (newPartsCount > 4)

    delete [] fullSignificand;


  return lost_fraction;

}


lostFraction IEEEFloat::multiplySignificand(const IEEEFloat &rhs) {

  // When the given semantics has zero, the addend here is a zero.

  // i.e . it belongs to the 'fcZero' category.

  // But when the semantics does not support zero, we need to

  // explicitly convey that this addend should be ignored

  // for multiplication.

  return multiplySignificand(rhs, IEEEFloat(*semantics), !semantics->hasZero);

}


/* Multiply the significands of LHS and RHS to DST.  */

lostFraction IEEEFloat::divideSignificand(const IEEEFloat &rhs) {

  unsigned int bit, i, partsCount;

  const integerPart *rhsSignificand;

  integerPart *lhsSignificand, *dividend, *divisor;

  integerPart scratch[4];

  lostFraction lost_fraction;


  assert(semantics == rhs.semantics);


  lhsSignificand = significandParts();

  rhsSignificand = rhs.significandParts();

  partsCount = partCount();


  if (partsCount > 2)

    dividend = new integerPart[partsCount * 2];

  else

    dividend = scratch;


  divisor = dividend + partsCount;


  /* Copy the dividend and divisor as they will be modified in-place.  */

  for (i = 0; i < partsCount; i++) {

    dividend[i] = lhsSignificand[i];

    divisor[i] = rhsSignificand[i];

    lhsSignificand[i] = 0;

  }


  exponent -= rhs.exponent;


  unsigned int precision = semantics->precision;


  /* Normalize the divisor.  */

  bit = precision - APInt::tcMSB(divisor, partsCount) - 1;

  if (bit) {

    exponent += bit;

    APInt::tcShiftLeft(divisor, partsCount, bit);

  }


  /* Normalize the dividend.  */

  bit = precision - APInt::tcMSB(dividend, partsCount) - 1;

  if (bit) {

    exponent -= bit;

    APInt::tcShiftLeft(dividend, partsCount, bit);

  }


  /* Ensure the dividend >= divisor initially for the loop below.

     Incidentally, this means that the division loop below is

     guaranteed to set the integer bit to one.  */

  if (APInt::tcCompare(dividend, divisor, partsCount) < 0) {

    exponent--;

    APInt::tcShiftLeft(dividend, partsCount, 1);

    assert(APInt::tcCompare(dividend, divisor, partsCount) >= 0);

  }


  /* Long division.  */

  for (bit = precision; bit; bit -= 1) {

    if (APInt::tcCompare(dividend, divisor, partsCount) >= 0) {

      APInt::tcSubtract(dividend, divisor, 0, partsCount);

      APInt::tcSetBit(lhsSignificand, bit - 1);

    }


    APInt::tcShiftLeft(dividend, partsCount, 1);

  }


  /* Figure out the lost fraction.  */

  int cmp = APInt::tcCompare(dividend, divisor, partsCount);


  if (cmp > 0)

    lost_fraction = lfMoreThanHalf;

  else if (cmp == 0)

    lost_fraction = lfExactlyHalf;

  else if (APInt::tcIsZero(dividend, partsCount))

    lost_fraction = lfExactlyZero;

  else

    lost_fraction = lfLessThanHalf;


  if (partsCount > 2)

    delete [] dividend;


  return lost_fraction;

}


unsigned int IEEEFloat::significandMSB() const {

  return APInt::tcMSB(significandParts(), partCount());

}


unsigned int IEEEFloat::significandLSB() const {

  return APInt::tcLSB(significandParts(), partCount());

}


/* Note that a zero result is NOT normalized to fcZero.  */

lostFraction IEEEFloat::shiftSignificandRight(unsigned int bits) {

  /* Our exponent should not overflow.  */

  assert((ExponentType) (exponent + bits) >= exponent);


  exponent += bits;


  return shiftRight(significandParts(), partCount(), bits);

}


/* Shift the significand left BITS bits, subtract BITS from its exponent.  */

void IEEEFloat::shiftSignificandLeft(unsigned int bits) {

  assert(bits < semantics->precision ||

         (semantics->precision == 1 && bits <= 1));


  if (bits) {

    unsigned int partsCount = partCount();


    APInt::tcShiftLeft(significandParts(), partsCount, bits);

    exponent -= bits;


    assert(!APInt::tcIsZero(significandParts(), partsCount));

  }

}


APFloat::cmpResult IEEEFloat::compareAbsoluteValue(const IEEEFloat &rhs) const {

  int compare;


  assert(semantics == rhs.semantics);

  assert(isFiniteNonZero());

  assert(rhs.isFiniteNonZero());


  compare = exponent - rhs.exponent;


  /* If exponents are equal, do an unsigned bignum comparison of the

     significands.  */

  if (compare == 0)

    compare = APInt::tcCompare(significandParts(), rhs.significandParts(),

                               partCount());


  if (compare > 0)

    return cmpGreaterThan;

  else if (compare < 0)

    return cmpLessThan;

  else

    return cmpEqual;

}


/* Set the least significant BITS bits of a bignum, clear the

   rest.  */


static void tcSetLeastSignificantBits(APInt::WordType *dst, unsigned parts,

                                      unsigned bits) {

  unsigned i = 0;

  while (bits > APInt::APINT_BITS_PER_WORD) {

    dst[i++] = ~(APInt::WordType)0;

    bits -= APInt::APINT_BITS_PER_WORD;

  }


  if (bits)

    dst[i++] = ~(APInt::WordType)0 >> (APInt::APINT_BITS_PER_WORD - bits);


  while (i < parts)

    dst[i++] = 0;

}


/* Handle overflow.  Sign is preserved.  We either become infinity or

   the largest finite number.  */

APFloat::opStatus IEEEFloat::handleOverflow(roundingMode rounding_mode) {

  if (semantics->nonFiniteBehavior != fltNonfiniteBehavior::FiniteOnly) {

    /* Infinity?  */

    if (rounding_mode == rmNearestTiesToEven ||

        rounding_mode == rmNearestTiesToAway ||

        (rounding_mode == rmTowardPositive && !sign) ||

        (rounding_mode == rmTowardNegative && sign)) {

      if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly)

        makeNaN(false, sign);

      else

        category = fcInfinity;

      return static_cast<opStatus>(opOverflow | opInexact);

    }

  }


  /* Otherwise we become the largest finite number.  */

  category = fcNormal;

  exponent = semantics->maxExponent;

  tcSetLeastSignificantBits(significandParts(), partCount(),

                            semantics->precision);

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly &&

      semantics->nanEncoding == fltNanEncoding::AllOnes)

    APInt::tcClearBit(significandParts(), 0);


  return opInexact;

}


/* Returns TRUE if, when truncating the current number, with BIT the

   new LSB, with the given lost fraction and rounding mode, the result

   would need to be rounded away from zero (i.e., by increasing the

   signficand).  This routine must work for fcZero of both signs, and

   fcNormal numbers.  */

bool IEEEFloat::roundAwayFromZero(roundingMode rounding_mode,

                                  lostFraction lost_fraction,

                                  unsigned int bit) const {

  /* NaNs and infinities should not have lost fractions.  */

  assert(isFiniteNonZero() || category == fcZero);


  /* Current callers never pass this so we don't handle it.  */

  assert(lost_fraction != lfExactlyZero);


  switch (rounding_mode) {

  case rmNearestTiesToAway:

    return lost_fraction == lfExactlyHalf || lost_fraction == lfMoreThanHalf;


  case rmNearestTiesToEven:

    if (lost_fraction == lfMoreThanHalf)

      return true;


    /* Our zeroes don't have a significand to test.  */

    if (lost_fraction == lfExactlyHalf && category != fcZero)

      return APInt::tcExtractBit(significandParts(), bit);


    return false;


  case rmTowardZero:

    return false;


  case rmTowardPositive:

    return !sign;


  case rmTowardNegative:

    return sign;


  default:

    break;

  }

  llvm_unreachable("Invalid rounding mode found");

}


APFloat::opStatus IEEEFloat::normalize(roundingMode rounding_mode,

                                       lostFraction lost_fraction) {

  unsigned int omsb;                /* One, not zero, based MSB.  */

  int exponentChange;


  if (!isFiniteNonZero())

    return opOK;


  /* Before rounding normalize the exponent of fcNormal numbers.  */

  omsb = significandMSB() + 1;


  // Only skip this `if` if the value is exactly zero.

  if (omsb || lost_fraction != lfExactlyZero) {

    /* OMSB is numbered from 1.  We want to place it in the integer

       bit numbered PRECISION if possible, with a compensating change in

       the exponent.  */

    exponentChange = omsb - semantics->precision;


    /* If the resulting exponent is too high, overflow according to

       the rounding mode.  */

    if (exponent + exponentChange > semantics->maxExponent)

      return handleOverflow(rounding_mode);


    /* Subnormal numbers have exponent minExponent, and their MSB

       is forced based on that.  */

    if (exponent + exponentChange < semantics->minExponent)

      exponentChange = semantics->minExponent - exponent;


    /* Shifting left is easy as we don't lose precision.  */

    if (exponentChange < 0) {

      assert(lost_fraction == lfExactlyZero);


      shiftSignificandLeft(-exponentChange);


      return opOK;

    }


    if (exponentChange > 0) {

      lostFraction lf;


      /* Shift right and capture any new lost fraction.  */

      lf = shiftSignificandRight(exponentChange);


      lost_fraction = combineLostFractions(lf, lost_fraction);


      /* Keep OMSB up-to-date.  */

      if (omsb > (unsigned) exponentChange)

        omsb -= exponentChange;

      else

        omsb = 0;

    }

  }


  // The all-ones values is an overflow if NaN is all ones. If NaN is

  // represented by negative zero, then it is a valid finite value.

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly &&

      semantics->nanEncoding == fltNanEncoding::AllOnes &&

      exponent == semantics->maxExponent && isSignificandAllOnes())

    return handleOverflow(rounding_mode);


  /* Now round the number according to rounding_mode given the lost

     fraction.  */


  /* As specified in IEEE 754, since we do not trap we do not report

     underflow for exact results.  */

  if (lost_fraction == lfExactlyZero) {

    /* Canonicalize zeroes.  */

    if (omsb == 0) {

      category = fcZero;

      if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

        sign = false;

      if (!semantics->hasZero)

        makeSmallestNormalized(false);

    }


    return opOK;

  }


  /* Increment the significand if we're rounding away from zero.  */

  if (roundAwayFromZero(rounding_mode, lost_fraction, 0)) {

    if (omsb == 0)

      exponent = semantics->minExponent;


    incrementSignificand();

    omsb = significandMSB() + 1;


    /* Did the significand increment overflow?  */

    if (omsb == (unsigned) semantics->precision + 1) {

      /* Renormalize by incrementing the exponent and shifting our

         significand right one.  However if we already have the

         maximum exponent we overflow to infinity.  */

      if (exponent == semantics->maxExponent)

        // Invoke overflow handling with a rounding mode that will guarantee

        // that the result gets turned into the correct infinity representation.

        // This is needed instead of just setting the category to infinity to

        // account for 8-bit floating point types that have no inf, only NaN.

        return handleOverflow(sign ? rmTowardNegative : rmTowardPositive);


      shiftSignificandRight(1);


      return opInexact;

    }


    // The all-ones values is an overflow if NaN is all ones. If NaN is

    // represented by negative zero, then it is a valid finite value.

    if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly &&

        semantics->nanEncoding == fltNanEncoding::AllOnes &&

        exponent == semantics->maxExponent && isSignificandAllOnes())

      return handleOverflow(rounding_mode);

  }


  /* The normal case - we were and are not denormal, and any

     significand increment above didn't overflow.  */

  if (omsb == semantics->precision)

    return opInexact;


  /* We have a non-zero denormal.  */

  assert(omsb < semantics->precision);


  /* Canonicalize zeroes.  */

  if (omsb == 0) {

    category = fcZero;

    if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

      sign = false;

    // This condition handles the case where the semantics

    // does not have zero but uses the all-zero encoding

    // to represent the smallest normal value.

    if (!semantics->hasZero)

      makeSmallestNormalized(false);

  }


  /* The fcZero case is a denormal that underflowed to zero.  */

  return (opStatus) (opUnderflow | opInexact);

}


APFloat::opStatus IEEEFloat::addOrSubtractSpecials(const IEEEFloat &rhs,

                                                   bool subtract) {

  switch (PackCategoriesIntoKey(category, rhs.category)) {

  default:

    llvm_unreachable(nullptr);


  case PackCategoriesIntoKey(fcZero, fcNaN):

  case PackCategoriesIntoKey(fcNormal, fcNaN):

  case PackCategoriesIntoKey(fcInfinity, fcNaN):

    assign(rhs);

    [[fallthrough]];

  case PackCategoriesIntoKey(fcNaN, fcZero):

  case PackCategoriesIntoKey(fcNaN, fcNormal):

  case PackCategoriesIntoKey(fcNaN, fcInfinity):

  case PackCategoriesIntoKey(fcNaN, fcNaN):

    if (isSignaling()) {

      makeQuiet();

      return opInvalidOp;

    }

    return rhs.isSignaling() ? opInvalidOp : opOK;


  case PackCategoriesIntoKey(fcNormal, fcZero):

  case PackCategoriesIntoKey(fcInfinity, fcNormal):

  case PackCategoriesIntoKey(fcInfinity, fcZero):

    return opOK;


  case PackCategoriesIntoKey(fcNormal, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcInfinity):

    category = fcInfinity;

    sign = rhs.sign ^ subtract;

    return opOK;


  case PackCategoriesIntoKey(fcZero, fcNormal):

    assign(rhs);

    sign = rhs.sign ^ subtract;

    return opOK;


  case PackCategoriesIntoKey(fcZero, fcZero):

    /* Sign depends on rounding mode; handled by caller.  */

    return opOK;


  case PackCategoriesIntoKey(fcInfinity, fcInfinity):

    /* Differently signed infinities can only be validly

       subtracted.  */

    if (((sign ^ rhs.sign)!=0) != subtract) {

      makeNaN();

      return opInvalidOp;

    }


    return opOK;


  case PackCategoriesIntoKey(fcNormal, fcNormal):

    return opDivByZero;

  }

}


/* Add or subtract two normal numbers.  */

lostFraction IEEEFloat::addOrSubtractSignificand(const IEEEFloat &rhs,

                                                 bool subtract) {

  integerPart carry = 0;

  lostFraction lost_fraction;

  int bits;


  /* Determine if the operation on the absolute values is effectively

     an addition or subtraction.  */

  subtract ^= static_cast<bool>(sign ^ rhs.sign);


  /* Are we bigger exponent-wise than the RHS?  */

  bits = exponent - rhs.exponent;


  /* Subtraction is more subtle than one might naively expect.  */

  if (subtract) {

    if ((bits < 0) && !semantics->hasSignedRepr)

      llvm_unreachable(

          "This floating point format does not support signed values");


    IEEEFloat temp_rhs(rhs);

    bool lost_fraction_is_from_rhs = false;


    if (bits == 0)

      lost_fraction = lfExactlyZero;

    else if (bits > 0) {

      lost_fraction = temp_rhs.shiftSignificandRight(bits - 1);

      lost_fraction_is_from_rhs = true;

      shiftSignificandLeft(1);

    } else {

      lost_fraction = shiftSignificandRight(-bits - 1);

      temp_rhs.shiftSignificandLeft(1);

    }


    // Should we reverse the subtraction.

    cmpResult cmp_result = compareAbsoluteValue(temp_rhs);

    if (cmp_result == cmpLessThan) {

      bool borrow =

          lost_fraction != lfExactlyZero && !lost_fraction_is_from_rhs;

      if (borrow) {

        // The lost fraction is being subtracted, borrow from the significand

        // and invert `lost_fraction`.

        if (lost_fraction == lfLessThanHalf)

          lost_fraction = lfMoreThanHalf;

        else if (lost_fraction == lfMoreThanHalf)

          lost_fraction = lfLessThanHalf;

      }

      carry = temp_rhs.subtractSignificand(*this, borrow);

      copySignificand(temp_rhs);

      sign = !sign;

    } else if (cmp_result == cmpGreaterThan) {

      bool borrow = lost_fraction != lfExactlyZero && lost_fraction_is_from_rhs;

      if (borrow) {

        // The lost fraction is being subtracted, borrow from the significand

        // and invert `lost_fraction`.

        if (lost_fraction == lfLessThanHalf)

          lost_fraction = lfMoreThanHalf;

        else if (lost_fraction == lfMoreThanHalf)

          lost_fraction = lfLessThanHalf;

      }

      carry = subtractSignificand(temp_rhs, borrow);

    } else { // cmpEqual

      zeroSignificand();

      if (lost_fraction != lfExactlyZero && lost_fraction_is_from_rhs) {

        // rhs is slightly larger due to the lost fraction, flip the sign.

        sign = !sign;

      }

    }


    /* The code above is intended to ensure that no borrow is

       necessary.  */

    assert(!carry);

    (void)carry;

  } else {

    if (bits > 0) {

      IEEEFloat temp_rhs(rhs);


      lost_fraction = temp_rhs.shiftSignificandRight(bits);

      carry = addSignificand(temp_rhs);

    } else {

      lost_fraction = shiftSignificandRight(-bits);

      carry = addSignificand(rhs);

    }


    /* We have a guard bit; generating a carry cannot happen.  */

    assert(!carry);

    (void)carry;

  }


  return lost_fraction;

}


APFloat::opStatus IEEEFloat::multiplySpecials(const IEEEFloat &rhs) {

  switch (PackCategoriesIntoKey(category, rhs.category)) {

  default:

    llvm_unreachable(nullptr);


  case PackCategoriesIntoKey(fcZero, fcNaN):

  case PackCategoriesIntoKey(fcNormal, fcNaN):

  case PackCategoriesIntoKey(fcInfinity, fcNaN):

    assign(rhs);

    sign = false;

    [[fallthrough]];

  case PackCategoriesIntoKey(fcNaN, fcZero):

  case PackCategoriesIntoKey(fcNaN, fcNormal):

  case PackCategoriesIntoKey(fcNaN, fcInfinity):

  case PackCategoriesIntoKey(fcNaN, fcNaN):

    sign ^= rhs.sign; // restore the original sign

    if (isSignaling()) {

      makeQuiet();

      return opInvalidOp;

    }

    return rhs.isSignaling() ? opInvalidOp : opOK;


  case PackCategoriesIntoKey(fcNormal, fcInfinity):

  case PackCategoriesIntoKey(fcInfinity, fcNormal):

  case PackCategoriesIntoKey(fcInfinity, fcInfinity):

    category = fcInfinity;

    return opOK;


  case PackCategoriesIntoKey(fcZero, fcNormal):

  case PackCategoriesIntoKey(fcNormal, fcZero):

  case PackCategoriesIntoKey(fcZero, fcZero):

    category = fcZero;

    return opOK;


  case PackCategoriesIntoKey(fcZero, fcInfinity):

  case PackCategoriesIntoKey(fcInfinity, fcZero):

    makeNaN();

    return opInvalidOp;


  case PackCategoriesIntoKey(fcNormal, fcNormal):

    return opOK;

  }

}


APFloat::opStatus IEEEFloat::divideSpecials(const IEEEFloat &rhs) {

  switch (PackCategoriesIntoKey(category, rhs.category)) {

  default:

    llvm_unreachable(nullptr);


  case PackCategoriesIntoKey(fcZero, fcNaN):

  case PackCategoriesIntoKey(fcNormal, fcNaN):

  case PackCategoriesIntoKey(fcInfinity, fcNaN):

    assign(rhs);

    sign = false;

    [[fallthrough]];

  case PackCategoriesIntoKey(fcNaN, fcZero):

  case PackCategoriesIntoKey(fcNaN, fcNormal):

  case PackCategoriesIntoKey(fcNaN, fcInfinity):

  case PackCategoriesIntoKey(fcNaN, fcNaN):

    sign ^= rhs.sign; // restore the original sign

    if (isSignaling()) {

      makeQuiet();

      return opInvalidOp;

    }

    return rhs.isSignaling() ? opInvalidOp : opOK;


  case PackCategoriesIntoKey(fcInfinity, fcZero):

  case PackCategoriesIntoKey(fcInfinity, fcNormal):

  case PackCategoriesIntoKey(fcZero, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcNormal):

    return opOK;


  case PackCategoriesIntoKey(fcNormal, fcInfinity):

    category = fcZero;

    return opOK;


  case PackCategoriesIntoKey(fcNormal, fcZero):

    if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly)

      makeNaN(false, sign);

    else

      category = fcInfinity;

    return opDivByZero;


  case PackCategoriesIntoKey(fcInfinity, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcZero):

    makeNaN();

    return opInvalidOp;


  case PackCategoriesIntoKey(fcNormal, fcNormal):

    return opOK;

  }

}


APFloat::opStatus IEEEFloat::modSpecials(const IEEEFloat &rhs) {

  switch (PackCategoriesIntoKey(category, rhs.category)) {

  default:

    llvm_unreachable(nullptr);


  case PackCategoriesIntoKey(fcZero, fcNaN):

  case PackCategoriesIntoKey(fcNormal, fcNaN):

  case PackCategoriesIntoKey(fcInfinity, fcNaN):

    assign(rhs);

    [[fallthrough]];

  case PackCategoriesIntoKey(fcNaN, fcZero):

  case PackCategoriesIntoKey(fcNaN, fcNormal):

  case PackCategoriesIntoKey(fcNaN, fcInfinity):

  case PackCategoriesIntoKey(fcNaN, fcNaN):

    if (isSignaling()) {

      makeQuiet();

      return opInvalidOp;

    }

    return rhs.isSignaling() ? opInvalidOp : opOK;


  case PackCategoriesIntoKey(fcZero, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcNormal):

  case PackCategoriesIntoKey(fcNormal, fcInfinity):

    return opOK;


  case PackCategoriesIntoKey(fcNormal, fcZero):

  case PackCategoriesIntoKey(fcInfinity, fcZero):

  case PackCategoriesIntoKey(fcInfinity, fcNormal):

  case PackCategoriesIntoKey(fcInfinity, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcZero):

    makeNaN();

    return opInvalidOp;


  case PackCategoriesIntoKey(fcNormal, fcNormal):

    return opOK;

  }

}


APFloat::opStatus IEEEFloat::remainderSpecials(const IEEEFloat &rhs) {

  switch (PackCategoriesIntoKey(category, rhs.category)) {

  default:

    llvm_unreachable(nullptr);


  case PackCategoriesIntoKey(fcZero, fcNaN):

  case PackCategoriesIntoKey(fcNormal, fcNaN):

  case PackCategoriesIntoKey(fcInfinity, fcNaN):

    assign(rhs);

    [[fallthrough]];

  case PackCategoriesIntoKey(fcNaN, fcZero):

  case PackCategoriesIntoKey(fcNaN, fcNormal):

  case PackCategoriesIntoKey(fcNaN, fcInfinity):

  case PackCategoriesIntoKey(fcNaN, fcNaN):

    if (isSignaling()) {

      makeQuiet();

      return opInvalidOp;

    }

    return rhs.isSignaling() ? opInvalidOp : opOK;


  case PackCategoriesIntoKey(fcZero, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcNormal):

  case PackCategoriesIntoKey(fcNormal, fcInfinity):

    return opOK;


  case PackCategoriesIntoKey(fcNormal, fcZero):

  case PackCategoriesIntoKey(fcInfinity, fcZero):

  case PackCategoriesIntoKey(fcInfinity, fcNormal):

  case PackCategoriesIntoKey(fcInfinity, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcZero):

    makeNaN();

    return opInvalidOp;


  case PackCategoriesIntoKey(fcNormal, fcNormal):

    return opDivByZero; // fake status, indicating this is not a special case

  }

}


/* Change sign.  */


void IEEEFloat::changeSign() {

  // With NaN-as-negative-zero, neither NaN or negative zero can change

  // their signs.

  if (semantics->nanEncoding == fltNanEncoding::NegativeZero &&

      (isZero() || isNaN()))

    return;

  /* Look mummy, this one's easy.  */

  sign = !sign;

}


/* Normalized addition or subtraction.  */

APFloat::opStatus IEEEFloat::addOrSubtract(const IEEEFloat &rhs,

                                           roundingMode rounding_mode,

                                           bool subtract) {

  opStatus fs;


  fs = addOrSubtractSpecials(rhs, subtract);


  /* This return code means it was not a simple case.  */

  if (fs == opDivByZero) {

    lostFraction lost_fraction;


    lost_fraction = addOrSubtractSignificand(rhs, subtract);

    fs = normalize(rounding_mode, lost_fraction);


    /* Can only be zero if we lost no fraction.  */

    assert(category != fcZero || lost_fraction == lfExactlyZero);

  }


  /* If two numbers add (exactly) to zero, IEEE 754 decrees it is a

     positive zero unless rounding to minus infinity, except that

     adding two like-signed zeroes gives that zero.  */

  if (category == fcZero) {

    if (rhs.category != fcZero || (sign == rhs.sign) == subtract)

      sign = (rounding_mode == rmTowardNegative);

    // NaN-in-negative-zero means zeros need to be normalized to +0.

    if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

      sign = false;

  }


  return fs;

}


/* Normalized addition.  */


APFloat::opStatus IEEEFloat::add(const IEEEFloat &rhs,

                                 roundingMode rounding_mode) {

  return addOrSubtract(rhs, rounding_mode, false);

}


/* Normalized subtraction.  */


APFloat::opStatus IEEEFloat::subtract(const IEEEFloat &rhs,

                                      roundingMode rounding_mode) {

  return addOrSubtract(rhs, rounding_mode, true);

}


/* Normalized multiply.  */


APFloat::opStatus IEEEFloat::multiply(const IEEEFloat &rhs,

                                      roundingMode rounding_mode) {

  opStatus fs;


  sign ^= rhs.sign;

  fs = multiplySpecials(rhs);


  if (isZero() && semantics->nanEncoding == fltNanEncoding::NegativeZero)

    sign = false;

  if (isFiniteNonZero()) {

    lostFraction lost_fraction = multiplySignificand(rhs);

    fs = normalize(rounding_mode, lost_fraction);

    if (lost_fraction != lfExactlyZero)

      fs = (opStatus) (fs | opInexact);

  }


  return fs;

}


/* Normalized divide.  */


APFloat::opStatus IEEEFloat::divide(const IEEEFloat &rhs,

                                    roundingMode rounding_mode) {

  opStatus fs;


  sign ^= rhs.sign;

  fs = divideSpecials(rhs);


  if (isZero() && semantics->nanEncoding == fltNanEncoding::NegativeZero)

    sign = false;

  if (isFiniteNonZero()) {

    lostFraction lost_fraction = divideSignificand(rhs);

    fs = normalize(rounding_mode, lost_fraction);

    if (lost_fraction != lfExactlyZero)

      fs = (opStatus) (fs | opInexact);

  }


  return fs;

}


/* Normalized remainder.  */


APFloat::opStatus IEEEFloat::remainder(const IEEEFloat &rhs) {

  opStatus fs;

  unsigned int origSign = sign;


  // First handle the special cases.

  fs = remainderSpecials(rhs);

  if (fs != opDivByZero)

    return fs;


  fs = opOK;


  // Make sure the current value is less than twice the denom. If the addition

  // did not succeed (an overflow has happened), which means that the finite

  // value we currently posses must be less than twice the denom (as we are

  // using the same semantics).

  IEEEFloat P2 = rhs;

  if (P2.add(rhs, rmNearestTiesToEven) == opOK) {

    fs = mod(P2);

    assert(fs == opOK);

  }


  // Lets work with absolute numbers.

  IEEEFloat P = rhs;

  P.sign = false;

  sign = false;


  //

  // To calculate the remainder we use the following scheme.

  //

  // The remainder is defained as follows:

  //

  // remainder = numer - rquot * denom = x - r * p

  //

  // Where r is the result of: x/p, rounded toward the nearest integral value

  // (with halfway cases rounded toward the even number).

  //

  // Currently, (after x mod 2p):

  // r is the number of 2p's present inside x, which is inherently, an even

  // number of p's.

  //

  // We may split the remaining calculation into 4 options:

  // - if x < 0.5p then we round to the nearest number with is 0, and are done.

  // - if x == 0.5p then we round to the nearest even number which is 0, and we

  //   are done as well.

  // - if 0.5p < x < p then we round to nearest number which is 1, and we have

  //   to subtract 1p at least once.

  // - if x >= p then we must subtract p at least once, as x must be a

  //   remainder.

  //

  // By now, we were done, or we added 1 to r, which in turn, now an odd number.

  //

  // We can now split the remaining calculation to the following 3 options:

  // - if x < 0.5p then we round to the nearest number with is 0, and are done.

  // - if x == 0.5p then we round to the nearest even number. As r is odd, we

  //   must round up to the next even number. so we must subtract p once more.

  // - if x > 0.5p (and inherently x < p) then we must round r up to the next

  //   integral, and subtract p once more.

  //


  // Extend the semantics to prevent an overflow/underflow or inexact result.

  bool losesInfo;

  fltSemantics extendedSemantics = *semantics;

  extendedSemantics.maxExponent++;

  extendedSemantics.minExponent--;

  extendedSemantics.precision += 2;


  IEEEFloat VEx = *this;

  fs = VEx.convert(extendedSemantics, rmNearestTiesToEven, &losesInfo);

  assert(fs == opOK && !losesInfo);

  IEEEFloat PEx = P;

  fs = PEx.convert(extendedSemantics, rmNearestTiesToEven, &losesInfo);

  assert(fs == opOK && !losesInfo);


  // It is simpler to work with 2x instead of 0.5p, and we do not need to lose

  // any fraction.

  fs = VEx.add(VEx, rmNearestTiesToEven);

  assert(fs == opOK);


  if (VEx.compare(PEx) == cmpGreaterThan) {

    fs = subtract(P, rmNearestTiesToEven);

    assert(fs == opOK);


    // Make VEx = this.add(this), but because we have different semantics, we do

    // not want to `convert` again, so we just subtract PEx twice (which equals

    // to the desired value).

    fs = VEx.subtract(PEx, rmNearestTiesToEven);

    assert(fs == opOK);

    fs = VEx.subtract(PEx, rmNearestTiesToEven);

    assert(fs == opOK);


    cmpResult result = VEx.compare(PEx);

    if (result == cmpGreaterThan || result == cmpEqual) {

      fs = subtract(P, rmNearestTiesToEven);

      assert(fs == opOK);

    }

  }


  if (isZero()) {

    sign = origSign;    // IEEE754 requires this

    if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

      // But some 8-bit floats only have positive 0.

      sign = false;

  }


  else

    sign ^= origSign;

  return fs;

}


/* Normalized llvm frem (C fmod). */


APFloat::opStatus IEEEFloat::mod(const IEEEFloat &rhs) {

  opStatus fs;

  fs = modSpecials(rhs);

  unsigned int origSign = sign;


  while (isFiniteNonZero() && rhs.isFiniteNonZero() &&

         compareAbsoluteValue(rhs) != cmpLessThan) {

    int Exp = ilogb(*this) - ilogb(rhs);

    IEEEFloat V = scalbn(rhs, Exp, rmNearestTiesToEven);

    // V can overflow to NaN with fltNonfiniteBehavior::NanOnly, so explicitly

    // check for it.

    if (V.isNaN() || compareAbsoluteValue(V) == cmpLessThan)

      V = scalbn(rhs, Exp - 1, rmNearestTiesToEven);

    V.sign = sign;


    fs = subtract(V, rmNearestTiesToEven);


    // When the semantics supports zero, this loop's

    // exit-condition is handled by the 'isFiniteNonZero'

    // category check above. However, when the semantics

    // does not have 'fcZero' and we have reached the

    // minimum possible value, (and any further subtract

    // will underflow to the same value) explicitly

    // provide an exit-path here.

    if (!semantics->hasZero && this->isSmallest())

      break;


    assert(fs==opOK);

  }

  if (isZero()) {

    sign = origSign; // fmod requires this

    if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

      sign = false;

  }

  return fs;

}


/* Normalized fused-multiply-add.  */


APFloat::opStatus IEEEFloat::fusedMultiplyAdd(const IEEEFloat &multiplicand,

                                              const IEEEFloat &addend,

                                              roundingMode rounding_mode) {

  opStatus fs;


  /* Post-multiplication sign, before addition.  */

  sign ^= multiplicand.sign;


  /* If and only if all arguments are normal do we need to do an

     extended-precision calculation.  */

  if (isFiniteNonZero() &&

      multiplicand.isFiniteNonZero() &&

      addend.isFinite()) {

    lostFraction lost_fraction;


    lost_fraction = multiplySignificand(multiplicand, addend);

    fs = normalize(rounding_mode, lost_fraction);

    if (lost_fraction != lfExactlyZero)

      fs = (opStatus) (fs | opInexact);


    /* If two numbers add (exactly) to zero, IEEE 754 decrees it is a

       positive zero unless rounding to minus infinity, except that

       adding two like-signed zeroes gives that zero.  */

    if (category == fcZero && !(fs & opUnderflow) && sign != addend.sign) {

      sign = (rounding_mode == rmTowardNegative);

      if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

        sign = false;

    }

  } else {

    fs = multiplySpecials(multiplicand);


    /* FS can only be opOK or opInvalidOp.  There is no more work

       to do in the latter case.  The IEEE-754R standard says it is

       implementation-defined in this case whether, if ADDEND is a

       quiet NaN, we raise invalid op; this implementation does so.


       If we need to do the addition we can do so with normal

       precision.  */

    if (fs == opOK)

      fs = addOrSubtract(addend, rounding_mode, false);

  }


  return fs;

}


/* Rounding-mode correct round to integral value.  */


APFloat::opStatus IEEEFloat::roundToIntegral(roundingMode rounding_mode) {

  opStatus fs;


  if (isInfinity())

    // [IEEE Std 754-2008 6.1]:

    // The behavior of infinity in floating-point arithmetic is derived from the

    // limiting cases of real arithmetic with operands of arbitrarily

    // large magnitude, when such a limit exists.

    // ...

    // Operations on infinite operands are usually exact and therefore signal no

    // exceptions ...

    return opOK;


  if (isNaN()) {

    if (isSignaling()) {

      // [IEEE Std 754-2008 6.2]:

      // Under default exception handling, any operation signaling an invalid

      // operation exception and for which a floating-point result is to be

      // delivered shall deliver a quiet NaN.

      makeQuiet();

      // [IEEE Std 754-2008 6.2]:

      // Signaling NaNs shall be reserved operands that, under default exception

      // handling, signal the invalid operation exception(see 7.2) for every

      // general-computational and signaling-computational operation except for

      // the conversions described in 5.12.

      return opInvalidOp;

    } else {

      // [IEEE Std 754-2008 6.2]:

      // For an operation with quiet NaN inputs, other than maximum and minimum

      // operations, if a floating-point result is to be delivered the result

      // shall be a quiet NaN which should be one of the input NaNs.

      // ...

      // Every general-computational and quiet-computational operation involving

      // one or more input NaNs, none of them signaling, shall signal no

      // exception, except fusedMultiplyAdd might signal the invalid operation

      // exception(see 7.2).

      return opOK;

    }

  }


  if (isZero()) {

    // [IEEE Std 754-2008 6.3]:

    // ... the sign of the result of conversions, the quantize operation, the

    // roundToIntegral operations, and the roundToIntegralExact(see 5.3.1) is

    // the sign of the first or only operand.

    return opOK;

  }


  // If the exponent is large enough, we know that this value is already

  // integral, and the arithmetic below would potentially cause it to saturate

  // to +/-Inf.  Bail out early instead.

  if (exponent + 1 >= (int)APFloat::semanticsPrecision(*semantics))

    return opOK;


  // The algorithm here is quite simple: we add 2^(p-1), where p is the

  // precision of our format, and then subtract it back off again.  The choice

  // of rounding modes for the addition/subtraction determines the rounding mode

  // for our integral rounding as well.

  // NOTE: When the input value is negative, we do subtraction followed by

  // addition instead.

  APInt IntegerConstant(NextPowerOf2(APFloat::semanticsPrecision(*semantics)),

                        1);

  IntegerConstant <<= APFloat::semanticsPrecision(*semantics) - 1;

  IEEEFloat MagicConstant(*semantics);

  fs = MagicConstant.convertFromAPInt(IntegerConstant, false,

                                      rmNearestTiesToEven);

  assert(fs == opOK);

  MagicConstant.sign = sign;


  // Preserve the input sign so that we can handle the case of zero result

  // correctly.

  bool inputSign = isNegative();


  fs = add(MagicConstant, rounding_mode);


  // Current value and 'MagicConstant' are both integers, so the result of the

  // subtraction is always exact according to Sterbenz' lemma.

  subtract(MagicConstant, rounding_mode);


  // Restore the input sign.

  if (inputSign != isNegative())

    changeSign();


  return fs;

}


/* Comparison requires normalized numbers.  */


APFloat::cmpResult IEEEFloat::compare(const IEEEFloat &rhs) const {

  cmpResult result;


  assert(semantics == rhs.semantics);


  switch (PackCategoriesIntoKey(category, rhs.category)) {

  default:

    llvm_unreachable(nullptr);


  case PackCategoriesIntoKey(fcNaN, fcZero):

  case PackCategoriesIntoKey(fcNaN, fcNormal):

  case PackCategoriesIntoKey(fcNaN, fcInfinity):

  case PackCategoriesIntoKey(fcNaN, fcNaN):

  case PackCategoriesIntoKey(fcZero, fcNaN):

  case PackCategoriesIntoKey(fcNormal, fcNaN):

  case PackCategoriesIntoKey(fcInfinity, fcNaN):

    return cmpUnordered;


  case PackCategoriesIntoKey(fcInfinity, fcNormal):

  case PackCategoriesIntoKey(fcInfinity, fcZero):

  case PackCategoriesIntoKey(fcNormal, fcZero):

    if (sign)

      return cmpLessThan;

    else

      return cmpGreaterThan;


  case PackCategoriesIntoKey(fcNormal, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcInfinity):

  case PackCategoriesIntoKey(fcZero, fcNormal):

    if (rhs.sign)

      return cmpGreaterThan;

    else

      return cmpLessThan;


  case PackCategoriesIntoKey(fcInfinity, fcInfinity):

    if (sign == rhs.sign)

      return cmpEqual;

    else if (sign)

      return cmpLessThan;

    else

      return cmpGreaterThan;


  case PackCategoriesIntoKey(fcZero, fcZero):

    return cmpEqual;


  case PackCategoriesIntoKey(fcNormal, fcNormal):

    break;

  }


  /* Two normal numbers.  Do they have the same sign?  */

  if (sign != rhs.sign) {

    if (sign)

      result = cmpLessThan;

    else

      result = cmpGreaterThan;

  } else {

    /* Compare absolute values; invert result if negative.  */

    result = compareAbsoluteValue(rhs);


    if (sign) {

      if (result == cmpLessThan)

        result = cmpGreaterThan;

      else if (result == cmpGreaterThan)

        result = cmpLessThan;

    }

  }


  return result;

}


/// IEEEFloat::convert - convert a value of one floating point type to another.

/// The return value corresponds to the IEEE754 exceptions.  *losesInfo

/// records whether the transformation lost information, i.e. whether

/// converting the result back to the original type will produce the

/// original value (this is almost the same as return value==fsOK, but there

/// are edge cases where this is not so).


APFloat::opStatus IEEEFloat::convert(const fltSemantics &toSemantics,

                                     roundingMode rounding_mode,

                                     bool *losesInfo) {

  lostFraction lostFraction;

  unsigned int newPartCount, oldPartCount;

  opStatus fs;

  int shift;

  const fltSemantics &fromSemantics = *semantics;

  bool is_signaling = isSignaling();


  lostFraction = lfExactlyZero;

  newPartCount = partCountForBits(toSemantics.precision + 1);

  oldPartCount = partCount();

  shift = toSemantics.precision - fromSemantics.precision;


  bool X86SpecialNan = false;

  if (&fromSemantics == &APFloatBase::semX87DoubleExtended &&

      &toSemantics != &APFloatBase::semX87DoubleExtended && category == fcNaN &&

      (!(*significandParts() & 0x8000000000000000ULL) ||

       !(*significandParts() & 0x4000000000000000ULL))) {

    // x86 has some unusual NaNs which cannot be represented in any other

    // format; note them here.

    X86SpecialNan = true;

  }


  // If this is a truncation of a denormal number, and the target semantics

  // has larger exponent range than the source semantics (this can happen

  // when truncating from PowerPC double-double to double format), the

  // right shift could lose result mantissa bits.  Adjust exponent instead

  // of performing excessive shift.

  // Also do a similar trick in case shifting denormal would produce zero

  // significand as this case isn't handled correctly by normalize.

  if (shift < 0 && isFiniteNonZero()) {

    int omsb = significandMSB() + 1;

    int exponentChange = omsb - fromSemantics.precision;

    if (exponent + exponentChange < toSemantics.minExponent)

      exponentChange = toSemantics.minExponent - exponent;

    exponentChange = std::max(exponentChange, shift);

    if (exponentChange < 0) {

      shift -= exponentChange;

      exponent += exponentChange;

    } else if (omsb <= -shift) {

      exponentChange = omsb + shift - 1; // leave at least one bit set

      shift -= exponentChange;

      exponent += exponentChange;

    }

  }


  // If this is a truncation, perform the shift before we narrow the storage.

  if (shift < 0 && (isFiniteNonZero() ||

                    (category == fcNaN && semantics->nonFiniteBehavior !=

                                              fltNonfiniteBehavior::NanOnly)))

    lostFraction = shiftRight(significandParts(), oldPartCount, -shift);


  // Fix the storage so it can hold to new value.

  if (newPartCount > oldPartCount) {

    // The new type requires more storage; make it available.

    integerPart *newParts;

    newParts = new integerPart[newPartCount];

    APInt::tcSet(newParts, 0, newPartCount);

    if (isFiniteNonZero() || category==fcNaN)

      APInt::tcAssign(newParts, significandParts(), oldPartCount);

    freeSignificand();

    significand.parts = newParts;

  } else if (newPartCount == 1 && oldPartCount != 1) {

    // Switch to built-in storage for a single part.

    integerPart newPart = 0;

    if (isFiniteNonZero() || category==fcNaN)

      newPart = significandParts()[0];

    freeSignificand();

    significand.part = newPart;

  }


  // Now that we have the right storage, switch the semantics.

  semantics = &toSemantics;


  // If this is an extension, perform the shift now that the storage is

  // available.

  if (shift > 0 && (isFiniteNonZero() || category==fcNaN))

    APInt::tcShiftLeft(significandParts(), newPartCount, shift);


  if (isFiniteNonZero()) {

    fs = normalize(rounding_mode, lostFraction);

    *losesInfo = (fs != opOK);

  } else if (category == fcNaN) {

    if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly) {

      *losesInfo =

          fromSemantics.nonFiniteBehavior != fltNonfiniteBehavior::NanOnly;

      makeNaN(false, sign);

      return is_signaling ? opInvalidOp : opOK;

    }


    // If NaN is negative zero, we need to create a new NaN to avoid converting

    // NaN to -Inf.

    if (fromSemantics.nanEncoding == fltNanEncoding::NegativeZero &&

        semantics->nanEncoding != fltNanEncoding::NegativeZero)

      makeNaN(false, false);


    *losesInfo = lostFraction != lfExactlyZero || X86SpecialNan;


    // For x87 extended precision, we want to make a NaN, not a special NaN if

    // the input wasn't special either.

    if (!X86SpecialNan && semantics == &APFloatBase::semX87DoubleExtended)

      APInt::tcSetBit(significandParts(), semantics->precision - 1);


    // Convert of sNaN creates qNaN and raises an exception (invalid op).

    // This also guarantees that a sNaN does not become Inf on a truncation

    // that loses all payload bits.

    if (is_signaling) {

      makeQuiet();

      fs = opInvalidOp;

    } else {

      fs = opOK;

    }

  } else if (category == fcInfinity &&

             semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly) {

    makeNaN(false, sign);

    *losesInfo = true;

    fs = opInexact;

  } else if (category == fcZero &&

             semantics->nanEncoding == fltNanEncoding::NegativeZero) {

    // Negative zero loses info, but positive zero doesn't.

    *losesInfo =

        fromSemantics.nanEncoding != fltNanEncoding::NegativeZero && sign;

    fs = *losesInfo ? opInexact : opOK;

    // NaN is negative zero means -0 -> +0, which can lose information

    sign = false;

  } else {

    *losesInfo = false;

    fs = opOK;

  }


  if (category == fcZero && !semantics->hasZero)

    makeSmallestNormalized(false);

  return fs;

}


/* Convert a floating point number to an integer according to the

   rounding mode.  If the rounded integer value is out of range this

   returns an invalid operation exception and the contents of the

   destination parts are unspecified.  If the rounded value is in

   range but the floating point number is not the exact integer, the C

   standard doesn't require an inexact exception to be raised.  IEEE

   854 does require it so we do that.


   Note that for conversions to integer type the C standard requires

   round-to-zero to always be used.  */

APFloat::opStatus IEEEFloat::convertToSignExtendedInteger(

    MutableArrayRef<integerPart> parts, unsigned int width, bool isSigned,

    roundingMode rounding_mode, bool *isExact) const {

  lostFraction lost_fraction;

  const integerPart *src;

  unsigned int dstPartsCount, truncatedBits;


  *isExact = false;


  /* Handle the three special cases first.  */

  if (category == fcInfinity || category == fcNaN)

    return opInvalidOp;


  dstPartsCount = partCountForBits(width);

  assert(dstPartsCount <= parts.size() && "Integer too big");


  if (category == fcZero) {

    APInt::tcSet(parts.data(), 0, dstPartsCount);

    // Negative zero can't be represented as an int.

    *isExact = !sign;

    return opOK;

  }


  src = significandParts();


  /* Step 1: place our absolute value, with any fraction truncated, in

     the destination.  */

  if (exponent < 0) {

    /* Our absolute value is less than one; truncate everything.  */

    APInt::tcSet(parts.data(), 0, dstPartsCount);

    /* For exponent -1 the integer bit represents .5, look at that.

       For smaller exponents leftmost truncated bit is 0. */

    truncatedBits = semantics->precision -1U - exponent;

  } else {

    /* We want the most significant (exponent + 1) bits; the rest are

       truncated.  */

    unsigned int bits = exponent + 1U;


    /* Hopelessly large in magnitude?  */

    if (bits > width)

      return opInvalidOp;


    if (bits < semantics->precision) {

      /* We truncate (semantics->precision - bits) bits.  */

      truncatedBits = semantics->precision - bits;

      APInt::tcExtract(parts.data(), dstPartsCount, src, bits, truncatedBits);

    } else {

      /* We want at least as many bits as are available.  */

      APInt::tcExtract(parts.data(), dstPartsCount, src, semantics->precision,

                       0);

      APInt::tcShiftLeft(parts.data(), dstPartsCount,

                         bits - semantics->precision);

      truncatedBits = 0;

    }

  }


  /* Step 2: work out any lost fraction, and increment the absolute

     value if we would round away from zero.  */

  if (truncatedBits) {

    lost_fraction = lostFractionThroughTruncation(src, partCount(),

                                                  truncatedBits);

    if (lost_fraction != lfExactlyZero &&

        roundAwayFromZero(rounding_mode, lost_fraction, truncatedBits)) {

      if (APInt::tcIncrement(parts.data(), dstPartsCount))

        return opInvalidOp;     /* Overflow.  */

    }

  } else {

    lost_fraction = lfExactlyZero;

  }


  /* Step 3: check if we fit in the destination.  */

  unsigned int omsb = APInt::tcMSB(parts.data(), dstPartsCount) + 1;


  if (sign) {

    if (!isSigned) {

      /* Negative numbers cannot be represented as unsigned.  */

      if (omsb != 0)

        return opInvalidOp;

    } else {

      /* It takes omsb bits to represent the unsigned integer value.

         We lose a bit for the sign, but care is needed as the

         maximally negative integer is a special case.  */

      if (omsb == width &&

          APInt::tcLSB(parts.data(), dstPartsCount) + 1 != omsb)

        return opInvalidOp;


      /* This case can happen because of rounding.  */

      if (omsb > width)

        return opInvalidOp;

    }


    APInt::tcNegate (parts.data(), dstPartsCount);

  } else {

    if (omsb >= width + !isSigned)

      return opInvalidOp;

  }


  if (lost_fraction == lfExactlyZero) {

    *isExact = true;

    return opOK;

  }

  return opInexact;

}


/* Same as convertToSignExtendedInteger, except we provide

   deterministic values in case of an invalid operation exception,

   namely zero for NaNs and the minimal or maximal value respectively

   for underflow or overflow.

   The *isExact output tells whether the result is exact, in the sense

   that converting it back to the original floating point type produces

   the original value.  This is almost equivalent to result==opOK,

   except for negative zeroes.

*/

APFloat::opStatus


IEEEFloat::convertToInteger(MutableArrayRef<integerPart> parts,

                            unsigned int width, bool isSigned,

                            roundingMode rounding_mode, bool *isExact) const {

  opStatus fs;


  fs = convertToSignExtendedInteger(parts, width, isSigned, rounding_mode,

                                    isExact);


  if (fs == opInvalidOp) {

    unsigned int bits, dstPartsCount;


    dstPartsCount = partCountForBits(width);

    assert(dstPartsCount <= parts.size() && "Integer too big");


    if (category == fcNaN)

      bits = 0;

    else if (sign)

      bits = isSigned;

    else

      bits = width - isSigned;


    tcSetLeastSignificantBits(parts.data(), dstPartsCount, bits);

    if (sign && isSigned)

      APInt::tcShiftLeft(parts.data(), dstPartsCount, width - 1);

  }


  return fs;

}


/* Convert an unsigned integer SRC to a floating point number,

   rounding according to ROUNDING_MODE.  The sign of the floating

   point number is not modified.  */

APFloat::opStatus IEEEFloat::convertFromUnsignedParts(

    const integerPart *src, unsigned int srcCount, roundingMode rounding_mode) {

  unsigned int omsb, precision, dstCount;

  integerPart *dst;

  lostFraction lost_fraction;


  category = fcNormal;

  omsb = APInt::tcMSB(src, srcCount) + 1;

  dst = significandParts();

  dstCount = partCount();

  precision = semantics->precision;


  /* We want the most significant PRECISION bits of SRC.  There may not

     be that many; extract what we can.  */

  if (precision <= omsb) {

    exponent = omsb - 1;

    lost_fraction = lostFractionThroughTruncation(src, srcCount,

                                                  omsb - precision);

    APInt::tcExtract(dst, dstCount, src, precision, omsb - precision);

  } else {

    exponent = precision - 1;

    lost_fraction = lfExactlyZero;

    APInt::tcExtract(dst, dstCount, src, omsb, 0);

  }


  return normalize(rounding_mode, lost_fraction);

}


APFloat::opStatus IEEEFloat::convertFromAPInt(const APInt &Val, bool isSigned,

                                              roundingMode rounding_mode) {

  unsigned int partCount = Val.getNumWords();

  APInt api = Val;


  sign = false;

  if (isSigned && api.isNegative()) {

    sign = true;

    api = -api;

  }


  return convertFromUnsignedParts(api.getRawData(), partCount, rounding_mode);

}


Expected<APFloat::opStatus>

IEEEFloat::convertFromHexadecimalString(StringRef s,

                                        roundingMode rounding_mode) {

  lostFraction lost_fraction = lfExactlyZero;


  category = fcNormal;

  zeroSignificand();

  exponent = 0;


  integerPart *significand = significandParts();

  unsigned partsCount = partCount();

  unsigned bitPos = partsCount * integerPartWidth;

  bool computedTrailingFraction = false;


  // Skip leading zeroes and any (hexa)decimal point.

  StringRef::iterator begin = s.begin();

  StringRef::iterator end = s.end();

  StringRef::iterator dot;

  auto PtrOrErr = skipLeadingZeroesAndAnyDot(begin, end, &dot);

  if (!PtrOrErr)

    return PtrOrErr.takeError();

  StringRef::iterator p = *PtrOrErr;

  StringRef::iterator firstSignificantDigit = p;


  while (p != end) {

    integerPart hex_value;


    if (*p == '.') {

      if (dot != end)

        return createError("String contains multiple dots");

      dot = p++;

      continue;

    }


    hex_value = hexDigitValue(*p);

    if (hex_value == UINT_MAX)

      break;


    p++;


    // Store the number while we have space.

    if (bitPos) {

      bitPos -= 4;

      hex_value <<= bitPos % integerPartWidth;

      significand[bitPos / integerPartWidth] |= hex_value;

    } else if (!computedTrailingFraction) {

      auto FractOrErr = trailingHexadecimalFraction(p, end, hex_value);

      if (!FractOrErr)

        return FractOrErr.takeError();

      lost_fraction = *FractOrErr;

      computedTrailingFraction = true;

    }

  }


  /* Hex floats require an exponent but not a hexadecimal point.  */

  if (p == end)

    return createError("Hex strings require an exponent");

  if (*p != 'p' && *p != 'P')

    return createError("Invalid character in significand");

  if (p == begin)

    return createError("Significand has no digits");

  if (dot != end && p - begin == 1)

    return createError("Significand has no digits");


  /* Ignore the exponent if we are zero.  */

  if (p != firstSignificantDigit) {

    int expAdjustment;


    /* Implicit hexadecimal point?  */

    if (dot == end)

      dot = p;


    /* Calculate the exponent adjustment implicit in the number of

       significant digits.  */

    expAdjustment = static_cast<int>(dot - firstSignificantDigit);

    if (expAdjustment < 0)

      expAdjustment++;

    expAdjustment = expAdjustment * 4 - 1;


    /* Adjust for writing the significand starting at the most

       significant nibble.  */

    expAdjustment += semantics->precision;

    expAdjustment -= partsCount * integerPartWidth;


    /* Adjust for the given exponent.  */

    auto ExpOrErr = totalExponent(p + 1, end, expAdjustment);

    if (!ExpOrErr)

      return ExpOrErr.takeError();

    exponent = *ExpOrErr;

  }


  return normalize(rounding_mode, lost_fraction);

}


APFloat::opStatus

IEEEFloat::roundSignificandWithExponent(const integerPart *decSigParts,

                                        unsigned sigPartCount, int exp,

                                        roundingMode rounding_mode) {

  unsigned int parts, pow5PartCount;

  fltSemantics calcSemantics = { 32767, -32767, 0, 0 };

  integerPart pow5Parts[maxPowerOfFiveParts];

  bool isNearest;


  isNearest = (rounding_mode == rmNearestTiesToEven ||

               rounding_mode == rmNearestTiesToAway);


  parts = partCountForBits(semantics->precision + 11);


  /* Calculate pow(5, abs(exp)).  */

  pow5PartCount = powerOf5(pow5Parts, exp >= 0 ? exp: -exp);


  for (;; parts *= 2) {

    opStatus sigStatus, powStatus;

    unsigned int excessPrecision, truncatedBits;


    calcSemantics.precision = parts * integerPartWidth - 1;

    excessPrecision = calcSemantics.precision - semantics->precision;

    truncatedBits = excessPrecision;


    IEEEFloat decSig(calcSemantics, uninitialized);

    decSig.makeZero(sign);

    IEEEFloat pow5(calcSemantics);


    sigStatus = decSig.convertFromUnsignedParts(decSigParts, sigPartCount,

                                                rmNearestTiesToEven);

    powStatus = pow5.convertFromUnsignedParts(pow5Parts, pow5PartCount,

                                              rmNearestTiesToEven);

    /* Add exp, as 10^n = 5^n * 2^n.  */

    decSig.exponent += exp;


    lostFraction calcLostFraction;

    integerPart HUerr, HUdistance;

    unsigned int powHUerr;


    if (exp >= 0) {

      /* multiplySignificand leaves the precision-th bit set to 1.  */

      calcLostFraction = decSig.multiplySignificand(pow5);

      powHUerr = powStatus != opOK;

    } else {

      calcLostFraction = decSig.divideSignificand(pow5);

      /* Denormal numbers have less precision.  */

      if (decSig.exponent < semantics->minExponent) {

        excessPrecision += (semantics->minExponent - decSig.exponent);

        truncatedBits = excessPrecision;

        excessPrecision = std::min(excessPrecision, calcSemantics.precision);

      }

      /* Extra half-ulp lost in reciprocal of exponent.  */

      powHUerr = (powStatus == opOK && calcLostFraction == lfExactlyZero) ? 0:2;

    }


    /* Both multiplySignificand and divideSignificand return the

       result with the integer bit set.  */

    assert(APInt::tcExtractBit

           (decSig.significandParts(), calcSemantics.precision - 1) == 1);


    HUerr = HUerrBound(calcLostFraction != lfExactlyZero, sigStatus != opOK,

                       powHUerr);

    HUdistance = 2 * ulpsFromBoundary(decSig.significandParts(),

                                      excessPrecision, isNearest);


    /* Are we guaranteed to round correctly if we truncate?  */

    if (HUdistance >= HUerr) {

      APInt::tcExtract(significandParts(), partCount(), decSig.significandParts(),

                       calcSemantics.precision - excessPrecision,

                       excessPrecision);

      /* Take the exponent of decSig.  If we tcExtract-ed less bits

         above we must adjust our exponent to compensate for the

         implicit right shift.  */

      exponent = (decSig.exponent + semantics->precision

                  - (calcSemantics.precision - excessPrecision));

      calcLostFraction = lostFractionThroughTruncation(decSig.significandParts(),

                                                       decSig.partCount(),

                                                       truncatedBits);

      return normalize(rounding_mode, calcLostFraction);

    }

  }

}


Expected<APFloat::opStatus>

IEEEFloat::convertFromDecimalString(StringRef str, roundingMode rounding_mode) {

  decimalInfo D;

  opStatus fs;


  /* Scan the text.  */

  StringRef::iterator p = str.begin();

  if (Error Err = interpretDecimal(p, str.end(), &D))

    return std::move(Err);


  /* Handle the quick cases.  First the case of no significant digits,

     i.e. zero, and then exponents that are obviously too large or too

     small.  Writing L for log 10 / log 2, a number d.ddddd*10^exp

     definitely overflows if


           (exp - 1) * L >= maxExponent


     and definitely underflows to zero where


           (exp + 1) * L <= minExponent - precision


     With integer arithmetic the tightest bounds for L are


           93/28 < L < 196/59            [ numerator <= 256 ]

           42039/12655 < L < 28738/8651  [ numerator <= 65536 ]

  */


  // Test if we have a zero number allowing for strings with no null terminators

  // and zero decimals with non-zero exponents.

  //

  // We computed firstSigDigit by ignoring all zeros and dots. Thus if

  // D->firstSigDigit equals str.end(), every digit must be a zero and there can

  // be at most one dot. On the other hand, if we have a zero with a non-zero

  // exponent, then we know that D.firstSigDigit will be non-numeric.

  if (D.firstSigDigit == str.end() || decDigitValue(*D.firstSigDigit) >= 10U) {

    category = fcZero;

    fs = opOK;

    if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

      sign = false;

    if (!semantics->hasZero)

      makeSmallestNormalized(false);


    /* Check whether the normalized exponent is high enough to overflow

       max during the log-rebasing in the max-exponent check below. */

  } else if (D.normalizedExponent - 1 > INT_MAX / 42039) {

    fs = handleOverflow(rounding_mode);


  /* If it wasn't, then it also wasn't high enough to overflow max

     during the log-rebasing in the min-exponent check.  Check that it

     won't overflow min in either check, then perform the min-exponent

     check. */

  } else if (D.normalizedExponent - 1 < INT_MIN / 42039 ||

             (D.normalizedExponent + 1) * 28738 <=

               8651 * (semantics->minExponent - (int) semantics->precision)) {

    /* Underflow to zero and round.  */

    category = fcNormal;

    zeroSignificand();

    fs = normalize(rounding_mode, lfLessThanHalf);


  /* We can finally safely perform the max-exponent check. */

  } else if ((D.normalizedExponent - 1) * 42039

             >= 12655 * semantics->maxExponent) {

    /* Overflow and round.  */

    fs = handleOverflow(rounding_mode);

  } else {

    integerPart *decSignificand;

    unsigned int partCount;


    /* A tight upper bound on number of bits required to hold an

       N-digit decimal integer is N * 196 / 59.  Allocate enough space

       to hold the full significand, and an extra part required by

       tcMultiplyPart.  */

    partCount = static_cast<unsigned int>(D.lastSigDigit - D.firstSigDigit) + 1;

    partCount = partCountForBits(1 + 196 * partCount / 59);

    decSignificand = new integerPart[partCount + 1];

    partCount = 0;


    /* Convert to binary efficiently - we do almost all multiplication

       in an integerPart.  When this would overflow do we do a single

       bignum multiplication, and then revert again to multiplication

       in an integerPart.  */

    do {

      integerPart decValue, val, multiplier;


      val = 0;

      multiplier = 1;


      do {

        if (*p == '.') {

          p++;

          if (p == str.end()) {

            break;

          }

        }

        decValue = decDigitValue(*p++);

        if (decValue >= 10U) {

          delete[] decSignificand;

          return createError("Invalid character in significand");

        }

        multiplier *= 10;

        val = val * 10 + decValue;

        /* The maximum number that can be multiplied by ten with any

           digit added without overflowing an integerPart.  */

      } while (p <= D.lastSigDigit && multiplier <= (~ (integerPart) 0 - 9) / 10);


      /* Multiply out the current part.  */

      APInt::tcMultiplyPart(decSignificand, decSignificand, multiplier, val,

                            partCount, partCount + 1, false);


      /* If we used another part (likely but not guaranteed), increase

         the count.  */

      if (decSignificand[partCount])

        partCount++;

    } while (p <= D.lastSigDigit);


    category = fcNormal;

    fs = roundSignificandWithExponent(decSignificand, partCount,

                                      D.exponent, rounding_mode);


    delete [] decSignificand;

  }


  return fs;

}


bool IEEEFloat::convertFromStringSpecials(StringRef str) {

  const size_t MIN_NAME_SIZE = 3;


  if (str.size() < MIN_NAME_SIZE)

    return false;


  if (str == "inf" || str == "INFINITY" || str == "+Inf") {

    makeInf(false);

    return true;

  }


  bool IsNegative = str.consume_front("-");

  if (IsNegative) {

    if (str.size() < MIN_NAME_SIZE)

      return false;


    if (str == "inf" || str == "INFINITY" || str == "Inf") {

      makeInf(true);

      return true;

    }

  }


  // If we have a 's' (or 'S') prefix, then this is a Signaling NaN.

  bool IsSignaling = str.consume_front_insensitive("s");

  if (IsSignaling) {

    if (str.size() < MIN_NAME_SIZE)

      return false;

  }


  if (str.consume_front("nan") || str.consume_front("NaN")) {

    // A NaN without payload.

    if (str.empty()) {

      makeNaN(IsSignaling, IsNegative);

      return true;

    }


    // Allow the payload to be inside parentheses.

    if (str.front() == '(') {

      // Parentheses should be balanced (and not empty).

      if (str.size() <= 2 || str.back() != ')')

        return false;


      str = str.slice(1, str.size() - 1);

    }


    // Determine the payload number's radix.

    unsigned Radix = 10;

    if (str[0] == '0') {

      if (str.size() > 1 && tolower(str[1]) == 'x') {

        str = str.drop_front(2);

        Radix = 16;

      } else {

        Radix = 8;

      }

    }


    // Parse the payload and make the NaN.

    APInt Payload;

    if (!str.getAsInteger(Radix, Payload)) {

      makeNaN(IsSignaling, IsNegative, &Payload);

      return true;

    }

  }


  return false;

}


Expected<APFloat::opStatus>


IEEEFloat::convertFromString(StringRef str, roundingMode rounding_mode) {

  if (str.empty())

    return createError("Invalid string length");


  // Handle special cases.

  if (convertFromStringSpecials(str))

    return opOK;


  /* Handle a leading minus sign.  */

  StringRef::iterator p = str.begin();

  size_t slen = str.size();

  sign = *p == '-' ? 1 : 0;

  if (sign && !semantics->hasSignedRepr)

    llvm_unreachable(

        "This floating point format does not support signed values");


  if (*p == '-' || *p == '+') {

    p++;

    slen--;

    if (!slen)

      return createError("String has no digits");

  }


  if (slen >= 2 && p[0] == '0' && (p[1] == 'x' || p[1] == 'X')) {

    if (slen == 2)

      return createError("Invalid string");

    return convertFromHexadecimalString(StringRef(p + 2, slen - 2),

                                        rounding_mode);

  }


  return convertFromDecimalString(StringRef(p, slen), rounding_mode);

}


/* Write out a hexadecimal representation of the floating point value

   to DST, which must be of sufficient size, in the C99 form

   [-]0xh.hhhhp[+-]d.  Return the number of characters written,

   excluding the terminating NUL.


   If UPPERCASE, the output is in upper case, otherwise in lower case.


   HEXDIGITS digits appear altogether, rounding the value if

   necessary.  If HEXDIGITS is 0, the minimal precision to display the

   number precisely is used instead.  If nothing would appear after

   the decimal point it is suppressed.


   The decimal exponent is always printed and has at least one digit.

   Zero values display an exponent of zero.  Infinities and NaNs

   appear as "infinity" or "nan" respectively.


   The above rules are as specified by C99.  There is ambiguity about

   what the leading hexadecimal digit should be.  This implementation

   uses whatever is necessary so that the exponent is displayed as

   stored.  This implies the exponent will fall within the IEEE format

   range, and the leading hexadecimal digit will be 0 (for denormals),

   1 (normal numbers) or 2 (normal numbers rounded-away-from-zero with

   any other digits zero).

*/


unsigned int IEEEFloat::convertToHexString(char *dst, unsigned int hexDigits,

                                           bool upperCase,

                                           roundingMode rounding_mode) const {

  char *p;


  p = dst;

  if (sign)

    *dst++ = '-';


  switch (category) {

  case fcInfinity:

    memcpy (dst, upperCase ? infinityU: infinityL, sizeof infinityU - 1);

    dst += sizeof infinityL - 1;

    break;


  case fcNaN:

    memcpy (dst, upperCase ? NaNU: NaNL, sizeof NaNU - 1);

    dst += sizeof NaNU - 1;

    break;


  case fcZero:

    *dst++ = '0';

    *dst++ = upperCase ? 'X': 'x';

    *dst++ = '0';

    if (hexDigits > 1) {

      *dst++ = '.';

      memset (dst, '0', hexDigits - 1);

      dst += hexDigits - 1;

    }

    *dst++ = upperCase ? 'P': 'p';

    *dst++ = '0';

    break;


  case fcNormal:

    dst = convertNormalToHexString (dst, hexDigits, upperCase, rounding_mode);

    break;

  }


  *dst = 0;


  return static_cast<unsigned int>(dst - p);

}


/* Does the hard work of outputting the correctly rounded hexadecimal

   form of a normal floating point number with the specified number of

   hexadecimal digits.  If HEXDIGITS is zero the minimum number of

   digits necessary to print the value precisely is output.  */

char *IEEEFloat::convertNormalToHexString(char *dst, unsigned int hexDigits,

                                          bool upperCase,

                                          roundingMode rounding_mode) const {

  unsigned int count, valueBits, shift, partsCount, outputDigits;

  const char *hexDigitChars;

  const integerPart *significand;

  char *p;

  bool roundUp;


  *dst++ = '0';

  *dst++ = upperCase ? 'X': 'x';


  roundUp = false;

  hexDigitChars = upperCase ? hexDigitsUpper: hexDigitsLower;


  significand = significandParts();

  partsCount = partCount();


  /* +3 because the first digit only uses the single integer bit, so

     we have 3 virtual zero most-significant-bits.  */

  valueBits = semantics->precision + 3;

  shift = integerPartWidth - valueBits % integerPartWidth;


  /* The natural number of digits required ignoring trailing

     insignificant zeroes.  */

  outputDigits = (valueBits - significandLSB () + 3) / 4;


  /* hexDigits of zero means use the required number for the

     precision.  Otherwise, see if we are truncating.  If we are,

     find out if we need to round away from zero.  */

  if (hexDigits) {

    if (hexDigits < outputDigits) {

      /* We are dropping non-zero bits, so need to check how to round.

         "bits" is the number of dropped bits.  */

      unsigned int bits;

      lostFraction fraction;


      bits = valueBits - hexDigits * 4;

      fraction = lostFractionThroughTruncation (significand, partsCount, bits);

      roundUp = roundAwayFromZero(rounding_mode, fraction, bits);

    }

    outputDigits = hexDigits;

  }


  /* Write the digits consecutively, and start writing in the location

     of the hexadecimal point.  We move the most significant digit

     left and add the hexadecimal point later.  */

  p = ++dst;


  count = (valueBits + integerPartWidth - 1) / integerPartWidth;


  while (outputDigits && count) {

    integerPart part;


    /* Put the most significant integerPartWidth bits in "part".  */

    if (--count == partsCount)

      part = 0;  /* An imaginary higher zero part.  */

    else

      part = significand[count] << shift;


    if (count && shift)

      part |= significand[count - 1] >> (integerPartWidth - shift);


    /* Convert as much of "part" to hexdigits as we can.  */

    unsigned int curDigits = integerPartWidth / 4;


    curDigits = std::min(curDigits, outputDigits);

    dst += partAsHex (dst, part, curDigits, hexDigitChars);

    outputDigits -= curDigits;

  }


  if (roundUp) {

    char *q = dst;


    /* Note that hexDigitChars has a trailing '0'.  */

    do {

      q--;

      *q = hexDigitChars[hexDigitValue (*q) + 1];

    } while (*q == '0');

    assert(q >= p);

  } else {

    /* Add trailing zeroes.  */

    memset (dst, '0', outputDigits);

    dst += outputDigits;

  }


  /* Move the most significant digit to before the point, and if there

     is something after the decimal point add it.  This must come

     after rounding above.  */

  p[-1] = p[0];

  if (dst -1 == p)

    dst--;

  else

    p[0] = '.';


  /* Finally output the exponent.  */

  *dst++ = upperCase ? 'P': 'p';


  return writeSignedDecimal (dst, exponent);

}


hash_code hash_value(const IEEEFloat &Arg) {

  if (!Arg.isFiniteNonZero())

    return hash_combine((uint8_t)Arg.category,

                        // NaN has no sign, fix it at zero.

                        Arg.isNaN() ? (uint8_t)0 : (uint8_t)Arg.sign,

                        Arg.semantics->precision);


  // Normal floats need their exponent and significand hashed.

  return hash_combine((uint8_t)Arg.category, (uint8_t)Arg.sign,

                      Arg.semantics->precision, Arg.exponent,

                      hash_combine_range(

                        Arg.significandParts(),

                        Arg.significandParts() + Arg.partCount()));

}


// Conversion from APFloat to/from host float/double.  It may eventually be

// possible to eliminate these and have everybody deal with APFloats, but that

// will take a while.  This approach will not easily extend to long double.

// Current implementation requires integerPartWidth==64, which is correct at

// the moment but could be made more general.


// Denormals have exponent minExponent in APFloat, but minExponent-1 in

// the actual IEEE respresentations.  We compensate for that here.


APInt IEEEFloat::convertF80LongDoubleAPFloatToAPInt() const {

  assert(semantics ==

         (const llvm::fltSemantics *)&APFloatBase::semX87DoubleExtended);

  assert(partCount()==2);


  uint64_t myexponent, mysignificand;


  if (isFiniteNonZero()) {

    myexponent = exponent+16383; //bias

    mysignificand = significandParts()[0];

    if (myexponent==1 && !(mysignificand & 0x8000000000000000ULL))

      myexponent = 0;   // denormal

  } else if (category==fcZero) {

    myexponent = 0;

    mysignificand = 0;

  } else if (category==fcInfinity) {

    myexponent = 0x7fff;

    mysignificand = 0x8000000000000000ULL;

  } else {

    assert(category == fcNaN && "Unknown category");

    myexponent = 0x7fff;

    mysignificand = significandParts()[0];

  }


  uint64_t words[2];

  words[0] = mysignificand;

  words[1] =  ((uint64_t)(sign & 1) << 15) |

              (myexponent & 0x7fffLL);

  return APInt(80, words);

}


APInt IEEEFloat::convertPPCDoubleDoubleLegacyAPFloatToAPInt() const {

  assert(semantics ==

         (const llvm::fltSemantics *)&APFloatBase::semPPCDoubleDoubleLegacy);

  assert(partCount()==2);


  uint64_t words[2];

  opStatus fs;

  bool losesInfo;


  // Convert number to double.  To avoid spurious underflows, we re-

  // normalize against the "double" minExponent first, and only *then*

  // truncate the mantissa.  The result of that second conversion

  // may be inexact, but should never underflow.

  // Declare fltSemantics before APFloat that uses it (and

  // saves pointer to it) to ensure correct destruction order.

  fltSemantics extendedSemantics = *semantics;

  extendedSemantics.minExponent = APFloatBase::semIEEEdouble.minExponent;

  IEEEFloat extended(*this);

  fs = extended.convert(extendedSemantics, rmNearestTiesToEven, &losesInfo);

  assert(fs == opOK && !losesInfo);

  (void)fs;


  IEEEFloat u(extended);

  fs = u.convert(APFloatBase::semIEEEdouble, rmNearestTiesToEven, &losesInfo);

  assert(fs == opOK || fs == opInexact);

  (void)fs;

  words[0] = *u.convertDoubleAPFloatToAPInt().getRawData();


  // If conversion was exact or resulted in a special case, we're done;

  // just set the second double to zero.  Otherwise, re-convert back to

  // the extended format and compute the difference.  This now should

  // convert exactly to double.

  if (u.isFiniteNonZero() && losesInfo) {

    fs = u.convert(extendedSemantics, rmNearestTiesToEven, &losesInfo);

    assert(fs == opOK && !losesInfo);

    (void)fs;


    IEEEFloat v(extended);

    v.subtract(u, rmNearestTiesToEven);

    fs = v.convert(APFloatBase::semIEEEdouble, rmNearestTiesToEven, &losesInfo);

    assert(fs == opOK && !losesInfo);

    (void)fs;

    words[1] = *v.convertDoubleAPFloatToAPInt().getRawData();

  } else {

    words[1] = 0;

  }


  return APInt(128, words);

}


template <const fltSemantics &S>

APInt IEEEFloat::convertIEEEFloatToAPInt() const {

  assert(semantics == &S);

  const int bias = (semantics == &APFloatBase::semFloat8E8M0FNU)

                       ? -S.minExponent

                       : -(S.minExponent - 1);

  constexpr unsigned int trailing_significand_bits = S.precision - 1;

  constexpr int integer_bit_part = trailing_significand_bits / integerPartWidth;

  constexpr integerPart integer_bit =

      integerPart{1} << (trailing_significand_bits % integerPartWidth);

  constexpr uint64_t significand_mask = integer_bit - 1;

  constexpr unsigned int exponent_bits =

      trailing_significand_bits ? (S.sizeInBits - 1 - trailing_significand_bits)

                                : S.sizeInBits;

  static_assert(exponent_bits < 64);

  constexpr uint64_t exponent_mask = (uint64_t{1} << exponent_bits) - 1;


  uint64_t myexponent;

  std::array<integerPart, partCountForBits(trailing_significand_bits)>

      mysignificand;


  if (isFiniteNonZero()) {

    myexponent = exponent + bias;

    std::copy_n(significandParts(), mysignificand.size(),

                mysignificand.begin());

    if (myexponent == 1 &&

        !(significandParts()[integer_bit_part] & integer_bit))

      myexponent = 0; // denormal

  } else if (category == fcZero) {

    if (!S.hasZero)

      llvm_unreachable("semantics does not support zero!");

    myexponent = ::exponentZero(S) + bias;

    mysignificand.fill(0);

  } else if (category == fcInfinity) {

    if (S.nonFiniteBehavior == fltNonfiniteBehavior::NanOnly ||

        S.nonFiniteBehavior == fltNonfiniteBehavior::FiniteOnly)

      llvm_unreachable("semantics don't support inf!");

    myexponent = ::exponentInf(S) + bias;

    mysignificand.fill(0);

  } else {

    assert(category == fcNaN && "Unknown category!");

    if (S.nonFiniteBehavior == fltNonfiniteBehavior::FiniteOnly)

      llvm_unreachable("semantics don't support NaN!");

    myexponent = ::exponentNaN(S) + bias;

    std::copy_n(significandParts(), mysignificand.size(),

                mysignificand.begin());

  }

  std::array<uint64_t, (S.sizeInBits + 63) / 64> words;

  auto words_iter =

      std::copy_n(mysignificand.begin(), mysignificand.size(), words.begin());

  if constexpr (significand_mask != 0 || trailing_significand_bits == 0) {

    // Clear the integer bit.

    words[mysignificand.size() - 1] &= significand_mask;

  }

  std::fill(words_iter, words.end(), uint64_t{0});

  constexpr size_t last_word = words.size() - 1;

  uint64_t shifted_sign = static_cast<uint64_t>(sign & 1)

                          << ((S.sizeInBits - 1) % 64);

  words[last_word] |= shifted_sign;

  uint64_t shifted_exponent = (myexponent & exponent_mask)

                              << (trailing_significand_bits % 64);

  words[last_word] |= shifted_exponent;

  if constexpr (last_word == 0) {

    return APInt(S.sizeInBits, words[0]);

  }

  return APInt(S.sizeInBits, words);

}


APInt IEEEFloat::convertQuadrupleAPFloatToAPInt() const {

  assert(partCount() == 2);

  return convertIEEEFloatToAPInt<APFloatBase::semIEEEquad>();

}


APInt IEEEFloat::convertDoubleAPFloatToAPInt() const {

  assert(partCount()==1);

  return convertIEEEFloatToAPInt<APFloatBase::semIEEEdouble>();

}


APInt IEEEFloat::convertFloatAPFloatToAPInt() const {

  assert(partCount()==1);

  return convertIEEEFloatToAPInt<APFloatBase::semIEEEsingle>();

}


APInt IEEEFloat::convertBFloatAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semBFloat>();

}


APInt IEEEFloat::convertHalfAPFloatToAPInt() const {

  assert(partCount()==1);

  return convertIEEEFloatToAPInt<APFloatBase::APFloatBase::semIEEEhalf>();

}


APInt IEEEFloat::convertFloat8E5M2APFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E5M2>();

}


APInt IEEEFloat::convertFloat8E5M2FNUZAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E5M2FNUZ>();

}


APInt IEEEFloat::convertFloat8E4M3APFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E4M3>();

}


APInt IEEEFloat::convertFloat8E4M3FNAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E4M3FN>();

}


APInt IEEEFloat::convertFloat8E4M3FNUZAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E4M3FNUZ>();

}


APInt IEEEFloat::convertFloat8E4M3B11FNUZAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E4M3B11FNUZ>();

}


APInt IEEEFloat::convertFloat8E3M4APFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E3M4>();

}


APInt IEEEFloat::convertFloatTF32APFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloatTF32>();

}


APInt IEEEFloat::convertFloat8E8M0FNUAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat8E8M0FNU>();

}


APInt IEEEFloat::convertFloat6E3M2FNAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat6E3M2FN>();

}


APInt IEEEFloat::convertFloat6E2M3FNAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat6E2M3FN>();

}


APInt IEEEFloat::convertFloat4E2M1FNAPFloatToAPInt() const {

  assert(partCount() == 1);

  return convertIEEEFloatToAPInt<APFloatBase::semFloat4E2M1FN>();

}


// This function creates an APInt that is just a bit map of the floating

// point constant as it would appear in memory.  It is not a conversion,

// and treating the result as a normal integer is unlikely to be useful.


APInt IEEEFloat::bitcastToAPInt() const {

  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEhalf)

    return convertHalfAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semBFloat)

    return convertBFloatAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEsingle)

    return convertFloatAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEdouble)

    return convertDoubleAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEquad)

    return convertQuadrupleAPFloatToAPInt();


  if (semantics ==

      (const llvm::fltSemantics *)&APFloatBase::semPPCDoubleDoubleLegacy)

    return convertPPCDoubleDoubleLegacyAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E5M2)

    return convertFloat8E5M2APFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E5M2FNUZ)

    return convertFloat8E5M2FNUZAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E4M3)

    return convertFloat8E4M3APFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E4M3FN)

    return convertFloat8E4M3FNAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E4M3FNUZ)

    return convertFloat8E4M3FNUZAPFloatToAPInt();


  if (semantics ==

      (const llvm::fltSemantics *)&APFloatBase::semFloat8E4M3B11FNUZ)

    return convertFloat8E4M3B11FNUZAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E3M4)

    return convertFloat8E3M4APFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloatTF32)

    return convertFloatTF32APFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat8E8M0FNU)

    return convertFloat8E8M0FNUAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat6E3M2FN)

    return convertFloat6E3M2FNAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat6E2M3FN)

    return convertFloat6E2M3FNAPFloatToAPInt();


  if (semantics == (const llvm::fltSemantics *)&APFloatBase::semFloat4E2M1FN)

    return convertFloat4E2M1FNAPFloatToAPInt();


  assert(semantics ==

             (const llvm::fltSemantics *)&APFloatBase::semX87DoubleExtended &&

         "unknown format!");

  return convertF80LongDoubleAPFloatToAPInt();

}


float IEEEFloat::convertToFloat() const {

  assert(semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEsingle &&

         "Float semantics are not IEEEsingle");

  APInt api = bitcastToAPInt();

  return api.bitsToFloat();

}


double IEEEFloat::convertToDouble() const {

  assert(semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEdouble &&

         "Float semantics are not IEEEdouble");

  APInt api = bitcastToAPInt();

  return api.bitsToDouble();

}


#ifdef HAS_IEE754_FLOAT128

float128 IEEEFloat::convertToQuad() const {

  assert(semantics == (const llvm::fltSemantics *)&APFloatBase::semIEEEquad &&

         "Float semantics are not IEEEquads");

  APInt api = bitcastToAPInt();

  return api.bitsToQuad();

}

#endif


/// Integer bit is explicit in this format.  Intel hardware (387 and later)

/// does not support these bit patterns:

///  exponent = all 1's, integer bit 0, significand 0 ("pseudoinfinity")

///  exponent = all 1's, integer bit 0, significand nonzero ("pseudoNaN")

///  exponent!=0 nor all 1's, integer bit 0 ("unnormal")

///  exponent = 0, integer bit 1 ("pseudodenormal")

/// At the moment, the first three are treated as NaNs, the last one as Normal.

void IEEEFloat::initFromF80LongDoubleAPInt(const APInt &api) {

  uint64_t i1 = api.getRawData()[0];

  uint64_t i2 = api.getRawData()[1];

  uint64_t myexponent = (i2 & 0x7fff);

  uint64_t mysignificand = i1;

  uint8_t myintegerbit = mysignificand >> 63;


  initialize(&APFloatBase::semX87DoubleExtended);

  assert(partCount()==2);


  sign = static_cast<unsigned int>(i2>>15);

  if (myexponent == 0 && mysignificand == 0) {

    makeZero(sign);

  } else if (myexponent==0x7fff && mysignificand==0x8000000000000000ULL) {

    makeInf(sign);

  } else if ((myexponent == 0x7fff && mysignificand != 0x8000000000000000ULL) ||

             (myexponent != 0x7fff && myexponent != 0 && myintegerbit == 0)) {

    category = fcNaN;

    exponent = exponentNaN();

    significandParts()[0] = mysignificand;

    significandParts()[1] = 0;

  } else {

    category = fcNormal;

    exponent = myexponent - 16383;

    significandParts()[0] = mysignificand;

    significandParts()[1] = 0;

    if (myexponent==0)          // denormal

      exponent = -16382;

  }

}


void IEEEFloat::initFromPPCDoubleDoubleLegacyAPInt(const APInt &api) {

  uint64_t i1 = api.getRawData()[0];

  uint64_t i2 = api.getRawData()[1];

  opStatus fs;

  bool losesInfo;


  // Get the first double and convert to our format.

  initFromDoubleAPInt(APInt(64, i1));

  fs = convert(APFloatBase::semPPCDoubleDoubleLegacy, rmNearestTiesToEven,

               &losesInfo);

  assert(fs == opOK && !losesInfo);

  (void)fs;


  // Unless we have a special case, add in second double.

  if (isFiniteNonZero()) {

    IEEEFloat v(APFloatBase::semIEEEdouble, APInt(64, i2));

    fs = v.convert(APFloatBase::semPPCDoubleDoubleLegacy, rmNearestTiesToEven,

                   &losesInfo);

    assert(fs == opOK && !losesInfo);

    (void)fs;


    add(v, rmNearestTiesToEven);

  }

}


// The E8M0 format has the following characteristics:

// It is an 8-bit unsigned format with only exponents (no actual significand).

// No encodings for {zero, infinities or denorms}.

// NaN is represented by all 1's.

// Bias is 127.

void IEEEFloat::initFromFloat8E8M0FNUAPInt(const APInt &api) {

  const uint64_t exponent_mask = 0xff;

  uint64_t val = api.getRawData()[0];

  uint64_t myexponent = (val & exponent_mask);


  initialize(&APFloatBase::semFloat8E8M0FNU);

  assert(partCount() == 1);


  // This format has unsigned representation only

  sign = 0;


  // Set the significand

  // This format does not have any significand but the 'Pth' precision bit is

  // always set to 1 for consistency in APFloat's internal representation.

  uint64_t mysignificand = 1;

  significandParts()[0] = mysignificand;


  // This format can either have a NaN or fcNormal

  // All 1's i.e. 255 is a NaN

  if (val == exponent_mask) {

    category = fcNaN;

    exponent = exponentNaN();

    return;

  }

  // Handle fcNormal...

  category = fcNormal;

  exponent = myexponent - 127; // 127 is bias

}

template <const fltSemantics &S>

void IEEEFloat::initFromIEEEAPInt(const APInt &api) {

  assert(api.getBitWidth() == S.sizeInBits);

  constexpr integerPart integer_bit = integerPart{1}

                                      << ((S.precision - 1) % integerPartWidth);

  constexpr uint64_t significand_mask = integer_bit - 1;

  constexpr unsigned int trailing_significand_bits = S.precision - 1;

  constexpr unsigned int stored_significand_parts =

      partCountForBits(trailing_significand_bits);

  constexpr unsigned int exponent_bits =

      S.sizeInBits - 1 - trailing_significand_bits;

  static_assert(exponent_bits < 64);

  constexpr uint64_t exponent_mask = (uint64_t{1} << exponent_bits) - 1;

  constexpr int bias = -(S.minExponent - 1);


  // Copy the bits of the significand. We need to clear out the exponent and

  // sign bit in the last word.

  std::array<integerPart, stored_significand_parts> mysignificand;

  std::copy_n(api.getRawData(), mysignificand.size(), mysignificand.begin());

  if constexpr (significand_mask != 0) {

    mysignificand[mysignificand.size() - 1] &= significand_mask;

  }


  // We assume the last word holds the sign bit, the exponent, and potentially

  // some of the trailing significand field.

  uint64_t last_word = api.getRawData()[api.getNumWords() - 1];

  uint64_t myexponent =

      (last_word >> (trailing_significand_bits % 64)) & exponent_mask;


  initialize(&S);

  assert(partCount() == mysignificand.size());


  sign = static_cast<unsigned int>(last_word >> ((S.sizeInBits - 1) % 64));


  bool all_zero_significand =

      llvm::all_of(mysignificand, [](integerPart bits) { return bits == 0; });


  bool is_zero = myexponent == 0 && all_zero_significand;


  if constexpr (S.nonFiniteBehavior == fltNonfiniteBehavior::IEEE754) {

    if (myexponent - bias == ::exponentInf(S) && all_zero_significand) {

      makeInf(sign);

      return;

    }

  }


  bool is_nan = false;


  if constexpr (S.nanEncoding == fltNanEncoding::IEEE) {

    is_nan = myexponent - bias == ::exponentNaN(S) && !all_zero_significand;

  } else if constexpr (S.nanEncoding == fltNanEncoding::AllOnes) {

    bool all_ones_significand =

        std::all_of(mysignificand.begin(), mysignificand.end() - 1,

                    [](integerPart bits) { return bits == ~integerPart{0}; }) &&

        (!significand_mask ||

         mysignificand[mysignificand.size() - 1] == significand_mask);

    is_nan = myexponent - bias == ::exponentNaN(S) && all_ones_significand;

  } else if constexpr (S.nanEncoding == fltNanEncoding::NegativeZero) {

    is_nan = is_zero && sign;

  }


  if (is_nan) {

    category = fcNaN;

    exponent = ::exponentNaN(S);

    std::copy_n(mysignificand.begin(), mysignificand.size(),

                significandParts());

    return;

  }


  if (is_zero) {

    makeZero(sign);

    return;

  }


  category = fcNormal;

  exponent = myexponent - bias;

  std::copy_n(mysignificand.begin(), mysignificand.size(), significandParts());

  if (myexponent == 0) // denormal

    exponent = S.minExponent;

  else

    significandParts()[mysignificand.size()-1] |= integer_bit; // integer bit

}


void IEEEFloat::initFromQuadrupleAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semIEEEquad>(api);

}


void IEEEFloat::initFromDoubleAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semIEEEdouble>(api);

}


void IEEEFloat::initFromFloatAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semIEEEsingle>(api);

}


void IEEEFloat::initFromBFloatAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semBFloat>(api);

}


void IEEEFloat::initFromHalfAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semIEEEhalf>(api);

}


void IEEEFloat::initFromFloat8E5M2APInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E5M2>(api);

}


void IEEEFloat::initFromFloat8E5M2FNUZAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E5M2FNUZ>(api);

}


void IEEEFloat::initFromFloat8E4M3APInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E4M3>(api);

}


void IEEEFloat::initFromFloat8E4M3FNAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E4M3FN>(api);

}


void IEEEFloat::initFromFloat8E4M3FNUZAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E4M3FNUZ>(api);

}


void IEEEFloat::initFromFloat8E4M3B11FNUZAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E4M3B11FNUZ>(api);

}


void IEEEFloat::initFromFloat8E3M4APInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat8E3M4>(api);

}


void IEEEFloat::initFromFloatTF32APInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloatTF32>(api);

}


void IEEEFloat::initFromFloat6E3M2FNAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat6E3M2FN>(api);

}


void IEEEFloat::initFromFloat6E2M3FNAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat6E2M3FN>(api);

}


void IEEEFloat::initFromFloat4E2M1FNAPInt(const APInt &api) {

  initFromIEEEAPInt<APFloatBase::semFloat4E2M1FN>(api);

}


/// Treat api as containing the bits of a floating point number.

void IEEEFloat::initFromAPInt(const fltSemantics *Sem, const APInt &api) {

  assert(api.getBitWidth() == Sem->sizeInBits);

  if (Sem == &APFloatBase::semIEEEhalf)

    return initFromHalfAPInt(api);

  if (Sem == &APFloatBase::semBFloat)

    return initFromBFloatAPInt(api);

  if (Sem == &APFloatBase::semIEEEsingle)

    return initFromFloatAPInt(api);

  if (Sem == &APFloatBase::semIEEEdouble)

    return initFromDoubleAPInt(api);

  if (Sem == &APFloatBase::semX87DoubleExtended)

    return initFromF80LongDoubleAPInt(api);

  if (Sem == &APFloatBase::semIEEEquad)

    return initFromQuadrupleAPInt(api);

  if (Sem == &APFloatBase::semPPCDoubleDoubleLegacy)

    return initFromPPCDoubleDoubleLegacyAPInt(api);

  if (Sem == &APFloatBase::semFloat8E5M2)

    return initFromFloat8E5M2APInt(api);

  if (Sem == &APFloatBase::semFloat8E5M2FNUZ)

    return initFromFloat8E5M2FNUZAPInt(api);

  if (Sem == &APFloatBase::semFloat8E4M3)

    return initFromFloat8E4M3APInt(api);

  if (Sem == &APFloatBase::semFloat8E4M3FN)

    return initFromFloat8E4M3FNAPInt(api);

  if (Sem == &APFloatBase::semFloat8E4M3FNUZ)

    return initFromFloat8E4M3FNUZAPInt(api);

  if (Sem == &APFloatBase::semFloat8E4M3B11FNUZ)

    return initFromFloat8E4M3B11FNUZAPInt(api);

  if (Sem == &APFloatBase::semFloat8E3M4)

    return initFromFloat8E3M4APInt(api);

  if (Sem == &APFloatBase::semFloatTF32)

    return initFromFloatTF32APInt(api);

  if (Sem == &APFloatBase::semFloat8E8M0FNU)

    return initFromFloat8E8M0FNUAPInt(api);

  if (Sem == &APFloatBase::semFloat6E3M2FN)

    return initFromFloat6E3M2FNAPInt(api);

  if (Sem == &APFloatBase::semFloat6E2M3FN)

    return initFromFloat6E2M3FNAPInt(api);

  if (Sem == &APFloatBase::semFloat4E2M1FN)

    return initFromFloat4E2M1FNAPInt(api);


  llvm_unreachable("unsupported semantics");

}


/// Make this number the largest magnitude normal number in the given

/// semantics.


void IEEEFloat::makeLargest(bool Negative) {

  if (Negative && !semantics->hasSignedRepr)

    llvm_unreachable(

        "This floating point format does not support signed values");

  // We want (in interchange format):

  //   sign = {Negative}

  //   exponent = 1..10

  //   significand = 1..1

  category = fcNormal;

  sign = Negative;

  exponent = semantics->maxExponent;


  // Use memset to set all but the highest integerPart to all ones.

  integerPart *significand = significandParts();

  unsigned PartCount = partCount();

  memset(significand, 0xFF, sizeof(integerPart)*(PartCount - 1));


  // Set the high integerPart especially setting all unused top bits for

  // internal consistency.

  const unsigned NumUnusedHighBits =

    PartCount*integerPartWidth - semantics->precision;

  significand[PartCount - 1] = (NumUnusedHighBits < integerPartWidth)

                                   ? (~integerPart(0) >> NumUnusedHighBits)

                                   : 0;

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly &&

      semantics->nanEncoding == fltNanEncoding::AllOnes &&

      (semantics->precision > 1))

    significand[0] &= ~integerPart(1);

}


/// Make this number the smallest magnitude denormal number in the given

/// semantics.


void IEEEFloat::makeSmallest(bool Negative) {

  if (Negative && !semantics->hasSignedRepr)

    llvm_unreachable(

        "This floating point format does not support signed values");

  // We want (in interchange format):

  //   sign = {Negative}

  //   exponent = 0..0

  //   significand = 0..01

  category = fcNormal;

  sign = Negative;

  exponent = semantics->minExponent;

  APInt::tcSet(significandParts(), 1, partCount());

}


void IEEEFloat::makeSmallestNormalized(bool Negative) {

  if (Negative && !semantics->hasSignedRepr)

    llvm_unreachable(

        "This floating point format does not support signed values");

  // We want (in interchange format):

  //   sign = {Negative}

  //   exponent = 0..0

  //   significand = 10..0


  category = fcNormal;

  zeroSignificand();

  sign = Negative;

  exponent = semantics->minExponent;

  APInt::tcSetBit(significandParts(), semantics->precision - 1);

}


IEEEFloat::IEEEFloat(const fltSemantics &Sem, const APInt &API) {

  initFromAPInt(&Sem, API);

}


IEEEFloat::IEEEFloat(float f) {

  initFromAPInt(&APFloatBase::semIEEEsingle, APInt::floatToBits(f));

}


IEEEFloat::IEEEFloat(double d) {

  initFromAPInt(&APFloatBase::semIEEEdouble, APInt::doubleToBits(d));

}


namespace {

  void append(SmallVectorImpl<char> &Buffer, StringRef Str) {

    Buffer.append(Str.begin(), Str.end());

  }


  /// Removes data from the given significand until it is no more

  /// precise than is required for the desired precision.

  void AdjustToPrecision(APInt &significand,

                         int &exp, unsigned FormatPrecision) {

    unsigned bits = significand.getActiveBits();


    // 196/59 is a very slight overestimate of lg_2(10).

    unsigned bitsRequired = (FormatPrecision * 196 + 58) / 59;


    if (bits <= bitsRequired) return;


    unsigned tensRemovable = (bits - bitsRequired) * 59 / 196;

    if (!tensRemovable) return;


    exp += tensRemovable;


    APInt divisor(significand.getBitWidth(), 1);

    APInt powten(significand.getBitWidth(), 10);

    while (true) {

      if (tensRemovable & 1)

        divisor *= powten;

      tensRemovable >>= 1;

      if (!tensRemovable) break;

      powten *= powten;

    }


    significand = significand.udiv(divisor);


    // Truncate the significand down to its active bit count.

    significand = significand.trunc(significand.getActiveBits());

  }


  void AdjustToPrecision(SmallVectorImpl<char> &buffer,

                         int &exp, unsigned FormatPrecision) {

    unsigned N = buffer.size();

    if (N <= FormatPrecision) return;


    // The most significant figures are the last ones in the buffer.

    unsigned FirstSignificant = N - FormatPrecision;


    // Round.

    // FIXME: this probably shouldn't use 'round half up'.


    // Rounding down is just a truncation, except we also want to drop

    // trailing zeros from the new result.

    if (buffer[FirstSignificant - 1] < '5') {

      while (FirstSignificant < N && buffer[FirstSignificant] == '0')

        FirstSignificant++;


      exp += FirstSignificant;

      buffer.erase(&buffer[0], &buffer[FirstSignificant]);

      return;

    }


    // Rounding up requires a decimal add-with-carry.  If we continue

    // the carry, the newly-introduced zeros will just be truncated.

    for (unsigned I = FirstSignificant; I != N; ++I) {

      if (buffer[I] == '9') {

        FirstSignificant++;

      } else {

        buffer[I]++;

        break;

      }

    }


    // If we carried through, we have exactly one digit of precision.

    if (FirstSignificant == N) {

      exp += FirstSignificant;

      buffer.clear();

      buffer.push_back('1');

      return;

    }


    exp += FirstSignificant;

    buffer.erase(&buffer[0], &buffer[FirstSignificant]);

  }


  void toStringImpl(SmallVectorImpl<char> &Str, const bool isNeg, int exp,

                    APInt significand, unsigned FormatPrecision,

                    unsigned FormatMaxPadding, bool TruncateZero) {

    const int semanticsPrecision = significand.getBitWidth();


    if (isNeg)

      Str.push_back('-');


    // Set FormatPrecision if zero.  We want to do this before we

    // truncate trailing zeros, as those are part of the precision.

    if (!FormatPrecision) {

      // We use enough digits so the number can be round-tripped back to an

      // APFloat. The formula comes from "How to Print Floating-Point Numbers

      // Accurately" by Steele and White.

      // FIXME: Using a formula based purely on the precision is conservative;

      // we can print fewer digits depending on the actual value being printed.


      // FormatPrecision = 2 + floor(significandBits / lg_2(10))

      FormatPrecision = 2 + semanticsPrecision * 59 / 196;

    }


    // Ignore trailing binary zeros.

    int trailingZeros = significand.countr_zero();

    exp += trailingZeros;

    significand.lshrInPlace(trailingZeros);


    // Change the exponent from 2^e to 10^e.

    if (exp == 0) {

      // Nothing to do.

    } else if (exp > 0) {

      // Just shift left.

      significand = significand.zext(semanticsPrecision + exp);

      significand <<= exp;

      exp = 0;

    } else { /* exp < 0 */

      int texp = -exp;


      // We transform this using the identity:

      //   (N)(2^-e) == (N)(5^e)(10^-e)

      // This means we have to multiply N (the significand) by 5^e.

      // To avoid overflow, we have to operate on numbers large

      // enough to store N * 5^e:

      //   log2(N * 5^e) == log2(N) + e * log2(5)

      //                 <= semantics->precision + e * 137 / 59

      //   (log_2(5) ~ 2.321928 < 2.322034 ~ 137/59)


      unsigned precision = semanticsPrecision + (137 * texp + 136) / 59;


      // Multiply significand by 5^e.

      //   N * 5^0101 == N * 5^(1*1) * 5^(0*2) * 5^(1*4) * 5^(0*8)

      significand = significand.zext(precision);

      APInt five_to_the_i(precision, 5);

      while (true) {

        if (texp & 1)

          significand *= five_to_the_i;


        texp >>= 1;

        if (!texp)

          break;

        five_to_the_i *= five_to_the_i;

      }

    }


    AdjustToPrecision(significand, exp, FormatPrecision);


    SmallVector<char, 256> buffer;


    // Fill the buffer.

    unsigned precision = significand.getBitWidth();

    if (precision < 4) {

      // We need enough precision to store the value 10.

      precision = 4;

      significand = significand.zext(precision);

    }

    APInt ten(precision, 10);

    APInt digit(precision, 0);


    bool inTrail = true;

    while (significand != 0) {

      // digit <- significand % 10

      // significand <- significand / 10

      APInt::udivrem(significand, ten, significand, digit);


      unsigned d = digit.getZExtValue();


      // Drop trailing zeros.

      if (inTrail && !d)

        exp++;

      else {

        buffer.push_back((char) ('0' + d));

        inTrail = false;

      }

    }


    assert(!buffer.empty() && "no characters in buffer!");


    // Drop down to FormatPrecision.

    // TODO: don't do more precise calculations above than are required.

    AdjustToPrecision(buffer, exp, FormatPrecision);


    unsigned NDigits = buffer.size();


    // Check whether we should use scientific notation.

    bool FormatScientific;

    if (!FormatMaxPadding)

      FormatScientific = true;

    else {

      if (exp >= 0) {

        // 765e3 --> 765000

        //              ^^^

        // But we shouldn't make the number look more precise than it is.

        FormatScientific = ((unsigned) exp > FormatMaxPadding ||

                            NDigits + (unsigned) exp > FormatPrecision);

      } else {

        // Power of the most significant digit.

        int MSD = exp + (int) (NDigits - 1);

        if (MSD >= 0) {

          // 765e-2 == 7.65

          FormatScientific = false;

        } else {

          // 765e-5 == 0.00765

          //           ^ ^^

          FormatScientific = ((unsigned) -MSD) > FormatMaxPadding;

        }

      }

    }


    // Scientific formatting is pretty straightforward.

    if (FormatScientific) {

      exp += (NDigits - 1);


      Str.push_back(buffer[NDigits-1]);

      Str.push_back('.');

      if (NDigits == 1 && TruncateZero)

        Str.push_back('0');

      else

        for (unsigned I = 1; I != NDigits; ++I)

          Str.push_back(buffer[NDigits-1-I]);

      // Fill with zeros up to FormatPrecision.

      if (!TruncateZero && FormatPrecision > NDigits - 1)

        Str.append(FormatPrecision - NDigits + 1, '0');

      // For !TruncateZero we use lower 'e'.

      Str.push_back(TruncateZero ? 'E' : 'e');


      Str.push_back(exp >= 0 ? '+' : '-');

      if (exp < 0)

        exp = -exp;

      SmallVector<char, 6> expbuf;

      do {

        expbuf.push_back((char) ('0' + (exp % 10)));

        exp /= 10;

      } while (exp);

      // Exponent always at least two digits if we do not truncate zeros.

      if (!TruncateZero && expbuf.size() < 2)

        expbuf.push_back('0');

      for (unsigned I = 0, E = expbuf.size(); I != E; ++I)

        Str.push_back(expbuf[E-1-I]);

      return;

    }


    // Non-scientific, positive exponents.

    if (exp >= 0) {

      for (unsigned I = 0; I != NDigits; ++I)

        Str.push_back(buffer[NDigits-1-I]);

      for (unsigned I = 0; I != (unsigned) exp; ++I)

        Str.push_back('0');

      return;

    }


    // Non-scientific, negative exponents.


    // The number of digits to the left of the decimal point.

    int NWholeDigits = exp + (int) NDigits;


    unsigned I = 0;

    if (NWholeDigits > 0) {

      for (; I != (unsigned) NWholeDigits; ++I)

        Str.push_back(buffer[NDigits-I-1]);

      Str.push_back('.');

    } else {

      unsigned NZeros = 1 + (unsigned) -NWholeDigits;


      Str.push_back('0');

      Str.push_back('.');

      for (unsigned Z = 1; Z != NZeros; ++Z)

        Str.push_back('0');

    }


    for (; I != NDigits; ++I)

      Str.push_back(buffer[NDigits-I-1]);


  }

} // namespace


void IEEEFloat::toString(SmallVectorImpl<char> &Str, unsigned FormatPrecision,

                         unsigned FormatMaxPadding, bool TruncateZero) const {

  switch (category) {

  case fcInfinity:

    if (isNegative())

      return append(Str, "-Inf");

    else

      return append(Str, "+Inf");


  case fcNaN: return append(Str, "NaN");


  case fcZero:

    if (isNegative())

      Str.push_back('-');


    if (!FormatMaxPadding) {

      if (TruncateZero)

        append(Str, "0.0E+0");

      else {

        append(Str, "0.0");

        if (FormatPrecision > 1)

          Str.append(FormatPrecision - 1, '0');

        append(Str, "e+00");

      }

    } else {

      Str.push_back('0');

    }

    return;


  case fcNormal:

    break;

  }


  // Decompose the number into an APInt and an exponent.

  int exp = exponent - ((int) semantics->precision - 1);

  APInt significand(

      semantics->precision,

      ArrayRef(significandParts(), partCountForBits(semantics->precision)));


  toStringImpl(Str, isNegative(), exp, significand, FormatPrecision,

               FormatMaxPadding, TruncateZero);


}


int IEEEFloat::getExactLog2Abs() const {

  if (!isFinite() || isZero())

    return INT_MIN;


  const integerPart *Parts = significandParts();

  const int PartCount = partCountForBits(semantics->precision);


  int PopCount = 0;

  for (int i = 0; i < PartCount; ++i) {

    PopCount += llvm::popcount(Parts[i]);

    if (PopCount > 1)

      return INT_MIN;

  }


  if (exponent != semantics->minExponent)

    return exponent;


  int CountrParts = 0;

  for (int i = 0; i < PartCount;

       ++i, CountrParts += APInt::APINT_BITS_PER_WORD) {

    if (Parts[i] != 0) {

      return exponent - semantics->precision + CountrParts +

             llvm::countr_zero(Parts[i]) + 1;

    }

  }


  llvm_unreachable("didn't find the set bit");

}


bool IEEEFloat::isSignaling() const {

  if (!isNaN())

    return false;

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly ||

      semantics->nonFiniteBehavior == fltNonfiniteBehavior::FiniteOnly)

    return false;


  // IEEE-754R 2008 6.2.1: A signaling NaN bit string should be encoded with the

  // first bit of the trailing significand being 0.

  return !APInt::tcExtractBit(significandParts(), semantics->precision - 2);

}


/// IEEE-754R 2008 5.3.1: nextUp/nextDown.

///

/// *NOTE* since nextDown(x) = -nextUp(-x), we only implement nextUp with

/// appropriate sign switching before/after the computation.


APFloat::opStatus IEEEFloat::next(bool nextDown) {

  // If we are performing nextDown, swap sign so we have -x.

  if (nextDown)

    changeSign();


  // Compute nextUp(x)

  opStatus result = opOK;


  // Handle each float category separately.

  switch (category) {

  case fcInfinity:

    // nextUp(+inf) = +inf

    if (!isNegative())

      break;

    // nextUp(-inf) = -getLargest()

    makeLargest(true);

    break;

  case fcNaN:

    // IEEE-754R 2008 6.2 Par 2: nextUp(sNaN) = qNaN. Set Invalid flag.

    // IEEE-754R 2008 6.2: nextUp(qNaN) = qNaN. Must be identity so we do not

    //                     change the payload.

    if (isSignaling()) {

      result = opInvalidOp;

      // For consistency, propagate the sign of the sNaN to the qNaN.

      makeNaN(false, isNegative(), nullptr);

    }

    break;

  case fcZero:

    // nextUp(pm 0) = +getSmallest()

    makeSmallest(false);

    break;

  case fcNormal:

    // nextUp(-getSmallest()) = -0

    if (isSmallest() && isNegative()) {

      APInt::tcSet(significandParts(), 0, partCount());

      category = fcZero;

      exponent = 0;

      if (semantics->nanEncoding == fltNanEncoding::NegativeZero)

        sign = false;

      if (!semantics->hasZero)

        makeSmallestNormalized(false);

      break;

    }


    if (isLargest() && !isNegative()) {

      if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly) {

        // nextUp(getLargest()) == NAN

        makeNaN();

        break;

      } else if (semantics->nonFiniteBehavior ==

                 fltNonfiniteBehavior::FiniteOnly) {

        // nextUp(getLargest()) == getLargest()

        break;

      } else {

        // nextUp(getLargest()) == INFINITY

        APInt::tcSet(significandParts(), 0, partCount());

        category = fcInfinity;

        exponent = semantics->maxExponent + 1;

        break;

      }

    }


    // nextUp(normal) == normal + inc.

    if (isNegative()) {

      // If we are negative, we need to decrement the significand.


      // We only cross a binade boundary that requires adjusting the exponent

      // if:

      //   1. exponent != semantics->minExponent. This implies we are not in the

      //   smallest binade or are dealing with denormals.

      //   2. Our significand excluding the integral bit is all zeros.

      bool WillCrossBinadeBoundary =

        exponent != semantics->minExponent && isSignificandAllZeros();


      // Decrement the significand.

      //

      // We always do this since:

      //   1. If we are dealing with a non-binade decrement, by definition we

      //   just decrement the significand.

      //   2. If we are dealing with a normal -> normal binade decrement, since

      //   we have an explicit integral bit the fact that all bits but the

      //   integral bit are zero implies that subtracting one will yield a

      //   significand with 0 integral bit and 1 in all other spots. Thus we

      //   must just adjust the exponent and set the integral bit to 1.

      //   3. If we are dealing with a normal -> denormal binade decrement,

      //   since we set the integral bit to 0 when we represent denormals, we

      //   just decrement the significand.

      integerPart *Parts = significandParts();

      APInt::tcDecrement(Parts, partCount());


      if (WillCrossBinadeBoundary) {

        // Our result is a normal number. Do the following:

        // 1. Set the integral bit to 1.

        // 2. Decrement the exponent.

        APInt::tcSetBit(Parts, semantics->precision - 1);

        exponent--;

      }

    } else {

      // If we are positive, we need to increment the significand.


      // We only cross a binade boundary that requires adjusting the exponent if

      // the input is not a denormal and all of said input's significand bits

      // are set. If all of said conditions are true: clear the significand, set

      // the integral bit to 1, and increment the exponent. If we have a

      // denormal always increment since moving denormals and the numbers in the

      // smallest normal binade have the same exponent in our representation.

      // If there are only exponents, any increment always crosses the

      // BinadeBoundary.

      bool WillCrossBinadeBoundary = !APFloat::hasSignificand(*semantics) ||

                                     (!isDenormal() && isSignificandAllOnes());


      if (WillCrossBinadeBoundary) {

        integerPart *Parts = significandParts();

        APInt::tcSet(Parts, 0, partCount());

        APInt::tcSetBit(Parts, semantics->precision - 1);

        assert(exponent != semantics->maxExponent &&

               "We can not increment an exponent beyond the maxExponent allowed"

               " by the given floating point semantics.");

        exponent++;

      } else {

        incrementSignificand();

      }

    }

    break;

  }


  // If we are performing nextDown, swap sign so we have -nextUp(-x)

  if (nextDown)

    changeSign();


  return result;

}


APFloatBase::ExponentType IEEEFloat::exponentNaN() const {

  return ::exponentNaN(*semantics);

}


APFloatBase::ExponentType IEEEFloat::exponentInf() const {

  return ::exponentInf(*semantics);

}


APFloatBase::ExponentType IEEEFloat::exponentZero() const {

  return ::exponentZero(*semantics);

}


void IEEEFloat::makeInf(bool Negative) {

  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::FiniteOnly)

    llvm_unreachable("This floating point format does not support Inf");


  if (semantics->nonFiniteBehavior == fltNonfiniteBehavior::NanOnly) {

    // There is no Inf, so make NaN instead.

    makeNaN(false, Negative);

    return;

  }

  category = fcInfinity;

  sign = Negative;

  exponent = exponentInf();

  APInt::tcSet(significandParts(), 0, partCount());

}


void IEEEFloat::makeZero(bool Negative) {

  if (!semantics->hasZero)

    llvm_unreachable("This floating point format does not support Zero");


  category = fcZero;

  sign = Negative;

  if (semantics->nanEncoding == fltNanEncoding::NegativeZero) {

    // Merge negative zero to positive because 0b10000...000 is used for NaN

    sign = false;

  }

  exponent = exponentZero();

  APInt::tcSet(significandParts(), 0, partCount());

}


void IEEEFloat::makeQuiet() {

  assert(isNaN());

  if (semantics->nonFiniteBehavior != fltNonfiniteBehavior::NanOnly)

    APInt::tcSetBit(significandParts(), semantics->precision - 2);

}


int ilogb(const IEEEFloat &Arg) {

  if (Arg.isNaN())

    return APFloat::IEK_NaN;

  if (Arg.isZero())

    return APFloat::IEK_Zero;

  if (Arg.isInfinity())

    return APFloat::IEK_Inf;

  if (!Arg.isDenormal())

    return Arg.exponent;


  IEEEFloat Normalized(Arg);

  int SignificandBits = Arg.getSemantics().precision - 1;


  Normalized.exponent += SignificandBits;

  Normalized.normalize(APFloat::rmNearestTiesToEven, lfExactlyZero);

  return Normalized.exponent - SignificandBits;

}


IEEEFloat scalbn(IEEEFloat X, int Exp, roundingMode RoundingMode) {

  auto MaxExp = X.getSemantics().maxExponent;

  auto MinExp = X.getSemantics().minExponent;


  // If Exp is wildly out-of-scale, simply adding it to X.exponent will

  // overflow; clamp it to a safe range before adding, but ensure that the range

  // is large enough that the clamp does not change the result. The range we

  // need to support is the difference between the largest possible exponent and

  // the normalized exponent of half the smallest denormal.


  int SignificandBits = X.getSemantics().precision - 1;

  int MaxIncrement = MaxExp - (MinExp - SignificandBits) + 1;


  // Clamp to one past the range ends to let normalize handle overlflow.

  X.exponent += std::clamp(Exp, -MaxIncrement - 1, MaxIncrement);

  X.normalize(RoundingMode, lfExactlyZero);

  if (X.isNaN())

    X.makeQuiet();

  return X;

}


IEEEFloat frexp(const IEEEFloat &Val, int &Exp, roundingMode RM) {

  Exp = ilogb(Val);


  // Quiet signalling nans.

  if (Exp == APFloat::IEK_NaN) {

    IEEEFloat Quiet(Val);

    Quiet.makeQuiet();

    return Quiet;

  }


  if (Exp == APFloat::IEK_Inf)

    return Val;


  // 1 is added because frexp is defined to return a normalized fraction in

  // +/-[0.5, 1.0), rather than the usual +/-[1.0, 2.0).

  Exp = Exp == APFloat::IEK_Zero ? 0 : Exp + 1;

  return scalbn(Val, -Exp, RM);

}


DoubleAPFloat::DoubleAPFloat(const fltSemantics &S)

    : Semantics(&S),

      Floats(new APFloat[2]{APFloat(APFloatBase::semIEEEdouble),

                            APFloat(APFloatBase::semIEEEdouble)}) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

}


DoubleAPFloat::DoubleAPFloat(const fltSemantics &S, uninitializedTag)

    : Semantics(&S), Floats(new APFloat[2]{

                         APFloat(APFloatBase::semIEEEdouble, uninitialized),

                         APFloat(APFloatBase::semIEEEdouble, uninitialized)}) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

}


DoubleAPFloat::DoubleAPFloat(const fltSemantics &S, integerPart I)

    : Semantics(&S),

      Floats(new APFloat[2]{APFloat(APFloatBase::semIEEEdouble, I),

                            APFloat(APFloatBase::semIEEEdouble)}) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

}


DoubleAPFloat::DoubleAPFloat(const fltSemantics &S, const APInt &I)

    : Semantics(&S),

      Floats(new APFloat[2]{

          APFloat(APFloatBase::semIEEEdouble, APInt(64, I.getRawData()[0])),

          APFloat(APFloatBase::semIEEEdouble, APInt(64, I.getRawData()[1]))}) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

}


DoubleAPFloat::DoubleAPFloat(const fltSemantics &S, APFloat &&First,

                             APFloat &&Second)

    : Semantics(&S),

      Floats(new APFloat[2]{std::move(First), std::move(Second)}) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

  assert(&Floats[0].getSemantics() == &APFloatBase::semIEEEdouble);

  assert(&Floats[1].getSemantics() == &APFloatBase::semIEEEdouble);

}


DoubleAPFloat::DoubleAPFloat(const DoubleAPFloat &RHS)

    : Semantics(RHS.Semantics),

      Floats(RHS.Floats ? new APFloat[2]{APFloat(RHS.Floats[0]),

                                         APFloat(RHS.Floats[1])}

                        : nullptr) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

}


DoubleAPFloat::DoubleAPFloat(DoubleAPFloat &&RHS)

    : Semantics(RHS.Semantics), Floats(RHS.Floats) {

  RHS.Semantics = &APFloatBase::semBogus;

  RHS.Floats = nullptr;

  assert(Semantics == &APFloatBase::semPPCDoubleDouble);

}


DoubleAPFloat &DoubleAPFloat::operator=(const DoubleAPFloat &RHS) {

  if (Semantics == RHS.Semantics && RHS.Floats) {

    Floats[0] = RHS.Floats[0];

    Floats[1] = RHS.Floats[1];

  } else if (this != &RHS) {

    this->~DoubleAPFloat();

    new (this) DoubleAPFloat(RHS);

  }

  return *this;

}


// Returns a result such that:

// 1. abs(Lo) <= ulp(Hi)/2

// 2. Hi == RTNE(Hi + Lo)

// 3. Hi + Lo == X + Y

//

// Requires that log2(X) >= log2(Y).


static std::pair<APFloat, APFloat> fastTwoSum(APFloat X, APFloat Y) {

  if (!X.isFinite())

    return {X, APFloat::getZero(X.getSemantics(), /*Negative=*/false)};

  APFloat Hi = X + Y;

  APFloat Delta = Hi - X;

  APFloat Lo = Y - Delta;

  return {Hi, Lo};

}


// Implement addition, subtraction, multiplication and division based on:

// "Software for Doubled-Precision Floating-Point Computations",

// by Seppo Linnainmaa, ACM TOMS vol 7 no 3, September 1981, pages 272-283.

APFloat::opStatus DoubleAPFloat::addImpl(const APFloat &a, const APFloat &aa,

                                         const APFloat &c, const APFloat &cc,

                                         roundingMode RM) {

  int Status = opOK;

  APFloat z = a;

  Status |= z.add(c, RM);

  if (!z.isFinite()) {

    if (!z.isInfinity()) {

      Floats[0] = std::move(z);

      Floats[1].makeZero(/* Neg = */ false);

      return (opStatus)Status;

    }

    Status = opOK;

    auto AComparedToC = a.compareAbsoluteValue(c);

    z = cc;

    Status |= z.add(aa, RM);

    if (AComparedToC == APFloat::cmpGreaterThan) {

      // z = cc + aa + c + a;

      Status |= z.add(c, RM);

      Status |= z.add(a, RM);

    } else {

      // z = cc + aa + a + c;

      Status |= z.add(a, RM);

      Status |= z.add(c, RM);

    }

    if (!z.isFinite()) {

      Floats[0] = std::move(z);

      Floats[1].makeZero(/* Neg = */ false);

      return (opStatus)Status;

    }

    Floats[0] = z;

    APFloat zz = aa;

    Status |= zz.add(cc, RM);

    if (AComparedToC == APFloat::cmpGreaterThan) {

      // Floats[1] = a - z + c + zz;

      Floats[1] = a;

      Status |= Floats[1].subtract(z, RM);

      Status |= Floats[1].add(c, RM);

      Status |= Floats[1].add(zz, RM);

    } else {

      // Floats[1] = c - z + a + zz;

      Floats[1] = c;

      Status |= Floats[1].subtract(z, RM);

      Status |= Floats[1].add(a, RM);

      Status |= Floats[1].add(zz, RM);

    }

  } else {

    // q = a - z;

    APFloat q = a;

    Status |= q.subtract(z, RM);


    // zz = q + c + (a - (q + z)) + aa + cc;

    // Compute a - (q + z) as -((q + z) - a) to avoid temporary copies.

    auto zz = q;

    Status |= zz.add(c, RM);

    Status |= q.add(z, RM);

    Status |= q.subtract(a, RM);

    q.changeSign();

    Status |= zz.add(q, RM);

    Status |= zz.add(aa, RM);

    Status |= zz.add(cc, RM);

    if (zz.isZero() && !zz.isNegative()) {

      Floats[0] = std::move(z);

      Floats[1].makeZero(/* Neg = */ false);

      return opOK;

    }

    Floats[0] = z;

    Status |= Floats[0].add(zz, RM);

    if (!Floats[0].isFinite()) {

      Floats[1].makeZero(/* Neg = */ false);

      return (opStatus)Status;

    }

    Floats[1] = std::move(z);

    Status |= Floats[1].subtract(Floats[0], RM);

    Status |= Floats[1].add(zz, RM);

  }

  return (opStatus)Status;

}


APFloat::opStatus DoubleAPFloat::addWithSpecial(const DoubleAPFloat &LHS,

                                                const DoubleAPFloat &RHS,

                                                DoubleAPFloat &Out,

                                                roundingMode RM) {

  if (LHS.getCategory() == fcNaN) {

    Out = LHS;

    return opOK;

  }

  if (RHS.getCategory() == fcNaN) {

    Out = RHS;

    return opOK;

  }

  if (LHS.getCategory() == fcZero) {

    Out = RHS;

    return opOK;

  }

  if (RHS.getCategory() == fcZero) {

    Out = LHS;

    return opOK;

  }

  if (LHS.getCategory() == fcInfinity && RHS.getCategory() == fcInfinity &&

      LHS.isNegative() != RHS.isNegative()) {

    Out.makeNaN(false, Out.isNegative(), nullptr);

    return opInvalidOp;

  }

  if (LHS.getCategory() == fcInfinity) {

    Out = LHS;

    return opOK;

  }

  if (RHS.getCategory() == fcInfinity) {

    Out = RHS;

    return opOK;

  }

  assert(LHS.getCategory() == fcNormal && RHS.getCategory() == fcNormal);


  APFloat A(LHS.Floats[0]), AA(LHS.Floats[1]), C(RHS.Floats[0]),

      CC(RHS.Floats[1]);

  assert(&A.getSemantics() == &APFloatBase::semIEEEdouble);

  assert(&AA.getSemantics() == &APFloatBase::semIEEEdouble);

  assert(&C.getSemantics() == &APFloatBase::semIEEEdouble);

  assert(&CC.getSemantics() == &APFloatBase::semIEEEdouble);

  assert(&Out.Floats[0].getSemantics() == &APFloatBase::semIEEEdouble);

  assert(&Out.Floats[1].getSemantics() == &APFloatBase::semIEEEdouble);

  return Out.addImpl(A, AA, C, CC, RM);

}


APFloat::opStatus DoubleAPFloat::add(const DoubleAPFloat &RHS,

                                     roundingMode RM) {

  return addWithSpecial(*this, RHS, *this, RM);

}


APFloat::opStatus DoubleAPFloat::subtract(const DoubleAPFloat &RHS,

                                          roundingMode RM) {

  changeSign();

  auto Ret = add(RHS, RM);

  changeSign();

  return Ret;

}


APFloat::opStatus DoubleAPFloat::multiply(const DoubleAPFloat &RHS,

                                          APFloat::roundingMode RM) {

  const auto &LHS = *this;

  auto &Out = *this;

  /* Interesting observation: For special categories, finding the lowest

     common ancestor of the following layered graph gives the correct

     return category:


        NaN

       /   \

     Zero  Inf

       \   /

       Normal


     e.g. NaN * NaN = NaN

          Zero * Inf = NaN

          Normal * Zero = Zero

          Normal * Inf = Inf

  */

  if (LHS.getCategory() == fcNaN) {

    Out = LHS;

    return opOK;

  }

  if (RHS.getCategory() == fcNaN) {

    Out = RHS;

    return opOK;

  }

  if ((LHS.getCategory() == fcZero && RHS.getCategory() == fcInfinity) ||

      (LHS.getCategory() == fcInfinity && RHS.getCategory() == fcZero)) {

    Out.makeNaN(false, false, nullptr);

    return opOK;

  }

  if (LHS.getCategory() == fcZero || LHS.getCategory() == fcInfinity) {

    Out = LHS;

    return opOK;

  }

  if (RHS.getCategory() == fcZero || RHS.getCategory() == fcInfinity) {

    Out = RHS;

    return opOK;

  }

  assert(LHS.getCategory() == fcNormal && RHS.getCategory() == fcNormal &&

         "Special cases not handled exhaustively");


  int Status = opOK;

  APFloat A = Floats[0], B = Floats[1], C = RHS.Floats[0], D = RHS.Floats[1];

  // t = a * c

  APFloat T = A;

  Status |= T.multiply(C, RM);

  if (!T.isFiniteNonZero()) {

    Floats[0] = T;

    Floats[1].makeZero(/* Neg = */ false);

    return (opStatus)Status;

  }


  // tau = fmsub(a, c, t), that is -fmadd(-a, c, t).

  APFloat Tau = A;

  T.changeSign();

  Status |= Tau.fusedMultiplyAdd(C, T, RM);

  T.changeSign();

  {

    // v = a * d

    APFloat V = A;

    Status |= V.multiply(D, RM);

    // w = b * c

    APFloat W = B;

    Status |= W.multiply(C, RM);

    Status |= V.add(W, RM);

    // tau += v + w

    Status |= Tau.add(V, RM);

  }

  // u = t + tau

  APFloat U = T;

  Status |= U.add(Tau, RM);


  Floats[0] = U;

  if (!U.isFinite()) {

    Floats[1].makeZero(/* Neg = */ false);

  } else {

    // Floats[1] = (t - u) + tau

    Status |= T.subtract(U, RM);

    Status |= T.add(Tau, RM);

    Floats[1] = T;

  }

  return (opStatus)Status;

}


APFloat::opStatus DoubleAPFloat::divide(const DoubleAPFloat &RHS,

                                        APFloat::roundingMode RM) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  APFloat Tmp(APFloatBase::semPPCDoubleDoubleLegacy, bitcastToAPInt());

  auto Ret = Tmp.divide(

      APFloat(APFloatBase::semPPCDoubleDoubleLegacy, RHS.bitcastToAPInt()), RM);

  *this = DoubleAPFloat(APFloatBase::semPPCDoubleDouble, Tmp.bitcastToAPInt());

  return Ret;

}


APFloat::opStatus DoubleAPFloat::remainder(const DoubleAPFloat &RHS) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  APFloat Tmp(APFloatBase::semPPCDoubleDoubleLegacy, bitcastToAPInt());

  auto Ret = Tmp.remainder(

      APFloat(APFloatBase::semPPCDoubleDoubleLegacy, RHS.bitcastToAPInt()));

  *this = DoubleAPFloat(APFloatBase::semPPCDoubleDouble, Tmp.bitcastToAPInt());

  return Ret;

}


APFloat::opStatus DoubleAPFloat::mod(const DoubleAPFloat &RHS) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  APFloat Tmp(APFloatBase::semPPCDoubleDoubleLegacy, bitcastToAPInt());

  auto Ret = Tmp.mod(

      APFloat(APFloatBase::semPPCDoubleDoubleLegacy, RHS.bitcastToAPInt()));

  *this = DoubleAPFloat(APFloatBase::semPPCDoubleDouble, Tmp.bitcastToAPInt());

  return Ret;

}


APFloat::opStatus


DoubleAPFloat::fusedMultiplyAdd(const DoubleAPFloat &Multiplicand,

                                const DoubleAPFloat &Addend,

                                APFloat::roundingMode RM) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  APFloat Tmp(APFloatBase::semPPCDoubleDoubleLegacy, bitcastToAPInt());

  auto Ret = Tmp.fusedMultiplyAdd(

      APFloat(APFloatBase::semPPCDoubleDoubleLegacy,

              Multiplicand.bitcastToAPInt()),

      APFloat(APFloatBase::semPPCDoubleDoubleLegacy, Addend.bitcastToAPInt()),

      RM);

  *this = DoubleAPFloat(APFloatBase::semPPCDoubleDouble, Tmp.bitcastToAPInt());

  return Ret;

}


APFloat::opStatus DoubleAPFloat::roundToIntegral(APFloat::roundingMode RM) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  const APFloat &Hi = getFirst();

  const APFloat &Lo = getSecond();


  APFloat RoundedHi = Hi;

  const opStatus HiStatus = RoundedHi.roundToIntegral(RM);


  // We can reduce the problem to just the high part if the input:

  // 1. Represents a non-finite value.

  // 2. Has a component which is zero.

  if (!Hi.isFiniteNonZero() || Lo.isZero()) {

    Floats[0] = std::move(RoundedHi);

    Floats[1].makeZero(/*Neg=*/false);

    return HiStatus;

  }


  // Adjust `Rounded` in the direction of `TieBreaker` if `ToRound` was at a

  // halfway point.

  auto RoundToNearestHelper = [](APFloat ToRound, APFloat Rounded,

                                 APFloat TieBreaker) {

    // RoundingError tells us which direction we rounded:

    //   - RoundingError > 0: we rounded up.

    //   - RoundingError < 0: we rounded down.

    // Sterbenz' lemma ensures that RoundingError is exact.

    const APFloat RoundingError = Rounded - ToRound;

    if (TieBreaker.isNonZero() &&

        TieBreaker.isNegative() != RoundingError.isNegative() &&

        abs(RoundingError).isExactlyValue(0.5))

      Rounded.add(

          APFloat::getOne(Rounded.getSemantics(), TieBreaker.isNegative()),

          rmNearestTiesToEven);

    return Rounded;

  };


  // Case 1: Hi is not an integer.

  // Special cases are for rounding modes that are sensitive to ties.

  if (RoundedHi != Hi) {

    // We need to consider the case where Hi was between two integers and the

    // rounding mode broke the tie when, in fact, Lo may have had a different

    // sign than Hi.

    if (RM == rmNearestTiesToAway || RM == rmNearestTiesToEven)

      RoundedHi = RoundToNearestHelper(Hi, RoundedHi, Lo);


    Floats[0] = std::move(RoundedHi);

    Floats[1].makeZero(/*Neg=*/false);

    return HiStatus;

  }


  // Case 2: Hi is an integer.

  // Special cases are for rounding modes which are rounding towards or away from zero.

  RoundingMode LoRoundingMode;

  if (RM == rmTowardZero)

    // When our input is positive, we want the Lo component rounded toward

    // negative infinity to get the smallest result magnitude. Likewise,

    // negative inputs want the Lo component rounded toward positive infinity.

    LoRoundingMode = isNegative() ? rmTowardPositive : rmTowardNegative;

  else

    LoRoundingMode = RM;


  APFloat RoundedLo = Lo;

  const opStatus LoStatus = RoundedLo.roundToIntegral(LoRoundingMode);

  if (LoRoundingMode == rmNearestTiesToAway)

    // We need to consider the case where Lo was between two integers and the

    // rounding mode broke the tie when, in fact, Hi may have had a different

    // sign than Lo.

    RoundedLo = RoundToNearestHelper(Lo, RoundedLo, Hi);


  // We must ensure that the final result has no overlap between the two APFloat values.

  std::tie(RoundedHi, RoundedLo) = fastTwoSum(RoundedHi, RoundedLo);


  Floats[0] = std::move(RoundedHi);

  Floats[1] = std::move(RoundedLo);

  return LoStatus;

}


void DoubleAPFloat::changeSign() {

  Floats[0].changeSign();

  Floats[1].changeSign();

}


APFloat::cmpResult


DoubleAPFloat::compareAbsoluteValue(const DoubleAPFloat &RHS) const {

  // Compare absolute values of the high parts.

  const cmpResult HiPartCmp = Floats[0].compareAbsoluteValue(RHS.Floats[0]);

  if (HiPartCmp != cmpEqual)

    return HiPartCmp;


  // Zero, regardless of sign, is equal.

  if (Floats[1].isZero() && RHS.Floats[1].isZero())

    return cmpEqual;


  // At this point, |this->Hi| == |RHS.Hi|.

  // The magnitude is |Hi+Lo| which is Hi+|Lo| if signs of Hi and Lo are the

  // same, and Hi-|Lo| if signs are different.

  const bool ThisIsSubtractive =

      Floats[0].isNegative() != Floats[1].isNegative();

  const bool RHSIsSubtractive =

      RHS.Floats[0].isNegative() != RHS.Floats[1].isNegative();


  // Case 1: The low part of 'this' is zero.

  if (Floats[1].isZero())

    // We are comparing |Hi| vs. |Hi| ± |RHS.Lo|.

    // If RHS is subtractive, its magnitude is smaller.

    // If RHS is additive, its magnitude is larger.

    return RHSIsSubtractive ? cmpGreaterThan : cmpLessThan;


  // Case 2: The low part of 'RHS' is zero (and we know 'this' is not).

  if (RHS.Floats[1].isZero())

    // We are comparing |Hi| ± |This.Lo| vs. |Hi|.

    // If 'this' is subtractive, its magnitude is smaller.

    // If 'this' is additive, its magnitude is larger.

    return ThisIsSubtractive ? cmpLessThan : cmpGreaterThan;


  // If their natures differ, the additive one is larger.

  if (ThisIsSubtractive != RHSIsSubtractive)

    return ThisIsSubtractive ? cmpLessThan : cmpGreaterThan;


  // Case 3: Both are additive (Hi+|Lo|) or both are subtractive (Hi-|Lo|).

  // The comparison now depends on the magnitude of the low parts.

  const cmpResult LoPartCmp = Floats[1].compareAbsoluteValue(RHS.Floats[1]);


  if (ThisIsSubtractive) {

    // Both are subtractive (Hi-|Lo|), so the comparison of |Lo| is inverted.

    if (LoPartCmp == cmpLessThan)

      return cmpGreaterThan;

    if (LoPartCmp == cmpGreaterThan)

      return cmpLessThan;

  }


  // If additive, the comparison of |Lo| is direct.

  // If equal, they are equal.

  return LoPartCmp;

}


APFloat::fltCategory DoubleAPFloat::getCategory() const {

  return Floats[0].getCategory();

}


bool DoubleAPFloat::isNegative() const { return Floats[0].isNegative(); }


void DoubleAPFloat::makeInf(bool Neg) {

  Floats[0].makeInf(Neg);

  Floats[1].makeZero(/* Neg = */ false);

}


void DoubleAPFloat::makeZero(bool Neg) {

  Floats[0].makeZero(Neg);

  Floats[1].makeZero(/* Neg = */ false);

}


void DoubleAPFloat::makeLargest(bool Neg) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  Floats[0] =

      APFloat(APFloatBase::semIEEEdouble, APInt(64, 0x7fefffffffffffffull));

  Floats[1] =

      APFloat(APFloatBase::semIEEEdouble, APInt(64, 0x7c8ffffffffffffeull));

  if (Neg)

    changeSign();

}


void DoubleAPFloat::makeSmallest(bool Neg) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  Floats[0].makeSmallest(Neg);

  Floats[1].makeZero(/* Neg = */ false);

}


void DoubleAPFloat::makeSmallestNormalized(bool Neg) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  Floats[0] =

      APFloat(APFloatBase::semIEEEdouble, APInt(64, 0x0360000000000000ull));

  if (Neg)

    Floats[0].changeSign();

  Floats[1].makeZero(/* Neg = */ false);

}


void DoubleAPFloat::makeNaN(bool SNaN, bool Neg, const APInt *fill) {

  Floats[0].makeNaN(SNaN, Neg, fill);

  Floats[1].makeZero(/* Neg = */ false);

}


APFloat::cmpResult DoubleAPFloat::compare(const DoubleAPFloat &RHS) const {

  auto Result = Floats[0].compare(RHS.Floats[0]);

  // |Float[0]| > |Float[1]|

  if (Result == APFloat::cmpEqual)

    return Floats[1].compare(RHS.Floats[1]);

  return Result;

}


bool DoubleAPFloat::bitwiseIsEqual(const DoubleAPFloat &RHS) const {

  return Floats[0].bitwiseIsEqual(RHS.Floats[0]) &&

         Floats[1].bitwiseIsEqual(RHS.Floats[1]);

}


hash_code hash_value(const DoubleAPFloat &Arg) {

  if (Arg.Floats)

    return hash_combine(hash_value(Arg.Floats[0]), hash_value(Arg.Floats[1]));

  return hash_combine(Arg.Semantics);

}


APInt DoubleAPFloat::bitcastToAPInt() const {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  uint64_t Data[] = {

      Floats[0].bitcastToAPInt().getRawData()[0],

      Floats[1].bitcastToAPInt().getRawData()[0],

  };

  return APInt(128, Data);

}


Expected<APFloat::opStatus> DoubleAPFloat::convertFromString(StringRef S,

                                                             roundingMode RM) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  APFloat Tmp(APFloatBase::semPPCDoubleDoubleLegacy);

  auto Ret = Tmp.convertFromString(S, RM);

  *this = DoubleAPFloat(APFloatBase::semPPCDoubleDouble, Tmp.bitcastToAPInt());

  return Ret;

}


// The double-double lattice of values corresponds to numbers which obey:

// - abs(lo) <= 1/2 * ulp(hi)

// - roundTiesToEven(hi + lo) == hi

//

// nextUp must choose the smallest output > input that follows these rules.

// nexDown must choose the largest output < input that follows these rules.


APFloat::opStatus DoubleAPFloat::next(bool nextDown) {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  // nextDown(x) = -nextUp(-x)

  if (nextDown) {

    changeSign();

    APFloat::opStatus Result = next(/*nextDown=*/false);

    changeSign();

    return Result;

  }

  switch (getCategory()) {

  case fcInfinity:

    // nextUp(+inf) = +inf

    // nextUp(-inf) = -getLargest()

    if (isNegative())

      makeLargest(true);

    return opOK;


  case fcNaN:

    // IEEE-754R 2008 6.2 Par 2: nextUp(sNaN) = qNaN. Set Invalid flag.

    // IEEE-754R 2008 6.2: nextUp(qNaN) = qNaN. Must be identity so we do not

    //                     change the payload.

    if (getFirst().isSignaling()) {

      // For consistency, propagate the sign of the sNaN to the qNaN.

      makeNaN(false, isNegative(), nullptr);

      return opInvalidOp;

    }

    return opOK;


  case fcZero:

    // nextUp(pm 0) = +getSmallest()

    makeSmallest(false);

    return opOK;


  case fcNormal:

    break;

  }


  const APFloat &HiOld = getFirst();

  const APFloat &LoOld = getSecond();


  APFloat NextLo = LoOld;

  NextLo.next(/*nextDown=*/false);


  // We want to admit values where:

  // 1. abs(Lo) <= ulp(Hi)/2

  // 2. Hi == RTNE(Hi + lo)

  auto InLattice = [](const APFloat &Hi, const APFloat &Lo) {

    return Hi + Lo == Hi;

  };


  // Check if (HiOld, nextUp(LoOld) is in the lattice.

  if (InLattice(HiOld, NextLo)) {

    // Yes, the result is (HiOld, nextUp(LoOld)).

    Floats[1] = std::move(NextLo);


    // TODO: Because we currently rely on semPPCDoubleDoubleLegacy, our maximum

    // value is defined to have exactly 106 bits of precision. This limitation

    // results in semPPCDoubleDouble being unable to reach its maximum canonical

    // value.

    DoubleAPFloat Largest{*Semantics, uninitialized};

    Largest.makeLargest(/*Neg=*/false);

    if (compare(Largest) == cmpGreaterThan)

      makeInf(/*Neg=*/false);


    return opOK;

  }


  // Now we need to handle the cases where (HiOld, nextUp(LoOld)) is not the

  // correct result. We know the new hi component will be nextUp(HiOld) but our

  // lattice rules make it a little ambiguous what the correct NextLo must be.

  APFloat NextHi = HiOld;

  NextHi.next(/*nextDown=*/false);


  // nextUp(getLargest()) == INFINITY

  if (NextHi.isInfinity()) {

    makeInf(/*Neg=*/false);

    return opOK;

  }


  // IEEE 754-2019 5.3.1:

  // "If x is the negative number of least magnitude in x's format, nextUp(x) is

  // -0."

  if (NextHi.isZero()) {

    makeZero(/*Neg=*/true);

    return opOK;

  }


  // abs(NextLo) must be <= ulp(NextHi)/2. We want NextLo to be as close to

  // negative infinity as possible.

  NextLo = neg(scalbn(harrisonUlp(NextHi), -1, rmTowardZero));

  if (!InLattice(NextHi, NextLo))

    // RTNE may mean that Lo must be < ulp(NextHi) / 2 so we bump NextLo.

    NextLo.next(/*nextDown=*/false);


  Floats[0] = std::move(NextHi);

  Floats[1] = std::move(NextLo);


  return opOK;

}


APFloat::opStatus DoubleAPFloat::convertToSignExtendedInteger(

    MutableArrayRef<integerPart> Input, unsigned int Width, bool IsSigned,

    roundingMode RM, bool *IsExact) const {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");


  // If Hi is not finite, or Lo is zero, the value is entirely represented

  // by Hi. Delegate to the simpler single-APFloat conversion.

  if (!getFirst().isFiniteNonZero() || getSecond().isZero())

    return getFirst().convertToInteger(Input, Width, IsSigned, RM, IsExact);


  // First, round the full double-double value to an integral value. This

  // simplifies the rest of the function, as we no longer need to consider

  // fractional parts.

  *IsExact = false;

  DoubleAPFloat Integral = *this;

  const opStatus RoundStatus = Integral.roundToIntegral(RM);

  if (RoundStatus == opInvalidOp)

    return opInvalidOp;

  const APFloat &IntegralHi = Integral.getFirst();

  const APFloat &IntegralLo = Integral.getSecond();


  // If rounding results in either component being zero, the sum is trivial.

  // Delegate to the simpler single-APFloat conversion.

  bool HiIsExact;

  if (IntegralHi.isZero() || IntegralLo.isZero()) {

    const opStatus HiStatus =

        IntegralHi.convertToInteger(Input, Width, IsSigned, RM, &HiIsExact);

    // The conversion from an integer-valued float to an APInt may fail if the

    // result would be out of range.  Regardless, taking this path is only

    // possible if rounding occurred during the initial `roundToIntegral`.

    return HiStatus == opOK ? opInexact : HiStatus;

  }


  // A negative number cannot be represented by an unsigned integer.

  // Since a double-double is canonical, if Hi is negative, the sum is negative.

  if (!IsSigned && IntegralHi.isNegative())

    return opInvalidOp;


  // Handle the special boundary case where |Hi| is exactly the power of two

  // that marks the edge of the integer's range (e.g., 2^63 for int64_t). In

  // this situation, Hi itself won't fit, but the sum Hi + Lo might.

  // `PositiveOverflowWidth` is the bit number for this boundary (N-1 for

  // signed, N for unsigned).

  bool LoIsExact;

  const int HiExactLog2 = IntegralHi.getExactLog2Abs();

  const unsigned PositiveOverflowWidth = IsSigned ? Width - 1 : Width;

  if (HiExactLog2 >= 0 &&

      static_cast<unsigned>(HiExactLog2) == PositiveOverflowWidth) {

    // If Hi and Lo have the same sign, |Hi + Lo| > |Hi|, so the sum is

    // guaranteed to overflow. E.g., for uint128_t, (2^128, 1) overflows.

    if (IntegralHi.isNegative() == IntegralLo.isNegative())

      return opInvalidOp;


    // If the signs differ, the sum will fit. We can compute the result using

    // properties of two's complement arithmetic without a wide intermediate

    // integer. E.g., for uint128_t, (2^128, -1) should be 2^128 - 1.

    const opStatus LoStatus = IntegralLo.convertToInteger(

        Input, Width, /*IsSigned=*/true, RM, &LoIsExact);

    if (LoStatus == opInvalidOp)

      return opInvalidOp;


    // Adjust the bit pattern of Lo to account for Hi's value:

    //  - For unsigned (Hi=2^Width): `2^Width + Lo` in `Width`-bit

    //    arithmetic is equivalent to just `Lo`. The conversion of `Lo` above

    //    already produced the correct final bit pattern.

    //  - For signed (Hi=2^(Width-1)): The sum `2^(Width-1) + Lo` (where Lo<0)

    //    can be computed by taking the two's complement pattern for `Lo` and

    //    clearing the sign bit.

    if (IsSigned && !IntegralHi.isNegative())

      APInt::tcClearBit(Input.data(), PositiveOverflowWidth);

    *IsExact = RoundStatus == opOK;

    return RoundStatus;

  }


  // Convert Hi into an integer.  This may not fit but that is OK: we know that

  // Hi + Lo would not fit either in this situation.

  const opStatus HiStatus = IntegralHi.convertToInteger(

      Input, Width, IsSigned, rmTowardZero, &HiIsExact);

  if (HiStatus == opInvalidOp)

    return HiStatus;


  // Convert Lo into a temporary integer of the same width.

  APSInt LoResult{Width, /*isUnsigned=*/!IsSigned};

  const opStatus LoStatus =

      IntegralLo.convertToInteger(LoResult, rmTowardZero, &LoIsExact);

  if (LoStatus == opInvalidOp)

    return LoStatus;


  // Add Lo to Hi. This addition is guaranteed not to overflow because of the

  // double-double canonicalization rule (`|Lo| <= ulp(Hi)/2`). The only case

  // where the sum could cross the integer type's boundary is when Hi is a

  // power of two, which is handled by the special case block above.

  APInt::tcAdd(Input.data(), LoResult.getRawData(), /*carry=*/0, Input.size());


  *IsExact = RoundStatus == opOK;

  return RoundStatus;

}


APFloat::opStatus


DoubleAPFloat::convertToInteger(MutableArrayRef<integerPart> Input,

                                unsigned int Width, bool IsSigned,

                                roundingMode RM, bool *IsExact) const {

  opStatus FS =

      convertToSignExtendedInteger(Input, Width, IsSigned, RM, IsExact);


  if (FS == opInvalidOp) {

    const unsigned DstPartsCount = partCountForBits(Width);

    assert(DstPartsCount <= Input.size() && "Integer too big");


    unsigned Bits;

    if (getCategory() == fcNaN)

      Bits = 0;

    else if (isNegative())

      Bits = IsSigned;

    else

      Bits = Width - IsSigned;


    tcSetLeastSignificantBits(Input.data(), DstPartsCount, Bits);

    if (isNegative() && IsSigned)

      APInt::tcShiftLeft(Input.data(), DstPartsCount, Width - 1);

  }


  return FS;

}


APFloat::opStatus DoubleAPFloat::handleOverflow(roundingMode RM) {

  switch (RM) {

  case APFloat::rmTowardZero:

    makeLargest(/*Neg=*/isNegative());

    break;

  case APFloat::rmTowardNegative:

    if (isNegative())

      makeInf(/*Neg=*/true);

    else

      makeLargest(/*Neg=*/false);

    break;

  case APFloat::rmTowardPositive:

    if (isNegative())

      makeLargest(/*Neg=*/true);

    else

      makeInf(/*Neg=*/false);

    break;

  case APFloat::rmNearestTiesToAway:

  case APFloat::rmNearestTiesToEven:

    makeInf(/*Neg=*/isNegative());

    break;

  default:

    llvm_unreachable("Invalid rounding mode found");

  }

  opStatus S = opInexact;

  if (!getFirst().isFinite())

    S = static_cast<opStatus>(S | opOverflow);

  return S;

}


APFloat::opStatus DoubleAPFloat::convertFromUnsignedParts(

    const integerPart *Src, unsigned int SrcCount, roundingMode RM) {

  // Find the most significant bit of the source integer. APInt::tcMSB returns

  // UINT_MAX for a zero value.

  const unsigned SrcMSB = APInt::tcMSB(Src, SrcCount);

  if (SrcMSB == UINT_MAX) {

    // The source integer is 0.

    makeZero(/*Neg=*/false);

    return opOK;

  }


  // Create a minimally-sized APInt to represent the source value.

  const unsigned SrcBitWidth = SrcMSB + 1;

  APSInt SrcInt{APInt{/*numBits=*/SrcBitWidth, ArrayRef(Src, SrcCount)},

                /*isUnsigned=*/true};


  // Stage 1: Initial Approximation.

  // Convert the source integer SrcInt to the Hi part of the DoubleAPFloat.

  // We use round-to-nearest because it minimizes the initial error, which is

  // crucial for the subsequent steps.

  APFloat Hi{getFirst().getSemantics()};

  Hi.convertFromAPInt(SrcInt, /*IsSigned=*/false, rmNearestTiesToEven);


  // If the first approximation already overflows, the number is too large.

  // NOTE: The underlying semantics are *more* conservative when choosing to

  // overflow because their notion of ULP is much larger. As such, it is always

  // safe to overflow at the DoubleAPFloat level if the APFloat overflows.

  if (!Hi.isFinite())

    return handleOverflow(RM);


  // Stage 2: Exact Error Calculation.

  // Calculate the exact error of the first approximation: Error = SrcInt - Hi.

  // This is done by converting Hi back to an integer and subtracting it from

  // the original source.

  bool HiAsIntIsExact;

  // Create an integer representation of Hi. Its width is determined by the

  // exponent of Hi, ensuring it's just large enough. This width can exceed

  // SrcBitWidth if the conversion to Hi rounded up to a power of two.

  // accurately when converted back to an integer.

  APSInt HiAsInt{static_cast<uint32_t>(ilogb(Hi) + 1), /*isUnsigned=*/true};

  Hi.convertToInteger(HiAsInt, rmNearestTiesToEven, &HiAsIntIsExact);

  const APInt Error = SrcInt.zext(HiAsInt.getBitWidth()) - HiAsInt;


  // Stage 3: Error Approximation and Rounding.

  // Convert the integer error into the Lo part of the DoubleAPFloat. This step

  // captures the remainder of the original number. The rounding mode for this

  // conversion (LoRM) may need to be adjusted from the user-requested RM to

  // ensure the final sum (Hi + Lo) rounds correctly.

  roundingMode LoRM = RM;

  // Adjustments are only necessary when the initial approximation Hi was an

  // overestimate, making the Error negative.

  if (Error.isNegative()) {

    if (RM == rmNearestTiesToAway) {

      // For rmNearestTiesToAway, a tie should round away from zero. Since

      // SrcInt is positive, this means rounding toward +infinity.

      // A standard conversion of a negative Error would round ties toward

      // -infinity, causing the final sum Hi + Lo to be smaller. To

      // counteract this, we detect the tie case and override the rounding

      // mode for Lo to rmTowardPositive.

      const unsigned ErrorActiveBits = Error.getSignificantBits() - 1;

      const unsigned LoPrecision = getSecond().getSemantics().precision;

      if (ErrorActiveBits > LoPrecision) {

        const unsigned RoundingBoundary = ErrorActiveBits - LoPrecision;

        // A tie occurs when the bits to be truncated are of the form 100...0.

        // This is detected by checking if the number of trailing zeros is

        // exactly one less than the number of bits being truncated.

        if (Error.countTrailingZeros() == RoundingBoundary - 1)

          LoRM = rmTowardPositive;

      }

    } else if (RM == rmTowardZero) {

      // For rmTowardZero, the final positive result must be truncated (rounded

      // down). When Hi is an overestimate, Error is negative. A standard

      // rmTowardZero conversion of Error would make it *less* negative,

      // effectively rounding the final sum Hi + Lo *up*. To ensure the sum

      // rounds down correctly, we force Lo to round toward -infinity.

      LoRM = rmTowardNegative;

    }

  }


  APFloat Lo{getSecond().getSemantics()};

  opStatus Status = Lo.convertFromAPInt(Error, /*IsSigned=*/true, LoRM);


  // Renormalize the pair (Hi, Lo) into a canonical DoubleAPFloat form where the

  // components do not overlap. fastTwoSum performs this operation.

  std::tie(Hi, Lo) = fastTwoSum(Hi, Lo);

  Floats[0] = std::move(Hi);

  Floats[1] = std::move(Lo);


  // A final check for overflow is needed because fastTwoSum can cause a

  // carry-out from Lo that pushes Hi to infinity.

  if (!getFirst().isFinite())

    return handleOverflow(RM);


  // The largest DoubleAPFloat must be canonical. Values which are larger are

  // not canonical and are equivalent to overflow.

  if (getFirst().isFiniteNonZero() && Floats[0].isLargest()) {

    DoubleAPFloat Largest{*Semantics};

    Largest.makeLargest(/*Neg=*/false);

    if (compare(Largest) == APFloat::cmpGreaterThan)

      return handleOverflow(RM);

  }


  // The final status of the operation is determined by the conversion of the

  // error term. If Lo could represent Error exactly, the entire conversion

  // is exact. Otherwise, it's inexact.

  return Status;

}


APFloat::opStatus DoubleAPFloat::convertFromAPInt(const APInt &Input,

                                                  bool IsSigned,

                                                  roundingMode RM) {

  const bool NegateInput = IsSigned && Input.isNegative();

  APInt API = Input;

  if (NegateInput)

    API.negate();


  const APFloat::opStatus Status =

      convertFromUnsignedParts(API.getRawData(), API.getNumWords(), RM);

  if (NegateInput)

    changeSign();

  return Status;

}


unsigned int DoubleAPFloat::convertToHexString(char *DST,

                                               unsigned int HexDigits,

                                               bool UpperCase,

                                               roundingMode RM) const {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  return APFloat(APFloatBase::semPPCDoubleDoubleLegacy, bitcastToAPInt())

      .convertToHexString(DST, HexDigits, UpperCase, RM);

}


bool DoubleAPFloat::isDenormal() const {

  return getCategory() == fcNormal &&

         (Floats[0].isDenormal() || Floats[1].isDenormal() ||

          // (double)(Hi + Lo) == Hi defines a normal number.

          Floats[0] != Floats[0] + Floats[1]);

}


bool DoubleAPFloat::isSmallest() const {

  if (getCategory() != fcNormal)

    return false;

  DoubleAPFloat Tmp(*this);

  Tmp.makeSmallest(this->isNegative());

  return Tmp.compare(*this) == cmpEqual;

}


bool DoubleAPFloat::isSmallestNormalized() const {

  if (getCategory() != fcNormal)

    return false;


  DoubleAPFloat Tmp(*this);

  Tmp.makeSmallestNormalized(this->isNegative());

  return Tmp.compare(*this) == cmpEqual;

}


bool DoubleAPFloat::isLargest() const {

  if (getCategory() != fcNormal)

    return false;

  DoubleAPFloat Tmp(*this);

  Tmp.makeLargest(this->isNegative());

  return Tmp.compare(*this) == cmpEqual;

}


bool DoubleAPFloat::isInteger() const {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  return Floats[0].isInteger() && Floats[1].isInteger();

}


void DoubleAPFloat::toString(SmallVectorImpl<char> &Str,

                             unsigned FormatPrecision,

                             unsigned FormatMaxPadding,

                             bool TruncateZero) const {

  assert(Semantics == &APFloatBase::semPPCDoubleDouble &&

         "Unexpected Semantics");

  APFloat(APFloatBase::semPPCDoubleDoubleLegacy, bitcastToAPInt())

      .toString(Str, FormatPrecision, FormatMaxPadding, TruncateZero);

}


int DoubleAPFloat::getExactLog2Abs() const {

  // In order for Hi + Lo to be a power of two, the following must be true:

  // 1. Hi must be a power of two.

  // 2. Lo must be zero.

  if (getSecond().isNonZero())

    return INT_MIN;

  return getFirst().getExactLog2Abs();

}


int ilogb(const DoubleAPFloat &Arg) {

  const APFloat &Hi = Arg.getFirst();

  const APFloat &Lo = Arg.getSecond();

  int IlogbResult = ilogb(Hi);

  // Zero and non-finite values can delegate to ilogb(Hi).

  if (Arg.getCategory() != fcNormal)

    return IlogbResult;

  // If Lo can't change the binade, we can delegate to ilogb(Hi).

  if (Lo.isZero() || Hi.isNegative() == Lo.isNegative())

    return IlogbResult;

  if (Hi.getExactLog2Abs() == INT_MIN)

    return IlogbResult;

  // Numbers of the form 2^a - 2^b or -2^a + 2^b are almost powers of two but

  // get nudged out of the binade by the low component.

  return IlogbResult - 1;

}


DoubleAPFloat scalbn(const DoubleAPFloat &Arg, int Exp,

                     APFloat::roundingMode RM) {

  assert(Arg.Semantics == &APFloatBase::PPCDoubleDouble() &&

         "Unexpected Semantics");

  return DoubleAPFloat(APFloatBase::PPCDoubleDouble(),

                       scalbn(Arg.Floats[0], Exp, RM),

                       scalbn(Arg.Floats[1], Exp, RM));

}


DoubleAPFloat frexp(const DoubleAPFloat &Arg, int &Exp,

                    APFloat::roundingMode RM) {

  assert(Arg.Semantics == &APFloatBase::PPCDoubleDouble() &&

         "Unexpected Semantics");


  // Get the unbiased exponent e of the number, where |Arg| = m * 2^e for m in

  // [1.0, 2.0).

  Exp = ilogb(Arg);


  // For NaNs, quiet any signaling NaN and return the result, as per standard

  // practice.

  if (Exp == APFloat::IEK_NaN) {

    DoubleAPFloat Quiet{Arg};

    Quiet.getFirst() = Quiet.getFirst().makeQuiet();

    return Quiet;

  }


  // For infinity, return it unchanged. The exponent remains IEK_Inf.

  if (Exp == APFloat::IEK_Inf)

    return Arg;


  // For zero, the fraction is zero and the standard requires the exponent be 0.

  if (Exp == APFloat::IEK_Zero) {

    Exp = 0;

    return Arg;

  }


  const APFloat &Hi = Arg.getFirst();

  const APFloat &Lo = Arg.getSecond();


  // frexp requires the fraction's absolute value to be in [0.5, 1.0).

  // ilogb provides an exponent for an absolute value in [1.0, 2.0).

  // Increment the exponent to ensure the fraction is in the correct range.

  ++Exp;


  const bool SignsDisagree = Hi.isNegative() != Lo.isNegative();

  APFloat Second = Lo;

  if (Arg.getCategory() == APFloat::fcNormal && Lo.isFiniteNonZero()) {

    roundingMode LoRoundingMode;

    // The interpretation of rmTowardZero depends on the sign of the combined

    // Arg rather than the sign of the component.

    if (RM == rmTowardZero)

      LoRoundingMode = Arg.isNegative() ? rmTowardPositive : rmTowardNegative;

    // For rmNearestTiesToAway, we face a similar problem. If signs disagree,

    // Lo is a correction *toward* zero relative to Hi. Rounding Lo

    // "away from zero" based on its own sign would move the value in the

    // wrong direction. As a safe proxy, we use rmNearestTiesToEven, which is

    // direction-agnostic. We only need to bother with this if Lo is scaled

    // down.

    else if (RM == rmNearestTiesToAway && SignsDisagree && Exp > 0)

      LoRoundingMode = rmNearestTiesToEven;

    else

      LoRoundingMode = RM;

    Second = scalbn(Lo, -Exp, LoRoundingMode);

    // The rmNearestTiesToEven proxy is correct most of the time, but it

    // differs from rmNearestTiesToAway when the scaled value of Lo is an

    // exact midpoint.

    // NOTE: This is morally equivalent to roundTiesTowardZero.

    if (RM == rmNearestTiesToAway && LoRoundingMode == rmNearestTiesToEven) {

      // Re-scale the result back to check if rounding occurred.

      const APFloat RecomposedLo = scalbn(Second, Exp, rmNearestTiesToEven);

      if (RecomposedLo != Lo) {

        // RoundingError tells us which direction we rounded:

        //   - RoundingError > 0: we rounded up.

        //   - RoundingError < 0: we down up.

        const APFloat RoundingError = RecomposedLo - Lo;

        // Determine if scalbn(Lo, -Exp) landed exactly on a midpoint.

        // We do this by checking if the absolute rounding error is exactly

        // half a ULP of the result.

        const APFloat UlpOfSecond = harrisonUlp(Second);

        const APFloat ScaledUlpOfSecond =

            scalbn(UlpOfSecond, Exp - 1, rmNearestTiesToEven);

        const bool IsMidpoint = abs(RoundingError) == ScaledUlpOfSecond;

        const bool RoundedLoAway =

            Second.isNegative() == RoundingError.isNegative();

        // The sign of Hi and Lo disagree and we rounded Lo away: we must

        // decrease the magnitude of Second to increase the magnitude

        // First+Second.

        if (IsMidpoint && RoundedLoAway)

          Second.next(/*nextDown=*/!Second.isNegative());

      }

    }

    // Handle a tricky edge case where Arg is slightly less than a power of two

    // (e.g., Arg = 2^k - epsilon). In this situation:

    // 1. Hi is 2^k, and Lo is a small negative value -epsilon.

    // 2. ilogb(Arg) correctly returns k-1.

    // 3. Our initial Exp becomes (k-1) + 1 = k.

    // 4. Scaling Hi (2^k) by 2^-k would yield a magnitude of 1.0 and

    //    scaling Lo by 2^-k would yield zero. This would make the result 1.0

    //    which is an invalid fraction, as the required interval is [0.5, 1.0).

    // We detect this specific case by checking if Hi is a power of two and if

    // the scaled Lo underflowed to zero. The fix: Increment Exp to k+1. This

    // adjusts the scale factor, causing Hi to be scaled to 0.5, which is a

    // valid fraction.

    if (Second.isZero() && SignsDisagree && Hi.getExactLog2Abs() != INT_MIN)

      ++Exp;

  }


  APFloat First = scalbn(Hi, -Exp, RM);

  return DoubleAPFloat(APFloatBase::PPCDoubleDouble(), std::move(First),

                       std::move(Second));

}


} // namespace detail


APFloat::Storage::Storage(IEEEFloat F, const fltSemantics &Semantics) {

  if (usesLayout<IEEEFloat>(Semantics)) {

    new (&IEEE) IEEEFloat(std::move(F));

    return;

  }

  if (usesLayout<DoubleAPFloat>(Semantics)) {

    const fltSemantics& S = F.getSemantics();

    new (&Double) DoubleAPFloat(Semantics, APFloat(std::move(F), S),

                                APFloat(APFloatBase::IEEEdouble()));

    return;

  }

  llvm_unreachable("Unexpected semantics");

}


Expected<APFloat::opStatus> APFloat::convertFromString(StringRef Str,

                                                       roundingMode RM) {

  APFLOAT_DISPATCH_ON_SEMANTICS(convertFromString(Str, RM));

}


hash_code hash_value(const APFloat &Arg) {

  if (APFloat::usesLayout<detail::IEEEFloat>(Arg.getSemantics()))

    return hash_value(Arg.U.IEEE);

  if (APFloat::usesLayout<detail::DoubleAPFloat>(Arg.getSemantics()))

    return hash_value(Arg.U.Double);

  llvm_unreachable("Unexpected semantics");

}


APFloat::APFloat(const fltSemantics &Semantics, StringRef S)

    : APFloat(Semantics) {

  auto StatusOrErr = convertFromString(S, rmNearestTiesToEven);

  assert(StatusOrErr && "Invalid floating point representation");

  consumeError(StatusOrErr.takeError());

}


FPClassTest APFloat::classify() const {

  if (isZero())

    return isNegative() ? fcNegZero : fcPosZero;

  if (isNormal())

    return isNegative() ? fcNegNormal : fcPosNormal;

  if (isDenormal())

    return isNegative() ? fcNegSubnormal : fcPosSubnormal;

  if (isInfinity())

    return isNegative() ? fcNegInf : fcPosInf;

  assert(isNaN() && "Other class of FP constant");

  return isSignaling() ? fcSNan : fcQNan;

}


bool APFloat::getExactInverse(APFloat *Inv) const {

  // Only finite, non-zero numbers can have a useful, representable inverse.

  // This check filters out +/- zero, +/- infinity, and NaN.

  if (!isFiniteNonZero())

    return false;


  // Historically, this function rejects subnormal inputs.  One reason why this

  // might be important is that subnormals may behave differently under FTZ/DAZ

  // runtime behavior.

  if (isDenormal())

    return false;


  // A number has an exact, representable inverse if and only if it is a power

  // of two.

  //

  // Mathematical Rationale:

  // 1. A binary floating-point number x is a dyadic rational, meaning it can

  //    be written as x = M / 2^k for integers M (the significand) and k.

  // 2. The inverse is 1/x = 2^k / M.

  // 3. For 1/x to also be a dyadic rational (and thus exactly representable

  //    in binary), its denominator M must also be a power of two.

  //    Let's say M = 2^m.

  // 4. Substituting this back into the formula for x, we get

  //    x = (2^m) / (2^k) = 2^(m-k).

  //

  // This proves that x must be a power of two.


  // getExactLog2Abs() returns the integer exponent if the number is a power of

  // two or INT_MIN if it is not.

  const int Exp = getExactLog2Abs();

  if (Exp == INT_MIN)

    return false;


  // The inverse of +/- 2^Exp is +/- 2^(-Exp). We can compute this by

  // scaling 1.0 by the negated exponent.

  APFloat Reciprocal =

      scalbn(APFloat::getOne(getSemantics(), /*Negative=*/isNegative()), -Exp,

             rmTowardZero);


  // scalbn might round if the resulting exponent -Exp is outside the

  // representable range, causing overflow (to infinity) or underflow. We

  // must verify that the result is still the exact power of two we expect.

  if (Reciprocal.getExactLog2Abs() != -Exp)

    return false;


  // Avoid multiplication with a subnormal, it is not safe on all platforms and

  // may be slower than a normal division.

  if (Reciprocal.isDenormal())

    return false;


  assert(Reciprocal.isFiniteNonZero());


  if (Inv)

    *Inv = std::move(Reciprocal);


  return true;

}


APFloat::opStatus APFloat::convert(const fltSemantics &ToSemantics,

                                   roundingMode RM, bool *losesInfo) {

  if (&getSemantics() == &ToSemantics) {

    *losesInfo = false;

    return opOK;

  }

  if (usesLayout<IEEEFloat>(getSemantics()) &&

      usesLayout<IEEEFloat>(ToSemantics))

    return U.IEEE.convert(ToSemantics, RM, losesInfo);

  if (usesLayout<IEEEFloat>(getSemantics()) &&

      usesLayout<DoubleAPFloat>(ToSemantics)) {

    assert(&ToSemantics == &APFloatBase::semPPCDoubleDouble);

    auto Ret =

        U.IEEE.convert(APFloatBase::semPPCDoubleDoubleLegacy, RM, losesInfo);

    *this = APFloat(ToSemantics, U.IEEE.bitcastToAPInt());

    return Ret;

  }

  if (usesLayout<DoubleAPFloat>(getSemantics()) &&

      usesLayout<IEEEFloat>(ToSemantics)) {

    auto Ret = getIEEE().convert(ToSemantics, RM, losesInfo);

    *this = APFloat(std::move(getIEEE()), ToSemantics);

    return Ret;

  }

  llvm_unreachable("Unexpected semantics");

}


APFloat APFloat::getAllOnesValue(const fltSemantics &Semantics) {

  return APFloat(Semantics, APInt::getAllOnes(Semantics.sizeInBits));

}


void APFloat::print(raw_ostream &OS) const {

  SmallVector<char, 16> Buffer;

  toString(Buffer);

  OS << Buffer;

}


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)


LLVM_DUMP_METHOD void APFloat::dump() const {

  print(dbgs());

  dbgs() << '\n';

}


#endif


void APFloat::Profile(FoldingSetNodeID &NID) const {

  NID.Add(bitcastToAPInt());

}


APFloat::opStatus APFloat::convertToInteger(APSInt &result,

                                            roundingMode rounding_mode,

                                            bool *isExact) const {

  unsigned bitWidth = result.getBitWidth();

  SmallVector<uint64_t, 4> parts(result.getNumWords());

  opStatus status = convertToInteger(parts, bitWidth, result.isSigned(),

                                     rounding_mode, isExact);

  // Keeps the original signed-ness.

  result = APInt(bitWidth, parts);

  return status;

}


double APFloat::convertToDouble() const {

  if (&getSemantics() ==

      (const llvm::fltSemantics *)&APFloatBase::semIEEEdouble)

    return getIEEE().convertToDouble();

  assert(isRepresentableBy(getSemantics(), semIEEEdouble) &&

         "Float semantics is not representable by IEEEdouble");

  APFloat Temp = *this;

  bool LosesInfo;

  opStatus St =

      Temp.convert(APFloatBase::semIEEEdouble, rmNearestTiesToEven, &LosesInfo);

  assert(!(St & opInexact) && !LosesInfo && "Unexpected imprecision");

  (void)St;

  return Temp.getIEEE().convertToDouble();

}


#ifdef HAS_IEE754_FLOAT128

float128 APFloat::convertToQuad() const {

  if (&getSemantics() == (const llvm::fltSemantics *)&APFloatBase::semIEEEquad)

    return getIEEE().convertToQuad();

  assert(isRepresentableBy(getSemantics(), semIEEEquad) &&

         "Float semantics is not representable by IEEEquad");

  APFloat Temp = *this;

  bool LosesInfo;

  opStatus St =

      Temp.convert(APFloatBase::semIEEEquad, rmNearestTiesToEven, &LosesInfo);

  assert(!(St & opInexact) && !LosesInfo && "Unexpected imprecision");

  (void)St;

  return Temp.getIEEE().convertToQuad();

}

#endif


float APFloat::convertToFloat() const {

  if (&getSemantics() ==

      (const llvm::fltSemantics *)&APFloatBase::semIEEEsingle)

    return getIEEE().convertToFloat();

  assert(isRepresentableBy(getSemantics(), semIEEEsingle) &&

         "Float semantics is not representable by IEEEsingle");

  APFloat Temp = *this;

  bool LosesInfo;

  opStatus St =

      Temp.convert(APFloatBase::semIEEEsingle, rmNearestTiesToEven, &LosesInfo);

  assert(!(St & opInexact) && !LosesInfo && "Unexpected imprecision");

  (void)St;

  return Temp.getIEEE().convertToFloat();

}


APFloat::Storage::~Storage() {

  if (usesLayout<IEEEFloat>(*semantics)) {

    IEEE.~IEEEFloat();

    return;

  }

  if (usesLayout<DoubleAPFloat>(*semantics)) {

    Double.~DoubleAPFloat();

    return;

  }

  llvm_unreachable("Unexpected semantics");

}


APFloat::Storage::Storage(const APFloat::Storage &RHS) {

  if (usesLayout<IEEEFloat>(*RHS.semantics)) {

    new (this) IEEEFloat(RHS.IEEE);

    return;

  }

  if (usesLayout<DoubleAPFloat>(*RHS.semantics)) {

    new (this) DoubleAPFloat(RHS.Double);

    return;

  }

  llvm_unreachable("Unexpected semantics");

}


APFloat::Storage::Storage(APFloat::Storage &&RHS) {

  if (usesLayout<IEEEFloat>(*RHS.semantics)) {

    new (this) IEEEFloat(std::move(RHS.IEEE));

    return;

  }

  if (usesLayout<DoubleAPFloat>(*RHS.semantics)) {

    new (this) DoubleAPFloat(std::move(RHS.Double));

    return;

  }

  llvm_unreachable("Unexpected semantics");

}


APFloat::Storage &APFloat::Storage::operator=(const APFloat::Storage &RHS) {

  if (usesLayout<IEEEFloat>(*semantics) &&

      usesLayout<IEEEFloat>(*RHS.semantics)) {

    IEEE = RHS.IEEE;

  } else if (usesLayout<DoubleAPFloat>(*semantics) &&

             usesLayout<DoubleAPFloat>(*RHS.semantics)) {

    Double = RHS.Double;

  } else if (this != &RHS) {

    this->~Storage();

    new (this) Storage(RHS);

  }

  return *this;

}


APFloat::Storage &APFloat::Storage::operator=(APFloat::Storage &&RHS) {

  if (usesLayout<IEEEFloat>(*semantics) &&

      usesLayout<IEEEFloat>(*RHS.semantics)) {

    IEEE = std::move(RHS.IEEE);

  } else if (usesLayout<DoubleAPFloat>(*semantics) &&

             usesLayout<DoubleAPFloat>(*RHS.semantics)) {

    Double = std::move(RHS.Double);

  } else if (this != &RHS) {

    this->~Storage();

    new (this) Storage(std::move(RHS));

  }

  return *this;

}


} // namespace llvm


#undef APFLOAT_DISPATCH_ON_SEMANTICS

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

PackCategoriesIntoKey
#define PackCategoriesIntoKey(_lhs, _rhs)
A macro used to combine two fcCategory enums into one key which can be used in a switch statement to ...
Definition APFloat.cpp:48

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APFLOAT_DISPATCH_ON_SEMANTICS
#define APFLOAT_DISPATCH_ON_SEMANTICS(METHOD_CALL)
Definition APFloat.h:26

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

false
Function Alias Analysis false
Definition AliasAnalysis.cpp:734

aa
aa
Definition AliasAnalysis.cpp:733

ArrayRef.h

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

LLVM_DUMP_METHOD
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition Compiler.h:638

isNeg
static bool isNeg(Value *V)
Returns true if the operation is a negation of V, and it works for both integers and floats.
Definition ComplexDeinterleavingPass.cpp:612

isSigned
static bool isSigned(unsigned int Opcode)
Definition ExpandLargeDivRem.cpp:52

FloatingPointMode.h
Utilities for dealing with flags related to floating point properties and mode controls.

FoldingSet.h
This file defines a hash set that can be used to remove duplication of nodes in a graph.

Hashing.h

isZero
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
Definition Lint.cpp:539

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

MathExtras.h

T
#define T
Definition Mips16ISelLowering.cpp:315

P
#define P(N)

if
if(PassOpts->AAPipeline)
Definition PassBuilderBindings.cpp:64

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

StringExtras.h
This file contains some functions that are useful when dealing with strings.

StringRef.h

Debug.h

Y
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")

X
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")

initialize
static void initialize(TargetLibraryInfoImpl &TLI, const Triple &T, const llvm::StringTable &StandardNames, VectorLibrary VecLib)
Initialize the set of available library functions based on the specified target triple.
Definition TargetLibraryInfo.cpp:901

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

LHS
Value * LHS
Definition X86PartialReduction.cpp:80

Input
The Input class is used to parse a yaml document into in-memory structs and vectors.
Definition YAMLTraits.h:1313

llvm::APFloatBase
Definition APFloat.h:149

llvm::APFloatBase::IEEEsingle
static const fltSemantics & IEEEsingle()
Definition APFloat.h:296

llvm::APFloatBase::Float8E4M3FN
static const fltSemantics & Float8E4M3FN()
Definition APFloat.h:306

llvm::APFloatBase::EnumToSemantics
static LLVM_ABI const llvm::fltSemantics & EnumToSemantics(Semantics S)
Definition APFloat.cpp:174

llvm::APFloatBase::semanticsHasInf
static LLVM_ABI bool semanticsHasInf(const fltSemantics &)
Definition APFloat.cpp:323

llvm::APFloatBase::cmpResult
cmpResult
IEEE-754R 5.11: Floating Point Comparison Relations.
Definition APFloat.h:334

llvm::APFloatBase::cmpEqual
@ cmpEqual
Definition APFloat.h:336

llvm::APFloatBase::cmpGreaterThan
@ cmpGreaterThan
Definition APFloat.h:337

llvm::APFloatBase::rmTowardZero
static constexpr roundingMode rmTowardZero
Definition APFloat.h:348

llvm::APFloatBase::semanticsMinExponent
static LLVM_ABI ExponentType semanticsMinExponent(const fltSemantics &)
Definition APFloat.cpp:298

llvm::APFloatBase::roundingMode
llvm::RoundingMode roundingMode
IEEE-754R 4.3: Rounding-direction attributes.
Definition APFloat.h:342

llvm::APFloatBase::BFloat
static const fltSemantics & BFloat()
Definition APFloat.h:295

llvm::APFloatBase::IEEEquad
static const fltSemantics & IEEEquad()
Definition APFloat.h:298

llvm::APFloatBase::semanticsSizeInBits
static LLVM_ABI unsigned int semanticsSizeInBits(const fltSemantics &)
Definition APFloat.cpp:301

llvm::APFloatBase::Float8E8M0FNU
static const fltSemantics & Float8E8M0FNU()
Definition APFloat.h:313

llvm::APFloatBase::semanticsHasSignedRepr
static LLVM_ABI bool semanticsHasSignedRepr(const fltSemantics &)
Definition APFloat.cpp:319

llvm::APFloatBase::IEEEdouble
static const fltSemantics & IEEEdouble()
Definition APFloat.h:297

llvm::APFloatBase::getSizeInBits
static LLVM_ABI unsigned getSizeInBits(const fltSemantics &Sem)
Returns the size of the floating point number (in bits) in the given semantics.
Definition APFloat.cpp:354

llvm::APFloatBase::x87DoubleExtended
static const fltSemantics & x87DoubleExtended()
Definition APFloat.h:317

llvm::APFloatBase::rmTowardNegative
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:347

llvm::APFloatBase::rmNearestTiesToEven
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:344

llvm::APFloatBase::hasSignBitInMSB
static LLVM_ABI bool hasSignBitInMSB(const fltSemantics &)
Definition APFloat.cpp:336

llvm::APFloatBase::semanticsMaxExponent
static LLVM_ABI ExponentType semanticsMaxExponent(const fltSemantics &)
Definition APFloat.cpp:294

llvm::APFloatBase::APFloat
friend class APFloat
Definition APFloat.h:291

llvm::APFloatBase::semanticsPrecision
static LLVM_ABI unsigned int semanticsPrecision(const fltSemantics &)
Definition APFloat.cpp:290

llvm::APFloatBase::semanticsHasNaN
static LLVM_ABI bool semanticsHasNaN(const fltSemantics &)
Definition APFloat.cpp:327

llvm::APFloatBase::SemanticsToEnum
static LLVM_ABI Semantics SemanticsToEnum(const llvm::fltSemantics &Sem)
Definition APFloat.cpp:221

llvm::APFloatBase::ExponentType
int32_t ExponentType
A signed type to represent a floating point numbers unbiased exponent.
Definition APFloat.h:155

llvm::APFloatBase::integerPartWidth
static constexpr unsigned integerPartWidth
Definition APFloat.h:152

llvm::APFloatBase::PPCDoubleDoubleLegacy
static const fltSemantics & PPCDoubleDoubleLegacy()
Definition APFloat.h:300

llvm::APFloatBase::integerPart
APInt::WordType integerPart
Definition APFloat.h:151

llvm::APFloatBase::semanticsHasZero
static LLVM_ABI bool semanticsHasZero(const fltSemantics &)
Definition APFloat.cpp:315

llvm::APFloatBase::isRepresentableAsNormalIn
static LLVM_ABI bool isRepresentableAsNormalIn(const fltSemantics &Src, const fltSemantics &Dst)
Definition APFloat.cpp:340

llvm::APFloatBase::Float8E5M2FNUZ
static const fltSemantics & Float8E5M2FNUZ()
Definition APFloat.h:304

llvm::APFloatBase::Float8E4M3FNUZ
static const fltSemantics & Float8E4M3FNUZ()
Definition APFloat.h:307

llvm::APFloatBase::rmTowardPositive
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:346

llvm::APFloatBase::IEEEhalf
static const fltSemantics & IEEEhalf()
Definition APFloat.h:294

llvm::APFloatBase::Float4E2M1FN
static const fltSemantics & Float4E2M1FN()
Definition APFloat.h:316

llvm::APFloatBase::Float6E2M3FN
static const fltSemantics & Float6E2M3FN()
Definition APFloat.h:315

llvm::APFloatBase::IEK_NaN
@ IEK_NaN
Definition APFloat.h:385

llvm::APFloatBase::IEK_Inf
@ IEK_Inf
Definition APFloat.h:386

llvm::APFloatBase::IEK_Zero
@ IEK_Zero
Definition APFloat.h:384

llvm::APFloatBase::Float8E4M3
static const fltSemantics & Float8E4M3()
Definition APFloat.h:305

llvm::APFloatBase::Float8E4M3B11FNUZ
static const fltSemantics & Float8E4M3B11FNUZ()
Definition APFloat.h:308

llvm::APFloatBase::isRepresentableBy
static LLVM_ABI bool isRepresentableBy(const fltSemantics &A, const fltSemantics &B)
Definition APFloat.cpp:266

llvm::APFloatBase::Float8E3M4
static const fltSemantics & Float8E3M4()
Definition APFloat.h:311

llvm::APFloatBase::isIEEELikeFP
static LLVM_ABI bool isIEEELikeFP(const fltSemantics &)
Definition APFloat.cpp:331

llvm::APFloatBase::Float8E5M2
static const fltSemantics & Float8E5M2()
Definition APFloat.h:303

llvm::APFloatBase::fltCategory
fltCategory
Category of internally-represented number.
Definition APFloat.h:370

llvm::APFloatBase::fcZero
@ fcZero
Definition APFloat.h:374

llvm::APFloatBase::fcNaN
@ fcNaN
Definition APFloat.h:372

llvm::APFloatBase::fcInfinity
@ fcInfinity
Definition APFloat.h:371

llvm::APFloatBase::fcNormal
@ fcNormal
Definition APFloat.h:373

llvm::APFloatBase::rmNearestTiesToAway
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:349

llvm::APFloatBase::PPCDoubleDouble
static const fltSemantics & PPCDoubleDouble()
Definition APFloat.h:299

llvm::APFloatBase::Semantics
Semantics
Definition APFloat.h:159

llvm::APFloatBase::S_Float6E2M3FN
@ S_Float6E2M3FN
Definition APFloat.h:253

llvm::APFloatBase::S_IEEEsingle
@ S_IEEEsingle
Definition APFloat.h:162

llvm::APFloatBase::S_Float8E4M3FNUZ
@ S_Float8E4M3FNUZ
Definition APFloat.h:224

llvm::APFloatBase::S_IEEEhalf
@ S_IEEEhalf
Definition APFloat.h:160

llvm::APFloatBase::S_BFloat
@ S_BFloat
Definition APFloat.h:161

llvm::APFloatBase::S_Float8E5M2
@ S_Float8E5M2
Definition APFloat.h:202

llvm::APFloatBase::S_PPCDoubleDouble
@ S_PPCDoubleDouble
Definition APFloat.h:174

llvm::APFloatBase::S_Float8E4M3
@ S_Float8E4M3
Definition APFloat.h:212

llvm::APFloatBase::S_Float4E2M1FN
@ S_Float4E2M1FN
Definition APFloat.h:257

llvm::APFloatBase::S_IEEEquad
@ S_IEEEquad
Definition APFloat.h:164

llvm::APFloatBase::S_Float6E3M2FN
@ S_Float6E3M2FN
Definition APFloat.h:249

llvm::APFloatBase::S_Float8E4M3FN
@ S_Float8E4M3FN
Definition APFloat.h:217

llvm::APFloatBase::S_FloatTF32
@ S_FloatTF32
Definition APFloat.h:238

llvm::APFloatBase::S_x87DoubleExtended
@ S_x87DoubleExtended
Definition APFloat.h:259

llvm::APFloatBase::S_Float8E5M2FNUZ
@ S_Float8E5M2FNUZ
Definition APFloat.h:209

llvm::APFloatBase::S_Float8E4M3B11FNUZ
@ S_Float8E4M3B11FNUZ
Definition APFloat.h:231

llvm::APFloatBase::S_Float8E3M4
@ S_Float8E3M4
Definition APFloat.h:234

llvm::APFloatBase::S_IEEEdouble
@ S_IEEEdouble
Definition APFloat.h:163

llvm::APFloatBase::S_PPCDoubleDoubleLegacy
@ S_PPCDoubleDoubleLegacy
Definition APFloat.h:199

llvm::APFloatBase::S_Float8E8M0FNU
@ S_Float8E8M0FNU
Definition APFloat.h:245

llvm::APFloatBase::Float6E3M2FN
static const fltSemantics & Float6E3M2FN()
Definition APFloat.h:314

llvm::APFloatBase::opStatus
opStatus
IEEE-754R 7: Default exception handling.
Definition APFloat.h:360

llvm::APFloatBase::opOK
@ opOK
Definition APFloat.h:361

llvm::APFloatBase::opInexact
@ opInexact
Definition APFloat.h:366

llvm::APFloatBase::FloatTF32
static const fltSemantics & FloatTF32()
Definition APFloat.h:312

llvm::APFloatBase::semanticsIntSizeInBits
static LLVM_ABI unsigned int semanticsIntSizeInBits(const fltSemantics &, bool)
Definition APFloat.cpp:304

llvm::APFloat
Definition APFloat.h:940

llvm::APFloat::getQNaN
static APFloat getQNaN(const fltSemantics &Sem, bool Negative=false, const APInt *payload=nullptr)
Factory for QNaN values.
Definition APFloat.h:1102

llvm::APFloat::Profile
LLVM_ABI void Profile(FoldingSetNodeID &NID) const
Used to insert APFloat objects, or objects that contain APFloat objects, into FoldingSets.
Definition APFloat.cpp:6096

llvm::APFloat::divide
opStatus divide(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1190

llvm::APFloat::isFiniteNonZero
bool isFiniteNonZero() const
Definition APFloat.h:1441

llvm::APFloat::convert
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:6053

llvm::APFloat::getExactLog2Abs
LLVM_READONLY int getExactLog2Abs() const
Definition APFloat.h:1479

llvm::APFloat::isNegative
bool isNegative() const
Definition APFloat.h:1431

llvm::APFloat::getExactInverse
LLVM_ABI bool getExactInverse(APFloat *Inv) const
If this value is normal and has an exact, normal, multiplicative inverse, store it in inv and return ...
Definition APFloat.cpp:5995

llvm::APFloat::DoubleAPFloat
friend DoubleAPFloat
Definition APFloat.h:1495

llvm::APFloat::convertToDouble
LLVM_ABI double convertToDouble() const
Converts this APFloat to host double value.
Definition APFloat.cpp:6112

llvm::APFloat::toString
void toString(SmallVectorImpl< char > &Str, unsigned FormatPrecision=0, unsigned FormatMaxPadding=3, bool TruncateZero=true) const
Definition APFloat.h:1460

llvm::APFloat::isNormal
bool isNormal() const
Definition APFloat.h:1435

llvm::APFloat::isDenormal
bool isDenormal() const
Definition APFloat.h:1432

llvm::APFloat::add
opStatus add(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1163

llvm::APFloat::getAllOnesValue
static LLVM_ABI APFloat getAllOnesValue(const fltSemantics &Semantics)
Returns a float which is bitcasted from an all one value int.
Definition APFloat.cpp:6079

llvm::APFloat::hash_value
LLVM_ABI friend hash_code hash_value(const APFloat &Arg)
See friend declarations above.
Definition APFloat.cpp:5967

llvm::APFloat::getSemantics
const fltSemantics & getSemantics() const
Definition APFloat.h:1439

llvm::APFloat::isFinite
bool isFinite() const
Definition APFloat.h:1436

llvm::APFloat::isNaN
bool isNaN() const
Definition APFloat.h:1429

llvm::APFloat::getOne
static APFloat getOne(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative One.
Definition APFloat.h:1070

llvm::APFloat::convertToHexString
unsigned int convertToHexString(char *DST, unsigned int HexDigits, bool UpperCase, roundingMode RM) const
Definition APFloat.h:1421

llvm::APFloat::convertToFloat
LLVM_ABI float convertToFloat() const
Converts this APFloat to host float value.
Definition APFloat.cpp:6143

llvm::APFloat::isSignaling
bool isSignaling() const
Definition APFloat.h:1433

llvm::APFloat::fusedMultiplyAdd
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
Definition APFloat.h:1217

llvm::APFloat::remainder
opStatus remainder(const APFloat &RHS)
Definition APFloat.h:1199

llvm::APFloat::isZero
bool isZero() const
Definition APFloat.h:1427

llvm::APFloat::bitcastToAPInt
APInt bitcastToAPInt() const
Definition APFloat.h:1335

llvm::APFloat::convertToInteger
opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.h:1314

llvm::APFloat::next
opStatus next(bool nextDown)
Definition APFloat.h:1236

llvm::APFloat::getInf
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1080

llvm::APFloat::scalbn
friend APFloat scalbn(APFloat X, int Exp, roundingMode RM)

llvm::APFloat::getSmallest
static APFloat getSmallest(const fltSemantics &Sem, bool Negative=false)
Returns the smallest (by magnitude) finite number in the given semantics.
Definition APFloat.h:1130

llvm::APFloat::classify
LLVM_ABI FPClassTest classify() const
Return the FPClassTest which will return true for the value.
Definition APFloat.cpp:5982

llvm::APFloat::mod
opStatus mod(const APFloat &RHS)
Definition APFloat.h:1208

llvm::APFloat::convertFromString
LLVM_ABI Expected< opStatus > convertFromString(StringRef, roundingMode)
Definition APFloat.cpp:5962

llvm::APFloat::IEEEFloat
friend IEEEFloat
Definition APFloat.h:1494

llvm::APFloat::dump
LLVM_DUMP_METHOD void dump() const
Definition APFloat.cpp:6090

llvm::APFloat::print
LLVM_ABI void print(raw_ostream &) const
Definition APFloat.cpp:6083

llvm::APFloat::roundToIntegral
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1230

llvm::APFloat::hasSignificand
static bool hasSignificand(const fltSemantics &Sem)
Returns true if the given semantics has actual significand.
Definition APFloat.h:1155

llvm::APFloat::getZero
static APFloat getZero(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Zero.
Definition APFloat.h:1061

llvm::APFloat::isInfinity
bool isInfinity() const
Definition APFloat.h:1428

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::udiv
LLVM_ABI APInt udiv(const APInt &RHS) const
Unsigned division operation.
Definition APInt.cpp:1573

llvm::APInt::tcSetBit
static LLVM_ABI void tcSetBit(WordType *, unsigned bit)
Set the given bit of a bignum. Zero-based.
Definition APInt.cpp:2368

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235

llvm::APInt::tcSet
static LLVM_ABI void tcSet(WordType *, WordType, unsigned)
Sets the least significant part of a bignum to the input value, and zeroes out higher parts.
Definition APInt.cpp:2340

llvm::APInt::udivrem
static LLVM_ABI void udivrem(const APInt &LHS, const APInt &RHS, APInt &Quotient, APInt &Remainder)
Dual division/remainder interface.
Definition APInt.cpp:1758

llvm::APInt::tcExtractBit
static LLVM_ABI int tcExtractBit(const WordType *, unsigned bit)
Extract the given bit of a bignum; returns 0 or 1. Zero-based.
Definition APInt.cpp:2363

llvm::APInt::zext
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
Definition APInt.cpp:1012

llvm::APInt::tcAdd
static LLVM_ABI WordType tcAdd(WordType *, const WordType *, WordType carry, unsigned)
DST += RHS + CARRY where CARRY is zero or one. Returns the carry flag.
Definition APInt.cpp:2442

llvm::APInt::tcExtract
static LLVM_ABI void tcExtract(WordType *, unsigned dstCount, const WordType *, unsigned srcBits, unsigned srcLSB)
Copy the bit vector of width srcBITS from SRC, starting at bit srcLSB, to DST, of dstCOUNT parts,...
Definition APInt.cpp:2412

llvm::APInt::getActiveBits
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition APInt.h:1513

llvm::APInt::trunc
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
Definition APInt.cpp:936

llvm::APInt::tcCompare
static LLVM_ABI int tcCompare(const WordType *, const WordType *, unsigned)
Comparison (unsigned) of two bignums.
Definition APInt.cpp:2752

llvm::APInt::floatToBits
static APInt floatToBits(float V)
Converts a float to APInt bits.
Definition APInt.h:1753

llvm::APInt::WordType
uint64_t WordType
Definition APInt.h:80

llvm::APInt::tcAssign
static LLVM_ABI void tcAssign(WordType *, const WordType *, unsigned)
Assign one bignum to another.
Definition APInt.cpp:2348

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1489

llvm::APInt::tcShiftRight
static LLVM_ABI void tcShiftRight(WordType *, unsigned Words, unsigned Count)
Shift a bignum right Count bits.
Definition APInt.cpp:2726

llvm::APInt::tcFullMultiply
static LLVM_ABI void tcFullMultiply(WordType *, const WordType *, const WordType *, unsigned, unsigned)
DST = LHS * RHS, where DST has width the sum of the widths of the operands.
Definition APInt.cpp:2632

llvm::APInt::getNumWords
unsigned getNumWords() const
Get the number of words.
Definition APInt.h:1496

llvm::APInt::isNegative
bool isNegative() const
Determine sign of this APInt.
Definition APInt.h:330

llvm::APInt::tcClearBit
static LLVM_ABI void tcClearBit(WordType *, unsigned bit)
Clear the given bit of a bignum. Zero-based.
Definition APInt.cpp:2373

llvm::APInt::negate
void negate()
Negate this APInt in place.
Definition APInt.h:1469

llvm::APInt::tcDecrement
static WordType tcDecrement(WordType *dst, unsigned parts)
Decrement a bignum in-place. Return the borrow flag.
Definition APInt.h:1919

llvm::APInt::countr_zero
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1640

llvm::APInt::tcLSB
static LLVM_ABI unsigned tcLSB(const WordType *, unsigned n)
Returns the bit number of the least or most significant set bit of a number.
Definition APInt.cpp:2379

llvm::APInt::tcShiftLeft
static LLVM_ABI void tcShiftLeft(WordType *, unsigned Words, unsigned Count)
Shift a bignum left Count bits.
Definition APInt.cpp:2699

llvm::APInt::tcIsZero
static LLVM_ABI bool tcIsZero(const WordType *, unsigned)
Returns true if a bignum is zero, false otherwise.
Definition APInt.cpp:2354

llvm::APInt::tcMSB
static LLVM_ABI unsigned tcMSB(const WordType *parts, unsigned n)
Returns the bit number of the most significant set bit of a number.
Definition APInt.cpp:2392

llvm::APInt::bitsToFloat
float bitsToFloat() const
Converts APInt bits to a float.
Definition APInt.h:1737

llvm::APInt::tcMultiplyPart
static LLVM_ABI int tcMultiplyPart(WordType *dst, const WordType *src, WordType multiplier, WordType carry, unsigned srcParts, unsigned dstParts, bool add)
DST += SRC * MULTIPLIER + PART if add is true DST = SRC * MULTIPLIER + PART if add is false.
Definition APInt.cpp:2530

llvm::APInt::APINT_BITS_PER_WORD
static constexpr unsigned APINT_BITS_PER_WORD
Bits in a word.
Definition APInt.h:86

llvm::APInt::tcSubtract
static LLVM_ABI WordType tcSubtract(WordType *, const WordType *, WordType carry, unsigned)
DST -= RHS + CARRY where CARRY is zero or one. Returns the carry flag.
Definition APInt.cpp:2477

llvm::APInt::tcNegate
static LLVM_ABI void tcNegate(WordType *, unsigned)
Negate a bignum in-place.
Definition APInt.cpp:2516

llvm::APInt::doubleToBits
static APInt doubleToBits(double V)
Converts a double to APInt bits.
Definition APInt.h:1745

llvm::APInt::tcIncrement
static WordType tcIncrement(WordType *dst, unsigned parts)
Increment a bignum in-place. Return the carry flag.
Definition APInt.h:1914

llvm::APInt::bitsToDouble
double bitsToDouble() const
Converts APInt bits to a double.
Definition APInt.h:1723

llvm::APInt::getRawData
const uint64_t * getRawData() const
This function returns a pointer to the internal storage of the APInt.
Definition APInt.h:570

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201

llvm::APInt::lshrInPlace
void lshrInPlace(unsigned ShiftAmt)
Logical right-shift this APInt by ShiftAmt in place.
Definition APInt.h:859

llvm::APSInt
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24

llvm::APSInt::isSigned
bool isSigned() const
Definition APSInt.h:78

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40

llvm::ArrayRef::size
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142

llvm::Error
Lightweight error class with error context and mandatory checking.
Definition Error.h:159

llvm::Error::success
static ErrorSuccess success()
Create a success value.
Definition Error.h:336

llvm::Expected
Tagged union holding either a T or a Error.
Definition Error.h:485

llvm::FoldingSetNodeID
FoldingSetNodeID - This class is used to gather all the unique data bits of a node.
Definition FoldingSet.h:330

llvm::FoldingSetNodeID::Add
void Add(const T &x)
Definition FoldingSet.h:370

llvm::MutableArrayRef
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition ArrayRef.h:298

llvm::MutableArrayRef::data
T * data() const
Definition ArrayRef.h:340

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:574

llvm::SmallVectorImpl::erase
iterator erase(const_iterator CI)
Definition SmallVector.h:744

llvm::SmallVectorImpl::append
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
Definition SmallVector.h:684

llvm::SmallVectorImpl::clear
void clear()
Definition SmallVector.h:611

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:417

llvm::SmallVectorTemplateCommon::size
size_t size() const
Definition SmallVector.h:80

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:83

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1203

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::StringRef::getAsInteger
bool getAsInteger(unsigned Radix, T &Result) const
Parse the current string as an integer of the specified radix.
Definition StringRef.h:472

llvm::StringRef::iterator
const char * iterator
Definition StringRef.h:59

llvm::StringRef::empty
constexpr bool empty() const
empty - Check if the string is empty.
Definition StringRef.h:143

llvm::StringRef::drop_front
StringRef drop_front(size_t N=1) const
Return a StringRef equal to 'this' but with the first N elements dropped.
Definition StringRef.h:611

llvm::StringRef::begin
iterator begin() const
Definition StringRef.h:112

llvm::StringRef::back
char back() const
back - Get the last character in the string.
Definition StringRef.h:155

llvm::StringRef::slice
StringRef slice(size_t Start, size_t End) const
Return a reference to the substring from [Start, End).
Definition StringRef.h:686

llvm::StringRef::size
constexpr size_t size() const
size - Get the string size.
Definition StringRef.h:146

llvm::StringRef::front
char front() const
front - Get the first character in the string.
Definition StringRef.h:149

llvm::StringRef::consume_front
bool consume_front(StringRef Prefix)
Returns true if this StringRef has the given prefix and removes that prefix.
Definition StringRef.h:637

llvm::StringRef::end
iterator end() const
Definition StringRef.h:114

llvm::StringRef::consume_front_insensitive
bool consume_front_insensitive(StringRef Prefix)
Returns true if this StringRef has the given prefix, ignoring case, and removes that prefix.
Definition StringRef.h:647

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82

llvm::detail::DoubleAPFloat
Definition APFloat.h:828

llvm::detail::DoubleAPFloat::makeSmallestNormalized
LLVM_ABI void makeSmallestNormalized(bool Neg)
Definition APFloat.cpp:5310

llvm::detail::DoubleAPFloat::operator=
LLVM_ABI DoubleAPFloat & operator=(const DoubleAPFloat &RHS)
Definition APFloat.cpp:4840

llvm::detail::DoubleAPFloat::changeSign
LLVM_ABI void changeSign()
Definition APFloat.cpp:5217

llvm::detail::DoubleAPFloat::getFirst
APFloat & getFirst()
Definition APFloat.h:1667

llvm::detail::DoubleAPFloat::isLargest
LLVM_ABI bool isLargest() const
Definition APFloat.cpp:5784

llvm::detail::DoubleAPFloat::remainder
LLVM_ABI opStatus remainder(const DoubleAPFloat &RHS)
Definition APFloat.cpp:5104

llvm::detail::DoubleAPFloat::multiply
LLVM_ABI opStatus multiply(const DoubleAPFloat &RHS, roundingMode RM)
Definition APFloat.cpp:5007

llvm::detail::DoubleAPFloat::getCategory
LLVM_ABI fltCategory getCategory() const
Definition APFloat.cpp:5276

llvm::detail::DoubleAPFloat::getSecond
APFloat & getSecond()
Definition APFloat.h:1669

llvm::detail::DoubleAPFloat::bitwiseIsEqual
LLVM_ABI bool bitwiseIsEqual(const DoubleAPFloat &RHS) const
Definition APFloat.cpp:5333

llvm::detail::DoubleAPFloat::getExactLog2Abs
LLVM_ABI LLVM_READONLY int getExactLog2Abs() const
Definition APFloat.cpp:5808

llvm::detail::DoubleAPFloat::convertFromAPInt
LLVM_ABI opStatus convertFromAPInt(const APInt &Input, bool IsSigned, roundingMode RM)
Definition APFloat.cpp:5735

llvm::detail::DoubleAPFloat::bitcastToAPInt
LLVM_ABI APInt bitcastToAPInt() const
Definition APFloat.cpp:5344

llvm::detail::DoubleAPFloat::convertFromString
LLVM_ABI Expected< opStatus > convertFromString(StringRef, roundingMode)
Definition APFloat.cpp:5354

llvm::detail::DoubleAPFloat::isSmallest
LLVM_ABI bool isSmallest() const
Definition APFloat.cpp:5767

llvm::detail::DoubleAPFloat::subtract
LLVM_ABI opStatus subtract(const DoubleAPFloat &RHS, roundingMode RM)
Definition APFloat.cpp:4999

llvm::detail::DoubleAPFloat::hash_value
LLVM_ABI friend hash_code hash_value(const DoubleAPFloat &Arg)
Definition APFloat.cpp:5338

llvm::detail::DoubleAPFloat::compareAbsoluteValue
LLVM_ABI cmpResult compareAbsoluteValue(const DoubleAPFloat &RHS) const
Definition APFloat.cpp:5223

llvm::detail::DoubleAPFloat::isDenormal
LLVM_ABI bool isDenormal() const
Definition APFloat.cpp:5760

llvm::detail::DoubleAPFloat::convertToInteger
LLVM_ABI opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.cpp:5571

llvm::detail::DoubleAPFloat::makeSmallest
LLVM_ABI void makeSmallest(bool Neg)
Definition APFloat.cpp:5303

llvm::detail::DoubleAPFloat::ilogb
LLVM_ABI friend int ilogb(const DoubleAPFloat &X)
Definition APFloat.cpp:5817

llvm::detail::DoubleAPFloat::next
LLVM_ABI opStatus next(bool nextDown)
Definition APFloat.cpp:5370

llvm::detail::DoubleAPFloat::makeInf
LLVM_ABI void makeInf(bool Neg)
Definition APFloat.cpp:5282

llvm::detail::DoubleAPFloat::isInteger
LLVM_ABI bool isInteger() const
Definition APFloat.cpp:5792

llvm::detail::DoubleAPFloat::makeZero
LLVM_ABI void makeZero(bool Neg)
Definition APFloat.cpp:5287

llvm::detail::DoubleAPFloat::divide
LLVM_ABI opStatus divide(const DoubleAPFloat &RHS, roundingMode RM)
Definition APFloat.cpp:5093

llvm::detail::DoubleAPFloat::isSmallestNormalized
LLVM_ABI bool isSmallestNormalized() const
Definition APFloat.cpp:5775

llvm::detail::DoubleAPFloat::mod
LLVM_ABI opStatus mod(const DoubleAPFloat &RHS)
Definition APFloat.cpp:5114

llvm::detail::DoubleAPFloat::DoubleAPFloat
LLVM_ABI DoubleAPFloat(const fltSemantics &S)
Definition APFloat.cpp:4787

llvm::detail::DoubleAPFloat::toString
LLVM_ABI void toString(SmallVectorImpl< char > &Str, unsigned FormatPrecision, unsigned FormatMaxPadding, bool TruncateZero=true) const
Definition APFloat.cpp:5798

llvm::detail::DoubleAPFloat::makeLargest
LLVM_ABI void makeLargest(bool Neg)
Definition APFloat.cpp:5292

llvm::detail::DoubleAPFloat::compare
LLVM_ABI cmpResult compare(const DoubleAPFloat &RHS) const
Definition APFloat.cpp:5325

llvm::detail::DoubleAPFloat::scalbn
LLVM_ABI friend DoubleAPFloat scalbn(const DoubleAPFloat &X, int Exp, roundingMode)

llvm::detail::DoubleAPFloat::roundToIntegral
LLVM_ABI opStatus roundToIntegral(roundingMode RM)
Definition APFloat.cpp:5140

llvm::detail::DoubleAPFloat::fusedMultiplyAdd
LLVM_ABI opStatus fusedMultiplyAdd(const DoubleAPFloat &Multiplicand, const DoubleAPFloat &Addend, roundingMode RM)
Definition APFloat.cpp:5125

llvm::detail::DoubleAPFloat::convertToHexString
LLVM_ABI unsigned int convertToHexString(char *DST, unsigned int HexDigits, bool UpperCase, roundingMode RM) const
Definition APFloat.cpp:5750

llvm::detail::DoubleAPFloat::isNegative
LLVM_ABI bool isNegative() const
Definition APFloat.cpp:5280

llvm::detail::DoubleAPFloat::add
LLVM_ABI opStatus add(const DoubleAPFloat &RHS, roundingMode RM)
Definition APFloat.cpp:4994

llvm::detail::DoubleAPFloat::~DoubleAPFloat
~DoubleAPFloat()
Definition APFloat.h:1672

llvm::detail::DoubleAPFloat::makeNaN
LLVM_ABI void makeNaN(bool SNaN, bool Neg, const APInt *fill)
Definition APFloat.cpp:5320

llvm::detail::IEEEFloat
Definition APFloat.h:445

llvm::detail::IEEEFloat::convertToHexString
LLVM_ABI unsigned int convertToHexString(char *dst, unsigned int hexDigits, bool upperCase, roundingMode) const
Write out a hexadecimal representation of the floating point value to DST, which must be of sufficien...
Definition APFloat.cpp:3323

llvm::detail::IEEEFloat::compareAbsoluteValue
LLVM_ABI cmpResult compareAbsoluteValue(const IEEEFloat &) const
Definition APFloat.cpp:1541

llvm::detail::IEEEFloat::mod
LLVM_ABI opStatus mod(const IEEEFloat &)
C fmod, or llvm frem.
Definition APFloat.cpp:2312

llvm::detail::IEEEFloat::getCategory
fltCategory getCategory() const
Definition APFloat.h:573

llvm::detail::IEEEFloat::convertFromAPInt
LLVM_ABI opStatus convertFromAPInt(const APInt &, bool, roundingMode)
Definition APFloat.cpp:2881

llvm::detail::IEEEFloat::isFiniteNonZero
bool isFiniteNonZero() const
Definition APFloat.h:576

llvm::detail::IEEEFloat::needsCleanup
bool needsCleanup() const
Returns whether this instance allocated memory.
Definition APFloat.h:463

llvm::detail::IEEEFloat::makeLargest
LLVM_ABI void makeLargest(bool Neg=false)
Make this number the largest magnitude normal number in the given semantics.
Definition APFloat.cpp:4109

llvm::detail::IEEEFloat::getExactLog2Abs
LLVM_ABI LLVM_READONLY int getExactLog2Abs() const
Definition APFloat.cpp:4504

llvm::detail::IEEEFloat::bitcastToAPInt
LLVM_ABI APInt bitcastToAPInt() const
Definition APFloat.cpp:3733

llvm::detail::IEEEFloat::scalbn
LLVM_ABI friend IEEEFloat scalbn(IEEEFloat X, int Exp, roundingMode)
Definition APFloat.cpp:4747

llvm::detail::IEEEFloat::compare
LLVM_ABI cmpResult compare(const IEEEFloat &) const
IEEE comparison with another floating point number (NaNs compare unordered, 0==-0).
Definition APFloat.cpp:2483

llvm::detail::IEEEFloat::isNegative
bool isNegative() const
IEEE-754R isSignMinus: Returns true if and only if the current value is negative.
Definition APFloat.h:538

llvm::detail::IEEEFloat::divide
LLVM_ABI opStatus divide(const IEEEFloat &, roundingMode)
Definition APFloat.cpp:2182

llvm::detail::IEEEFloat::isNaN
bool isNaN() const
Returns true if and only if the float is a quiet or signaling NaN.
Definition APFloat.h:563

llvm::detail::IEEEFloat::remainder
LLVM_ABI opStatus remainder(const IEEEFloat &)
IEEE remainder.
Definition APFloat.cpp:2202

llvm::detail::IEEEFloat::convertToDouble
LLVM_ABI double convertToDouble() const
Definition APFloat.cpp:3803

llvm::detail::IEEEFloat::convertToFloat
LLVM_ABI float convertToFloat() const
Definition APFloat.cpp:3796

llvm::detail::IEEEFloat::subtract
LLVM_ABI opStatus subtract(const IEEEFloat &, roundingMode)
Definition APFloat.cpp:2156

llvm::detail::IEEEFloat::toString
LLVM_ABI void toString(SmallVectorImpl< char > &Str, unsigned FormatPrecision=0, unsigned FormatMaxPadding=3, bool TruncateZero=true) const
Converts this value into a decimal string.
Definition APFloat.cpp:4460

llvm::detail::IEEEFloat::~IEEEFloat
LLVM_ABI ~IEEEFloat()
Definition APFloat.cpp:1220

llvm::detail::IEEEFloat::makeSmallest
LLVM_ABI void makeSmallest(bool Neg=false)
Make this number the smallest magnitude denormal number in the given semantics.
Definition APFloat.cpp:4141

llvm::detail::IEEEFloat::makeInf
LLVM_ABI void makeInf(bool Neg=false)
Definition APFloat.cpp:4694

llvm::detail::IEEEFloat::isSmallestNormalized
LLVM_ABI bool isSmallestNormalized() const
Returns true if this is the smallest (by magnitude) normalized finite number in the given semantics.
Definition APFloat.cpp:1041

llvm::detail::IEEEFloat::makeQuiet
LLVM_ABI void makeQuiet()
Definition APFloat.cpp:4723

llvm::detail::IEEEFloat::isLargest
LLVM_ABI bool isLargest() const
Returns true if and only if the number has the largest possible finite magnitude in the current seman...
Definition APFloat.cpp:1143

llvm::detail::IEEEFloat::add
LLVM_ABI opStatus add(const IEEEFloat &, roundingMode)
Definition APFloat.cpp:2150

llvm::detail::IEEEFloat::isFinite
bool isFinite() const
Returns true if and only if the current value is zero, subnormal, or normal.
Definition APFloat.h:550

llvm::detail::IEEEFloat::convertFromString
LLVM_ABI Expected< opStatus > convertFromString(StringRef, roundingMode)
Definition APFloat.cpp:3266

llvm::detail::IEEEFloat::makeNaN
LLVM_ABI void makeNaN(bool SNaN=false, bool Neg=false, const APInt *fill=nullptr)
Definition APFloat.cpp:930

llvm::detail::IEEEFloat::multiply
LLVM_ABI opStatus multiply(const IEEEFloat &, roundingMode)
Definition APFloat.cpp:2162

llvm::detail::IEEEFloat::roundToIntegral
LLVM_ABI opStatus roundToIntegral(roundingMode)
Definition APFloat.cpp:2396

llvm::detail::IEEEFloat::operator=
LLVM_ABI IEEEFloat & operator=(const IEEEFloat &)
Definition APFloat.cpp:1002

llvm::detail::IEEEFloat::bitwiseIsEqual
LLVM_ABI bool bitwiseIsEqual(const IEEEFloat &) const
Bitwise comparison for equality (QNaNs compare equal, 0!=-0).
Definition APFloat.cpp:1168

llvm::detail::IEEEFloat::makeSmallestNormalized
LLVM_ABI void makeSmallestNormalized(bool Negative=false)
Returns the smallest (by magnitude) normalized finite number in the given semantics.
Definition APFloat.cpp:4155

llvm::detail::IEEEFloat::isInteger
LLVM_ABI bool isInteger() const
Returns true if and only if the number is an exact integer.
Definition APFloat.cpp:1160

llvm::detail::IEEEFloat::IEEEFloat
LLVM_ABI IEEEFloat(const fltSemantics &)
Definition APFloat.cpp:1195

llvm::detail::IEEEFloat::fusedMultiplyAdd
LLVM_ABI opStatus fusedMultiplyAdd(const IEEEFloat &, const IEEEFloat &, roundingMode)
Definition APFloat.cpp:2350

llvm::detail::IEEEFloat::ilogb
LLVM_ABI friend int ilogb(const IEEEFloat &Arg)
Definition APFloat.cpp:4729

llvm::detail::IEEEFloat::next
LLVM_ABI opStatus next(bool nextDown)
IEEE-754R 5.3.1: nextUp/nextDown.
Definition APFloat.cpp:4549

llvm::detail::IEEEFloat::isInfinity
bool isInfinity() const
IEEE-754R isInfinite(): Returns true if and only if the float is infinity.
Definition APFloat.h:560

llvm::detail::IEEEFloat::getSemantics
const fltSemantics & getSemantics() const
Definition APFloat.h:574

llvm::detail::IEEEFloat::isZero
bool isZero() const
Returns true if and only if the float is plus or minus zero.
Definition APFloat.h:553

llvm::detail::IEEEFloat::isSignaling
LLVM_ABI bool isSignaling() const
Returns true if and only if the float is a signaling NaN.
Definition APFloat.cpp:4533

llvm::detail::IEEEFloat::makeZero
LLVM_ABI void makeZero(bool Neg=false)
Definition APFloat.cpp:4709

llvm::detail::IEEEFloat::convert
LLVM_ABI opStatus convert(const fltSemantics &, roundingMode, bool *)
IEEEFloat::convert - convert a value of one floating point type to another.
Definition APFloat.cpp:2560

llvm::detail::IEEEFloat::changeSign
LLVM_ABI void changeSign()
Definition APFloat.cpp:2106

llvm::detail::IEEEFloat::isDenormal
LLVM_ABI bool isDenormal() const
IEEE-754R isSubnormal(): Returns true if and only if the float is a denormal.
Definition APFloat.cpp:1027

llvm::detail::IEEEFloat::convertToInteger
LLVM_ABI opStatus convertToInteger(MutableArrayRef< integerPart >, unsigned int, bool, roundingMode, bool *) const
Definition APFloat.cpp:2821

llvm::detail::IEEEFloat::isSmallest
LLVM_ABI bool isSmallest() const
Returns true if and only if the number has the smallest possible non-zero magnitude in the current se...
Definition APFloat.cpp:1033

llvm::hash_code
An opaque object representing a hash code.
Definition Hashing.h:76

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

uint64_t

uint8_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

Error.h

detail
Definition ClauseT.h:111

llvm::AArch64::RM
@ RM
Definition AArch64ISelLowering.h:34

llvm::ARCCC::Z
@ Z
Definition ARCInfo.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::M68k::MemAddrModeKind::q
@ q
Definition M68kBaseInfo.h:66

llvm::M68k::MemAddrModeKind::u
@ u
Definition M68kBaseInfo.h:60

llvm::M68k::MemAddrModeKind::p
@ p
Definition M68kBaseInfo.h:55

llvm::M68k::MemAddrModeKind::v
@ v
Definition M68kBaseInfo.h:62

llvm::detail::opInexact
static constexpr opStatus opInexact
Definition APFloat.h:439

llvm::detail::abs
LLVM_ABI SlowDynamicAPInt abs(const SlowDynamicAPInt &X)
Redeclarations of friend declarations above to make it discoverable by lookups.
Definition SlowDynamicAPInt.cpp:190

llvm::detail::fcNaN
static constexpr fltCategory fcNaN
Definition APFloat.h:441

llvm::detail::opDivByZero
static constexpr opStatus opDivByZero
Definition APFloat.h:436

llvm::detail::opOverflow
static constexpr opStatus opOverflow
Definition APFloat.h:437

llvm::detail::cmpLessThan
static constexpr cmpResult cmpLessThan
Definition APFloat.h:431

llvm::detail::value
const char unit< Period >::value[]
Definition Chrono.h:104

llvm::detail::tcSetLeastSignificantBits
static void tcSetLeastSignificantBits(APInt::WordType *dst, unsigned parts, unsigned bits)
Definition APFloat.cpp:1566

llvm::detail::rmTowardPositive
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:427

llvm::detail::uninitialized
static constexpr uninitializedTag uninitialized
Definition APFloat.h:421

llvm::detail::fcZero
static constexpr fltCategory fcZero
Definition APFloat.h:443

llvm::detail::opOK
static constexpr opStatus opOK
Definition APFloat.h:434

llvm::detail::cmpGreaterThan
static constexpr cmpResult cmpGreaterThan
Definition APFloat.h:432

llvm::detail::integerPartWidth
static constexpr unsigned integerPartWidth
Definition APFloat.h:429

llvm::detail::hash_value
LLVM_ABI hash_code hash_value(const IEEEFloat &Arg)
Definition APFloat.cpp:3471

llvm::detail::ExponentType
APFloatBase::ExponentType ExponentType
Definition APFloat.h:420

llvm::detail::fcNormal
static constexpr fltCategory fcNormal
Definition APFloat.h:442

llvm::detail::opInvalidOp
static constexpr opStatus opInvalidOp
Definition APFloat.h:435

llvm::detail::opStatus
APFloatBase::opStatus opStatus
Definition APFloat.h:417

llvm::detail::frexp
LLVM_ABI IEEEFloat frexp(const IEEEFloat &Val, int &Exp, roundingMode RM)
Definition APFloat.cpp:4768

llvm::detail::uninitializedTag
APFloatBase::uninitializedTag uninitializedTag
Definition APFloat.h:415

llvm::detail::cmpUnordered
static constexpr cmpResult cmpUnordered
Definition APFloat.h:433

llvm::detail::rmTowardNegative
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:426

llvm::detail::roundingMode
APFloatBase::roundingMode roundingMode
Definition APFloat.h:416

llvm::detail::cmpResult
APFloatBase::cmpResult cmpResult
Definition APFloat.h:418

llvm::detail::fcInfinity
static constexpr fltCategory fcInfinity
Definition APFloat.h:440

llvm::detail::rmNearestTiesToAway
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:424

llvm::detail::rmTowardZero
static constexpr roundingMode rmTowardZero
Definition APFloat.h:428

llvm::detail::opUnderflow
static constexpr opStatus opUnderflow
Definition APFloat.h:438

llvm::detail::rmNearestTiesToEven
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:422

llvm::detail::ilogb
LLVM_ABI int ilogb(const IEEEFloat &Arg)
Definition APFloat.cpp:4729

llvm::detail::cmpEqual
static constexpr cmpResult cmpEqual
Definition APFloat.h:430

llvm::detail::scalbn
LLVM_ABI IEEEFloat scalbn(IEEEFloat X, int Exp, roundingMode)
Definition APFloat.cpp:4747

llvm::detail::fastTwoSum
static std::pair< APFloat, APFloat > fastTwoSum(APFloat X, APFloat Y)
Definition APFloat.cpp:4857

llvm::detail::integerPart
APFloatBase::integerPart integerPart
Definition APFloat.h:414

llvm::lltok::APSInt
@ APSInt
Definition LLToken.h:520

llvm::lltok::APFloat
@ APFloat
Definition LLToken.h:519

llvm::pdb::Double
@ Double
Definition PDBTypes.h:402

llvm::sys::fs
Definition FileSystem.h:50

llvm::sys::fs::status
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().

llvm::tgtok::dot
@ dot
Definition TGLexer.h:50

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::partAsHex
static unsigned int partAsHex(char *dst, APFloatBase::integerPart part, unsigned int count, const char *hexDigitChars)
Definition APFloat.cpp:821

llvm::fill
void fill(R &&Range, T &&Value)
Provide wrappers to std::fill which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1745

llvm::infinityL
static const char infinityL[]
Definition APFloat.cpp:812

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1725

llvm::ChangePrinter::Quiet
@ Quiet
Definition PrintPasses.h:21

llvm::partCountForBits
static constexpr unsigned int partCountForBits(unsigned int bits)
Definition APFloat.cpp:385

llvm::NaNU
static const char NaNU[]
Definition APFloat.cpp:815

llvm::HUerrBound
static unsigned int HUerrBound(bool inexactMultiply, unsigned int HUerr1, unsigned int HUerr2)
Definition APFloat.cpp:696

llvm::powerOf5
static unsigned int powerOf5(APFloatBase::integerPart *dst, unsigned int power)
Definition APFloat.cpp:755

llvm::hexDigitValue
unsigned hexDigitValue(char C)
Interpret the given character C as a hexadecimal digit and return its value.
Definition StringExtras.h:81

llvm::harrisonUlp
static APFloat harrisonUlp(const APFloat &X)
Definition APFloat.cpp:872

llvm::exponentZero
static constexpr APFloatBase::ExponentType exponentZero(const fltSemantics &semantics)
Definition APFloat.cpp:359

llvm::totalExponent
static Expected< int > totalExponent(StringRef::iterator p, StringRef::iterator end, int exponentAdjustment)
Definition APFloat.cpp:447

llvm::inconvertibleErrorCode
LLVM_ABI std::error_code inconvertibleErrorCode()
The value returned by this function can be returned from convertToErrorCode for Error values where no...
Definition Error.cpp:98

llvm::maxPowerOfFiveExponent
const unsigned int maxPowerOfFiveExponent
Definition APFloat.cpp:285

llvm::ilogb
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1516

llvm::writeUnsignedDecimal
static char * writeUnsignedDecimal(char *dst, unsigned int n)
Definition APFloat.cpp:839

llvm::popcount
constexpr int popcount(T Value) noexcept
Count the number of set bits in a value.
Definition bit.h:154

llvm::maxPrecision
const unsigned int maxPrecision
Definition APFloat.cpp:284

llvm::frexp
APFloat frexp(const APFloat &X, int &Exp, APFloat::roundingMode RM)
Equivalent of C standard library function.
Definition APFloat.h:1537

llvm::NaNL
static const char NaNL[]
Definition APFloat.cpp:814

llvm::countr_zero
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
Definition bit.h:202

llvm::infinityU
static const char infinityU[]
Definition APFloat.cpp:813

llvm::lostFraction
lostFraction
Enum that represents what fraction of the LSB truncated bits of an fp number represent.
Definition APFloat.h:50

llvm::lfMoreThanHalf
@ lfMoreThanHalf
Definition APFloat.h:54

llvm::lfLessThanHalf
@ lfLessThanHalf
Definition APFloat.h:52

llvm::lfExactlyHalf
@ lfExactlyHalf
Definition APFloat.h:53

llvm::lfExactlyZero
@ lfExactlyZero
Definition APFloat.h:51

llvm::interpretDecimal
static Error interpretDecimal(StringRef::iterator begin, StringRef::iterator end, decimalInfo *D)
Definition APFloat.cpp:539

llvm::isFinite
LLVM_ABI bool isFinite(const Loop *L)
Return true if this loop can be assumed to run for a finite number of iterations.
Definition LoopInfo.cpp:1152

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition FloatingPointMode.h:240

llvm::fcNegSubnormal
@ fcNegSubnormal
Definition FloatingPointMode.h:247

llvm::fcPosNormal
@ fcPosNormal
Definition FloatingPointMode.h:251

llvm::fcQNan
@ fcQNan
Definition FloatingPointMode.h:244

llvm::fcNegZero
@ fcNegZero
Definition FloatingPointMode.h:248

llvm::fcNegInf
@ fcNegInf
Definition FloatingPointMode.h:245

llvm::fcPosZero
@ fcPosZero
Definition FloatingPointMode.h:249

llvm::fcSNan
@ fcSNan
Definition FloatingPointMode.h:243

llvm::fcNegNormal
@ fcNegNormal
Definition FloatingPointMode.h:246

llvm::fcZero
@ fcZero
Definition FloatingPointMode.h:258

llvm::fcPosSubnormal
@ fcPosSubnormal
Definition FloatingPointMode.h:250

llvm::fcPosInf
@ fcPosInf
Definition FloatingPointMode.h:252

llvm::maxPowerOfFiveParts
const unsigned int maxPowerOfFiveParts
Definition APFloat.cpp:286

llvm::scalbn
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1525

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207

llvm::exponentNaN
static constexpr APFloatBase::ExponentType exponentNaN(const fltSemantics &semantics)
Definition APFloat.cpp:369

llvm::createError
static Error createError(const Twine &Err)
Definition APFloat.cpp:381

llvm::shiftRight
static lostFraction shiftRight(APFloatBase::integerPart *dst, unsigned int parts, unsigned int bits)
Definition APFloat.cpp:662

llvm::make_error
Error make_error(ArgTs &&... Args)
Make a Error instance representing failure using the given error info type.
Definition Error.h:340

llvm::PackElem::Hi
@ Hi
Definition VECustomDAG.h:132

llvm::PackElem::Lo
@ Lo
Definition VECustomDAG.h:131

llvm::IRMemLocation::First
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
Definition ModRef.h:74

llvm::hexDigitsUpper
static const char hexDigitsUpper[]
Definition APFloat.cpp:811

llvm::Data
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189

llvm::instrprof_error::truncated
@ truncated
Definition InstrProf.h:407

llvm::maxExponent
const unsigned int maxExponent
Definition APFloat.cpp:283

llvm::decDigitValue
static unsigned int decDigitValue(unsigned int c)
Definition APFloat.cpp:392

llvm::fltNonfiniteBehavior
fltNonfiniteBehavior
Definition APFloat.cpp:57

llvm::fltNonfiniteBehavior::IEEE754
@ IEEE754
Definition APFloat.cpp:61

llvm::fltNonfiniteBehavior::NanOnly
@ NanOnly
Definition APFloat.cpp:70

llvm::fltNonfiniteBehavior::FiniteOnly
@ FiniteOnly
Definition APFloat.cpp:74

llvm::count
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
Definition STLExtras.h:1954

llvm::combineLostFractions
static lostFraction combineLostFractions(lostFraction moreSignificant, lostFraction lessSignificant)
Definition APFloat.cpp:675

llvm::skipLeadingZeroesAndAnyDot
static Expected< StringRef::iterator > skipLeadingZeroesAndAnyDot(StringRef::iterator begin, StringRef::iterator end, StringRef::iterator *dot)
Definition APFloat.cpp:499

llvm::RoundingMode
RoundingMode
Rounding mode.
Definition FloatingPointMode.h:38

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::exponentInf
static constexpr APFloatBase::ExponentType exponentInf(const fltSemantics &semantics)
Definition APFloat.cpp:364

llvm::HighlightColor::Error
@ Error
Definition WithColor.h:34

llvm::lostFractionThroughTruncation
static lostFraction lostFractionThroughTruncation(const APFloatBase::integerPart *parts, unsigned int partCount, unsigned int bits)
Definition APFloat.cpp:640

llvm::neg
APFloat neg(APFloat X)
Returns the negated value of the argument.
Definition APFloat.h:1551

llvm::ulpsFromBoundary
static APFloatBase::integerPart ulpsFromBoundary(const APFloatBase::integerPart *parts, unsigned int bits, bool isNearest)
Definition APFloat.cpp:710

llvm::writeSignedDecimal
static char * writeSignedDecimal(char *dst, int value)
Definition APFloat.cpp:857

llvm::hash_combine
hash_code hash_combine(const Ts &...args)
Combine values into a single hash_code.
Definition Hashing.h:592

llvm::trailingHexadecimalFraction
static Expected< lostFraction > trailingHexadecimalFraction(StringRef::iterator p, StringRef::iterator end, unsigned int digitValue)
Definition APFloat.cpp:609

llvm::consumeError
void consumeError(Error Err)
Consume a Error without doing anything.
Definition Error.h:1083

llvm::fltNanEncoding
fltNanEncoding
Definition APFloat.cpp:81

llvm::fltNanEncoding::NegativeZero
@ NegativeZero
Definition APFloat.cpp:99

llvm::fltNanEncoding::AllOnes
@ AllOnes
Definition APFloat.cpp:92

llvm::fltNanEncoding::IEEE
@ IEEE
Definition APFloat.cpp:84

llvm::readExponent
static Expected< int > readExponent(StringRef::iterator begin, StringRef::iterator end)
Definition APFloat.cpp:402

llvm::hash_combine_range
hash_code hash_combine_range(InputIteratorT first, InputIteratorT last)
Compute a hash_code for a sequence of values.
Definition Hashing.h:466

llvm::NextPowerOf2
constexpr uint64_t NextPowerOf2(uint64_t A)
Returns the next power of two (in 64-bits) that is strictly greater than A.
Definition MathExtras.h:373

llvm::hexDigitsLower
static const char hexDigitsLower[]
Definition APFloat.cpp:810

raw_ostream.h

N
#define N

Status
Definition SIModeRegister.cpp:29

llvm::decimalInfo
Definition APFloat.cpp:532

llvm::decimalInfo::normalizedExponent
int normalizedExponent
Definition APFloat.cpp:536

llvm::decimalInfo::exponent
int exponent
Definition APFloat.cpp:535

llvm::decimalInfo::lastSigDigit
const char * lastSigDigit
Definition APFloat.cpp:534

llvm::decimalInfo::firstSigDigit
const char * firstSigDigit
Definition APFloat.cpp:533

llvm::fltSemantics
Definition APFloat.cpp:103

llvm::fltSemantics::hasSignBitInMSB
bool hasSignBitInMSB
Definition APFloat.cpp:130

llvm::fltSemantics::maxExponent
APFloatBase::ExponentType maxExponent
Definition APFloat.cpp:106

llvm::fltSemantics::nonFiniteBehavior
fltNonfiniteBehavior nonFiniteBehavior
Definition APFloat.cpp:119

llvm::fltSemantics::minExponent
APFloatBase::ExponentType minExponent
Definition APFloat.cpp:110

llvm::fltSemantics::hasSignedRepr
bool hasSignedRepr
Definition APFloat.cpp:127

llvm::fltSemantics::sizeInBits
unsigned int sizeInBits
Definition APFloat.cpp:117

llvm::fltSemantics::precision
unsigned int precision
Definition APFloat.cpp:114

llvm::fltSemantics::hasZero
bool hasZero
Definition APFloat.cpp:124

llvm::fltSemantics::nanEncoding
fltNanEncoding nanEncoding
Definition APFloat.cpp:121