doxygen/ScaledNumber_8cpp_source.html

//==- lib/Support/ScaledNumber.cpp - Support for scaled numbers -*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// Implementation of some scaled number algorithms.

//

//===----------------------------------------------------------------------===//


#include "llvm/Support/ScaledNumber.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/raw_ostream.h"


using namespace llvm;

using namespace llvm::ScaledNumbers;


std::pair<uint64_t, int16_t> ScaledNumbers::multiply64(uint64_t LHS,

                                                       uint64_t RHS) {

  // Separate into two 32-bit digits (U.L).

  auto getU = [](uint64_t N) { return N >> 32; };

  auto getL = [](uint64_t N) { return N & UINT32_MAX; };

  uint64_t UL = getU(LHS), LL = getL(LHS), UR = getU(RHS), LR = getL(RHS);


  // Compute cross products.

  uint64_t P1 = UL * UR, P2 = UL * LR, P3 = LL * UR, P4 = LL * LR;


  // Sum into two 64-bit digits.

  uint64_t Upper = P1, Lower = P4;

  auto addWithCarry = [&](uint64_t N) {

    uint64_t NewLower = Lower + (getL(N) << 32);

    Upper += getU(N) + (NewLower < Lower);

    Lower = NewLower;

  };

  addWithCarry(P2);

  addWithCarry(P3);


  // Check whether the upper digit is empty.

  if (!Upper)

    return std::make_pair(Lower, 0);


  // Shift as little as possible to maximize precision.

  unsigned LeadingZeros = llvm::countl_zero(Upper);

  int Shift = 64 - LeadingZeros;

  if (LeadingZeros)

    Upper = Upper << LeadingZeros | Lower >> Shift;

  return getRounded(Upper, Shift,

                    Shift && (Lower & UINT64_C(1) << (Shift - 1)));

}


static uint64_t getHalf(uint64_t N) { return (N >> 1) + (N & 1); }


std::pair<uint32_t, int16_t> ScaledNumbers::divide32(uint32_t Dividend,

                                                     uint32_t Divisor) {

  assert(Dividend && "expected non-zero dividend");

  assert(Divisor && "expected non-zero divisor");


  // Use 64-bit math and canonicalize the dividend to gain precision.

  uint64_t Dividend64 = Dividend;

  int Shift = 0;

  if (int Zeros = llvm::countl_zero(Dividend64)) {

    Shift -= Zeros;

    Dividend64 <<= Zeros;

  }

  uint64_t Quotient = Dividend64 / Divisor;

  uint64_t Remainder = Dividend64 % Divisor;


  // If Quotient needs to be shifted, leave the rounding to getAdjusted().

  if (Quotient > UINT32_MAX)

    return getAdjusted<uint32_t>(Quotient, Shift);


  // Round based on the value of the next bit.

  return getRounded<uint32_t>(Quotient, Shift, Remainder >= getHalf(Divisor));

}


std::pair<uint64_t, int16_t> ScaledNumbers::divide64(uint64_t Dividend,

                                                     uint64_t Divisor) {

  assert(Dividend && "expected non-zero dividend");

  assert(Divisor && "expected non-zero divisor");


  // Minimize size of divisor.

  int Shift = 0;

  if (int Zeros = llvm::countr_zero(Divisor)) {

    Shift -= Zeros;

    Divisor >>= Zeros;

  }


  // Check for powers of two.

  if (Divisor == 1)

    return std::make_pair(Dividend, Shift);


  // Maximize size of dividend.

  if (int Zeros = llvm::countl_zero(Dividend)) {

    Shift -= Zeros;

    Dividend <<= Zeros;

  }


  // Start with the result of a divide.

  uint64_t Quotient = Dividend / Divisor;

  Dividend %= Divisor;


  // Continue building the quotient with long division.

  while (!(Quotient >> 63) && Dividend) {

    // Shift Dividend and check for overflow.

    bool IsOverflow = Dividend >> 63;

    Dividend <<= 1;

    --Shift;


    // Get the next bit of Quotient.

    Quotient <<= 1;

    if (IsOverflow || Divisor <= Dividend) {

      Quotient |= 1;

      Dividend -= Divisor;

    }

  }


  return getRounded(Quotient, Shift, Dividend >= getHalf(Divisor));

}


int ScaledNumbers::compareImpl(uint64_t L, uint64_t R, int ScaleDiff) {

  assert(ScaleDiff >= 0 && "wrong argument order");

  assert(ScaleDiff < 64 && "numbers too far apart");


  uint64_t L_adjusted = L >> ScaleDiff;

  if (L_adjusted < R)

    return -1;

  if (L_adjusted > R)

    return 1;


  return L > L_adjusted << ScaleDiff ? 1 : 0;

}


static void appendDigit(std::string &Str, unsigned D) {

  assert(D < 10);

  Str += '0' + D % 10;

}


static void appendNumber(std::string &Str, uint64_t N) {

  while (N) {

    appendDigit(Str, N % 10);

    N /= 10;

  }

}


static bool doesRoundUp(char Digit) {

  switch (Digit) {

  case '5':

  case '6':

  case '7':

  case '8':

  case '9':

    return true;

  default:

    return false;

  }

}


static std::string toStringAPFloat(uint64_t D, int E, unsigned Precision) {

  assert(E >= ScaledNumbers::MinScale);

  assert(E <= ScaledNumbers::MaxScale);


  // Find a new E, but don't let it increase past MaxScale.

  int LeadingZeros = ScaledNumberBase::countLeadingZeros64(D);

  int NewE = std::min(ScaledNumbers::MaxScale, E + 63 - LeadingZeros);

  int Shift = 63 - (NewE - E);

  assert(Shift <= LeadingZeros);

  assert(Shift == LeadingZeros || NewE == ScaledNumbers::MaxScale);

  assert(Shift >= 0 && Shift < 64 && "undefined behavior");

  D <<= Shift;

  E = NewE;


  // Check for a denormal.

  unsigned AdjustedE = E + 16383;

  if (!(D >> 63)) {

    assert(E == ScaledNumbers::MaxScale);

    AdjustedE = 0;

  }


  // Build the float and print it.

  uint64_t RawBits[2] = {D, AdjustedE};

  APFloat Float(APFloat::x87DoubleExtended(), APInt(80, RawBits));

  SmallVector<char, 24> Chars;

  Float.toString(Chars, Precision, 0);

  return std::string(Chars.begin(), Chars.end());

}


static std::string stripTrailingZeros(const std::string &Float) {

  size_t NonZero = Float.find_last_not_of('0');

  assert(NonZero != std::string::npos && "no . in floating point string");


  if (Float[NonZero] == '.')

    ++NonZero;


  return Float.substr(0, NonZero + 1);

}


std::string ScaledNumberBase::toString(uint64_t D, int16_t E, int Width,

                                       unsigned Precision) {

  if (!D)

    return "0.0";


  // Canonicalize exponent and digits.

  uint64_t Above0 = 0;

  uint64_t Below0 = 0;

  uint64_t Extra = 0;

  int ExtraShift = 0;

  if (E == 0) {

    Above0 = D;

  } else if (E > 0) {

    if (int Shift = std::min(int16_t(countLeadingZeros64(D)), E)) {

      D <<= Shift;

      E -= Shift;


      if (!E)

        Above0 = D;

    }

  } else if (E > -64) {

    Above0 = D >> -E;

    Below0 = D << (64 + E);

  } else if (E == -64) {

    // Special case: shift by 64 bits is undefined behavior.

    Below0 = D;

  } else if (E > -120) {

    Below0 = D >> (-E - 64);

    Extra = D << (128 + E);

    ExtraShift = -64 - E;

  }


  // Fall back on APFloat for very small and very large numbers.

  if (!Above0 && !Below0)

    return toStringAPFloat(D, E, Precision);


  // Append the digits before the decimal.

  std::string Str;

  size_t DigitsOut = 0;

  if (Above0) {

    appendNumber(Str, Above0);

    DigitsOut = Str.size();

  } else

    appendDigit(Str, 0);

  std::reverse(Str.begin(), Str.end());


  // Return early if there's nothing after the decimal.

  if (!Below0)

    return Str + ".0";


  // Append the decimal and beyond.

  Str += '.';

  uint64_t Error = UINT64_C(1) << (64 - Width);


  // We need to shift Below0 to the right to make space for calculating

  // digits.  Save the precision we're losing in Extra.

  Extra = (Below0 & 0xf) << 56 | (Extra >> 8);

  Below0 >>= 4;

  size_t SinceDot = 0;

  size_t AfterDot = Str.size();

  do {

    if (ExtraShift) {

      --ExtraShift;

      Error *= 5;

    } else

      Error *= 10;


    Below0 *= 10;

    Extra *= 10;

    Below0 += (Extra >> 60);

    Extra = Extra & (UINT64_MAX >> 4);

    appendDigit(Str, Below0 >> 60);

    Below0 = Below0 & (UINT64_MAX >> 4);

    if (DigitsOut || Str.back() != '0')

      ++DigitsOut;

    ++SinceDot;

  } while (Error && (Below0 << 4 | Extra >> 60) >= Error / 2 &&

           (!Precision || DigitsOut <= Precision || SinceDot < 2));


  // Return early for maximum precision.

  if (!Precision || DigitsOut <= Precision)

    return stripTrailingZeros(Str);


  // Find where to truncate.

  size_t Truncate =

      std::max(Str.size() - (DigitsOut - Precision), AfterDot + 1);


  // Check if there's anything to truncate.

  if (Truncate >= Str.size())

    return stripTrailingZeros(Str);


  bool Carry = doesRoundUp(Str[Truncate]);

  if (!Carry)

    return stripTrailingZeros(Str.substr(0, Truncate));


  // Round with the first truncated digit.

  for (std::string::reverse_iterator I(Str.begin() + Truncate), E = Str.rend();

       I != E; ++I) {

    if (*I == '.')

      continue;

    if (*I == '9') {

      *I = '0';

      continue;

    }


    ++*I;

    Carry = false;

    break;

  }


  // Add "1" in front if we still need to carry.

  return stripTrailingZeros(std::string(Carry, '1') + Str.substr(0, Truncate));

}


raw_ostream &ScaledNumberBase::print(raw_ostream &OS, uint64_t D, int16_t E,

                                     int Width, unsigned Precision) {

  return OS << toString(D, E, Width, Precision);

}


void ScaledNumberBase::dump(uint64_t D, int16_t E, int Width) {

  print(dbgs(), D, E, Width, 0) << "[" << Width << ":" << D << "*2^" << E

                                << "]";

}

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

ArrayRef.h

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

Debug.h

I
#define I(x, y, z)
Definition: MD5.cpp:58

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

OS
raw_pwrite_stream & OS
Definition: SampleProfWriter.cpp:53

getHalf
static uint64_t getHalf(uint64_t N)
Definition: ScaledNumber.cpp:55

doesRoundUp
static bool doesRoundUp(char Digit)
Definition: ScaledNumber.cpp:149

toStringAPFloat
static std::string toStringAPFloat(uint64_t D, int E, unsigned Precision)
Definition: ScaledNumber.cpp:162

appendDigit
static void appendDigit(std::string &Str, unsigned D)
Definition: ScaledNumber.cpp:137

stripTrailingZeros
static std::string stripTrailingZeros(const std::string &Float)
Definition: ScaledNumber.cpp:191

appendNumber
static void appendNumber(std::string &Str, uint64_t N)
Definition: ScaledNumber.cpp:142

ScaledNumber.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:76

LHS
Value * LHS
Definition: X86PartialReduction.cpp:75

llvm::APFloat
Definition: APFloat.h:780

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:76

llvm::Error
Lightweight error class with error context and mandatory checking.
Definition: Error.h:160

llvm::ScaledNumberBase::countLeadingZeros64
static int countLeadingZeros64(uint64_t N)
Definition: ScaledNumber.h:430

llvm::ScaledNumberBase::print
static raw_ostream & print(raw_ostream &OS, uint64_t D, int16_t E, int Width, unsigned Precision)
Definition: ScaledNumber.cpp:315

llvm::ScaledNumberBase::toString
static std::string toString(uint64_t D, int16_t E, int Width, unsigned Precision)
Definition: ScaledNumber.cpp:201

llvm::ScaledNumberBase::dump
static void dump(uint64_t D, int16_t E, int Width)
Definition: ScaledNumber.cpp:320

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition: SmallVector.h:282

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition: SmallVector.h:280

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52

uint32_t

uint64_t

UINT64_MAX
#define UINT64_MAX
Definition: DataTypes.h:77

llvm::ScaledNumbers
Definition: ScaledNumber.h:33

llvm::ScaledNumbers::divide64
std::pair< uint64_t, int16_t > divide64(uint64_t Dividend, uint64_t Divisor)
Divide two 64-bit integers to create a 64-bit scaled number.
Definition: ScaledNumber.cpp:80

llvm::ScaledNumbers::multiply64
std::pair< uint64_t, int16_t > multiply64(uint64_t LHS, uint64_t RHS)
Multiply two 64-bit integers to create a 64-bit scaled number.
Definition: ScaledNumber.cpp:22

llvm::ScaledNumbers::MinScale
const int32_t MinScale
Maximum scale; same as APFloat for easy debug printing.
Definition: ScaledNumber.h:39

llvm::ScaledNumbers::getRounded
std::pair< DigitsT, int16_t > getRounded(DigitsT Digits, int16_t Scale, bool ShouldRound)
Conditionally round up a scaled number.
Definition: ScaledNumber.h:52

llvm::ScaledNumbers::divide32
std::pair< uint32_t, int16_t > divide32(uint32_t Dividend, uint32_t Divisor)
Divide two 32-bit integers to create a 32-bit scaled number.
Definition: ScaledNumber.cpp:57

llvm::ScaledNumbers::MaxScale
const int32_t MaxScale
Maximum scale; same as APFloat for easy debug printing.
Definition: ScaledNumber.h:36

llvm::ScaledNumbers::compareImpl
int compareImpl(uint64_t L, uint64_t R, int ScaleDiff)
Implementation for comparing scaled numbers.
Definition: ScaledNumber.cpp:124

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::countr_zero
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
Definition: bit.h:215

llvm::countl_zero
int countl_zero(T Val)
Count number of 0's from the most significant bit to the least stopping at the first 1.
Definition: bit.h:281

llvm::HexPrintStyle::Upper
@ Upper

llvm::HexPrintStyle::Lower
@ Lower

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

raw_ostream.h

N
#define N