lib/Support/APInt.cpp

f22ef01cSRoman Divacky//===-- APInt.cpp - Implement APInt class ---------------------------------===//
f22ef01cSRoman Divacky//
f22ef01cSRoman Divacky//                     The LLVM Compiler Infrastructure
f22ef01cSRoman Divacky//
f22ef01cSRoman Divacky// This file is distributed under the University of Illinois Open Source
f22ef01cSRoman Divacky// License. See LICENSE.TXT for details.
f22ef01cSRoman Divacky//
f22ef01cSRoman Divacky//===----------------------------------------------------------------------===//
f22ef01cSRoman Divacky//
f22ef01cSRoman Divacky// This file implements a class to represent arbitrary precision integer
f22ef01cSRoman Divacky// constant values and provide a variety of arithmetic operations on them.
f22ef01cSRoman Divacky//
f22ef01cSRoman Divacky//===----------------------------------------------------------------------===//
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky#include "llvm/ADT/APInt.h"
3ca95b02SDimitry Andric#include "llvm/ADT/ArrayRef.h"
f22ef01cSRoman Divacky#include "llvm/ADT/FoldingSet.h"
dff0c46cSDimitry Andric#include "llvm/ADT/Hashing.h"
*b5893f02SDimitry Andric#include "llvm/ADT/Optional.h"
f22ef01cSRoman Divacky#include "llvm/ADT/SmallString.h"
dff0c46cSDimitry Andric#include "llvm/ADT/StringRef.h"
*b5893f02SDimitry Andric#include "llvm/ADT/bit.h"
4ba319b5SDimitry Andric#include "llvm/Config/llvm-config.h"
f22ef01cSRoman Divacky#include "llvm/Support/Debug.h"
f22ef01cSRoman Divacky#include "llvm/Support/ErrorHandling.h"
f22ef01cSRoman Divacky#include "llvm/Support/MathExtras.h"
f22ef01cSRoman Divacky#include "llvm/Support/raw_ostream.h"
d88c1a5aSDimitry Andric#include <climits>
f22ef01cSRoman Divacky#include <cmath>
f22ef01cSRoman Divacky#include <cstdlib>
139f7f9bSDimitry Andric#include <cstring>
f22ef01cSRoman Divackyusing namespace llvm;
f22ef01cSRoman Divacky
91bc56edSDimitry Andric#define DEBUG_TYPE "apint"
91bc56edSDimitry Andric
f22ef01cSRoman Divacky/// A utility function for allocating memory, checking for allocation failures,
f22ef01cSRoman Divacky/// and ensuring the contents are zeroed.
f22ef01cSRoman Divackyinline static uint64_t* getClearedMemory(unsigned numWords) {
f22ef01cSRoman Divacky  uint64_t *result = new uint64_t[numWords];
f22ef01cSRoman Divacky  memset(result, 0, numWords * sizeof(uint64_t));
f22ef01cSRoman Divacky  return result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// A utility function for allocating memory and checking for allocation
f22ef01cSRoman Divacky/// failure.  The content is not zeroed.
f22ef01cSRoman Divackyinline static uint64_t* getMemory(unsigned numWords) {
4ba319b5SDimitry Andric  return new uint64_t[numWords];
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// A utility function that converts a character to a digit.
f22ef01cSRoman Divackyinline static unsigned getDigit(char cdigit, uint8_t radix) {
f22ef01cSRoman Divacky  unsigned r;
f22ef01cSRoman Divacky
6122f3e6SDimitry Andric  if (radix == 16 || radix == 36) {
f22ef01cSRoman Divacky    r = cdigit - '0';
f22ef01cSRoman Divacky    if (r <= 9)
f22ef01cSRoman Divacky      return r;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    r = cdigit - 'A';
6122f3e6SDimitry Andric    if (r <= radix - 11U)
f22ef01cSRoman Divacky      return r + 10;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    r = cdigit - 'a';
6122f3e6SDimitry Andric    if (r <= radix - 11U)
f22ef01cSRoman Divacky      return r + 10;
6122f3e6SDimitry Andric
6122f3e6SDimitry Andric    radix = 10;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  r = cdigit - '0';
f22ef01cSRoman Divacky  if (r < radix)
f22ef01cSRoman Divacky    return r;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return -1U;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky
3ca95b02SDimitry Andricvoid APInt::initSlowCase(uint64_t val, bool isSigned) {
f37b6182SDimitry Andric  U.pVal = getClearedMemory(getNumWords());
f37b6182SDimitry Andric  U.pVal[0] = val;
f22ef01cSRoman Divacky  if (isSigned && int64_t(val) < 0)
f22ef01cSRoman Divacky    for (unsigned i = 1; i < getNumWords(); ++i)
*b5893f02SDimitry Andric      U.pVal[i] = WORDTYPE_MAX;
7a7e6055SDimitry Andric  clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divackyvoid APInt::initSlowCase(const APInt& that) {
f37b6182SDimitry Andric  U.pVal = getMemory(getNumWords());
f37b6182SDimitry Andric  memcpy(U.pVal, that.U.pVal, getNumWords() * APINT_WORD_SIZE);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6122f3e6SDimitry Andricvoid APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
f22ef01cSRoman Divacky  assert(BitWidth && "Bitwidth too small");
6122f3e6SDimitry Andric  assert(bigVal.data() && "Null pointer detected!");
f22ef01cSRoman Divacky  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL = bigVal[0];
f22ef01cSRoman Divacky  else {
f22ef01cSRoman Divacky    // Get memory, cleared to 0
f37b6182SDimitry Andric    U.pVal = getClearedMemory(getNumWords());
f22ef01cSRoman Divacky    // Calculate the number of words to copy
6122f3e6SDimitry Andric    unsigned words = std::min<unsigned>(bigVal.size(), getNumWords());
f22ef01cSRoman Divacky    // Copy the words from bigVal to pVal
f37b6182SDimitry Andric    memcpy(U.pVal, bigVal.data(), words * APINT_WORD_SIZE);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  // Make sure unused high bits are cleared
f22ef01cSRoman Divacky  clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6122f3e6SDimitry AndricAPInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal)
7a7e6055SDimitry Andric  : BitWidth(numBits) {
6122f3e6SDimitry Andric  initFromArray(bigVal);
6122f3e6SDimitry Andric}
6122f3e6SDimitry Andric
6122f3e6SDimitry AndricAPInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
7a7e6055SDimitry Andric  : BitWidth(numBits) {
6122f3e6SDimitry Andric  initFromArray(makeArrayRef(bigVal, numWords));
6122f3e6SDimitry Andric}
6122f3e6SDimitry Andric
ffd1746dSEd SchoutenAPInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
f37b6182SDimitry Andric  : BitWidth(numbits) {
f22ef01cSRoman Divacky  assert(BitWidth && "Bitwidth too small");
f22ef01cSRoman Divacky  fromString(numbits, Str, radix);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
5517e702SDimitry Andricvoid APInt::reallocate(unsigned NewBitWidth) {
5517e702SDimitry Andric  // If the number of words is the same we can just change the width and stop.
5517e702SDimitry Andric  if (getNumWords() == getNumWords(NewBitWidth)) {
5517e702SDimitry Andric    BitWidth = NewBitWidth;
5517e702SDimitry Andric    return;
5517e702SDimitry Andric  }
5517e702SDimitry Andric
5517e702SDimitry Andric  // If we have an allocation, delete it.
5517e702SDimitry Andric  if (!isSingleWord())
5517e702SDimitry Andric    delete [] U.pVal;
5517e702SDimitry Andric
5517e702SDimitry Andric  // Update BitWidth.
5517e702SDimitry Andric  BitWidth = NewBitWidth;
5517e702SDimitry Andric
5517e702SDimitry Andric  // If we are supposed to have an allocation, create it.
5517e702SDimitry Andric  if (!isSingleWord())
5517e702SDimitry Andric    U.pVal = getMemory(getNumWords());
5517e702SDimitry Andric}
5517e702SDimitry Andric
6bc11b14SDimitry Andricvoid APInt::AssignSlowCase(const APInt& RHS) {
f22ef01cSRoman Divacky  // Don't do anything for X = X
f22ef01cSRoman Divacky  if (this == &RHS)
6bc11b14SDimitry Andric    return;
f22ef01cSRoman Divacky
5517e702SDimitry Andric  // Adjust the bit width and handle allocations as necessary.
5517e702SDimitry Andric  reallocate(RHS.getBitWidth());
f22ef01cSRoman Divacky
5517e702SDimitry Andric  // Copy the data.
5517e702SDimitry Andric  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL = RHS.U.VAL;
5517e702SDimitry Andric  else
5517e702SDimitry Andric    memcpy(U.pVal, RHS.U.pVal, getNumWords() * APINT_WORD_SIZE);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
ff0cc061SDimitry Andric/// This method 'profiles' an APInt for use with FoldingSet.
f22ef01cSRoman Divackyvoid APInt::Profile(FoldingSetNodeID& ID) const {
f22ef01cSRoman Divacky  ID.AddInteger(BitWidth);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  if (isSingleWord()) {
f37b6182SDimitry Andric    ID.AddInteger(U.VAL);
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  unsigned NumWords = getNumWords();
f22ef01cSRoman Divacky  for (unsigned i = 0; i < NumWords; ++i)
f37b6182SDimitry Andric    ID.AddInteger(U.pVal[i]);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
4ba319b5SDimitry Andric/// Prefix increment operator. Increments the APInt by one.
f22ef01cSRoman DivackyAPInt& APInt::operator++() {
f22ef01cSRoman Divacky  if (isSingleWord())
f37b6182SDimitry Andric    ++U.VAL;
f22ef01cSRoman Divacky  else
f37b6182SDimitry Andric    tcIncrement(U.pVal, getNumWords());
f22ef01cSRoman Divacky  return clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
4ba319b5SDimitry Andric/// Prefix decrement operator. Decrements the APInt by one.
f22ef01cSRoman DivackyAPInt& APInt::operator--() {
f22ef01cSRoman Divacky  if (isSingleWord())
f37b6182SDimitry Andric    --U.VAL;
f22ef01cSRoman Divacky  else
f37b6182SDimitry Andric    tcDecrement(U.pVal, getNumWords());
f22ef01cSRoman Divacky  return clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Adds the RHS APint to this APInt.
f22ef01cSRoman Divacky/// @returns this, after addition of RHS.
4ba319b5SDimitry Andric/// Addition assignment operator.
f22ef01cSRoman DivackyAPInt& APInt::operator+=(const APInt& RHS) {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
f22ef01cSRoman Divacky  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL += RHS.U.VAL;
7a7e6055SDimitry Andric  else
f37b6182SDimitry Andric    tcAdd(U.pVal, RHS.U.pVal, 0, getNumWords());
f22ef01cSRoman Divacky  return clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
d88c1a5aSDimitry AndricAPInt& APInt::operator+=(uint64_t RHS) {
d88c1a5aSDimitry Andric  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL += RHS;
d88c1a5aSDimitry Andric  else
f37b6182SDimitry Andric    tcAddPart(U.pVal, RHS, getNumWords());
d88c1a5aSDimitry Andric  return clearUnusedBits();
d88c1a5aSDimitry Andric}
d88c1a5aSDimitry Andric
f22ef01cSRoman Divacky/// Subtracts the RHS APInt from this APInt
f22ef01cSRoman Divacky/// @returns this, after subtraction
4ba319b5SDimitry Andric/// Subtraction assignment operator.
f22ef01cSRoman DivackyAPInt& APInt::operator-=(const APInt& RHS) {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
f22ef01cSRoman Divacky  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL -= RHS.U.VAL;
f22ef01cSRoman Divacky  else
f37b6182SDimitry Andric    tcSubtract(U.pVal, RHS.U.pVal, 0, getNumWords());
f22ef01cSRoman Divacky  return clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
d88c1a5aSDimitry AndricAPInt& APInt::operator-=(uint64_t RHS) {
d88c1a5aSDimitry Andric  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL -= RHS;
d88c1a5aSDimitry Andric  else
f37b6182SDimitry Andric    tcSubtractPart(U.pVal, RHS, getNumWords());
d88c1a5aSDimitry Andric  return clearUnusedBits();
d88c1a5aSDimitry Andric}
d88c1a5aSDimitry Andric
0f5676f4SDimitry AndricAPInt APInt::operator*(const APInt& RHS) const {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
0f5676f4SDimitry Andric  if (isSingleWord())
0f5676f4SDimitry Andric    return APInt(BitWidth, U.VAL * RHS.U.VAL);
f22ef01cSRoman Divacky
0f5676f4SDimitry Andric  APInt Result(getMemory(getNumWords()), getBitWidth());
f22ef01cSRoman Divacky
0f5676f4SDimitry Andric  tcMultiply(Result.U.pVal, U.pVal, RHS.U.pVal, getNumWords());
f22ef01cSRoman Divacky
0f5676f4SDimitry Andric  Result.clearUnusedBits();
0f5676f4SDimitry Andric  return Result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6bc11b14SDimitry Andricvoid APInt::AndAssignSlowCase(const APInt& RHS) {
f37b6182SDimitry Andric  tcAnd(U.pVal, RHS.U.pVal, getNumWords());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6bc11b14SDimitry Andricvoid APInt::OrAssignSlowCase(const APInt& RHS) {
f37b6182SDimitry Andric  tcOr(U.pVal, RHS.U.pVal, getNumWords());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6bc11b14SDimitry Andricvoid APInt::XorAssignSlowCase(const APInt& RHS) {
f37b6182SDimitry Andric  tcXor(U.pVal, RHS.U.pVal, getNumWords());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
0f5676f4SDimitry AndricAPInt& APInt::operator*=(const APInt& RHS) {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
0f5676f4SDimitry Andric  *this = *this * RHS;
0f5676f4SDimitry Andric  return *this;
0f5676f4SDimitry Andric}
0f5676f4SDimitry Andric
0f5676f4SDimitry AndricAPInt& APInt::operator*=(uint64_t RHS) {
0f5676f4SDimitry Andric  if (isSingleWord()) {
0f5676f4SDimitry Andric    U.VAL *= RHS;
0f5676f4SDimitry Andric  } else {
0f5676f4SDimitry Andric    unsigned NumWords = getNumWords();
0f5676f4SDimitry Andric    tcMultiplyPart(U.pVal, U.pVal, RHS, 0, NumWords, NumWords, false);
0f5676f4SDimitry Andric  }
0f5676f4SDimitry Andric  return clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divackybool APInt::EqualSlowCase(const APInt& RHS) const {
f37b6182SDimitry Andric  return std::equal(U.pVal, U.pVal + getNumWords(), RHS.U.pVal);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
51690af2SDimitry Andricint APInt::compare(const APInt& RHS) const {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
f22ef01cSRoman Divacky  if (isSingleWord())
f37b6182SDimitry Andric    return U.VAL < RHS.U.VAL ? -1 : U.VAL > RHS.U.VAL;
f22ef01cSRoman Divacky
f37b6182SDimitry Andric  return tcCompare(U.pVal, RHS.U.pVal, getNumWords());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
51690af2SDimitry Andricint APInt::compareSigned(const APInt& RHS) const {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
f22ef01cSRoman Divacky  if (isSingleWord()) {
f37b6182SDimitry Andric    int64_t lhsSext = SignExtend64(U.VAL, BitWidth);
f37b6182SDimitry Andric    int64_t rhsSext = SignExtend64(RHS.U.VAL, BitWidth);
51690af2SDimitry Andric    return lhsSext < rhsSext ? -1 : lhsSext > rhsSext;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  bool lhsNeg = isNegative();
3ca95b02SDimitry Andric  bool rhsNeg = RHS.isNegative();
f22ef01cSRoman Divacky
3ca95b02SDimitry Andric  // If the sign bits don't match, then (LHS < RHS) if LHS is negative
3ca95b02SDimitry Andric  if (lhsNeg != rhsNeg)
51690af2SDimitry Andric    return lhsNeg ? -1 : 1;
3ca95b02SDimitry Andric
7a7e6055SDimitry Andric  // Otherwise we can just use an unsigned comparison, because even negative
3ca95b02SDimitry Andric  // numbers compare correctly this way if both have the same signed-ness.
f37b6182SDimitry Andric  return tcCompare(U.pVal, RHS.U.pVal, getNumWords());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
7a7e6055SDimitry Andricvoid APInt::setBitsSlowCase(unsigned loBit, unsigned hiBit) {
7a7e6055SDimitry Andric  unsigned loWord = whichWord(loBit);
7a7e6055SDimitry Andric  unsigned hiWord = whichWord(hiBit);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Create an initial mask for the low word with zeros below loBit.
*b5893f02SDimitry Andric  uint64_t loMask = WORDTYPE_MAX << whichBit(loBit);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // If hiBit is not aligned, we need a high mask.
7a7e6055SDimitry Andric  unsigned hiShiftAmt = whichBit(hiBit);
7a7e6055SDimitry Andric  if (hiShiftAmt != 0) {
7a7e6055SDimitry Andric    // Create a high mask with zeros above hiBit.
*b5893f02SDimitry Andric    uint64_t hiMask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - hiShiftAmt);
7a7e6055SDimitry Andric    // If loWord and hiWord are equal, then we combine the masks. Otherwise,
7a7e6055SDimitry Andric    // set the bits in hiWord.
7a7e6055SDimitry Andric    if (hiWord == loWord)
7a7e6055SDimitry Andric      loMask &= hiMask;
7a7e6055SDimitry Andric    else
f37b6182SDimitry Andric      U.pVal[hiWord] |= hiMask;
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric  // Apply the mask to the low word.
f37b6182SDimitry Andric  U.pVal[loWord] |= loMask;
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Fill any words between loWord and hiWord with all ones.
7a7e6055SDimitry Andric  for (unsigned word = loWord + 1; word < hiWord; ++word)
*b5893f02SDimitry Andric    U.pVal[word] = WORDTYPE_MAX;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
4ba319b5SDimitry Andric/// Toggle every bit to its opposite value.
7a7e6055SDimitry Andricvoid APInt::flipAllBitsSlowCase() {
f37b6182SDimitry Andric  tcComplement(U.pVal, getNumWords());
7a7e6055SDimitry Andric  clearUnusedBits();
7a7e6055SDimitry Andric}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Toggle a given bit to its opposite value whose position is given
f22ef01cSRoman Divacky/// as "bitPosition".
4ba319b5SDimitry Andric/// Toggles a given bit to its opposite value.
2754fe60SDimitry Andricvoid APInt::flipBit(unsigned bitPosition) {
f22ef01cSRoman Divacky  assert(bitPosition < BitWidth && "Out of the bit-width range!");
2754fe60SDimitry Andric  if ((*this)[bitPosition]) clearBit(bitPosition);
2754fe60SDimitry Andric  else setBit(bitPosition);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
7a7e6055SDimitry Andricvoid APInt::insertBits(const APInt &subBits, unsigned bitPosition) {
7a7e6055SDimitry Andric  unsigned subBitWidth = subBits.getBitWidth();
7a7e6055SDimitry Andric  assert(0 < subBitWidth && (subBitWidth + bitPosition) <= BitWidth &&
7a7e6055SDimitry Andric         "Illegal bit insertion");
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Insertion is a direct copy.
7a7e6055SDimitry Andric  if (subBitWidth == BitWidth) {
7a7e6055SDimitry Andric    *this = subBits;
7a7e6055SDimitry Andric    return;
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Single word result can be done as a direct bitmask.
7a7e6055SDimitry Andric  if (isSingleWord()) {
*b5893f02SDimitry Andric    uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - subBitWidth);
f37b6182SDimitry Andric    U.VAL &= ~(mask << bitPosition);
f37b6182SDimitry Andric    U.VAL |= (subBits.U.VAL << bitPosition);
7a7e6055SDimitry Andric    return;
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  unsigned loBit = whichBit(bitPosition);
7a7e6055SDimitry Andric  unsigned loWord = whichWord(bitPosition);
7a7e6055SDimitry Andric  unsigned hi1Word = whichWord(bitPosition + subBitWidth - 1);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Insertion within a single word can be done as a direct bitmask.
7a7e6055SDimitry Andric  if (loWord == hi1Word) {
*b5893f02SDimitry Andric    uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - subBitWidth);
f37b6182SDimitry Andric    U.pVal[loWord] &= ~(mask << loBit);
f37b6182SDimitry Andric    U.pVal[loWord] |= (subBits.U.VAL << loBit);
7a7e6055SDimitry Andric    return;
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Insert on word boundaries.
7a7e6055SDimitry Andric  if (loBit == 0) {
7a7e6055SDimitry Andric    // Direct copy whole words.
7a7e6055SDimitry Andric    unsigned numWholeSubWords = subBitWidth / APINT_BITS_PER_WORD;
f37b6182SDimitry Andric    memcpy(U.pVal + loWord, subBits.getRawData(),
7a7e6055SDimitry Andric           numWholeSubWords * APINT_WORD_SIZE);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric    // Mask+insert remaining bits.
7a7e6055SDimitry Andric    unsigned remainingBits = subBitWidth % APINT_BITS_PER_WORD;
7a7e6055SDimitry Andric    if (remainingBits != 0) {
*b5893f02SDimitry Andric      uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - remainingBits);
f37b6182SDimitry Andric      U.pVal[hi1Word] &= ~mask;
f37b6182SDimitry Andric      U.pVal[hi1Word] |= subBits.getWord(subBitWidth - 1);
7a7e6055SDimitry Andric    }
7a7e6055SDimitry Andric    return;
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // General case - set/clear individual bits in dst based on src.
7a7e6055SDimitry Andric  // TODO - there is scope for optimization here, but at the moment this code
7a7e6055SDimitry Andric  // path is barely used so prefer readability over performance.
7a7e6055SDimitry Andric  for (unsigned i = 0; i != subBitWidth; ++i) {
7a7e6055SDimitry Andric    if (subBits[i])
7a7e6055SDimitry Andric      setBit(bitPosition + i);
7a7e6055SDimitry Andric    else
7a7e6055SDimitry Andric      clearBit(bitPosition + i);
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric}
7a7e6055SDimitry Andric
7a7e6055SDimitry AndricAPInt APInt::extractBits(unsigned numBits, unsigned bitPosition) const {
7a7e6055SDimitry Andric  assert(numBits > 0 && "Can't extract zero bits");
7a7e6055SDimitry Andric  assert(bitPosition < BitWidth && (numBits + bitPosition) <= BitWidth &&
7a7e6055SDimitry Andric         "Illegal bit extraction");
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  if (isSingleWord())
f37b6182SDimitry Andric    return APInt(numBits, U.VAL >> bitPosition);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  unsigned loBit = whichBit(bitPosition);
7a7e6055SDimitry Andric  unsigned loWord = whichWord(bitPosition);
7a7e6055SDimitry Andric  unsigned hiWord = whichWord(bitPosition + numBits - 1);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Single word result extracting bits from a single word source.
7a7e6055SDimitry Andric  if (loWord == hiWord)
f37b6182SDimitry Andric    return APInt(numBits, U.pVal[loWord] >> loBit);
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Extracting bits that start on a source word boundary can be done
7a7e6055SDimitry Andric  // as a fast memory copy.
7a7e6055SDimitry Andric  if (loBit == 0)
f37b6182SDimitry Andric    return APInt(numBits, makeArrayRef(U.pVal + loWord, 1 + hiWord - loWord));
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // General case - shift + copy source words directly into place.
7a7e6055SDimitry Andric  APInt Result(numBits, 0);
7a7e6055SDimitry Andric  unsigned NumSrcWords = getNumWords();
7a7e6055SDimitry Andric  unsigned NumDstWords = Result.getNumWords();
7a7e6055SDimitry Andric
4ba319b5SDimitry Andric  uint64_t *DestPtr = Result.isSingleWord() ? &Result.U.VAL : Result.U.pVal;
7a7e6055SDimitry Andric  for (unsigned word = 0; word < NumDstWords; ++word) {
f37b6182SDimitry Andric    uint64_t w0 = U.pVal[loWord + word];
7a7e6055SDimitry Andric    uint64_t w1 =
f37b6182SDimitry Andric        (loWord + word + 1) < NumSrcWords ? U.pVal[loWord + word + 1] : 0;
4ba319b5SDimitry Andric    DestPtr[word] = (w0 >> loBit) | (w1 << (APINT_BITS_PER_WORD - loBit));
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  return Result.clearUnusedBits();
7a7e6055SDimitry Andric}
7a7e6055SDimitry Andric
ffd1746dSEd Schoutenunsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
f22ef01cSRoman Divacky  assert(!str.empty() && "Invalid string length");
6122f3e6SDimitry Andric  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
6122f3e6SDimitry Andric          radix == 36) &&
6122f3e6SDimitry Andric         "Radix should be 2, 8, 10, 16, or 36!");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  size_t slen = str.size();
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Each computation below needs to know if it's negative.
f22ef01cSRoman Divacky  StringRef::iterator p = str.begin();
f22ef01cSRoman Divacky  unsigned isNegative = *p == '-';
f22ef01cSRoman Divacky  if (*p == '-' || *p == '+') {
f22ef01cSRoman Divacky    p++;
f22ef01cSRoman Divacky    slen--;
f22ef01cSRoman Divacky    assert(slen && "String is only a sign, needs a value.");
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // For radixes of power-of-two values, the bits required is accurately and
f22ef01cSRoman Divacky  // easily computed
f22ef01cSRoman Divacky  if (radix == 2)
f22ef01cSRoman Divacky    return slen + isNegative;
f22ef01cSRoman Divacky  if (radix == 8)
f22ef01cSRoman Divacky    return slen * 3 + isNegative;
f22ef01cSRoman Divacky  if (radix == 16)
f22ef01cSRoman Divacky    return slen * 4 + isNegative;
f22ef01cSRoman Divacky
6122f3e6SDimitry Andric  // FIXME: base 36
6122f3e6SDimitry Andric
f22ef01cSRoman Divacky  // This is grossly inefficient but accurate. We could probably do something
f22ef01cSRoman Divacky  // with a computation of roughly slen*64/20 and then adjust by the value of
f22ef01cSRoman Divacky  // the first few digits. But, I'm not sure how accurate that could be.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Compute a sufficient number of bits that is always large enough but might
f22ef01cSRoman Divacky  // be too large. This avoids the assertion in the constructor. This
f22ef01cSRoman Divacky  // calculation doesn't work appropriately for the numbers 0-9, so just use 4
f22ef01cSRoman Divacky  // bits in that case.
6122f3e6SDimitry Andric  unsigned sufficient
6122f3e6SDimitry Andric    = radix == 10? (slen == 1 ? 4 : slen * 64/18)
6122f3e6SDimitry Andric                 : (slen == 1 ? 7 : slen * 16/3);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Convert to the actual binary value.
f22ef01cSRoman Divacky  APInt tmp(sufficient, StringRef(p, slen), radix);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Compute how many bits are required. If the log is infinite, assume we need
f22ef01cSRoman Divacky  // just bit.
f22ef01cSRoman Divacky  unsigned log = tmp.logBase2();
f22ef01cSRoman Divacky  if (log == (unsigned)-1) {
f22ef01cSRoman Divacky    return isNegative + 1;
f22ef01cSRoman Divacky  } else {
f22ef01cSRoman Divacky    return isNegative + log + 1;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
dff0c46cSDimitry Andrichash_code llvm::hash_value(const APInt &Arg) {
dff0c46cSDimitry Andric  if (Arg.isSingleWord())
f37b6182SDimitry Andric    return hash_combine(Arg.U.VAL);
f22ef01cSRoman Divacky
f37b6182SDimitry Andric  return hash_combine_range(Arg.U.pVal, Arg.U.pVal + Arg.getNumWords());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
ff0cc061SDimitry Andricbool APInt::isSplat(unsigned SplatSizeInBits) const {
ff0cc061SDimitry Andric  assert(getBitWidth() % SplatSizeInBits == 0 &&
ff0cc061SDimitry Andric         "SplatSizeInBits must divide width!");
ff0cc061SDimitry Andric  // We can check that all parts of an integer are equal by making use of a
ff0cc061SDimitry Andric  // little trick: rotate and check if it's still the same value.
ff0cc061SDimitry Andric  return *this == rotl(SplatSizeInBits);
ff0cc061SDimitry Andric}
ff0cc061SDimitry Andric
ff0cc061SDimitry Andric/// This function returns the high "numBits" bits of this APInt.
f22ef01cSRoman DivackyAPInt APInt::getHiBits(unsigned numBits) const {
7a7e6055SDimitry Andric  return this->lshr(BitWidth - numBits);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
ff0cc061SDimitry Andric/// This function returns the low "numBits" bits of this APInt.
f22ef01cSRoman DivackyAPInt APInt::getLoBits(unsigned numBits) const {
7a7e6055SDimitry Andric  APInt Result(getLowBitsSet(BitWidth, numBits));
7a7e6055SDimitry Andric  Result &= *this;
7a7e6055SDimitry Andric  return Result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f37b6182SDimitry Andric/// Return a value containing V broadcasted over NewLen bits.
f37b6182SDimitry AndricAPInt APInt::getSplat(unsigned NewLen, const APInt &V) {
f37b6182SDimitry Andric  assert(NewLen >= V.getBitWidth() && "Can't splat to smaller bit width!");
f37b6182SDimitry Andric
f37b6182SDimitry Andric  APInt Val = V.zextOrSelf(NewLen);
f37b6182SDimitry Andric  for (unsigned I = V.getBitWidth(); I < NewLen; I <<= 1)
f37b6182SDimitry Andric    Val |= Val << I;
f37b6182SDimitry Andric
f37b6182SDimitry Andric  return Val;
f37b6182SDimitry Andric}
f37b6182SDimitry Andric
f22ef01cSRoman Divackyunsigned APInt::countLeadingZerosSlowCase() const {
3ca95b02SDimitry Andric  unsigned Count = 0;
3ca95b02SDimitry Andric  for (int i = getNumWords()-1; i >= 0; --i) {
f37b6182SDimitry Andric    uint64_t V = U.pVal[i];
3ca95b02SDimitry Andric    if (V == 0)
f22ef01cSRoman Divacky      Count += APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky    else {
3ca95b02SDimitry Andric      Count += llvm::countLeadingZeros(V);
f22ef01cSRoman Divacky      break;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
3ca95b02SDimitry Andric  // Adjust for unused bits in the most significant word (they are zero).
3ca95b02SDimitry Andric  unsigned Mod = BitWidth % APINT_BITS_PER_WORD;
3ca95b02SDimitry Andric  Count -= Mod > 0 ? APINT_BITS_PER_WORD - Mod : 0;
f22ef01cSRoman Divacky  return Count;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
edd7eaddSDimitry Andricunsigned APInt::countLeadingOnesSlowCase() const {
f22ef01cSRoman Divacky  unsigned highWordBits = BitWidth % APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  unsigned shift;
f22ef01cSRoman Divacky  if (!highWordBits) {
f22ef01cSRoman Divacky    highWordBits = APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky    shift = 0;
f22ef01cSRoman Divacky  } else {
f22ef01cSRoman Divacky    shift = APINT_BITS_PER_WORD - highWordBits;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  int i = getNumWords() - 1;
f37b6182SDimitry Andric  unsigned Count = llvm::countLeadingOnes(U.pVal[i] << shift);
f22ef01cSRoman Divacky  if (Count == highWordBits) {
f22ef01cSRoman Divacky    for (i--; i >= 0; --i) {
*b5893f02SDimitry Andric      if (U.pVal[i] == WORDTYPE_MAX)
f22ef01cSRoman Divacky        Count += APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky      else {
f37b6182SDimitry Andric        Count += llvm::countLeadingOnes(U.pVal[i]);
f22ef01cSRoman Divacky        break;
f22ef01cSRoman Divacky      }
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  return Count;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
edd7eaddSDimitry Andricunsigned APInt::countTrailingZerosSlowCase() const {
f22ef01cSRoman Divacky  unsigned Count = 0;
f22ef01cSRoman Divacky  unsigned i = 0;
f37b6182SDimitry Andric  for (; i < getNumWords() && U.pVal[i] == 0; ++i)
f22ef01cSRoman Divacky    Count += APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  if (i < getNumWords())
f37b6182SDimitry Andric    Count += llvm::countTrailingZeros(U.pVal[i]);
f22ef01cSRoman Divacky  return std::min(Count, BitWidth);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divackyunsigned APInt::countTrailingOnesSlowCase() const {
f22ef01cSRoman Divacky  unsigned Count = 0;
f22ef01cSRoman Divacky  unsigned i = 0;
*b5893f02SDimitry Andric  for (; i < getNumWords() && U.pVal[i] == WORDTYPE_MAX; ++i)
f22ef01cSRoman Divacky    Count += APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  if (i < getNumWords())
f37b6182SDimitry Andric    Count += llvm::countTrailingOnes(U.pVal[i]);
51690af2SDimitry Andric  assert(Count <= BitWidth);
51690af2SDimitry Andric  return Count;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divackyunsigned APInt::countPopulationSlowCase() const {
f22ef01cSRoman Divacky  unsigned Count = 0;
f22ef01cSRoman Divacky  for (unsigned i = 0; i < getNumWords(); ++i)
f37b6182SDimitry Andric    Count += llvm::countPopulation(U.pVal[i]);
f22ef01cSRoman Divacky  return Count;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6bc11b14SDimitry Andricbool APInt::intersectsSlowCase(const APInt &RHS) const {
6bc11b14SDimitry Andric  for (unsigned i = 0, e = getNumWords(); i != e; ++i)
f37b6182SDimitry Andric    if ((U.pVal[i] & RHS.U.pVal[i]) != 0)
6bc11b14SDimitry Andric      return true;
6bc11b14SDimitry Andric
6bc11b14SDimitry Andric  return false;
6bc11b14SDimitry Andric}
6bc11b14SDimitry Andric
6bc11b14SDimitry Andricbool APInt::isSubsetOfSlowCase(const APInt &RHS) const {
6bc11b14SDimitry Andric  for (unsigned i = 0, e = getNumWords(); i != e; ++i)
f37b6182SDimitry Andric    if ((U.pVal[i] & ~RHS.U.pVal[i]) != 0)
6bc11b14SDimitry Andric      return false;
6bc11b14SDimitry Andric
6bc11b14SDimitry Andric  return true;
6bc11b14SDimitry Andric}
6bc11b14SDimitry Andric
f22ef01cSRoman DivackyAPInt APInt::byteSwap() const {
f22ef01cSRoman Divacky  assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
f22ef01cSRoman Divacky  if (BitWidth == 16)
f37b6182SDimitry Andric    return APInt(BitWidth, ByteSwap_16(uint16_t(U.VAL)));
dff0c46cSDimitry Andric  if (BitWidth == 32)
f37b6182SDimitry Andric    return APInt(BitWidth, ByteSwap_32(unsigned(U.VAL)));
dff0c46cSDimitry Andric  if (BitWidth == 48) {
f37b6182SDimitry Andric    unsigned Tmp1 = unsigned(U.VAL >> 16);
f22ef01cSRoman Divacky    Tmp1 = ByteSwap_32(Tmp1);
f37b6182SDimitry Andric    uint16_t Tmp2 = uint16_t(U.VAL);
f22ef01cSRoman Divacky    Tmp2 = ByteSwap_16(Tmp2);
f22ef01cSRoman Divacky    return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
dff0c46cSDimitry Andric  }
dff0c46cSDimitry Andric  if (BitWidth == 64)
f37b6182SDimitry Andric    return APInt(BitWidth, ByteSwap_64(U.VAL));
dff0c46cSDimitry Andric
dff0c46cSDimitry Andric  APInt Result(getNumWords() * APINT_BITS_PER_WORD, 0);
dff0c46cSDimitry Andric  for (unsigned I = 0, N = getNumWords(); I != N; ++I)
f37b6182SDimitry Andric    Result.U.pVal[I] = ByteSwap_64(U.pVal[N - I - 1]);
dff0c46cSDimitry Andric  if (Result.BitWidth != BitWidth) {
7a7e6055SDimitry Andric    Result.lshrInPlace(Result.BitWidth - BitWidth);
dff0c46cSDimitry Andric    Result.BitWidth = BitWidth;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  return Result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
3ca95b02SDimitry AndricAPInt APInt::reverseBits() const {
3ca95b02SDimitry Andric  switch (BitWidth) {
3ca95b02SDimitry Andric  case 64:
f37b6182SDimitry Andric    return APInt(BitWidth, llvm::reverseBits<uint64_t>(U.VAL));
3ca95b02SDimitry Andric  case 32:
f37b6182SDimitry Andric    return APInt(BitWidth, llvm::reverseBits<uint32_t>(U.VAL));
3ca95b02SDimitry Andric  case 16:
f37b6182SDimitry Andric    return APInt(BitWidth, llvm::reverseBits<uint16_t>(U.VAL));
3ca95b02SDimitry Andric  case 8:
f37b6182SDimitry Andric    return APInt(BitWidth, llvm::reverseBits<uint8_t>(U.VAL));
3ca95b02SDimitry Andric  default:
3ca95b02SDimitry Andric    break;
3ca95b02SDimitry Andric  }
3ca95b02SDimitry Andric
3ca95b02SDimitry Andric  APInt Val(*this);
6bc11b14SDimitry Andric  APInt Reversed(BitWidth, 0);
6bc11b14SDimitry Andric  unsigned S = BitWidth;
3ca95b02SDimitry Andric
6bc11b14SDimitry Andric  for (; Val != 0; Val.lshrInPlace(1)) {
3ca95b02SDimitry Andric    Reversed <<= 1;
6bc11b14SDimitry Andric    Reversed |= Val[0];
3ca95b02SDimitry Andric    --S;
3ca95b02SDimitry Andric  }
3ca95b02SDimitry Andric
3ca95b02SDimitry Andric  Reversed <<= S;
3ca95b02SDimitry Andric  return Reversed;
3ca95b02SDimitry Andric}
3ca95b02SDimitry Andric
7a7e6055SDimitry AndricAPInt llvm::APIntOps::GreatestCommonDivisor(APInt A, APInt B) {
7a7e6055SDimitry Andric  // Fast-path a common case.
7a7e6055SDimitry Andric  if (A == B) return A;
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Corner cases: if either operand is zero, the other is the gcd.
7a7e6055SDimitry Andric  if (!A) return B;
7a7e6055SDimitry Andric  if (!B) return A;
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Count common powers of 2 and remove all other powers of 2.
7a7e6055SDimitry Andric  unsigned Pow2;
7a7e6055SDimitry Andric  {
7a7e6055SDimitry Andric    unsigned Pow2_A = A.countTrailingZeros();
7a7e6055SDimitry Andric    unsigned Pow2_B = B.countTrailingZeros();
7a7e6055SDimitry Andric    if (Pow2_A > Pow2_B) {
7a7e6055SDimitry Andric      A.lshrInPlace(Pow2_A - Pow2_B);
7a7e6055SDimitry Andric      Pow2 = Pow2_B;
7a7e6055SDimitry Andric    } else if (Pow2_B > Pow2_A) {
7a7e6055SDimitry Andric      B.lshrInPlace(Pow2_B - Pow2_A);
7a7e6055SDimitry Andric      Pow2 = Pow2_A;
7a7e6055SDimitry Andric    } else {
7a7e6055SDimitry Andric      Pow2 = Pow2_A;
f22ef01cSRoman Divacky    }
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  // Both operands are odd multiples of 2^Pow_2:
7a7e6055SDimitry Andric  //
7a7e6055SDimitry Andric  //   gcd(a, b) = gcd(|a - b| / 2^i, min(a, b))
7a7e6055SDimitry Andric  //
7a7e6055SDimitry Andric  // This is a modified version of Stein's algorithm, taking advantage of
7a7e6055SDimitry Andric  // efficient countTrailingZeros().
7a7e6055SDimitry Andric  while (A != B) {
7a7e6055SDimitry Andric    if (A.ugt(B)) {
7a7e6055SDimitry Andric      A -= B;
7a7e6055SDimitry Andric      A.lshrInPlace(A.countTrailingZeros() - Pow2);
7a7e6055SDimitry Andric    } else {
7a7e6055SDimitry Andric      B -= A;
7a7e6055SDimitry Andric      B.lshrInPlace(B.countTrailingZeros() - Pow2);
7a7e6055SDimitry Andric    }
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
f22ef01cSRoman Divacky  return A;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman DivackyAPInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
*b5893f02SDimitry Andric  uint64_t I = bit_cast<uint64_t>(Double);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Get the sign bit from the highest order bit
*b5893f02SDimitry Andric  bool isNeg = I >> 63;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Get the 11-bit exponent and adjust for the 1023 bit bias
*b5893f02SDimitry Andric  int64_t exp = ((I >> 52) & 0x7ff) - 1023;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If the exponent is negative, the value is < 0 so just return 0.
f22ef01cSRoman Divacky  if (exp < 0)
f22ef01cSRoman Divacky    return APInt(width, 0u);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Extract the mantissa by clearing the top 12 bits (sign + exponent).
*b5893f02SDimitry Andric  uint64_t mantissa = (I & (~0ULL >> 12)) | 1ULL << 52;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If the exponent doesn't shift all bits out of the mantissa
f22ef01cSRoman Divacky  if (exp < 52)
f22ef01cSRoman Divacky    return isNeg ? -APInt(width, mantissa >> (52 - exp)) :
f22ef01cSRoman Divacky                    APInt(width, mantissa >> (52 - exp));
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If the client didn't provide enough bits for us to shift the mantissa into
f22ef01cSRoman Divacky  // then the result is undefined, just return 0
f22ef01cSRoman Divacky  if (width <= exp - 52)
f22ef01cSRoman Divacky    return APInt(width, 0);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Otherwise, we have to shift the mantissa bits up to the right location
f22ef01cSRoman Divacky  APInt Tmp(width, mantissa);
f37b6182SDimitry Andric  Tmp <<= (unsigned)exp - 52;
f22ef01cSRoman Divacky  return isNeg ? -Tmp : Tmp;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
ff0cc061SDimitry Andric/// This function converts this APInt to a double.
f22ef01cSRoman Divacky/// The layout for double is as following (IEEE Standard 754):
f22ef01cSRoman Divacky///  --------------------------------------
f22ef01cSRoman Divacky/// |  Sign    Exponent    Fraction    Bias |
f22ef01cSRoman Divacky/// |-------------------------------------- |
f22ef01cSRoman Divacky/// |  1[63]   11[62-52]   52[51-00]   1023 |
f22ef01cSRoman Divacky///  --------------------------------------
f22ef01cSRoman Divackydouble APInt::roundToDouble(bool isSigned) const {
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Handle the simple case where the value is contained in one uint64_t.
f22ef01cSRoman Divacky  // It is wrong to optimize getWord(0) to VAL; there might be more than one word.
f22ef01cSRoman Divacky  if (isSingleWord() || getActiveBits() <= APINT_BITS_PER_WORD) {
f22ef01cSRoman Divacky    if (isSigned) {
3ca95b02SDimitry Andric      int64_t sext = SignExtend64(getWord(0), BitWidth);
f22ef01cSRoman Divacky      return double(sext);
f22ef01cSRoman Divacky    } else
f22ef01cSRoman Divacky      return double(getWord(0));
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Determine if the value is negative.
f22ef01cSRoman Divacky  bool isNeg = isSigned ? (*this)[BitWidth-1] : false;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Construct the absolute value if we're negative.
f22ef01cSRoman Divacky  APInt Tmp(isNeg ? -(*this) : (*this));
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Figure out how many bits we're using.
f22ef01cSRoman Divacky  unsigned n = Tmp.getActiveBits();
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // The exponent (without bias normalization) is just the number of bits
f22ef01cSRoman Divacky  // we are using. Note that the sign bit is gone since we constructed the
f22ef01cSRoman Divacky  // absolute value.
f22ef01cSRoman Divacky  uint64_t exp = n;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Return infinity for exponent overflow
f22ef01cSRoman Divacky  if (exp > 1023) {
f22ef01cSRoman Divacky    if (!isSigned || !isNeg)
f22ef01cSRoman Divacky      return std::numeric_limits<double>::infinity();
f22ef01cSRoman Divacky    else
f22ef01cSRoman Divacky      return -std::numeric_limits<double>::infinity();
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  exp += 1023; // Increment for 1023 bias
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Number of bits in mantissa is 52. To obtain the mantissa value, we must
f22ef01cSRoman Divacky  // extract the high 52 bits from the correct words in pVal.
f22ef01cSRoman Divacky  uint64_t mantissa;
f22ef01cSRoman Divacky  unsigned hiWord = whichWord(n-1);
f22ef01cSRoman Divacky  if (hiWord == 0) {
f37b6182SDimitry Andric    mantissa = Tmp.U.pVal[0];
f22ef01cSRoman Divacky    if (n > 52)
f22ef01cSRoman Divacky      mantissa >>= n - 52; // shift down, we want the top 52 bits.
f22ef01cSRoman Divacky  } else {
f22ef01cSRoman Divacky    assert(hiWord > 0 && "huh?");
f37b6182SDimitry Andric    uint64_t hibits = Tmp.U.pVal[hiWord] << (52 - n % APINT_BITS_PER_WORD);
f37b6182SDimitry Andric    uint64_t lobits = Tmp.U.pVal[hiWord-1] >> (11 + n % APINT_BITS_PER_WORD);
f22ef01cSRoman Divacky    mantissa = hibits | lobits;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // The leading bit of mantissa is implicit, so get rid of it.
f22ef01cSRoman Divacky  uint64_t sign = isNeg ? (1ULL << (APINT_BITS_PER_WORD - 1)) : 0;
*b5893f02SDimitry Andric  uint64_t I = sign | (exp << 52) | mantissa;
*b5893f02SDimitry Andric  return bit_cast<double>(I);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky// Truncate to new width.
2754fe60SDimitry AndricAPInt APInt::trunc(unsigned width) const {
f22ef01cSRoman Divacky  assert(width < BitWidth && "Invalid APInt Truncate request");
f22ef01cSRoman Divacky  assert(width && "Can't truncate to 0 bits");
2754fe60SDimitry Andric
2754fe60SDimitry Andric  if (width <= APINT_BITS_PER_WORD)
2754fe60SDimitry Andric    return APInt(width, getRawData()[0]);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  APInt Result(getMemory(getNumWords(width)), width);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  // Copy full words.
2754fe60SDimitry Andric  unsigned i;
2754fe60SDimitry Andric  for (i = 0; i != width / APINT_BITS_PER_WORD; i++)
f37b6182SDimitry Andric    Result.U.pVal[i] = U.pVal[i];
2754fe60SDimitry Andric
2754fe60SDimitry Andric  // Truncate and copy any partial word.
2754fe60SDimitry Andric  unsigned bits = (0 - width) % APINT_BITS_PER_WORD;
2754fe60SDimitry Andric  if (bits != 0)
f37b6182SDimitry Andric    Result.U.pVal[i] = U.pVal[i] << bits >> bits;
2754fe60SDimitry Andric
2754fe60SDimitry Andric  return Result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky// Sign extend to a new width.
51690af2SDimitry AndricAPInt APInt::sext(unsigned Width) const {
51690af2SDimitry Andric  assert(Width > BitWidth && "Invalid APInt SignExtend request");
2754fe60SDimitry Andric
51690af2SDimitry Andric  if (Width <= APINT_BITS_PER_WORD)
f37b6182SDimitry Andric    return APInt(Width, SignExtend64(U.VAL, BitWidth));
f22ef01cSRoman Divacky
51690af2SDimitry Andric  APInt Result(getMemory(getNumWords(Width)), Width);
f22ef01cSRoman Divacky
51690af2SDimitry Andric  // Copy words.
f37b6182SDimitry Andric  std::memcpy(Result.U.pVal, getRawData(), getNumWords() * APINT_WORD_SIZE);
2754fe60SDimitry Andric
51690af2SDimitry Andric  // Sign extend the last word since there may be unused bits in the input.
f37b6182SDimitry Andric  Result.U.pVal[getNumWords() - 1] =
f37b6182SDimitry Andric      SignExtend64(Result.U.pVal[getNumWords() - 1],
51690af2SDimitry Andric                   ((BitWidth - 1) % APINT_BITS_PER_WORD) + 1);
2754fe60SDimitry Andric
51690af2SDimitry Andric  // Fill with sign bits.
f37b6182SDimitry Andric  std::memset(Result.U.pVal + getNumWords(), isNegative() ? -1 : 0,
51690af2SDimitry Andric              (Result.getNumWords() - getNumWords()) * APINT_WORD_SIZE);
51690af2SDimitry Andric  Result.clearUnusedBits();
2754fe60SDimitry Andric  return Result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky//  Zero extend to a new width.
2754fe60SDimitry AndricAPInt APInt::zext(unsigned width) const {
f22ef01cSRoman Divacky  assert(width > BitWidth && "Invalid APInt ZeroExtend request");
2754fe60SDimitry Andric
2754fe60SDimitry Andric  if (width <= APINT_BITS_PER_WORD)
f37b6182SDimitry Andric    return APInt(width, U.VAL);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  APInt Result(getMemory(getNumWords(width)), width);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  // Copy words.
f37b6182SDimitry Andric  std::memcpy(Result.U.pVal, getRawData(), getNumWords() * APINT_WORD_SIZE);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  // Zero remaining words.
f37b6182SDimitry Andric  std::memset(Result.U.pVal + getNumWords(), 0,
51690af2SDimitry Andric              (Result.getNumWords() - getNumWords()) * APINT_WORD_SIZE);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  return Result;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
2754fe60SDimitry AndricAPInt APInt::zextOrTrunc(unsigned width) const {
f22ef01cSRoman Divacky  if (BitWidth < width)
f22ef01cSRoman Divacky    return zext(width);
f22ef01cSRoman Divacky  if (BitWidth > width)
f22ef01cSRoman Divacky    return trunc(width);
f22ef01cSRoman Divacky  return *this;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
2754fe60SDimitry AndricAPInt APInt::sextOrTrunc(unsigned width) const {
f22ef01cSRoman Divacky  if (BitWidth < width)
f22ef01cSRoman Divacky    return sext(width);
f22ef01cSRoman Divacky  if (BitWidth > width)
f22ef01cSRoman Divacky    return trunc(width);
f22ef01cSRoman Divacky  return *this;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
dff0c46cSDimitry AndricAPInt APInt::zextOrSelf(unsigned width) const {
dff0c46cSDimitry Andric  if (BitWidth < width)
dff0c46cSDimitry Andric    return zext(width);
dff0c46cSDimitry Andric  return *this;
dff0c46cSDimitry Andric}
dff0c46cSDimitry Andric
dff0c46cSDimitry AndricAPInt APInt::sextOrSelf(unsigned width) const {
dff0c46cSDimitry Andric  if (BitWidth < width)
dff0c46cSDimitry Andric    return sext(width);
dff0c46cSDimitry Andric  return *this;
dff0c46cSDimitry Andric}
dff0c46cSDimitry Andric
f22ef01cSRoman Divacky/// Arithmetic right-shift this APInt by shiftAmt.
4ba319b5SDimitry Andric/// Arithmetic right-shift function.
51690af2SDimitry Andricvoid APInt::ashrInPlace(const APInt &shiftAmt) {
51690af2SDimitry Andric  ashrInPlace((unsigned)shiftAmt.getLimitedValue(BitWidth));
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Arithmetic right-shift this APInt by shiftAmt.
4ba319b5SDimitry Andric/// Arithmetic right-shift function.
51690af2SDimitry Andricvoid APInt::ashrSlowCase(unsigned ShiftAmt) {
51690af2SDimitry Andric  // Don't bother performing a no-op shift.
51690af2SDimitry Andric  if (!ShiftAmt)
51690af2SDimitry Andric    return;
f22ef01cSRoman Divacky
51690af2SDimitry Andric  // Save the original sign bit for later.
51690af2SDimitry Andric  bool Negative = isNegative();
f22ef01cSRoman Divacky
4ba319b5SDimitry Andric  // WordShift is the inter-part shift; BitShift is intra-part shift.
51690af2SDimitry Andric  unsigned WordShift = ShiftAmt / APINT_BITS_PER_WORD;
51690af2SDimitry Andric  unsigned BitShift = ShiftAmt % APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky
51690af2SDimitry Andric  unsigned WordsToMove = getNumWords() - WordShift;
51690af2SDimitry Andric  if (WordsToMove != 0) {
51690af2SDimitry Andric    // Sign extend the last word to fill in the unused bits.
f37b6182SDimitry Andric    U.pVal[getNumWords() - 1] = SignExtend64(
f37b6182SDimitry Andric        U.pVal[getNumWords() - 1], ((BitWidth - 1) % APINT_BITS_PER_WORD) + 1);
f22ef01cSRoman Divacky
51690af2SDimitry Andric    // Fastpath for moving by whole words.
51690af2SDimitry Andric    if (BitShift == 0) {
f37b6182SDimitry Andric      std::memmove(U.pVal, U.pVal + WordShift, WordsToMove * APINT_WORD_SIZE);
f22ef01cSRoman Divacky    } else {
51690af2SDimitry Andric      // Move the words containing significant bits.
51690af2SDimitry Andric      for (unsigned i = 0; i != WordsToMove - 1; ++i)
f37b6182SDimitry Andric        U.pVal[i] = (U.pVal[i + WordShift] >> BitShift) |
f37b6182SDimitry Andric                    (U.pVal[i + WordShift + 1] << (APINT_BITS_PER_WORD - BitShift));
f22ef01cSRoman Divacky
51690af2SDimitry Andric      // Handle the last word which has no high bits to copy.
f37b6182SDimitry Andric      U.pVal[WordsToMove - 1] = U.pVal[WordShift + WordsToMove - 1] >> BitShift;
51690af2SDimitry Andric      // Sign extend one more time.
f37b6182SDimitry Andric      U.pVal[WordsToMove - 1] =
f37b6182SDimitry Andric          SignExtend64(U.pVal[WordsToMove - 1], APINT_BITS_PER_WORD - BitShift);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
51690af2SDimitry Andric  // Fill in the remainder based on the original sign.
f37b6182SDimitry Andric  std::memset(U.pVal + WordsToMove, Negative ? -1 : 0,
51690af2SDimitry Andric              WordShift * APINT_WORD_SIZE);
51690af2SDimitry Andric  clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Logical right-shift this APInt by shiftAmt.
4ba319b5SDimitry Andric/// Logical right-shift function.
6bc11b14SDimitry Andricvoid APInt::lshrInPlace(const APInt &shiftAmt) {
6bc11b14SDimitry Andric  lshrInPlace((unsigned)shiftAmt.getLimitedValue(BitWidth));
7a7e6055SDimitry Andric}
7a7e6055SDimitry Andric
f22ef01cSRoman Divacky/// Logical right-shift this APInt by shiftAmt.
4ba319b5SDimitry Andric/// Logical right-shift function.
6bc11b14SDimitry Andricvoid APInt::lshrSlowCase(unsigned ShiftAmt) {
f37b6182SDimitry Andric  tcShiftRight(U.pVal, getNumWords(), ShiftAmt);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Left-shift this APInt by shiftAmt.
4ba319b5SDimitry Andric/// Left-shift function.
f37b6182SDimitry AndricAPInt &APInt::operator<<=(const APInt &shiftAmt) {
f22ef01cSRoman Divacky  // It's undefined behavior in C to shift by BitWidth or greater.
f37b6182SDimitry Andric  *this <<= (unsigned)shiftAmt.getLimitedValue(BitWidth);
f37b6182SDimitry Andric  return *this;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6bc11b14SDimitry Andricvoid APInt::shlSlowCase(unsigned ShiftAmt) {
f37b6182SDimitry Andric  tcShiftLeft(U.pVal, getNumWords(), ShiftAmt);
6bc11b14SDimitry Andric  clearUnusedBits();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric// Calculate the rotate amount modulo the bit width.
7a7e6055SDimitry Andricstatic unsigned rotateModulo(unsigned BitWidth, const APInt &rotateAmt) {
7a7e6055SDimitry Andric  unsigned rotBitWidth = rotateAmt.getBitWidth();
7a7e6055SDimitry Andric  APInt rot = rotateAmt;
7a7e6055SDimitry Andric  if (rotBitWidth < BitWidth) {
7a7e6055SDimitry Andric    // Extend the rotate APInt, so that the urem doesn't divide by 0.
7a7e6055SDimitry Andric    // e.g. APInt(1, 32) would give APInt(1, 0).
7a7e6055SDimitry Andric    rot = rotateAmt.zext(BitWidth);
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric  rot = rot.urem(APInt(rot.getBitWidth(), BitWidth));
7a7e6055SDimitry Andric  return rot.getLimitedValue(BitWidth);
7a7e6055SDimitry Andric}
7a7e6055SDimitry Andric
f22ef01cSRoman DivackyAPInt APInt::rotl(const APInt &rotateAmt) const {
7a7e6055SDimitry Andric  return rotl(rotateModulo(BitWidth, rotateAmt));
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman DivackyAPInt APInt::rotl(unsigned rotateAmt) const {
dff0c46cSDimitry Andric  rotateAmt %= BitWidth;
f22ef01cSRoman Divacky  if (rotateAmt == 0)
f22ef01cSRoman Divacky    return *this;
dff0c46cSDimitry Andric  return shl(rotateAmt) | lshr(BitWidth - rotateAmt);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman DivackyAPInt APInt::rotr(const APInt &rotateAmt) const {
7a7e6055SDimitry Andric  return rotr(rotateModulo(BitWidth, rotateAmt));
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman DivackyAPInt APInt::rotr(unsigned rotateAmt) const {
dff0c46cSDimitry Andric  rotateAmt %= BitWidth;
f22ef01cSRoman Divacky  if (rotateAmt == 0)
f22ef01cSRoman Divacky    return *this;
dff0c46cSDimitry Andric  return lshr(rotateAmt) | shl(BitWidth - rotateAmt);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky// Square Root - this method computes and returns the square root of "this".
f22ef01cSRoman Divacky// Three mechanisms are used for computation. For small values (<= 5 bits),
f22ef01cSRoman Divacky// a table lookup is done. This gets some performance for common cases. For
f22ef01cSRoman Divacky// values using less than 52 bits, the value is converted to double and then
f22ef01cSRoman Divacky// the libc sqrt function is called. The result is rounded and then converted
f22ef01cSRoman Divacky// back to a uint64_t which is then used to construct the result. Finally,
f22ef01cSRoman Divacky// the Babylonian method for computing square roots is used.
f22ef01cSRoman DivackyAPInt APInt::sqrt() const {
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Determine the magnitude of the value.
f22ef01cSRoman Divacky  unsigned magnitude = getActiveBits();
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Use a fast table for some small values. This also gets rid of some
f22ef01cSRoman Divacky  // rounding errors in libc sqrt for small values.
f22ef01cSRoman Divacky  if (magnitude <= 5) {
f22ef01cSRoman Divacky    static const uint8_t results[32] = {
f22ef01cSRoman Divacky      /*     0 */ 0,
f22ef01cSRoman Divacky      /*  1- 2 */ 1, 1,
f22ef01cSRoman Divacky      /*  3- 6 */ 2, 2, 2, 2,
f22ef01cSRoman Divacky      /*  7-12 */ 3, 3, 3, 3, 3, 3,
f22ef01cSRoman Divacky      /* 13-20 */ 4, 4, 4, 4, 4, 4, 4, 4,
f22ef01cSRoman Divacky      /* 21-30 */ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
f22ef01cSRoman Divacky      /*    31 */ 6
f22ef01cSRoman Divacky    };
f37b6182SDimitry Andric    return APInt(BitWidth, results[ (isSingleWord() ? U.VAL : U.pVal[0]) ]);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If the magnitude of the value fits in less than 52 bits (the precision of
f22ef01cSRoman Divacky  // an IEEE double precision floating point value), then we can use the
f22ef01cSRoman Divacky  // libc sqrt function which will probably use a hardware sqrt computation.
f22ef01cSRoman Divacky  // This should be faster than the algorithm below.
f22ef01cSRoman Divacky  if (magnitude < 52) {
f22ef01cSRoman Divacky    return APInt(BitWidth,
f37b6182SDimitry Andric                 uint64_t(::round(::sqrt(double(isSingleWord() ? U.VAL
f37b6182SDimitry Andric                                                               : U.pVal[0])))));
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Okay, all the short cuts are exhausted. We must compute it. The following
f22ef01cSRoman Divacky  // is a classical Babylonian method for computing the square root. This code
39d628a0SDimitry Andric  // was adapted to APInt from a wikipedia article on such computations.
f22ef01cSRoman Divacky  // See http://www.wikipedia.org/ and go to the page named
f22ef01cSRoman Divacky  // Calculate_an_integer_square_root.
f22ef01cSRoman Divacky  unsigned nbits = BitWidth, i = 4;
f22ef01cSRoman Divacky  APInt testy(BitWidth, 16);
f22ef01cSRoman Divacky  APInt x_old(BitWidth, 1);
f22ef01cSRoman Divacky  APInt x_new(BitWidth, 0);
f22ef01cSRoman Divacky  APInt two(BitWidth, 2);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Select a good starting value using binary logarithms.
f22ef01cSRoman Divacky  for (;; i += 2, testy = testy.shl(2))
f22ef01cSRoman Divacky    if (i >= nbits || this->ule(testy)) {
f22ef01cSRoman Divacky      x_old = x_old.shl(i / 2);
f22ef01cSRoman Divacky      break;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Use the Babylonian method to arrive at the integer square root:
f22ef01cSRoman Divacky  for (;;) {
f22ef01cSRoman Divacky    x_new = (this->udiv(x_old) + x_old).udiv(two);
f22ef01cSRoman Divacky    if (x_old.ule(x_new))
f22ef01cSRoman Divacky      break;
f22ef01cSRoman Divacky    x_old = x_new;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Make sure we return the closest approximation
f22ef01cSRoman Divacky  // NOTE: The rounding calculation below is correct. It will produce an
f22ef01cSRoman Divacky  // off-by-one discrepancy with results from pari/gp. That discrepancy has been
f22ef01cSRoman Divacky  // determined to be a rounding issue with pari/gp as it begins to use a
f22ef01cSRoman Divacky  // floating point representation after 192 bits. There are no discrepancies
f22ef01cSRoman Divacky  // between this algorithm and pari/gp for bit widths < 192 bits.
f22ef01cSRoman Divacky  APInt square(x_old * x_old);
f22ef01cSRoman Divacky  APInt nextSquare((x_old + 1) * (x_old +1));
f22ef01cSRoman Divacky  if (this->ult(square))
f22ef01cSRoman Divacky    return x_old;
dff0c46cSDimitry Andric  assert(this->ule(nextSquare) && "Error in APInt::sqrt computation");
f22ef01cSRoman Divacky  APInt midpoint((nextSquare - square).udiv(two));
f22ef01cSRoman Divacky  APInt offset(*this - square);
f22ef01cSRoman Divacky  if (offset.ult(midpoint))
f22ef01cSRoman Divacky    return x_old;
f22ef01cSRoman Divacky  return x_old + 1;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Computes the multiplicative inverse of this APInt for a given modulo. The
f22ef01cSRoman Divacky/// iterative extended Euclidean algorithm is used to solve for this value,
f22ef01cSRoman Divacky/// however we simplify it to speed up calculating only the inverse, and take
f22ef01cSRoman Divacky/// advantage of div+rem calculations. We also use some tricks to avoid copying
f22ef01cSRoman Divacky/// (potentially large) APInts around.
f22ef01cSRoman DivackyAPInt APInt::multiplicativeInverse(const APInt& modulo) const {
f22ef01cSRoman Divacky  assert(ult(modulo) && "This APInt must be smaller than the modulo");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Using the properties listed at the following web page (accessed 06/21/08):
f22ef01cSRoman Divacky  //   http://www.numbertheory.org/php/euclid.html
f22ef01cSRoman Divacky  // (especially the properties numbered 3, 4 and 9) it can be proved that
f22ef01cSRoman Divacky  // BitWidth bits suffice for all the computations in the algorithm implemented
f22ef01cSRoman Divacky  // below. More precisely, this number of bits suffice if the multiplicative
f22ef01cSRoman Divacky  // inverse exists, but may not suffice for the general extended Euclidean
f22ef01cSRoman Divacky  // algorithm.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  APInt r[2] = { modulo, *this };
f22ef01cSRoman Divacky  APInt t[2] = { APInt(BitWidth, 0), APInt(BitWidth, 1) };
f22ef01cSRoman Divacky  APInt q(BitWidth, 0);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  unsigned i;
f22ef01cSRoman Divacky  for (i = 0; r[i^1] != 0; i ^= 1) {
f22ef01cSRoman Divacky    // An overview of the math without the confusing bit-flipping:
f22ef01cSRoman Divacky    // q = r[i-2] / r[i-1]
f22ef01cSRoman Divacky    // r[i] = r[i-2] % r[i-1]
f22ef01cSRoman Divacky    // t[i] = t[i-2] - t[i-1] * q
f22ef01cSRoman Divacky    udivrem(r[i], r[i^1], q, r[i]);
f22ef01cSRoman Divacky    t[i] -= t[i^1] * q;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If this APInt and the modulo are not coprime, there is no multiplicative
f22ef01cSRoman Divacky  // inverse, so return 0. We check this by looking at the next-to-last
f22ef01cSRoman Divacky  // remainder, which is the gcd(*this,modulo) as calculated by the Euclidean
f22ef01cSRoman Divacky  // algorithm.
f22ef01cSRoman Divacky  if (r[i] != 1)
f22ef01cSRoman Divacky    return APInt(BitWidth, 0);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // The next-to-last t is the multiplicative inverse.  However, we are
5517e702SDimitry Andric  // interested in a positive inverse. Calculate a positive one from a negative
f22ef01cSRoman Divacky  // one if necessary. A simple addition of the modulo suffices because
f22ef01cSRoman Divacky  // abs(t[i]) is known to be less than *this/2 (see the link above).
5517e702SDimitry Andric  if (t[i].isNegative())
5517e702SDimitry Andric    t[i] += modulo;
5517e702SDimitry Andric
5517e702SDimitry Andric  return std::move(t[i]);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Calculate the magic numbers required to implement a signed integer division
f22ef01cSRoman Divacky/// by a constant as a sequence of multiplies, adds and shifts.  Requires that
f22ef01cSRoman Divacky/// the divisor not be 0, 1, or -1.  Taken from "Hacker's Delight", Henry S.
f22ef01cSRoman Divacky/// Warren, Jr., chapter 10.
f22ef01cSRoman DivackyAPInt::ms APInt::magic() const {
f22ef01cSRoman Divacky  const APInt& d = *this;
f22ef01cSRoman Divacky  unsigned p;
f22ef01cSRoman Divacky  APInt ad, anc, delta, q1, r1, q2, r2, t;
f22ef01cSRoman Divacky  APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
f22ef01cSRoman Divacky  struct ms mag;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  ad = d.abs();
f22ef01cSRoman Divacky  t = signedMin + (d.lshr(d.getBitWidth() - 1));
f22ef01cSRoman Divacky  anc = t - 1 - t.urem(ad);   // absolute value of nc
f22ef01cSRoman Divacky  p = d.getBitWidth() - 1;    // initialize p
f22ef01cSRoman Divacky  q1 = signedMin.udiv(anc);   // initialize q1 = 2p/abs(nc)
f22ef01cSRoman Divacky  r1 = signedMin - q1*anc;    // initialize r1 = rem(2p,abs(nc))
f22ef01cSRoman Divacky  q2 = signedMin.udiv(ad);    // initialize q2 = 2p/abs(d)
f22ef01cSRoman Divacky  r2 = signedMin - q2*ad;     // initialize r2 = rem(2p,abs(d))
f22ef01cSRoman Divacky  do {
f22ef01cSRoman Divacky    p = p + 1;
f22ef01cSRoman Divacky    q1 = q1<<1;          // update q1 = 2p/abs(nc)
f22ef01cSRoman Divacky    r1 = r1<<1;          // update r1 = rem(2p/abs(nc))
f22ef01cSRoman Divacky    if (r1.uge(anc)) {  // must be unsigned comparison
f22ef01cSRoman Divacky      q1 = q1 + 1;
f22ef01cSRoman Divacky      r1 = r1 - anc;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    q2 = q2<<1;          // update q2 = 2p/abs(d)
f22ef01cSRoman Divacky    r2 = r2<<1;          // update r2 = rem(2p/abs(d))
f22ef01cSRoman Divacky    if (r2.uge(ad)) {   // must be unsigned comparison
f22ef01cSRoman Divacky      q2 = q2 + 1;
f22ef01cSRoman Divacky      r2 = r2 - ad;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    delta = ad - r2;
dd6029ffSDimitry Andric  } while (q1.ult(delta) || (q1 == delta && r1 == 0));
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  mag.m = q2 + 1;
f22ef01cSRoman Divacky  if (d.isNegative()) mag.m = -mag.m;   // resulting magic number
f22ef01cSRoman Divacky  mag.s = p - d.getBitWidth();          // resulting shift
f22ef01cSRoman Divacky  return mag;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Calculate the magic numbers required to implement an unsigned integer
f22ef01cSRoman Divacky/// division by a constant as a sequence of multiplies, adds and shifts.
f22ef01cSRoman Divacky/// Requires that the divisor not be 0.  Taken from "Hacker's Delight", Henry
f22ef01cSRoman Divacky/// S. Warren, Jr., chapter 10.
3b0f4066SDimitry Andric/// LeadingZeros can be used to simplify the calculation if the upper bits
3b0f4066SDimitry Andric/// of the divided value are known zero.
3b0f4066SDimitry AndricAPInt::mu APInt::magicu(unsigned LeadingZeros) const {
f22ef01cSRoman Divacky  const APInt& d = *this;
f22ef01cSRoman Divacky  unsigned p;
f22ef01cSRoman Divacky  APInt nc, delta, q1, r1, q2, r2;
f22ef01cSRoman Divacky  struct mu magu;
f22ef01cSRoman Divacky  magu.a = 0;               // initialize "add" indicator
3b0f4066SDimitry Andric  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth()).lshr(LeadingZeros);
f22ef01cSRoman Divacky  APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
f22ef01cSRoman Divacky  APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
f22ef01cSRoman Divacky
7ae0e2c9SDimitry Andric  nc = allOnes - (allOnes - d).urem(d);
f22ef01cSRoman Divacky  p = d.getBitWidth() - 1;  // initialize p
f22ef01cSRoman Divacky  q1 = signedMin.udiv(nc);  // initialize q1 = 2p/nc
f22ef01cSRoman Divacky  r1 = signedMin - q1*nc;   // initialize r1 = rem(2p,nc)
f22ef01cSRoman Divacky  q2 = signedMax.udiv(d);   // initialize q2 = (2p-1)/d
f22ef01cSRoman Divacky  r2 = signedMax - q2*d;    // initialize r2 = rem((2p-1),d)
f22ef01cSRoman Divacky  do {
f22ef01cSRoman Divacky    p = p + 1;
f22ef01cSRoman Divacky    if (r1.uge(nc - r1)) {
f22ef01cSRoman Divacky      q1 = q1 + q1 + 1;  // update q1
f22ef01cSRoman Divacky      r1 = r1 + r1 - nc; // update r1
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    else {
f22ef01cSRoman Divacky      q1 = q1+q1; // update q1
f22ef01cSRoman Divacky      r1 = r1+r1; // update r1
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    if ((r2 + 1).uge(d - r2)) {
f22ef01cSRoman Divacky      if (q2.uge(signedMax)) magu.a = 1;
f22ef01cSRoman Divacky      q2 = q2+q2 + 1;     // update q2
f22ef01cSRoman Divacky      r2 = r2+r2 + 1 - d; // update r2
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    else {
f22ef01cSRoman Divacky      if (q2.uge(signedMin)) magu.a = 1;
f22ef01cSRoman Divacky      q2 = q2+q2;     // update q2
f22ef01cSRoman Divacky      r2 = r2+r2 + 1; // update r2
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    delta = d - 1 - r2;
f22ef01cSRoman Divacky  } while (p < d.getBitWidth()*2 &&
f22ef01cSRoman Divacky           (q1.ult(delta) || (q1 == delta && r1 == 0)));
f22ef01cSRoman Divacky  magu.m = q2 + 1; // resulting magic number
f22ef01cSRoman Divacky  magu.s = p - d.getBitWidth();  // resulting shift
f22ef01cSRoman Divacky  return magu;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/// Implementation of Knuth's Algorithm D (Division of nonnegative integers)
f22ef01cSRoman Divacky/// from "Art of Computer Programming, Volume 2", section 4.3.1, p. 272. The
f22ef01cSRoman Divacky/// variables here have the same names as in the algorithm. Comments explain
f22ef01cSRoman Divacky/// the algorithm and any deviation from it.
5517e702SDimitry Andricstatic void KnuthDiv(uint32_t *u, uint32_t *v, uint32_t *q, uint32_t* r,
f22ef01cSRoman Divacky                     unsigned m, unsigned n) {
f22ef01cSRoman Divacky  assert(u && "Must provide dividend");
f22ef01cSRoman Divacky  assert(v && "Must provide divisor");
f22ef01cSRoman Divacky  assert(q && "Must provide quotient");
ff0cc061SDimitry Andric  assert(u != v && u != q && v != q && "Must use different memory");
f22ef01cSRoman Divacky  assert(n>1 && "n must be > 1");
f22ef01cSRoman Divacky
ff0cc061SDimitry Andric  // b denotes the base of the number system. In our case b is 2^32.
d88c1a5aSDimitry Andric  const uint64_t b = uint64_t(1) << 32;
f22ef01cSRoman Divacky
2cab237bSDimitry Andric// The DEBUG macros here tend to be spam in the debug output if you're not
2cab237bSDimitry Andric// debugging this code. Disable them unless KNUTH_DEBUG is defined.
*b5893f02SDimitry Andric#ifdef KNUTH_DEBUG
*b5893f02SDimitry Andric#define DEBUG_KNUTH(X) LLVM_DEBUG(X)
*b5893f02SDimitry Andric#else
*b5893f02SDimitry Andric#define DEBUG_KNUTH(X) do {} while(false)
2cab237bSDimitry Andric#endif
2cab237bSDimitry Andric
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << "KnuthDiv: m=" << m << " n=" << n << '\n');
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << "KnuthDiv: original:");
*b5893f02SDimitry Andric  DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << " by");
*b5893f02SDimitry Andric  DEBUG_KNUTH(for (int i = n; i > 0; i--) dbgs() << " " << v[i - 1]);
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << '\n');
f22ef01cSRoman Divacky  // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
f22ef01cSRoman Divacky  // u and v by d. Note that we have taken Knuth's advice here to use a power
f22ef01cSRoman Divacky  // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
f22ef01cSRoman Divacky  // 2 allows us to shift instead of multiply and it is easy to determine the
f22ef01cSRoman Divacky  // shift amount from the leading zeros.  We are basically normalizing the u
f22ef01cSRoman Divacky  // and v so that its high bits are shifted to the top of v's range without
f22ef01cSRoman Divacky  // overflow. Note that this can require an extra word in u so that u must
f22ef01cSRoman Divacky  // be of length m+n+1.
f785676fSDimitry Andric  unsigned shift = countLeadingZeros(v[n-1]);
5517e702SDimitry Andric  uint32_t v_carry = 0;
5517e702SDimitry Andric  uint32_t u_carry = 0;
f22ef01cSRoman Divacky  if (shift) {
f22ef01cSRoman Divacky    for (unsigned i = 0; i < m+n; ++i) {
5517e702SDimitry Andric      uint32_t u_tmp = u[i] >> (32 - shift);
f22ef01cSRoman Divacky      u[i] = (u[i] << shift) | u_carry;
f22ef01cSRoman Divacky      u_carry = u_tmp;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    for (unsigned i = 0; i < n; ++i) {
5517e702SDimitry Andric      uint32_t v_tmp = v[i] >> (32 - shift);
f22ef01cSRoman Divacky      v[i] = (v[i] << shift) | v_carry;
f22ef01cSRoman Divacky      v_carry = v_tmp;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  u[m+n] = u_carry;
ff0cc061SDimitry Andric
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << "KnuthDiv:   normal:");
*b5893f02SDimitry Andric  DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << " by");
*b5893f02SDimitry Andric  DEBUG_KNUTH(for (int i = n; i > 0; i--) dbgs() << " " << v[i - 1]);
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << '\n');
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // D2. [Initialize j.]  Set j to m. This is the loop counter over the places.
f22ef01cSRoman Divacky  int j = m;
f22ef01cSRoman Divacky  do {
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << "KnuthDiv: quotient digit #" << j << '\n');
f22ef01cSRoman Divacky    // D3. [Calculate q'.].
f22ef01cSRoman Divacky    //     Set qp = (u[j+n]*b + u[j+n-1]) / v[n-1]. (qp=qprime=q')
f22ef01cSRoman Divacky    //     Set rp = (u[j+n]*b + u[j+n-1]) % v[n-1]. (rp=rprime=r')
f22ef01cSRoman Divacky    // Now test if qp == b or qp*v[n-2] > b*rp + u[j+n-2]; if so, decrease
5517e702SDimitry Andric    // qp by 1, increase rp by v[n-1], and repeat this test if rp < b. The test
f22ef01cSRoman Divacky    // on v[n-2] determines at high speed most of the cases in which the trial
f22ef01cSRoman Divacky    // value qp is one too large, and it eliminates all cases where qp is two
f22ef01cSRoman Divacky    // too large.
5517e702SDimitry Andric    uint64_t dividend = Make_64(u[j+n], u[j+n-1]);
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << "KnuthDiv: dividend == " << dividend << '\n');
f22ef01cSRoman Divacky    uint64_t qp = dividend / v[n-1];
f22ef01cSRoman Divacky    uint64_t rp = dividend % v[n-1];
f22ef01cSRoman Divacky    if (qp == b || qp*v[n-2] > b*rp + u[j+n-2]) {
f22ef01cSRoman Divacky      qp--;
f22ef01cSRoman Divacky      rp += v[n-1];
f22ef01cSRoman Divacky      if (rp < b && (qp == b || qp*v[n-2] > b*rp + u[j+n-2]))
f22ef01cSRoman Divacky        qp--;
f22ef01cSRoman Divacky    }
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    // D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
f22ef01cSRoman Divacky    // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
f22ef01cSRoman Divacky    // consists of a simple multiplication by a one-place number, combined with
f22ef01cSRoman Divacky    // a subtraction.
f22ef01cSRoman Divacky    // The digits (u[j+n]...u[j]) should be kept positive; if the result of
f22ef01cSRoman Divacky    // this step is actually negative, (u[j+n]...u[j]) should be left as the
f22ef01cSRoman Divacky    // true value plus b**(n+1), namely as the b's complement of
f22ef01cSRoman Divacky    // the true value, and a "borrow" to the left should be remembered.
ff0cc061SDimitry Andric    int64_t borrow = 0;
ff0cc061SDimitry Andric    for (unsigned i = 0; i < n; ++i) {
ff0cc061SDimitry Andric      uint64_t p = uint64_t(qp) * uint64_t(v[i]);
5517e702SDimitry Andric      int64_t subres = int64_t(u[j+i]) - borrow - Lo_32(p);
5517e702SDimitry Andric      u[j+i] = Lo_32(subres);
5517e702SDimitry Andric      borrow = Hi_32(p) - Hi_32(subres);
*b5893f02SDimitry Andric      DEBUG_KNUTH(dbgs() << "KnuthDiv: u[j+i] = " << u[j + i]
ff0cc061SDimitry Andric                        << ", borrow = " << borrow << '\n');
f22ef01cSRoman Divacky    }
ff0cc061SDimitry Andric    bool isNeg = u[j+n] < borrow;
5517e702SDimitry Andric    u[j+n] -= Lo_32(borrow);
ff0cc061SDimitry Andric
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << "KnuthDiv: after subtraction:");
*b5893f02SDimitry Andric    DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << '\n');
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
f22ef01cSRoman Divacky    // negative, go to step D6; otherwise go on to step D7.
5517e702SDimitry Andric    q[j] = Lo_32(qp);
f22ef01cSRoman Divacky    if (isNeg) {
f22ef01cSRoman Divacky      // D6. [Add back]. The probability that this step is necessary is very
f22ef01cSRoman Divacky      // small, on the order of only 2/b. Make sure that test data accounts for
f22ef01cSRoman Divacky      // this possibility. Decrease q[j] by 1
f22ef01cSRoman Divacky      q[j]--;
f22ef01cSRoman Divacky      // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
f22ef01cSRoman Divacky      // A carry will occur to the left of u[j+n], and it should be ignored
f22ef01cSRoman Divacky      // since it cancels with the borrow that occurred in D4.
f22ef01cSRoman Divacky      bool carry = false;
f22ef01cSRoman Divacky      for (unsigned i = 0; i < n; i++) {
5517e702SDimitry Andric        uint32_t limit = std::min(u[j+i],v[i]);
f22ef01cSRoman Divacky        u[j+i] += v[i] + carry;
f22ef01cSRoman Divacky        carry = u[j+i] < limit || (carry && u[j+i] == limit);
f22ef01cSRoman Divacky      }
f22ef01cSRoman Divacky      u[j+n] += carry;
f22ef01cSRoman Divacky    }
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << "KnuthDiv: after correction:");
*b5893f02SDimitry Andric    DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << "\nKnuthDiv: digit result = " << q[j] << '\n');
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    // D7. [Loop on j.]  Decrease j by one. Now if j >= 0, go back to D3.
f22ef01cSRoman Divacky  } while (--j >= 0);
f22ef01cSRoman Divacky
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << "KnuthDiv: quotient:");
*b5893f02SDimitry Andric  DEBUG_KNUTH(for (int i = m; i >= 0; i--) dbgs() << " " << q[i]);
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << '\n');
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
f22ef01cSRoman Divacky  // remainder may be obtained by dividing u[...] by d. If r is non-null we
f22ef01cSRoman Divacky  // compute the remainder (urem uses this).
f22ef01cSRoman Divacky  if (r) {
f22ef01cSRoman Divacky    // The value d is expressed by the "shift" value above since we avoided
f22ef01cSRoman Divacky    // multiplication by d by using a shift left. So, all we have to do is
7a7e6055SDimitry Andric    // shift right here.
f22ef01cSRoman Divacky    if (shift) {
5517e702SDimitry Andric      uint32_t carry = 0;
*b5893f02SDimitry Andric      DEBUG_KNUTH(dbgs() << "KnuthDiv: remainder:");
f22ef01cSRoman Divacky      for (int i = n-1; i >= 0; i--) {
f22ef01cSRoman Divacky        r[i] = (u[i] >> shift) | carry;
f22ef01cSRoman Divacky        carry = u[i] << (32 - shift);
*b5893f02SDimitry Andric        DEBUG_KNUTH(dbgs() << " " << r[i]);
f22ef01cSRoman Divacky      }
f22ef01cSRoman Divacky    } else {
f22ef01cSRoman Divacky      for (int i = n-1; i >= 0; i--) {
f22ef01cSRoman Divacky        r[i] = u[i];
*b5893f02SDimitry Andric        DEBUG_KNUTH(dbgs() << " " << r[i]);
f22ef01cSRoman Divacky      }
f22ef01cSRoman Divacky    }
*b5893f02SDimitry Andric    DEBUG_KNUTH(dbgs() << '\n');
f22ef01cSRoman Divacky  }
*b5893f02SDimitry Andric  DEBUG_KNUTH(dbgs() << '\n');
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
d8866befSDimitry Andricvoid APInt::divide(const WordType *LHS, unsigned lhsWords, const WordType *RHS,
d8866befSDimitry Andric                   unsigned rhsWords, WordType *Quotient, WordType *Remainder) {
f22ef01cSRoman Divacky  assert(lhsWords >= rhsWords && "Fractional result");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // First, compose the values into an array of 32-bit words instead of
f22ef01cSRoman Divacky  // 64-bit words. This is a necessity of both the "short division" algorithm
f22ef01cSRoman Divacky  // and the Knuth "classical algorithm" which requires there to be native
f22ef01cSRoman Divacky  // operations for +, -, and * on an m bit value with an m*2 bit result. We
f22ef01cSRoman Divacky  // can't use 64-bit operands here because we don't have native results of
f22ef01cSRoman Divacky  // 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't
f22ef01cSRoman Divacky  // work on large-endian machines.
f22ef01cSRoman Divacky  unsigned n = rhsWords * 2;
f22ef01cSRoman Divacky  unsigned m = (lhsWords * 2) - n;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Allocate space for the temporary values we need either on the stack, if
f22ef01cSRoman Divacky  // it will fit, or on the heap if it won't.
5517e702SDimitry Andric  uint32_t SPACE[128];
5517e702SDimitry Andric  uint32_t *U = nullptr;
5517e702SDimitry Andric  uint32_t *V = nullptr;
5517e702SDimitry Andric  uint32_t *Q = nullptr;
5517e702SDimitry Andric  uint32_t *R = nullptr;
f22ef01cSRoman Divacky  if ((Remainder?4:3)*n+2*m+1 <= 128) {
f22ef01cSRoman Divacky    U = &SPACE[0];
f22ef01cSRoman Divacky    V = &SPACE[m+n+1];
f22ef01cSRoman Divacky    Q = &SPACE[(m+n+1) + n];
f22ef01cSRoman Divacky    if (Remainder)
f22ef01cSRoman Divacky      R = &SPACE[(m+n+1) + n + (m+n)];
f22ef01cSRoman Divacky  } else {
5517e702SDimitry Andric    U = new uint32_t[m + n + 1];
5517e702SDimitry Andric    V = new uint32_t[n];
5517e702SDimitry Andric    Q = new uint32_t[m+n];
f22ef01cSRoman Divacky    if (Remainder)
5517e702SDimitry Andric      R = new uint32_t[n];
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Initialize the dividend
5517e702SDimitry Andric  memset(U, 0, (m+n+1)*sizeof(uint32_t));
f22ef01cSRoman Divacky  for (unsigned i = 0; i < lhsWords; ++i) {
d8866befSDimitry Andric    uint64_t tmp = LHS[i];
5517e702SDimitry Andric    U[i * 2] = Lo_32(tmp);
5517e702SDimitry Andric    U[i * 2 + 1] = Hi_32(tmp);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  U[m+n] = 0; // this extra word is for "spill" in the Knuth algorithm.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Initialize the divisor
5517e702SDimitry Andric  memset(V, 0, (n)*sizeof(uint32_t));
f22ef01cSRoman Divacky  for (unsigned i = 0; i < rhsWords; ++i) {
d8866befSDimitry Andric    uint64_t tmp = RHS[i];
5517e702SDimitry Andric    V[i * 2] = Lo_32(tmp);
5517e702SDimitry Andric    V[i * 2 + 1] = Hi_32(tmp);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // initialize the quotient and remainder
5517e702SDimitry Andric  memset(Q, 0, (m+n) * sizeof(uint32_t));
f22ef01cSRoman Divacky  if (Remainder)
5517e702SDimitry Andric    memset(R, 0, n * sizeof(uint32_t));
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Now, adjust m and n for the Knuth division. n is the number of words in
f22ef01cSRoman Divacky  // the divisor. m is the number of words by which the dividend exceeds the
f22ef01cSRoman Divacky  // divisor (i.e. m+n is the length of the dividend). These sizes must not
f22ef01cSRoman Divacky  // contain any zero words or the Knuth algorithm fails.
f22ef01cSRoman Divacky  for (unsigned i = n; i > 0 && V[i-1] == 0; i--) {
f22ef01cSRoman Divacky    n--;
f22ef01cSRoman Divacky    m++;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  for (unsigned i = m+n; i > 0 && U[i-1] == 0; i--)
f22ef01cSRoman Divacky    m--;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If we're left with only a single word for the divisor, Knuth doesn't work
f22ef01cSRoman Divacky  // so we implement the short division algorithm here. This is much simpler
f22ef01cSRoman Divacky  // and faster because we are certain that we can divide a 64-bit quantity
f22ef01cSRoman Divacky  // by a 32-bit quantity at hardware speed and short division is simply a
f22ef01cSRoman Divacky  // series of such operations. This is just like doing short division but we
f22ef01cSRoman Divacky  // are using base 2^32 instead of base 10.
f22ef01cSRoman Divacky  assert(n != 0 && "Divide by zero?");
f22ef01cSRoman Divacky  if (n == 1) {
5517e702SDimitry Andric    uint32_t divisor = V[0];
5517e702SDimitry Andric    uint32_t remainder = 0;
5517e702SDimitry Andric    for (int i = m; i >= 0; i--) {
5517e702SDimitry Andric      uint64_t partial_dividend = Make_64(remainder, U[i]);
f22ef01cSRoman Divacky      if (partial_dividend == 0) {
f22ef01cSRoman Divacky        Q[i] = 0;
f22ef01cSRoman Divacky        remainder = 0;
f22ef01cSRoman Divacky      } else if (partial_dividend < divisor) {
f22ef01cSRoman Divacky        Q[i] = 0;
5517e702SDimitry Andric        remainder = Lo_32(partial_dividend);
f22ef01cSRoman Divacky      } else if (partial_dividend == divisor) {
f22ef01cSRoman Divacky        Q[i] = 1;
f22ef01cSRoman Divacky        remainder = 0;
f22ef01cSRoman Divacky      } else {
5517e702SDimitry Andric        Q[i] = Lo_32(partial_dividend / divisor);
5517e702SDimitry Andric        remainder = Lo_32(partial_dividend - (Q[i] * divisor));
f22ef01cSRoman Divacky      }
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky    if (R)
f22ef01cSRoman Divacky      R[0] = remainder;
f22ef01cSRoman Divacky  } else {
f22ef01cSRoman Divacky    // Now we're ready to invoke the Knuth classical divide algorithm. In this
f22ef01cSRoman Divacky    // case n > 1.
f22ef01cSRoman Divacky    KnuthDiv(U, V, Q, R, m, n);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If the caller wants the quotient
f22ef01cSRoman Divacky  if (Quotient) {
f22ef01cSRoman Divacky    for (unsigned i = 0; i < lhsWords; ++i)
d8866befSDimitry Andric      Quotient[i] = Make_64(Q[i*2+1], Q[i*2]);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // If the caller wants the remainder
f22ef01cSRoman Divacky  if (Remainder) {
f22ef01cSRoman Divacky    for (unsigned i = 0; i < rhsWords; ++i)
d8866befSDimitry Andric      Remainder[i] = Make_64(R[i*2+1], R[i*2]);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Clean up the memory we allocated.
f22ef01cSRoman Divacky  if (U != &SPACE[0]) {
f22ef01cSRoman Divacky    delete [] U;
f22ef01cSRoman Divacky    delete [] V;
f22ef01cSRoman Divacky    delete [] Q;
f22ef01cSRoman Divacky    delete [] R;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman DivackyAPInt APInt::udiv(const APInt &RHS) const {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // First, deal with the easy case
f22ef01cSRoman Divacky  if (isSingleWord()) {
f37b6182SDimitry Andric    assert(RHS.U.VAL != 0 && "Divide by zero?");
f37b6182SDimitry Andric    return APInt(BitWidth, U.VAL / RHS.U.VAL);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Get some facts about the LHS and RHS number of bits and words
5517e702SDimitry Andric  unsigned lhsWords = getNumWords(getActiveBits());
f22ef01cSRoman Divacky  unsigned rhsBits  = RHS.getActiveBits();
5517e702SDimitry Andric  unsigned rhsWords = getNumWords(rhsBits);
f22ef01cSRoman Divacky  assert(rhsWords && "Divided by zero???");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Deal with some degenerate cases
f22ef01cSRoman Divacky  if (!lhsWords)
f22ef01cSRoman Divacky    // 0 / X ===> 0
f22ef01cSRoman Divacky    return APInt(BitWidth, 0);
5517e702SDimitry Andric  if (rhsBits == 1)
5517e702SDimitry Andric    // X / 1 ===> X
5517e702SDimitry Andric    return *this;
5517e702SDimitry Andric  if (lhsWords < rhsWords || this->ult(RHS))
f22ef01cSRoman Divacky    // X / Y ===> 0, iff X < Y
f22ef01cSRoman Divacky    return APInt(BitWidth, 0);
5517e702SDimitry Andric  if (*this == RHS)
f22ef01cSRoman Divacky    // X / X ===> 1
f22ef01cSRoman Divacky    return APInt(BitWidth, 1);
5517e702SDimitry Andric  if (lhsWords == 1) // rhsWords is 1 if lhsWords is 1.
f22ef01cSRoman Divacky    // All high words are zero, just use native divide
f37b6182SDimitry Andric    return APInt(BitWidth, this->U.pVal[0] / RHS.U.pVal[0]);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
d8866befSDimitry Andric  APInt Quotient(BitWidth, 0); // to hold result.
d8866befSDimitry Andric  divide(U.pVal, lhsWords, RHS.U.pVal, rhsWords, Quotient.U.pVal, nullptr);
d8866befSDimitry Andric  return Quotient;
d8866befSDimitry Andric}
d8866befSDimitry Andric
d8866befSDimitry AndricAPInt APInt::udiv(uint64_t RHS) const {
d8866befSDimitry Andric  assert(RHS != 0 && "Divide by zero?");
d8866befSDimitry Andric
d8866befSDimitry Andric  // First, deal with the easy case
d8866befSDimitry Andric  if (isSingleWord())
d8866befSDimitry Andric    return APInt(BitWidth, U.VAL / RHS);
d8866befSDimitry Andric
d8866befSDimitry Andric  // Get some facts about the LHS words.
d8866befSDimitry Andric  unsigned lhsWords = getNumWords(getActiveBits());
d8866befSDimitry Andric
d8866befSDimitry Andric  // Deal with some degenerate cases
d8866befSDimitry Andric  if (!lhsWords)
d8866befSDimitry Andric    // 0 / X ===> 0
d8866befSDimitry Andric    return APInt(BitWidth, 0);
d8866befSDimitry Andric  if (RHS == 1)
d8866befSDimitry Andric    // X / 1 ===> X
d8866befSDimitry Andric    return *this;
d8866befSDimitry Andric  if (this->ult(RHS))
d8866befSDimitry Andric    // X / Y ===> 0, iff X < Y
d8866befSDimitry Andric    return APInt(BitWidth, 0);
d8866befSDimitry Andric  if (*this == RHS)
d8866befSDimitry Andric    // X / X ===> 1
d8866befSDimitry Andric    return APInt(BitWidth, 1);
d8866befSDimitry Andric  if (lhsWords == 1) // rhsWords is 1 if lhsWords is 1.
d8866befSDimitry Andric    // All high words are zero, just use native divide
d8866befSDimitry Andric    return APInt(BitWidth, this->U.pVal[0] / RHS);
d8866befSDimitry Andric
d8866befSDimitry Andric  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
d8866befSDimitry Andric  APInt Quotient(BitWidth, 0); // to hold result.
d8866befSDimitry Andric  divide(U.pVal, lhsWords, &RHS, 1, Quotient.U.pVal, nullptr);
f22ef01cSRoman Divacky  return Quotient;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
139f7f9bSDimitry AndricAPInt APInt::sdiv(const APInt &RHS) const {
139f7f9bSDimitry Andric  if (isNegative()) {
139f7f9bSDimitry Andric    if (RHS.isNegative())
139f7f9bSDimitry Andric      return (-(*this)).udiv(-RHS);
139f7f9bSDimitry Andric    return -((-(*this)).udiv(RHS));
139f7f9bSDimitry Andric  }
139f7f9bSDimitry Andric  if (RHS.isNegative())
139f7f9bSDimitry Andric    return -(this->udiv(-RHS));
139f7f9bSDimitry Andric  return this->udiv(RHS);
139f7f9bSDimitry Andric}
139f7f9bSDimitry Andric
d8866befSDimitry AndricAPInt APInt::sdiv(int64_t RHS) const {
d8866befSDimitry Andric  if (isNegative()) {
d8866befSDimitry Andric    if (RHS < 0)
d8866befSDimitry Andric      return (-(*this)).udiv(-RHS);
d8866befSDimitry Andric    return -((-(*this)).udiv(RHS));
d8866befSDimitry Andric  }
d8866befSDimitry Andric  if (RHS < 0)
d8866befSDimitry Andric    return -(this->udiv(-RHS));
d8866befSDimitry Andric  return this->udiv(RHS);
d8866befSDimitry Andric}
d8866befSDimitry Andric
f22ef01cSRoman DivackyAPInt APInt::urem(const APInt &RHS) const {
f22ef01cSRoman Divacky  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
f22ef01cSRoman Divacky  if (isSingleWord()) {
f37b6182SDimitry Andric    assert(RHS.U.VAL != 0 && "Remainder by zero?");
f37b6182SDimitry Andric    return APInt(BitWidth, U.VAL % RHS.U.VAL);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Get some facts about the LHS
5517e702SDimitry Andric  unsigned lhsWords = getNumWords(getActiveBits());
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Get some facts about the RHS
f22ef01cSRoman Divacky  unsigned rhsBits = RHS.getActiveBits();
5517e702SDimitry Andric  unsigned rhsWords = getNumWords(rhsBits);
f22ef01cSRoman Divacky  assert(rhsWords && "Performing remainder operation by zero ???");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Check the degenerate cases
5517e702SDimitry Andric  if (lhsWords == 0)
f22ef01cSRoman Divacky    // 0 % Y ===> 0
f22ef01cSRoman Divacky    return APInt(BitWidth, 0);
5517e702SDimitry Andric  if (rhsBits == 1)
5517e702SDimitry Andric    // X % 1 ===> 0
5517e702SDimitry Andric    return APInt(BitWidth, 0);
5517e702SDimitry Andric  if (lhsWords < rhsWords || this->ult(RHS))
f22ef01cSRoman Divacky    // X % Y ===> X, iff X < Y
f22ef01cSRoman Divacky    return *this;
5517e702SDimitry Andric  if (*this == RHS)
f22ef01cSRoman Divacky    // X % X == 0;
f22ef01cSRoman Divacky    return APInt(BitWidth, 0);
5517e702SDimitry Andric  if (lhsWords == 1)
f22ef01cSRoman Divacky    // All high words are zero, just use native remainder
f37b6182SDimitry Andric    return APInt(BitWidth, U.pVal[0] % RHS.U.pVal[0]);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
d8866befSDimitry Andric  APInt Remainder(BitWidth, 0);
d8866befSDimitry Andric  divide(U.pVal, lhsWords, RHS.U.pVal, rhsWords, nullptr, Remainder.U.pVal);
d8866befSDimitry Andric  return Remainder;
d8866befSDimitry Andric}
d8866befSDimitry Andric
d8866befSDimitry Andricuint64_t APInt::urem(uint64_t RHS) const {
d8866befSDimitry Andric  assert(RHS != 0 && "Remainder by zero?");
d8866befSDimitry Andric
d8866befSDimitry Andric  if (isSingleWord())
d8866befSDimitry Andric    return U.VAL % RHS;
d8866befSDimitry Andric
d8866befSDimitry Andric  // Get some facts about the LHS
d8866befSDimitry Andric  unsigned lhsWords = getNumWords(getActiveBits());
d8866befSDimitry Andric
d8866befSDimitry Andric  // Check the degenerate cases
d8866befSDimitry Andric  if (lhsWords == 0)
d8866befSDimitry Andric    // 0 % Y ===> 0
d8866befSDimitry Andric    return 0;
d8866befSDimitry Andric  if (RHS == 1)
d8866befSDimitry Andric    // X % 1 ===> 0
d8866befSDimitry Andric    return 0;
d8866befSDimitry Andric  if (this->ult(RHS))
d8866befSDimitry Andric    // X % Y ===> X, iff X < Y
d8866befSDimitry Andric    return getZExtValue();
d8866befSDimitry Andric  if (*this == RHS)
d8866befSDimitry Andric    // X % X == 0;
d8866befSDimitry Andric    return 0;
d8866befSDimitry Andric  if (lhsWords == 1)
d8866befSDimitry Andric    // All high words are zero, just use native remainder
d8866befSDimitry Andric    return U.pVal[0] % RHS;
d8866befSDimitry Andric
d8866befSDimitry Andric  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
d8866befSDimitry Andric  uint64_t Remainder;
d8866befSDimitry Andric  divide(U.pVal, lhsWords, &RHS, 1, nullptr, &Remainder);
f22ef01cSRoman Divacky  return Remainder;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
139f7f9bSDimitry AndricAPInt APInt::srem(const APInt &RHS) const {
139f7f9bSDimitry Andric  if (isNegative()) {
139f7f9bSDimitry Andric    if (RHS.isNegative())
139f7f9bSDimitry Andric      return -((-(*this)).urem(-RHS));
139f7f9bSDimitry Andric    return -((-(*this)).urem(RHS));
139f7f9bSDimitry Andric  }
139f7f9bSDimitry Andric  if (RHS.isNegative())
139f7f9bSDimitry Andric    return this->urem(-RHS);
139f7f9bSDimitry Andric  return this->urem(RHS);
139f7f9bSDimitry Andric}
139f7f9bSDimitry Andric
d8866befSDimitry Andricint64_t APInt::srem(int64_t RHS) const {
d8866befSDimitry Andric  if (isNegative()) {
d8866befSDimitry Andric    if (RHS < 0)
d8866befSDimitry Andric      return -((-(*this)).urem(-RHS));
d8866befSDimitry Andric    return -((-(*this)).urem(RHS));
d8866befSDimitry Andric  }
d8866befSDimitry Andric  if (RHS < 0)
d8866befSDimitry Andric    return this->urem(-RHS);
d8866befSDimitry Andric  return this->urem(RHS);
d8866befSDimitry Andric}
d8866befSDimitry Andric
f22ef01cSRoman Divackyvoid APInt::udivrem(const APInt &LHS, const APInt &RHS,
f22ef01cSRoman Divacky                    APInt &Quotient, APInt &Remainder) {
39d628a0SDimitry Andric  assert(LHS.BitWidth == RHS.BitWidth && "Bit widths must be the same");
5517e702SDimitry Andric  unsigned BitWidth = LHS.BitWidth;
39d628a0SDimitry Andric
39d628a0SDimitry Andric  // First, deal with the easy case
39d628a0SDimitry Andric  if (LHS.isSingleWord()) {
f37b6182SDimitry Andric    assert(RHS.U.VAL != 0 && "Divide by zero?");
f37b6182SDimitry Andric    uint64_t QuotVal = LHS.U.VAL / RHS.U.VAL;
f37b6182SDimitry Andric    uint64_t RemVal = LHS.U.VAL % RHS.U.VAL;
5517e702SDimitry Andric    Quotient = APInt(BitWidth, QuotVal);
5517e702SDimitry Andric    Remainder = APInt(BitWidth, RemVal);
39d628a0SDimitry Andric    return;
39d628a0SDimitry Andric  }
39d628a0SDimitry Andric
f22ef01cSRoman Divacky  // Get some size facts about the dividend and divisor
5517e702SDimitry Andric  unsigned lhsWords = getNumWords(LHS.getActiveBits());
f22ef01cSRoman Divacky  unsigned rhsBits  = RHS.getActiveBits();
5517e702SDimitry Andric  unsigned rhsWords = getNumWords(rhsBits);
5517e702SDimitry Andric  assert(rhsWords && "Performing divrem operation by zero ???");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Check the degenerate cases
f22ef01cSRoman Divacky  if (lhsWords == 0) {
4ba319b5SDimitry Andric    Quotient = APInt(BitWidth, 0);    // 0 / Y ===> 0
4ba319b5SDimitry Andric    Remainder = APInt(BitWidth, 0);   // 0 % Y ===> 0
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
5517e702SDimitry Andric  if (rhsBits == 1) {
5517e702SDimitry Andric    Quotient = LHS;                   // X / 1 ===> X
4ba319b5SDimitry Andric    Remainder = APInt(BitWidth, 0);   // X % 1 ===> 0
5517e702SDimitry Andric  }
5517e702SDimitry Andric
f22ef01cSRoman Divacky  if (lhsWords < rhsWords || LHS.ult(RHS)) {
f22ef01cSRoman Divacky    Remainder = LHS;                  // X % Y ===> X, iff X < Y
4ba319b5SDimitry Andric    Quotient = APInt(BitWidth, 0);    // X / Y ===> 0, iff X < Y
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  if (LHS == RHS) {
4ba319b5SDimitry Andric    Quotient  = APInt(BitWidth, 1);   // X / X ===> 1
4ba319b5SDimitry Andric    Remainder = APInt(BitWidth, 0);   // X % X ===> 0;
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
d8866befSDimitry Andric  // Make sure there is enough space to hold the results.
d8866befSDimitry Andric  // NOTE: This assumes that reallocate won't affect any bits if it doesn't
d8866befSDimitry Andric  // change the size. This is necessary if Quotient or Remainder is aliased
d8866befSDimitry Andric  // with LHS or RHS.
d8866befSDimitry Andric  Quotient.reallocate(BitWidth);
d8866befSDimitry Andric  Remainder.reallocate(BitWidth);
d8866befSDimitry Andric
5517e702SDimitry Andric  if (lhsWords == 1) { // rhsWords is 1 if lhsWords is 1.
f22ef01cSRoman Divacky    // There is only one word to consider so use the native versions.
5517e702SDimitry Andric    uint64_t lhsValue = LHS.U.pVal[0];
5517e702SDimitry Andric    uint64_t rhsValue = RHS.U.pVal[0];
5517e702SDimitry Andric    Quotient = lhsValue / rhsValue;
5517e702SDimitry Andric    Remainder = lhsValue % rhsValue;
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Okay, lets do it the long way
d8866befSDimitry Andric  divide(LHS.U.pVal, lhsWords, RHS.U.pVal, rhsWords, Quotient.U.pVal,
d8866befSDimitry Andric         Remainder.U.pVal);
d8866befSDimitry Andric  // Clear the rest of the Quotient and Remainder.
d8866befSDimitry Andric  std::memset(Quotient.U.pVal + lhsWords, 0,
d8866befSDimitry Andric              (getNumWords(BitWidth) - lhsWords) * APINT_WORD_SIZE);
d8866befSDimitry Andric  std::memset(Remainder.U.pVal + rhsWords, 0,
d8866befSDimitry Andric              (getNumWords(BitWidth) - rhsWords) * APINT_WORD_SIZE);
d8866befSDimitry Andric}
d8866befSDimitry Andric
d8866befSDimitry Andricvoid APInt::udivrem(const APInt &LHS, uint64_t RHS, APInt &Quotient,
d8866befSDimitry Andric                    uint64_t &Remainder) {
d8866befSDimitry Andric  assert(RHS != 0 && "Divide by zero?");
d8866befSDimitry Andric  unsigned BitWidth = LHS.BitWidth;
d8866befSDimitry Andric
d8866befSDimitry Andric  // First, deal with the easy case
d8866befSDimitry Andric  if (LHS.isSingleWord()) {
d8866befSDimitry Andric    uint64_t QuotVal = LHS.U.VAL / RHS;
d8866befSDimitry Andric    Remainder = LHS.U.VAL % RHS;
d8866befSDimitry Andric    Quotient = APInt(BitWidth, QuotVal);
d8866befSDimitry Andric    return;
d8866befSDimitry Andric  }
d8866befSDimitry Andric
d8866befSDimitry Andric  // Get some size facts about the dividend and divisor
d8866befSDimitry Andric  unsigned lhsWords = getNumWords(LHS.getActiveBits());
d8866befSDimitry Andric
d8866befSDimitry Andric  // Check the degenerate cases
d8866befSDimitry Andric  if (lhsWords == 0) {
4ba319b5SDimitry Andric    Quotient = APInt(BitWidth, 0);    // 0 / Y ===> 0
d8866befSDimitry Andric    Remainder = 0;                    // 0 % Y ===> 0
d8866befSDimitry Andric    return;
d8866befSDimitry Andric  }
d8866befSDimitry Andric
d8866befSDimitry Andric  if (RHS == 1) {
d8866befSDimitry Andric    Quotient = LHS;                   // X / 1 ===> X
d8866befSDimitry Andric    Remainder = 0;                    // X % 1 ===> 0
4ba319b5SDimitry Andric    return;
d8866befSDimitry Andric  }
d8866befSDimitry Andric
d8866befSDimitry Andric  if (LHS.ult(RHS)) {
d8866befSDimitry Andric    Remainder = LHS.getZExtValue();   // X % Y ===> X, iff X < Y
4ba319b5SDimitry Andric    Quotient = APInt(BitWidth, 0);    // X / Y ===> 0, iff X < Y
d8866befSDimitry Andric    return;
d8866befSDimitry Andric  }
d8866befSDimitry Andric
d8866befSDimitry Andric  if (LHS == RHS) {
4ba319b5SDimitry Andric    Quotient  = APInt(BitWidth, 1);   // X / X ===> 1
d8866befSDimitry Andric    Remainder = 0;                    // X % X ===> 0;
d8866befSDimitry Andric    return;
d8866befSDimitry Andric  }
d8866befSDimitry Andric
d8866befSDimitry Andric  // Make sure there is enough space to hold the results.
d8866befSDimitry Andric  // NOTE: This assumes that reallocate won't affect any bits if it doesn't
d8866befSDimitry Andric  // change the size. This is necessary if Quotient is aliased with LHS.
d8866befSDimitry Andric  Quotient.reallocate(BitWidth);
d8866befSDimitry Andric
d8866befSDimitry Andric  if (lhsWords == 1) { // rhsWords is 1 if lhsWords is 1.
d8866befSDimitry Andric    // There is only one word to consider so use the native versions.
d8866befSDimitry Andric    uint64_t lhsValue = LHS.U.pVal[0];
d8866befSDimitry Andric    Quotient = lhsValue / RHS;
d8866befSDimitry Andric    Remainder = lhsValue % RHS;
d8866befSDimitry Andric    return;
d8866befSDimitry Andric  }
d8866befSDimitry Andric
d8866befSDimitry Andric  // Okay, lets do it the long way
d8866befSDimitry Andric  divide(LHS.U.pVal, lhsWords, &RHS, 1, Quotient.U.pVal, &Remainder);
d8866befSDimitry Andric  // Clear the rest of the Quotient.
d8866befSDimitry Andric  std::memset(Quotient.U.pVal + lhsWords, 0,
d8866befSDimitry Andric              (getNumWords(BitWidth) - lhsWords) * APINT_WORD_SIZE);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
139f7f9bSDimitry Andricvoid APInt::sdivrem(const APInt &LHS, const APInt &RHS,
139f7f9bSDimitry Andric                    APInt &Quotient, APInt &Remainder) {
139f7f9bSDimitry Andric  if (LHS.isNegative()) {
139f7f9bSDimitry Andric    if (RHS.isNegative())
139f7f9bSDimitry Andric      APInt::udivrem(-LHS, -RHS, Quotient, Remainder);
139f7f9bSDimitry Andric    else {
139f7f9bSDimitry Andric      APInt::udivrem(-LHS, RHS, Quotient, Remainder);
5517e702SDimitry Andric      Quotient.negate();
139f7f9bSDimitry Andric    }
5517e702SDimitry Andric    Remainder.negate();
139f7f9bSDimitry Andric  } else if (RHS.isNegative()) {
139f7f9bSDimitry Andric    APInt::udivrem(LHS, -RHS, Quotient, Remainder);
5517e702SDimitry Andric    Quotient.negate();
139f7f9bSDimitry Andric  } else {
139f7f9bSDimitry Andric    APInt::udivrem(LHS, RHS, Quotient, Remainder);
139f7f9bSDimitry Andric  }
139f7f9bSDimitry Andric}
139f7f9bSDimitry Andric
d8866befSDimitry Andricvoid APInt::sdivrem(const APInt &LHS, int64_t RHS,
d8866befSDimitry Andric                    APInt &Quotient, int64_t &Remainder) {
d8866befSDimitry Andric  uint64_t R = Remainder;
d8866befSDimitry Andric  if (LHS.isNegative()) {
d8866befSDimitry Andric    if (RHS < 0)
d8866befSDimitry Andric      APInt::udivrem(-LHS, -RHS, Quotient, R);
d8866befSDimitry Andric    else {
d8866befSDimitry Andric      APInt::udivrem(-LHS, RHS, Quotient, R);
d8866befSDimitry Andric      Quotient.negate();
d8866befSDimitry Andric    }
d8866befSDimitry Andric    R = -R;
d8866befSDimitry Andric  } else if (RHS < 0) {
d8866befSDimitry Andric    APInt::udivrem(LHS, -RHS, Quotient, R);
d8866befSDimitry Andric    Quotient.negate();
d8866befSDimitry Andric  } else {
d8866befSDimitry Andric    APInt::udivrem(LHS, RHS, Quotient, R);
d8866befSDimitry Andric  }
d8866befSDimitry Andric  Remainder = R;
d8866befSDimitry Andric}
d8866befSDimitry Andric
2754fe60SDimitry AndricAPInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
2754fe60SDimitry Andric  APInt Res = *this+RHS;
2754fe60SDimitry Andric  Overflow = isNonNegative() == RHS.isNonNegative() &&
2754fe60SDimitry Andric             Res.isNonNegative() != isNonNegative();
2754fe60SDimitry Andric  return Res;
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
2754fe60SDimitry AndricAPInt APInt::uadd_ov(const APInt &RHS, bool &Overflow) const {
2754fe60SDimitry Andric  APInt Res = *this+RHS;
2754fe60SDimitry Andric  Overflow = Res.ult(RHS);
2754fe60SDimitry Andric  return Res;
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
2754fe60SDimitry AndricAPInt APInt::ssub_ov(const APInt &RHS, bool &Overflow) const {
2754fe60SDimitry Andric  APInt Res = *this - RHS;
2754fe60SDimitry Andric  Overflow = isNonNegative() != RHS.isNonNegative() &&
2754fe60SDimitry Andric             Res.isNonNegative() != isNonNegative();
2754fe60SDimitry Andric  return Res;
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
2754fe60SDimitry AndricAPInt APInt::usub_ov(const APInt &RHS, bool &Overflow) const {
2754fe60SDimitry Andric  APInt Res = *this-RHS;
2754fe60SDimitry Andric  Overflow = Res.ugt(*this);
2754fe60SDimitry Andric  return Res;
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
2754fe60SDimitry AndricAPInt APInt::sdiv_ov(const APInt &RHS, bool &Overflow) const {
2754fe60SDimitry Andric  // MININT/-1  -->  overflow.
2754fe60SDimitry Andric  Overflow = isMinSignedValue() && RHS.isAllOnesValue();
2754fe60SDimitry Andric  return sdiv(RHS);
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
2754fe60SDimitry AndricAPInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
2754fe60SDimitry Andric  APInt Res = *this * RHS;
2754fe60SDimitry Andric
2754fe60SDimitry Andric  if (*this != 0 && RHS != 0)
2754fe60SDimitry Andric    Overflow = Res.sdiv(RHS) != *this || Res.sdiv(*this) != RHS;
2754fe60SDimitry Andric  else
2754fe60SDimitry Andric    Overflow = false;
2754fe60SDimitry Andric  return Res;
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
3b0f4066SDimitry AndricAPInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
3b0f4066SDimitry Andric  APInt Res = *this * RHS;
3b0f4066SDimitry Andric
3b0f4066SDimitry Andric  if (*this != 0 && RHS != 0)
3b0f4066SDimitry Andric    Overflow = Res.udiv(RHS) != *this || Res.udiv(*this) != RHS;
3b0f4066SDimitry Andric  else
3b0f4066SDimitry Andric    Overflow = false;
3b0f4066SDimitry Andric  return Res;
3b0f4066SDimitry Andric}
3b0f4066SDimitry Andric
39d628a0SDimitry AndricAPInt APInt::sshl_ov(const APInt &ShAmt, bool &Overflow) const {
39d628a0SDimitry Andric  Overflow = ShAmt.uge(getBitWidth());
2754fe60SDimitry Andric  if (Overflow)
39d628a0SDimitry Andric    return APInt(BitWidth, 0);
2754fe60SDimitry Andric
2754fe60SDimitry Andric  if (isNonNegative()) // Don't allow sign change.
39d628a0SDimitry Andric    Overflow = ShAmt.uge(countLeadingZeros());
2754fe60SDimitry Andric  else
39d628a0SDimitry Andric    Overflow = ShAmt.uge(countLeadingOnes());
39d628a0SDimitry Andric
39d628a0SDimitry Andric  return *this << ShAmt;
39d628a0SDimitry Andric}
39d628a0SDimitry Andric
39d628a0SDimitry AndricAPInt APInt::ushl_ov(const APInt &ShAmt, bool &Overflow) const {
39d628a0SDimitry Andric  Overflow = ShAmt.uge(getBitWidth());
39d628a0SDimitry Andric  if (Overflow)
39d628a0SDimitry Andric    return APInt(BitWidth, 0);
39d628a0SDimitry Andric
39d628a0SDimitry Andric  Overflow = ShAmt.ugt(countLeadingZeros());
2754fe60SDimitry Andric
2754fe60SDimitry Andric  return *this << ShAmt;
2754fe60SDimitry Andric}
2754fe60SDimitry Andric
*b5893f02SDimitry AndricAPInt APInt::sadd_sat(const APInt &RHS) const {
*b5893f02SDimitry Andric  bool Overflow;
*b5893f02SDimitry Andric  APInt Res = sadd_ov(RHS, Overflow);
*b5893f02SDimitry Andric  if (!Overflow)
*b5893f02SDimitry Andric    return Res;
2754fe60SDimitry Andric
*b5893f02SDimitry Andric  return isNegative() ? APInt::getSignedMinValue(BitWidth)
*b5893f02SDimitry Andric                      : APInt::getSignedMaxValue(BitWidth);
*b5893f02SDimitry Andric}
*b5893f02SDimitry Andric
*b5893f02SDimitry AndricAPInt APInt::uadd_sat(const APInt &RHS) const {
*b5893f02SDimitry Andric  bool Overflow;
*b5893f02SDimitry Andric  APInt Res = uadd_ov(RHS, Overflow);
*b5893f02SDimitry Andric  if (!Overflow)
*b5893f02SDimitry Andric    return Res;
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  return APInt::getMaxValue(BitWidth);
*b5893f02SDimitry Andric}
*b5893f02SDimitry Andric
*b5893f02SDimitry AndricAPInt APInt::ssub_sat(const APInt &RHS) const {
*b5893f02SDimitry Andric  bool Overflow;
*b5893f02SDimitry Andric  APInt Res = ssub_ov(RHS, Overflow);
*b5893f02SDimitry Andric  if (!Overflow)
*b5893f02SDimitry Andric    return Res;
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  return isNegative() ? APInt::getSignedMinValue(BitWidth)
*b5893f02SDimitry Andric                      : APInt::getSignedMaxValue(BitWidth);
*b5893f02SDimitry Andric}
*b5893f02SDimitry Andric
*b5893f02SDimitry AndricAPInt APInt::usub_sat(const APInt &RHS) const {
*b5893f02SDimitry Andric  bool Overflow;
*b5893f02SDimitry Andric  APInt Res = usub_ov(RHS, Overflow);
*b5893f02SDimitry Andric  if (!Overflow)
*b5893f02SDimitry Andric    return Res;
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  return APInt(BitWidth, 0);
*b5893f02SDimitry Andric}
2754fe60SDimitry Andric
2754fe60SDimitry Andric
ffd1746dSEd Schoutenvoid APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
f22ef01cSRoman Divacky  // Check our assumptions here
f22ef01cSRoman Divacky  assert(!str.empty() && "Invalid string length");
6122f3e6SDimitry Andric  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
6122f3e6SDimitry Andric          radix == 36) &&
6122f3e6SDimitry Andric         "Radix should be 2, 8, 10, 16, or 36!");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  StringRef::iterator p = str.begin();
f22ef01cSRoman Divacky  size_t slen = str.size();
f22ef01cSRoman Divacky  bool isNeg = *p == '-';
f22ef01cSRoman Divacky  if (*p == '-' || *p == '+') {
f22ef01cSRoman Divacky    p++;
f22ef01cSRoman Divacky    slen--;
f22ef01cSRoman Divacky    assert(slen && "String is only a sign, needs a value.");
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  assert((slen <= numbits || radix != 2) && "Insufficient bit width");
f22ef01cSRoman Divacky  assert(((slen-1)*3 <= numbits || radix != 8) && "Insufficient bit width");
f22ef01cSRoman Divacky  assert(((slen-1)*4 <= numbits || radix != 16) && "Insufficient bit width");
f22ef01cSRoman Divacky  assert((((slen-1)*64)/22 <= numbits || radix != 10) &&
f22ef01cSRoman Divacky         "Insufficient bit width");
f22ef01cSRoman Divacky
f37b6182SDimitry Andric  // Allocate memory if needed
f37b6182SDimitry Andric  if (isSingleWord())
f37b6182SDimitry Andric    U.VAL = 0;
f37b6182SDimitry Andric  else
f37b6182SDimitry Andric    U.pVal = getClearedMemory(getNumWords());
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Figure out if we can shift instead of multiply
f22ef01cSRoman Divacky  unsigned shift = (radix == 16 ? 4 : radix == 8 ? 3 : radix == 2 ? 1 : 0);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Enter digit traversal loop
f22ef01cSRoman Divacky  for (StringRef::iterator e = str.end(); p != e; ++p) {
f22ef01cSRoman Divacky    unsigned digit = getDigit(*p, radix);
f22ef01cSRoman Divacky    assert(digit < radix && "Invalid character in digit string");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    // Shift or multiply the value by the radix
f22ef01cSRoman Divacky    if (slen > 1) {
f22ef01cSRoman Divacky      if (shift)
f22ef01cSRoman Divacky        *this <<= shift;
f22ef01cSRoman Divacky      else
0f5676f4SDimitry Andric        *this *= radix;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    // Add in the digit we just interpreted
7a7e6055SDimitry Andric    *this += digit;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky  // If its negative, put it in two's complement form
5517e702SDimitry Andric  if (isNeg)
5517e702SDimitry Andric    this->negate();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divackyvoid APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
17a519f9SDimitry Andric                     bool Signed, bool formatAsCLiteral) const {
6122f3e6SDimitry Andric  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2 ||
6122f3e6SDimitry Andric          Radix == 36) &&
dff0c46cSDimitry Andric         "Radix should be 2, 8, 10, 16, or 36!");
f22ef01cSRoman Divacky
17a519f9SDimitry Andric  const char *Prefix = "";
17a519f9SDimitry Andric  if (formatAsCLiteral) {
17a519f9SDimitry Andric    switch (Radix) {
17a519f9SDimitry Andric      case 2:
17a519f9SDimitry Andric        // Binary literals are a non-standard extension added in gcc 4.3:
17a519f9SDimitry Andric        // http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
17a519f9SDimitry Andric        Prefix = "0b";
17a519f9SDimitry Andric        break;
17a519f9SDimitry Andric      case 8:
17a519f9SDimitry Andric        Prefix = "0";
17a519f9SDimitry Andric        break;
dff0c46cSDimitry Andric      case 10:
dff0c46cSDimitry Andric        break; // No prefix
17a519f9SDimitry Andric      case 16:
17a519f9SDimitry Andric        Prefix = "0x";
17a519f9SDimitry Andric        break;
dff0c46cSDimitry Andric      default:
dff0c46cSDimitry Andric        llvm_unreachable("Invalid radix!");
17a519f9SDimitry Andric    }
17a519f9SDimitry Andric  }
17a519f9SDimitry Andric
f22ef01cSRoman Divacky  // First, check for a zero value and just short circuit the logic below.
f22ef01cSRoman Divacky  if (*this == 0) {
17a519f9SDimitry Andric    while (*Prefix) {
17a519f9SDimitry Andric      Str.push_back(*Prefix);
17a519f9SDimitry Andric      ++Prefix;
17a519f9SDimitry Andric    };
f22ef01cSRoman Divacky    Str.push_back('0');
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
6122f3e6SDimitry Andric  static const char Digits[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  if (isSingleWord()) {
f22ef01cSRoman Divacky    char Buffer[65];
302affcbSDimitry Andric    char *BufPtr = std::end(Buffer);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    uint64_t N;
e580952dSDimitry Andric    if (!Signed) {
e580952dSDimitry Andric      N = getZExtValue();
e580952dSDimitry Andric    } else {
f22ef01cSRoman Divacky      int64_t I = getSExtValue();
e580952dSDimitry Andric      if (I >= 0) {
f22ef01cSRoman Divacky        N = I;
f22ef01cSRoman Divacky      } else {
e580952dSDimitry Andric        Str.push_back('-');
e580952dSDimitry Andric        N = -(uint64_t)I;
e580952dSDimitry Andric      }
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky
17a519f9SDimitry Andric    while (*Prefix) {
17a519f9SDimitry Andric      Str.push_back(*Prefix);
17a519f9SDimitry Andric      ++Prefix;
17a519f9SDimitry Andric    };
17a519f9SDimitry Andric
f22ef01cSRoman Divacky    while (N) {
f22ef01cSRoman Divacky      *--BufPtr = Digits[N % Radix];
f22ef01cSRoman Divacky      N /= Radix;
f22ef01cSRoman Divacky    }
302affcbSDimitry Andric    Str.append(BufPtr, std::end(Buffer));
f22ef01cSRoman Divacky    return;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  APInt Tmp(*this);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  if (Signed && isNegative()) {
f22ef01cSRoman Divacky    // They want to print the signed version and it is a negative value
f22ef01cSRoman Divacky    // Flip the bits and add one to turn it into the equivalent positive
f22ef01cSRoman Divacky    // value and put a '-' in the result.
5517e702SDimitry Andric    Tmp.negate();
f22ef01cSRoman Divacky    Str.push_back('-');
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
17a519f9SDimitry Andric  while (*Prefix) {
17a519f9SDimitry Andric    Str.push_back(*Prefix);
17a519f9SDimitry Andric    ++Prefix;
17a519f9SDimitry Andric  };
17a519f9SDimitry Andric
f22ef01cSRoman Divacky  // We insert the digits backward, then reverse them to get the right order.
f22ef01cSRoman Divacky  unsigned StartDig = Str.size();
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // For the 2, 8 and 16 bit cases, we can just shift instead of divide
f22ef01cSRoman Divacky  // because the number of bits per digit (1, 3 and 4 respectively) divides
7a7e6055SDimitry Andric  // equally.  We just shift until the value is zero.
6122f3e6SDimitry Andric  if (Radix == 2 || Radix == 8 || Radix == 16) {
f22ef01cSRoman Divacky    // Just shift tmp right for each digit width until it becomes zero
f22ef01cSRoman Divacky    unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
f22ef01cSRoman Divacky    unsigned MaskAmt = Radix - 1;
f22ef01cSRoman Divacky
5517e702SDimitry Andric    while (Tmp.getBoolValue()) {
f22ef01cSRoman Divacky      unsigned Digit = unsigned(Tmp.getRawData()[0]) & MaskAmt;
f22ef01cSRoman Divacky      Str.push_back(Digits[Digit]);
6bc11b14SDimitry Andric      Tmp.lshrInPlace(ShiftAmt);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  } else {
5517e702SDimitry Andric    while (Tmp.getBoolValue()) {
d8866befSDimitry Andric      uint64_t Digit;
d8866befSDimitry Andric      udivrem(Tmp, Radix, Tmp, Digit);
f22ef01cSRoman Divacky      assert(Digit < Radix && "divide failed");
f22ef01cSRoman Divacky      Str.push_back(Digits[Digit]);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  // Reverse the digits before returning.
f22ef01cSRoman Divacky  std::reverse(Str.begin()+StartDig, Str.end());
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
ff0cc061SDimitry Andric/// Returns the APInt as a std::string. Note that this is an inefficient method.
ff0cc061SDimitry Andric/// It is better to pass in a SmallVector/SmallString to the methods above.
f22ef01cSRoman Divackystd::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
f22ef01cSRoman Divacky  SmallString<40> S;
17a519f9SDimitry Andric  toString(S, Radix, Signed, /* formatAsCLiteral = */false);
f22ef01cSRoman Divacky  return S.str();
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3ca95b02SDimitry AndricLLVM_DUMP_METHOD void APInt::dump() const {
f22ef01cSRoman Divacky  SmallString<40> S, U;
f22ef01cSRoman Divacky  this->toStringUnsigned(U);
f22ef01cSRoman Divacky  this->toStringSigned(S);
f22ef01cSRoman Divacky  dbgs() << "APInt(" << BitWidth << "b, "
7a7e6055SDimitry Andric         << U << "u " << S << "s)\n";
f22ef01cSRoman Divacky}
7a7e6055SDimitry Andric#endif
f22ef01cSRoman Divacky
f22ef01cSRoman Divackyvoid APInt::print(raw_ostream &OS, bool isSigned) const {
f22ef01cSRoman Divacky  SmallString<40> S;
17a519f9SDimitry Andric  this->toString(S, 10, isSigned, /* formatAsCLiteral = */false);
ff0cc061SDimitry Andric  OS << S;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky// This implements a variety of operations on a representation of
f22ef01cSRoman Divacky// arbitrary precision, two's-complement, bignum integer values.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky// Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
f22ef01cSRoman Divacky// and unrestricting assumption.
7a7e6055SDimitry Andricstatic_assert(APInt::APINT_BITS_PER_WORD % 2 == 0,
7a7e6055SDimitry Andric              "Part width must be divisible by 2!");
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Some handy functions local to this file.  */
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the integer part with the least significant BITS set.
f22ef01cSRoman Divacky   BITS cannot be zero.  */
7a7e6055SDimitry Andricstatic inline APInt::WordType lowBitMask(unsigned bits) {
7a7e6055SDimitry Andric  assert(bits != 0 && bits <= APInt::APINT_BITS_PER_WORD);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  return ~(APInt::WordType) 0 >> (APInt::APINT_BITS_PER_WORD - bits);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the value of the lower half of PART.  */
7a7e6055SDimitry Andricstatic inline APInt::WordType lowHalf(APInt::WordType part) {
7a7e6055SDimitry Andric  return part & lowBitMask(APInt::APINT_BITS_PER_WORD / 2);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the value of the upper half of PART.  */
7a7e6055SDimitry Andricstatic inline APInt::WordType highHalf(APInt::WordType part) {
7a7e6055SDimitry Andric  return part >> (APInt::APINT_BITS_PER_WORD / 2);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the bit number of the most significant set bit of a part.
f22ef01cSRoman Divacky   If the input number has no bits set -1U is returned.  */
7a7e6055SDimitry Andricstatic unsigned partMSB(APInt::WordType value) {
f785676fSDimitry Andric  return findLastSet(value, ZB_Max);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the bit number of the least significant set bit of a
f22ef01cSRoman Divacky   part.  If the input number has no bits set -1U is returned.  */
7a7e6055SDimitry Andricstatic unsigned partLSB(APInt::WordType value) {
f785676fSDimitry Andric  return findFirstSet(value, ZB_Max);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Sets the least significant part of a bignum to the input value, and
f22ef01cSRoman Divacky   zeroes out higher parts.  */
7a7e6055SDimitry Andricvoid APInt::tcSet(WordType *dst, WordType part, unsigned parts) {
f22ef01cSRoman Divacky  assert(parts > 0);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  dst[0] = part;
7a7e6055SDimitry Andric  for (unsigned i = 1; i < parts; i++)
f22ef01cSRoman Divacky    dst[i] = 0;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Assign one bignum to another.  */
7a7e6055SDimitry Andricvoid APInt::tcAssign(WordType *dst, const WordType *src, unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    dst[i] = src[i];
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns true if a bignum is zero, false otherwise.  */
7a7e6055SDimitry Andricbool APInt::tcIsZero(const WordType *src, unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    if (src[i])
f22ef01cSRoman Divacky      return false;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return true;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Extract the given bit of a bignum; returns 0 or 1.  */
7a7e6055SDimitry Andricint APInt::tcExtractBit(const WordType *parts, unsigned bit) {
7a7e6055SDimitry Andric  return (parts[whichWord(bit)] & maskBit(bit)) != 0;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Set the given bit of a bignum. */
7a7e6055SDimitry Andricvoid APInt::tcSetBit(WordType *parts, unsigned bit) {
7a7e6055SDimitry Andric  parts[whichWord(bit)] |= maskBit(bit);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Clears the given bit of a bignum. */
7a7e6055SDimitry Andricvoid APInt::tcClearBit(WordType *parts, unsigned bit) {
7a7e6055SDimitry Andric  parts[whichWord(bit)] &= ~maskBit(bit);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the bit number of the least significant set bit of a
f22ef01cSRoman Divacky   number.  If the input number has no bits set -1U is returned.  */
7a7e6055SDimitry Andricunsigned APInt::tcLSB(const WordType *parts, unsigned n) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < n; i++) {
f22ef01cSRoman Divacky    if (parts[i] != 0) {
7a7e6055SDimitry Andric      unsigned lsb = partLSB(parts[i]);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric      return lsb + i * APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return -1U;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Returns the bit number of the most significant set bit of a number.
f22ef01cSRoman Divacky   If the input number has no bits set -1U is returned.  */
7a7e6055SDimitry Andricunsigned APInt::tcMSB(const WordType *parts, unsigned n) {
f22ef01cSRoman Divacky  do {
f22ef01cSRoman Divacky    --n;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    if (parts[n] != 0) {
7a7e6055SDimitry Andric      unsigned msb = partMSB(parts[n]);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric      return msb + n * APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  } while (n);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return -1U;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Copy the bit vector of width srcBITS from SRC, starting at bit
f22ef01cSRoman Divacky   srcLSB, to DST, of dstCOUNT parts, such that the bit srcLSB becomes
f22ef01cSRoman Divacky   the least significant bit of DST.  All high bits above srcBITS in
f22ef01cSRoman Divacky   DST are zero-filled.  */
f22ef01cSRoman Divackyvoid
7a7e6055SDimitry AndricAPInt::tcExtract(WordType *dst, unsigned dstCount, const WordType *src,
7a7e6055SDimitry Andric                 unsigned srcBits, unsigned srcLSB) {
7a7e6055SDimitry Andric  unsigned dstParts = (srcBits + APINT_BITS_PER_WORD - 1) / APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  assert(dstParts <= dstCount);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  unsigned firstSrcPart = srcLSB / APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  tcAssign (dst, src + firstSrcPart, dstParts);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  unsigned shift = srcLSB % APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  tcShiftRight (dst, dstParts, shift);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  /* We now have (dstParts * APINT_BITS_PER_WORD - shift) bits from SRC
f22ef01cSRoman Divacky     in DST.  If this is less that srcBits, append the rest, else
f22ef01cSRoman Divacky     clear the high bits.  */
7a7e6055SDimitry Andric  unsigned n = dstParts * APINT_BITS_PER_WORD - shift;
f22ef01cSRoman Divacky  if (n < srcBits) {
7a7e6055SDimitry Andric    WordType mask = lowBitMask (srcBits - n);
f22ef01cSRoman Divacky    dst[dstParts - 1] |= ((src[firstSrcPart + dstParts] & mask)
7a7e6055SDimitry Andric                          << n % APINT_BITS_PER_WORD);
f22ef01cSRoman Divacky  } else if (n > srcBits) {
7a7e6055SDimitry Andric    if (srcBits % APINT_BITS_PER_WORD)
7a7e6055SDimitry Andric      dst[dstParts - 1] &= lowBitMask (srcBits % APINT_BITS_PER_WORD);
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  /* Clear high parts.  */
f22ef01cSRoman Divacky  while (dstParts < dstCount)
f22ef01cSRoman Divacky    dst[dstParts++] = 0;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* DST += RHS + C where C is zero or one.  Returns the carry flag.  */
7a7e6055SDimitry AndricAPInt::WordType APInt::tcAdd(WordType *dst, const WordType *rhs,
7a7e6055SDimitry Andric                             WordType c, unsigned parts) {
f22ef01cSRoman Divacky  assert(c <= 1);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++) {
7a7e6055SDimitry Andric    WordType l = dst[i];
f22ef01cSRoman Divacky    if (c) {
f22ef01cSRoman Divacky      dst[i] += rhs[i] + 1;
f22ef01cSRoman Divacky      c = (dst[i] <= l);
f22ef01cSRoman Divacky    } else {
f22ef01cSRoman Divacky      dst[i] += rhs[i];
f22ef01cSRoman Divacky      c = (dst[i] < l);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return c;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric/// This function adds a single "word" integer, src, to the multiple
7a7e6055SDimitry Andric/// "word" integer array, dst[]. dst[] is modified to reflect the addition and
7a7e6055SDimitry Andric/// 1 is returned if there is a carry out, otherwise 0 is returned.
7a7e6055SDimitry Andric/// @returns the carry of the addition.
7a7e6055SDimitry AndricAPInt::WordType APInt::tcAddPart(WordType *dst, WordType src,
7a7e6055SDimitry Andric                                 unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; ++i) {
7a7e6055SDimitry Andric    dst[i] += src;
7a7e6055SDimitry Andric    if (dst[i] >= src)
7a7e6055SDimitry Andric      return 0; // No need to carry so exit early.
7a7e6055SDimitry Andric    src = 1; // Carry one to next digit.
7a7e6055SDimitry Andric  }
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  return 1;
7a7e6055SDimitry Andric}
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric/* DST -= RHS + C where C is zero or one.  Returns the carry flag.  */
7a7e6055SDimitry AndricAPInt::WordType APInt::tcSubtract(WordType *dst, const WordType *rhs,
7a7e6055SDimitry Andric                                  WordType c, unsigned parts) {
f22ef01cSRoman Divacky  assert(c <= 1);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++) {
7a7e6055SDimitry Andric    WordType l = dst[i];
f22ef01cSRoman Divacky    if (c) {
f22ef01cSRoman Divacky      dst[i] -= rhs[i] + 1;
f22ef01cSRoman Divacky      c = (dst[i] >= l);
f22ef01cSRoman Divacky    } else {
f22ef01cSRoman Divacky      dst[i] -= rhs[i];
f22ef01cSRoman Divacky      c = (dst[i] > l);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return c;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric/// This function subtracts a single "word" (64-bit word), src, from
7a7e6055SDimitry Andric/// the multi-word integer array, dst[], propagating the borrowed 1 value until
7a7e6055SDimitry Andric/// no further borrowing is needed or it runs out of "words" in dst.  The result
7a7e6055SDimitry Andric/// is 1 if "borrowing" exhausted the digits in dst, or 0 if dst was not
7a7e6055SDimitry Andric/// exhausted. In other words, if src > dst then this function returns 1,
7a7e6055SDimitry Andric/// otherwise 0.
7a7e6055SDimitry Andric/// @returns the borrow out of the subtraction
7a7e6055SDimitry AndricAPInt::WordType APInt::tcSubtractPart(WordType *dst, WordType src,
7a7e6055SDimitry Andric                                      unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; ++i) {
7a7e6055SDimitry Andric    WordType Dst = dst[i];
7a7e6055SDimitry Andric    dst[i] -= src;
7a7e6055SDimitry Andric    if (src <= Dst)
7a7e6055SDimitry Andric      return 0; // No need to borrow so exit early.
7a7e6055SDimitry Andric    src = 1; // We have to "borrow 1" from next "word"
7a7e6055SDimitry Andric  }
7a7e6055SDimitry Andric
7a7e6055SDimitry Andric  return 1;
7a7e6055SDimitry Andric}
7a7e6055SDimitry Andric
f22ef01cSRoman Divacky/* Negate a bignum in-place.  */
7a7e6055SDimitry Andricvoid APInt::tcNegate(WordType *dst, unsigned parts) {
f22ef01cSRoman Divacky  tcComplement(dst, parts);
f22ef01cSRoman Divacky  tcIncrement(dst, parts);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/*  DST += SRC * MULTIPLIER + CARRY   if add is true
f22ef01cSRoman Divacky    DST  = SRC * MULTIPLIER + CARRY   if add is false
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    Requires 0 <= DSTPARTS <= SRCPARTS + 1.  If DST overlaps SRC
f22ef01cSRoman Divacky    they must start at the same point, i.e. DST == SRC.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    If DSTPARTS == SRCPARTS + 1 no overflow occurs and zero is
f22ef01cSRoman Divacky    returned.  Otherwise DST is filled with the least significant
f22ef01cSRoman Divacky    DSTPARTS parts of the result, and if all of the omitted higher
f22ef01cSRoman Divacky    parts were zero return zero, otherwise overflow occurred and
f22ef01cSRoman Divacky    return one.  */
7a7e6055SDimitry Andricint APInt::tcMultiplyPart(WordType *dst, const WordType *src,
7a7e6055SDimitry Andric                          WordType multiplier, WordType carry,
7a7e6055SDimitry Andric                          unsigned srcParts, unsigned dstParts,
7a7e6055SDimitry Andric                          bool add) {
f22ef01cSRoman Divacky  /* Otherwise our writes of DST kill our later reads of SRC.  */
f22ef01cSRoman Divacky  assert(dst <= src || dst >= src + srcParts);
f22ef01cSRoman Divacky  assert(dstParts <= srcParts + 1);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  /* N loops; minimum of dstParts and srcParts.  */
0f5676f4SDimitry Andric  unsigned n = std::min(dstParts, srcParts);
f22ef01cSRoman Divacky
0f5676f4SDimitry Andric  for (unsigned i = 0; i < n; i++) {
7a7e6055SDimitry Andric    WordType low, mid, high, srcPart;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky      /* [ LOW, HIGH ] = MULTIPLIER * SRC[i] + DST[i] + CARRY.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky         This cannot overflow, because
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky         (n - 1) * (n - 1) + 2 (n - 1) = (n - 1) * (n + 1)
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky         which is less than n^2.  */
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    srcPart = src[i];
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    if (multiplier == 0 || srcPart == 0) {
f22ef01cSRoman Divacky      low = carry;
f22ef01cSRoman Divacky      high = 0;
f22ef01cSRoman Divacky    } else {
f22ef01cSRoman Divacky      low = lowHalf(srcPart) * lowHalf(multiplier);
f22ef01cSRoman Divacky      high = highHalf(srcPart) * highHalf(multiplier);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky      mid = lowHalf(srcPart) * highHalf(multiplier);
f22ef01cSRoman Divacky      high += highHalf(mid);
7a7e6055SDimitry Andric      mid <<= APINT_BITS_PER_WORD / 2;
f22ef01cSRoman Divacky      if (low + mid < low)
f22ef01cSRoman Divacky        high++;
f22ef01cSRoman Divacky      low += mid;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky      mid = highHalf(srcPart) * lowHalf(multiplier);
f22ef01cSRoman Divacky      high += highHalf(mid);
7a7e6055SDimitry Andric      mid <<= APINT_BITS_PER_WORD / 2;
f22ef01cSRoman Divacky      if (low + mid < low)
f22ef01cSRoman Divacky        high++;
f22ef01cSRoman Divacky      low += mid;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky      /* Now add carry.  */
f22ef01cSRoman Divacky      if (low + carry < low)
f22ef01cSRoman Divacky        high++;
f22ef01cSRoman Divacky      low += carry;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    if (add) {
f22ef01cSRoman Divacky      /* And now DST[i], and store the new low part there.  */
f22ef01cSRoman Divacky      if (low + dst[i] < low)
f22ef01cSRoman Divacky        high++;
f22ef01cSRoman Divacky      dst[i] += low;
f22ef01cSRoman Divacky    } else
f22ef01cSRoman Divacky      dst[i] = low;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    carry = high;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
0f5676f4SDimitry Andric  if (srcParts < dstParts) {
f22ef01cSRoman Divacky    /* Full multiplication, there is no overflow.  */
0f5676f4SDimitry Andric    assert(srcParts + 1 == dstParts);
0f5676f4SDimitry Andric    dst[srcParts] = carry;
f22ef01cSRoman Divacky    return 0;
0f5676f4SDimitry Andric  }
0f5676f4SDimitry Andric
f22ef01cSRoman Divacky  /* We overflowed if there is carry.  */
f22ef01cSRoman Divacky  if (carry)
f22ef01cSRoman Divacky    return 1;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  /* We would overflow if any significant unwritten parts would be
f22ef01cSRoman Divacky     non-zero.  This is true if any remaining src parts are non-zero
f22ef01cSRoman Divacky     and the multiplier is non-zero.  */
f22ef01cSRoman Divacky  if (multiplier)
0f5676f4SDimitry Andric    for (unsigned i = dstParts; i < srcParts; i++)
f22ef01cSRoman Divacky      if (src[i])
f22ef01cSRoman Divacky        return 1;
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  /* We fitted in the narrow destination.  */
f22ef01cSRoman Divacky  return 0;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* DST = LHS * RHS, where DST has the same width as the operands and
f22ef01cSRoman Divacky   is filled with the least significant parts of the result.  Returns
f22ef01cSRoman Divacky   one if overflow occurred, otherwise zero.  DST must be disjoint
f22ef01cSRoman Divacky   from both operands.  */
7a7e6055SDimitry Andricint APInt::tcMultiply(WordType *dst, const WordType *lhs,
7a7e6055SDimitry Andric                      const WordType *rhs, unsigned parts) {
f22ef01cSRoman Divacky  assert(dst != lhs && dst != rhs);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  int overflow = 0;
f22ef01cSRoman Divacky  tcSet(dst, 0, parts);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    overflow |= tcMultiplyPart(&dst[i], lhs, rhs[i], 0, parts,
f22ef01cSRoman Divacky                               parts - i, true);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return overflow;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
5517e702SDimitry Andric/// DST = LHS * RHS, where DST has width the sum of the widths of the
5517e702SDimitry Andric/// operands. No overflow occurs. DST must be disjoint from both operands.
5517e702SDimitry Andricvoid APInt::tcFullMultiply(WordType *dst, const WordType *lhs,
7a7e6055SDimitry Andric                           const WordType *rhs, unsigned lhsParts,
7a7e6055SDimitry Andric                           unsigned rhsParts) {
f22ef01cSRoman Divacky  /* Put the narrower number on the LHS for less loops below.  */
0f5676f4SDimitry Andric  if (lhsParts > rhsParts)
f22ef01cSRoman Divacky    return tcFullMultiply (dst, rhs, lhs, rhsParts, lhsParts);
0f5676f4SDimitry Andric
f22ef01cSRoman Divacky  assert(dst != lhs && dst != rhs);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  tcSet(dst, 0, rhsParts);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  for (unsigned i = 0; i < lhsParts; i++)
7a7e6055SDimitry Andric    tcMultiplyPart(&dst[i], rhs, lhs[i], 0, rhsParts, rhsParts + 1, true);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* If RHS is zero LHS and REMAINDER are left unchanged, return one.
f22ef01cSRoman Divacky   Otherwise set LHS to LHS / RHS with the fractional part discarded,
f22ef01cSRoman Divacky   set REMAINDER to the remainder, return zero.  i.e.
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky   OLD_LHS = RHS * LHS + REMAINDER
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky   SCRATCH is a bignum of the same size as the operands and result for
f22ef01cSRoman Divacky   use by the routine; its contents need not be initialized and are
f22ef01cSRoman Divacky   destroyed.  LHS, REMAINDER and SCRATCH must be distinct.
f22ef01cSRoman Divacky*/
7a7e6055SDimitry Andricint APInt::tcDivide(WordType *lhs, const WordType *rhs,
7a7e6055SDimitry Andric                    WordType *remainder, WordType *srhs,
7a7e6055SDimitry Andric                    unsigned parts) {
f22ef01cSRoman Divacky  assert(lhs != remainder && lhs != srhs && remainder != srhs);
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  unsigned shiftCount = tcMSB(rhs, parts) + 1;
f22ef01cSRoman Divacky  if (shiftCount == 0)
f22ef01cSRoman Divacky    return true;
f22ef01cSRoman Divacky
7a7e6055SDimitry Andric  shiftCount = parts * APINT_BITS_PER_WORD - shiftCount;
7a7e6055SDimitry Andric  unsigned n = shiftCount / APINT_BITS_PER_WORD;
7a7e6055SDimitry Andric  WordType mask = (WordType) 1 << (shiftCount % APINT_BITS_PER_WORD);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  tcAssign(srhs, rhs, parts);
f22ef01cSRoman Divacky  tcShiftLeft(srhs, parts, shiftCount);
f22ef01cSRoman Divacky  tcAssign(remainder, lhs, parts);
f22ef01cSRoman Divacky  tcSet(lhs, 0, parts);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  /* Loop, subtracting SRHS if REMAINDER is greater and adding that to
f22ef01cSRoman Divacky     the total.  */
f22ef01cSRoman Divacky  for (;;) {
5517e702SDimitry Andric    int compare = tcCompare(remainder, srhs, parts);
f22ef01cSRoman Divacky    if (compare >= 0) {
f22ef01cSRoman Divacky      tcSubtract(remainder, srhs, 0, parts);
f22ef01cSRoman Divacky      lhs[n] |= mask;
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky    if (shiftCount == 0)
f22ef01cSRoman Divacky      break;
f22ef01cSRoman Divacky    shiftCount--;
f22ef01cSRoman Divacky    tcShiftRight(srhs, parts, 1);
3ca95b02SDimitry Andric    if ((mask >>= 1) == 0) {
7a7e6055SDimitry Andric      mask = (WordType) 1 << (APINT_BITS_PER_WORD - 1);
3ca95b02SDimitry Andric      n--;
3ca95b02SDimitry Andric    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return false;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
6bc11b14SDimitry Andric/// Shift a bignum left Cound bits in-place. Shifted in bits are zero. There are
6bc11b14SDimitry Andric/// no restrictions on Count.
6bc11b14SDimitry Andricvoid APInt::tcShiftLeft(WordType *Dst, unsigned Words, unsigned Count) {
6bc11b14SDimitry Andric  // Don't bother performing a no-op shift.
6bc11b14SDimitry Andric  if (!Count)
6bc11b14SDimitry Andric    return;
f22ef01cSRoman Divacky
51690af2SDimitry Andric  // WordShift is the inter-part shift; BitShift is the intra-part shift.
6bc11b14SDimitry Andric  unsigned WordShift = std::min(Count / APINT_BITS_PER_WORD, Words);
6bc11b14SDimitry Andric  unsigned BitShift = Count % APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky
6bc11b14SDimitry Andric  // Fastpath for moving by whole words.
6bc11b14SDimitry Andric  if (BitShift == 0) {
6bc11b14SDimitry Andric    std::memmove(Dst + WordShift, Dst, (Words - WordShift) * APINT_WORD_SIZE);
f22ef01cSRoman Divacky  } else {
6bc11b14SDimitry Andric    while (Words-- > WordShift) {
6bc11b14SDimitry Andric      Dst[Words] = Dst[Words - WordShift] << BitShift;
6bc11b14SDimitry Andric      if (Words > WordShift)
6bc11b14SDimitry Andric        Dst[Words] |=
6bc11b14SDimitry Andric          Dst[Words - WordShift - 1] >> (APINT_BITS_PER_WORD - BitShift);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
6bc11b14SDimitry Andric  // Fill in the remainder with 0s.
6bc11b14SDimitry Andric  std::memset(Dst, 0, WordShift * APINT_WORD_SIZE);
6bc11b14SDimitry Andric}
6bc11b14SDimitry Andric
6bc11b14SDimitry Andric/// Shift a bignum right Count bits in-place. Shifted in bits are zero. There
6bc11b14SDimitry Andric/// are no restrictions on Count.
6bc11b14SDimitry Andricvoid APInt::tcShiftRight(WordType *Dst, unsigned Words, unsigned Count) {
6bc11b14SDimitry Andric  // Don't bother performing a no-op shift.
6bc11b14SDimitry Andric  if (!Count)
6bc11b14SDimitry Andric    return;
6bc11b14SDimitry Andric
51690af2SDimitry Andric  // WordShift is the inter-part shift; BitShift is the intra-part shift.
6bc11b14SDimitry Andric  unsigned WordShift = std::min(Count / APINT_BITS_PER_WORD, Words);
6bc11b14SDimitry Andric  unsigned BitShift = Count % APINT_BITS_PER_WORD;
6bc11b14SDimitry Andric
6bc11b14SDimitry Andric  unsigned WordsToMove = Words - WordShift;
6bc11b14SDimitry Andric  // Fastpath for moving by whole words.
6bc11b14SDimitry Andric  if (BitShift == 0) {
6bc11b14SDimitry Andric    std::memmove(Dst, Dst + WordShift, WordsToMove * APINT_WORD_SIZE);
6bc11b14SDimitry Andric  } else {
6bc11b14SDimitry Andric    for (unsigned i = 0; i != WordsToMove; ++i) {
6bc11b14SDimitry Andric      Dst[i] = Dst[i + WordShift] >> BitShift;
6bc11b14SDimitry Andric      if (i + 1 != WordsToMove)
6bc11b14SDimitry Andric        Dst[i] |= Dst[i + WordShift + 1] << (APINT_BITS_PER_WORD - BitShift);
f22ef01cSRoman Divacky    }
f22ef01cSRoman Divacky  }
6bc11b14SDimitry Andric
6bc11b14SDimitry Andric  // Fill in the remainder with 0s.
6bc11b14SDimitry Andric  std::memset(Dst + WordsToMove, 0, WordShift * APINT_WORD_SIZE);
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Bitwise and of two bignums.  */
7a7e6055SDimitry Andricvoid APInt::tcAnd(WordType *dst, const WordType *rhs, unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    dst[i] &= rhs[i];
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Bitwise inclusive or of two bignums.  */
7a7e6055SDimitry Andricvoid APInt::tcOr(WordType *dst, const WordType *rhs, unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    dst[i] |= rhs[i];
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Bitwise exclusive or of two bignums.  */
7a7e6055SDimitry Andricvoid APInt::tcXor(WordType *dst, const WordType *rhs, unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    dst[i] ^= rhs[i];
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Complement a bignum in-place.  */
7a7e6055SDimitry Andricvoid APInt::tcComplement(WordType *dst, unsigned parts) {
7a7e6055SDimitry Andric  for (unsigned i = 0; i < parts; i++)
f22ef01cSRoman Divacky    dst[i] = ~dst[i];
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Comparison (unsigned) of two bignums.  */
7a7e6055SDimitry Andricint APInt::tcCompare(const WordType *lhs, const WordType *rhs,
7a7e6055SDimitry Andric                     unsigned parts) {
f22ef01cSRoman Divacky  while (parts) {
f22ef01cSRoman Divacky    parts--;
51690af2SDimitry Andric    if (lhs[parts] != rhs[parts])
7a7e6055SDimitry Andric      return (lhs[parts] > rhs[parts]) ? 1 : -1;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  return 0;
f22ef01cSRoman Divacky}
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky/* Set the least significant BITS bits of a bignum, clear the
f22ef01cSRoman Divacky   rest.  */
7a7e6055SDimitry Andricvoid APInt::tcSetLeastSignificantBits(WordType *dst, unsigned parts,
7a7e6055SDimitry Andric                                      unsigned bits) {
7a7e6055SDimitry Andric  unsigned i = 0;
7a7e6055SDimitry Andric  while (bits > APINT_BITS_PER_WORD) {
7a7e6055SDimitry Andric    dst[i++] = ~(WordType) 0;
7a7e6055SDimitry Andric    bits -= APINT_BITS_PER_WORD;
f22ef01cSRoman Divacky  }
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  if (bits)
7a7e6055SDimitry Andric    dst[i++] = ~(WordType) 0 >> (APINT_BITS_PER_WORD - bits);
f22ef01cSRoman Divacky
f22ef01cSRoman Divacky  while (i < parts)
f22ef01cSRoman Divacky    dst[i++] = 0;
f22ef01cSRoman Divacky}
4ba319b5SDimitry Andric
4ba319b5SDimitry AndricAPInt llvm::APIntOps::RoundingUDiv(const APInt &A, const APInt &B,
4ba319b5SDimitry Andric                                   APInt::Rounding RM) {
4ba319b5SDimitry Andric  // Currently udivrem always rounds down.
4ba319b5SDimitry Andric  switch (RM) {
4ba319b5SDimitry Andric  case APInt::Rounding::DOWN:
4ba319b5SDimitry Andric  case APInt::Rounding::TOWARD_ZERO:
4ba319b5SDimitry Andric    return A.udiv(B);
4ba319b5SDimitry Andric  case APInt::Rounding::UP: {
4ba319b5SDimitry Andric    APInt Quo, Rem;
4ba319b5SDimitry Andric    APInt::udivrem(A, B, Quo, Rem);
4ba319b5SDimitry Andric    if (Rem == 0)
4ba319b5SDimitry Andric      return Quo;
4ba319b5SDimitry Andric    return Quo + 1;
4ba319b5SDimitry Andric  }
4ba319b5SDimitry Andric  }
4ba319b5SDimitry Andric  llvm_unreachable("Unknown APInt::Rounding enum");
4ba319b5SDimitry Andric}
4ba319b5SDimitry Andric
4ba319b5SDimitry AndricAPInt llvm::APIntOps::RoundingSDiv(const APInt &A, const APInt &B,
4ba319b5SDimitry Andric                                   APInt::Rounding RM) {
4ba319b5SDimitry Andric  switch (RM) {
4ba319b5SDimitry Andric  case APInt::Rounding::DOWN:
4ba319b5SDimitry Andric  case APInt::Rounding::UP: {
4ba319b5SDimitry Andric    APInt Quo, Rem;
4ba319b5SDimitry Andric    APInt::sdivrem(A, B, Quo, Rem);
4ba319b5SDimitry Andric    if (Rem == 0)
4ba319b5SDimitry Andric      return Quo;
4ba319b5SDimitry Andric    // This algorithm deals with arbitrary rounding mode used by sdivrem.
4ba319b5SDimitry Andric    // We want to check whether the non-integer part of the mathematical value
4ba319b5SDimitry Andric    // is negative or not. If the non-integer part is negative, we need to round
4ba319b5SDimitry Andric    // down from Quo; otherwise, if it's positive or 0, we return Quo, as it's
4ba319b5SDimitry Andric    // already rounded down.
4ba319b5SDimitry Andric    if (RM == APInt::Rounding::DOWN) {
4ba319b5SDimitry Andric      if (Rem.isNegative() != B.isNegative())
4ba319b5SDimitry Andric        return Quo - 1;
4ba319b5SDimitry Andric      return Quo;
4ba319b5SDimitry Andric    }
4ba319b5SDimitry Andric    if (Rem.isNegative() != B.isNegative())
4ba319b5SDimitry Andric      return Quo;
4ba319b5SDimitry Andric    return Quo + 1;
4ba319b5SDimitry Andric  }
4ba319b5SDimitry Andric  // Currently sdiv rounds twards zero.
4ba319b5SDimitry Andric  case APInt::Rounding::TOWARD_ZERO:
4ba319b5SDimitry Andric    return A.sdiv(B);
4ba319b5SDimitry Andric  }
4ba319b5SDimitry Andric  llvm_unreachable("Unknown APInt::Rounding enum");
4ba319b5SDimitry Andric}
*b5893f02SDimitry Andric
*b5893f02SDimitry AndricOptional<APInt>
*b5893f02SDimitry Andricllvm::APIntOps::SolveQuadraticEquationWrap(APInt A, APInt B, APInt C,
*b5893f02SDimitry Andric                                           unsigned RangeWidth) {
*b5893f02SDimitry Andric  unsigned CoeffWidth = A.getBitWidth();
*b5893f02SDimitry Andric  assert(CoeffWidth == B.getBitWidth() && CoeffWidth == C.getBitWidth());
*b5893f02SDimitry Andric  assert(RangeWidth <= CoeffWidth &&
*b5893f02SDimitry Andric         "Value range width should be less than coefficient width");
*b5893f02SDimitry Andric  assert(RangeWidth > 1 && "Value range bit width should be > 1");
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  LLVM_DEBUG(dbgs() << __func__ << ": solving " << A << "x^2 + " << B
*b5893f02SDimitry Andric                    << "x + " << C << ", rw:" << RangeWidth << '\n');
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // Identify 0 as a (non)solution immediately.
*b5893f02SDimitry Andric  if (C.sextOrTrunc(RangeWidth).isNullValue() ) {
*b5893f02SDimitry Andric    LLVM_DEBUG(dbgs() << __func__ << ": zero solution\n");
*b5893f02SDimitry Andric    return APInt(CoeffWidth, 0);
*b5893f02SDimitry Andric  }
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // The result of APInt arithmetic has the same bit width as the operands,
*b5893f02SDimitry Andric  // so it can actually lose high bits. A product of two n-bit integers needs
*b5893f02SDimitry Andric  // 2n-1 bits to represent the full value.
*b5893f02SDimitry Andric  // The operation done below (on quadratic coefficients) that can produce
*b5893f02SDimitry Andric  // the largest value is the evaluation of the equation during bisection,
*b5893f02SDimitry Andric  // which needs 3 times the bitwidth of the coefficient, so the total number
*b5893f02SDimitry Andric  // of required bits is 3n.
*b5893f02SDimitry Andric  //
*b5893f02SDimitry Andric  // The purpose of this extension is to simulate the set Z of all integers,
*b5893f02SDimitry Andric  // where n+1 > n for all n in Z. In Z it makes sense to talk about positive
*b5893f02SDimitry Andric  // and negative numbers (not so much in a modulo arithmetic). The method
*b5893f02SDimitry Andric  // used to solve the equation is based on the standard formula for real
*b5893f02SDimitry Andric  // numbers, and uses the concepts of "positive" and "negative" with their
*b5893f02SDimitry Andric  // usual meanings.
*b5893f02SDimitry Andric  CoeffWidth *= 3;
*b5893f02SDimitry Andric  A = A.sext(CoeffWidth);
*b5893f02SDimitry Andric  B = B.sext(CoeffWidth);
*b5893f02SDimitry Andric  C = C.sext(CoeffWidth);
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // Make A > 0 for simplicity. Negate cannot overflow at this point because
*b5893f02SDimitry Andric  // the bit width has increased.
*b5893f02SDimitry Andric  if (A.isNegative()) {
*b5893f02SDimitry Andric    A.negate();
*b5893f02SDimitry Andric    B.negate();
*b5893f02SDimitry Andric    C.negate();
*b5893f02SDimitry Andric  }
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // Solving an equation q(x) = 0 with coefficients in modular arithmetic
*b5893f02SDimitry Andric  // is really solving a set of equations q(x) = kR for k = 0, 1, 2, ...,
*b5893f02SDimitry Andric  // and R = 2^BitWidth.
*b5893f02SDimitry Andric  // Since we're trying not only to find exact solutions, but also values
*b5893f02SDimitry Andric  // that "wrap around", such a set will always have a solution, i.e. an x
*b5893f02SDimitry Andric  // that satisfies at least one of the equations, or such that |q(x)|
*b5893f02SDimitry Andric  // exceeds kR, while |q(x-1)| for the same k does not.
*b5893f02SDimitry Andric  //
*b5893f02SDimitry Andric  // We need to find a value k, such that Ax^2 + Bx + C = kR will have a
*b5893f02SDimitry Andric  // positive solution n (in the above sense), and also such that the n
*b5893f02SDimitry Andric  // will be the least among all solutions corresponding to k = 0, 1, ...
*b5893f02SDimitry Andric  // (more precisely, the least element in the set
*b5893f02SDimitry Andric  //   { n(k) | k is such that a solution n(k) exists }).
*b5893f02SDimitry Andric  //
*b5893f02SDimitry Andric  // Consider the parabola (over real numbers) that corresponds to the
*b5893f02SDimitry Andric  // quadratic equation. Since A > 0, the arms of the parabola will point
*b5893f02SDimitry Andric  // up. Picking different values of k will shift it up and down by R.
*b5893f02SDimitry Andric  //
*b5893f02SDimitry Andric  // We want to shift the parabola in such a way as to reduce the problem
*b5893f02SDimitry Andric  // of solving q(x) = kR to solving shifted_q(x) = 0.
*b5893f02SDimitry Andric  // (The interesting solutions are the ceilings of the real number
*b5893f02SDimitry Andric  // solutions.)
*b5893f02SDimitry Andric  APInt R = APInt::getOneBitSet(CoeffWidth, RangeWidth);
*b5893f02SDimitry Andric  APInt TwoA = 2 * A;
*b5893f02SDimitry Andric  APInt SqrB = B * B;
*b5893f02SDimitry Andric  bool PickLow;
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  auto RoundUp = [] (const APInt &V, const APInt &A) -> APInt {
*b5893f02SDimitry Andric    assert(A.isStrictlyPositive());
*b5893f02SDimitry Andric    APInt T = V.abs().urem(A);
*b5893f02SDimitry Andric    if (T.isNullValue())
*b5893f02SDimitry Andric      return V;
*b5893f02SDimitry Andric    return V.isNegative() ? V+T : V+(A-T);
*b5893f02SDimitry Andric  };
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // The vertex of the parabola is at -B/2A, but since A > 0, it's negative
*b5893f02SDimitry Andric  // iff B is positive.
*b5893f02SDimitry Andric  if (B.isNonNegative()) {
*b5893f02SDimitry Andric    // If B >= 0, the vertex it at a negative location (or at 0), so in
*b5893f02SDimitry Andric    // order to have a non-negative solution we need to pick k that makes
*b5893f02SDimitry Andric    // C-kR negative. To satisfy all the requirements for the solution
*b5893f02SDimitry Andric    // that we are looking for, it needs to be closest to 0 of all k.
*b5893f02SDimitry Andric    C = C.srem(R);
*b5893f02SDimitry Andric    if (C.isStrictlyPositive())
*b5893f02SDimitry Andric      C -= R;
*b5893f02SDimitry Andric    // Pick the greater solution.
*b5893f02SDimitry Andric    PickLow = false;
*b5893f02SDimitry Andric  } else {
*b5893f02SDimitry Andric    // If B < 0, the vertex is at a positive location. For any solution
*b5893f02SDimitry Andric    // to exist, the discriminant must be non-negative. This means that
*b5893f02SDimitry Andric    // C-kR <= B^2/4A is a necessary condition for k, i.e. there is a
*b5893f02SDimitry Andric    // lower bound on values of k: kR >= C - B^2/4A.
*b5893f02SDimitry Andric    APInt LowkR = C - SqrB.udiv(2*TwoA); // udiv because all values > 0.
*b5893f02SDimitry Andric    // Round LowkR up (towards +inf) to the nearest kR.
*b5893f02SDimitry Andric    LowkR = RoundUp(LowkR, R);
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric    // If there exists k meeting the condition above, and such that
*b5893f02SDimitry Andric    // C-kR > 0, there will be two positive real number solutions of
*b5893f02SDimitry Andric    // q(x) = kR. Out of all such values of k, pick the one that makes
*b5893f02SDimitry Andric    // C-kR closest to 0, (i.e. pick maximum k such that C-kR > 0).
*b5893f02SDimitry Andric    // In other words, find maximum k such that LowkR <= kR < C.
*b5893f02SDimitry Andric    if (C.sgt(LowkR)) {
*b5893f02SDimitry Andric      // If LowkR < C, then such a k is guaranteed to exist because
*b5893f02SDimitry Andric      // LowkR itself is a multiple of R.
*b5893f02SDimitry Andric      C -= -RoundUp(-C, R);      // C = C - RoundDown(C, R)
*b5893f02SDimitry Andric      // Pick the smaller solution.
*b5893f02SDimitry Andric      PickLow = true;
*b5893f02SDimitry Andric    } else {
*b5893f02SDimitry Andric      // If C-kR < 0 for all potential k's, it means that one solution
*b5893f02SDimitry Andric      // will be negative, while the other will be positive. The positive
*b5893f02SDimitry Andric      // solution will shift towards 0 if the parabola is moved up.
*b5893f02SDimitry Andric      // Pick the kR closest to the lower bound (i.e. make C-kR closest
*b5893f02SDimitry Andric      // to 0, or in other words, out of all parabolas that have solutions,
*b5893f02SDimitry Andric      // pick the one that is the farthest "up").
*b5893f02SDimitry Andric      // Since LowkR is itself a multiple of R, simply take C-LowkR.
*b5893f02SDimitry Andric      C -= LowkR;
*b5893f02SDimitry Andric      // Pick the greater solution.
*b5893f02SDimitry Andric      PickLow = false;
*b5893f02SDimitry Andric    }
*b5893f02SDimitry Andric  }
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  LLVM_DEBUG(dbgs() << __func__ << ": updated coefficients " << A << "x^2 + "
*b5893f02SDimitry Andric                    << B << "x + " << C << ", rw:" << RangeWidth << '\n');
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  APInt D = SqrB - 4*A*C;
*b5893f02SDimitry Andric  assert(D.isNonNegative() && "Negative discriminant");
*b5893f02SDimitry Andric  APInt SQ = D.sqrt();
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  APInt Q = SQ * SQ;
*b5893f02SDimitry Andric  bool InexactSQ = Q != D;
*b5893f02SDimitry Andric  // The calculated SQ may actually be greater than the exact (non-integer)
*b5893f02SDimitry Andric  // value. If that's the case, decremement SQ to get a value that is lower.
*b5893f02SDimitry Andric  if (Q.sgt(D))
*b5893f02SDimitry Andric    SQ -= 1;
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  APInt X;
*b5893f02SDimitry Andric  APInt Rem;
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // SQ is rounded down (i.e SQ * SQ <= D), so the roots may be inexact.
*b5893f02SDimitry Andric  // When using the quadratic formula directly, the calculated low root
*b5893f02SDimitry Andric  // may be greater than the exact one, since we would be subtracting SQ.
*b5893f02SDimitry Andric  // To make sure that the calculated root is not greater than the exact
*b5893f02SDimitry Andric  // one, subtract SQ+1 when calculating the low root (for inexact value
*b5893f02SDimitry Andric  // of SQ).
*b5893f02SDimitry Andric  if (PickLow)
*b5893f02SDimitry Andric    APInt::sdivrem(-B - (SQ+InexactSQ), TwoA, X, Rem);
*b5893f02SDimitry Andric  else
*b5893f02SDimitry Andric    APInt::sdivrem(-B + SQ, TwoA, X, Rem);
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  // The updated coefficients should be such that the (exact) solution is
*b5893f02SDimitry Andric  // positive. Since APInt division rounds towards 0, the calculated one
*b5893f02SDimitry Andric  // can be 0, but cannot be negative.
*b5893f02SDimitry Andric  assert(X.isNonNegative() && "Solution should be non-negative");
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  if (!InexactSQ && Rem.isNullValue()) {
*b5893f02SDimitry Andric    LLVM_DEBUG(dbgs() << __func__ << ": solution (root): " << X << '\n');
*b5893f02SDimitry Andric    return X;
*b5893f02SDimitry Andric  }
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  assert((SQ*SQ).sle(D) && "SQ = |_sqrt(D)_|, so SQ*SQ <= D");
*b5893f02SDimitry Andric  // The exact value of the square root of D should be between SQ and SQ+1.
*b5893f02SDimitry Andric  // This implies that the solution should be between that corresponding to
*b5893f02SDimitry Andric  // SQ (i.e. X) and that corresponding to SQ+1.
*b5893f02SDimitry Andric  //
*b5893f02SDimitry Andric  // The calculated X cannot be greater than the exact (real) solution.
*b5893f02SDimitry Andric  // Actually it must be strictly less than the exact solution, while
*b5893f02SDimitry Andric  // X+1 will be greater than or equal to it.
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  APInt VX = (A*X + B)*X + C;
*b5893f02SDimitry Andric  APInt VY = VX + TwoA*X + A + B;
*b5893f02SDimitry Andric  bool SignChange = VX.isNegative() != VY.isNegative() ||
*b5893f02SDimitry Andric                    VX.isNullValue() != VY.isNullValue();
*b5893f02SDimitry Andric  // If the sign did not change between X and X+1, X is not a valid solution.
*b5893f02SDimitry Andric  // This could happen when the actual (exact) roots don't have an integer
*b5893f02SDimitry Andric  // between them, so they would both be contained between X and X+1.
*b5893f02SDimitry Andric  if (!SignChange) {
*b5893f02SDimitry Andric    LLVM_DEBUG(dbgs() << __func__ << ": no valid solution\n");
*b5893f02SDimitry Andric    return None;
*b5893f02SDimitry Andric  }
*b5893f02SDimitry Andric
*b5893f02SDimitry Andric  X += 1;
*b5893f02SDimitry Andric  LLVM_DEBUG(dbgs() << __func__ << ": solution (wrap): " << X << '\n');
*b5893f02SDimitry Andric  return X;
*b5893f02SDimitry Andric}