lib/Support/APInt.cpp

193323Sed//===-- APInt.cpp - Implement APInt class ---------------------------------===//
193323Sed//
193323Sed//                     The LLVM Compiler Infrastructure
193323Sed//
193323Sed// This file is distributed under the University of Illinois Open Source
193323Sed// License. See LICENSE.TXT for details.
193323Sed//
193323Sed//===----------------------------------------------------------------------===//
193323Sed//
193323Sed// This file implements a class to represent arbitrary precision integer
193323Sed// constant values and provide a variety of arithmetic operations on them.
193323Sed//
193323Sed//===----------------------------------------------------------------------===//
193323Sed
193323Sed#define DEBUG_TYPE "apint"
193323Sed#include "llvm/ADT/APInt.h"
193323Sed#include "llvm/ADT/FoldingSet.h"
234353Sdim#include "llvm/ADT/Hashing.h"
193323Sed#include "llvm/ADT/SmallString.h"
234353Sdim#include "llvm/ADT/StringRef.h"
193323Sed#include "llvm/Support/Debug.h"
198090Srdivacky#include "llvm/Support/ErrorHandling.h"
193323Sed#include "llvm/Support/MathExtras.h"
193323Sed#include "llvm/Support/raw_ostream.h"
193323Sed#include <cmath>
249423Sdim#include <cstdlib>
249423Sdim#include <cstring>
193323Sed#include <limits>
193323Sedusing namespace llvm;
193323Sed
193323Sed/// A utility function for allocating memory, checking for allocation failures,
193323Sed/// and ensuring the contents are zeroed.
193323Sedinline static uint64_t* getClearedMemory(unsigned numWords) {
193323Sed  uint64_t * result = new uint64_t[numWords];
193323Sed  assert(result && "APInt memory allocation fails!");
193323Sed  memset(result, 0, numWords * sizeof(uint64_t));
193323Sed  return result;
193323Sed}
193323Sed
198090Srdivacky/// A utility function for allocating memory and checking for allocation
193323Sed/// failure.  The content is not zeroed.
193323Sedinline static uint64_t* getMemory(unsigned numWords) {
193323Sed  uint64_t * result = new uint64_t[numWords];
193323Sed  assert(result && "APInt memory allocation fails!");
193323Sed  return result;
193323Sed}
193323Sed
198090Srdivacky/// A utility function that converts a character to a digit.
198090Srdivackyinline static unsigned getDigit(char cdigit, uint8_t radix) {
198090Srdivacky  unsigned r;
198090Srdivacky
226633Sdim  if (radix == 16 || radix == 36) {
198090Srdivacky    r = cdigit - '0';
198090Srdivacky    if (r <= 9)
198090Srdivacky      return r;
198090Srdivacky
198090Srdivacky    r = cdigit - 'A';
226633Sdim    if (r <= radix - 11U)
198090Srdivacky      return r + 10;
198090Srdivacky
198090Srdivacky    r = cdigit - 'a';
226633Sdim    if (r <= radix - 11U)
198090Srdivacky      return r + 10;
226633Sdim
226633Sdim    radix = 10;
198090Srdivacky  }
198090Srdivacky
198090Srdivacky  r = cdigit - '0';
198090Srdivacky  if (r < radix)
198090Srdivacky    return r;
198090Srdivacky
198090Srdivacky  return -1U;
198090Srdivacky}
198090Srdivacky
198090Srdivacky
193323Sedvoid APInt::initSlowCase(unsigned numBits, uint64_t val, bool isSigned) {
193323Sed  pVal = getClearedMemory(getNumWords());
193323Sed  pVal[0] = val;
198090Srdivacky  if (isSigned && int64_t(val) < 0)
193323Sed    for (unsigned i = 1; i < getNumWords(); ++i)
193323Sed      pVal[i] = -1ULL;
193323Sed}
193323Sed
193323Sedvoid APInt::initSlowCase(const APInt& that) {
193323Sed  pVal = getMemory(getNumWords());
193323Sed  memcpy(pVal, that.pVal, getNumWords() * APINT_WORD_SIZE);
193323Sed}
193323Sed
226633Sdimvoid APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
198090Srdivacky  assert(BitWidth && "Bitwidth too small");
226633Sdim  assert(bigVal.data() && "Null pointer detected!");
193323Sed  if (isSingleWord())
193323Sed    VAL = bigVal[0];
193323Sed  else {
193323Sed    // Get memory, cleared to 0
193323Sed    pVal = getClearedMemory(getNumWords());
193323Sed    // Calculate the number of words to copy
226633Sdim    unsigned words = std::min<unsigned>(bigVal.size(), getNumWords());
193323Sed    // Copy the words from bigVal to pVal
226633Sdim    memcpy(pVal, bigVal.data(), words * APINT_WORD_SIZE);
193323Sed  }
193323Sed  // Make sure unused high bits are cleared
193323Sed  clearUnusedBits();
193323Sed}
193323Sed
226633SdimAPInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal)
226633Sdim  : BitWidth(numBits), VAL(0) {
226633Sdim  initFromArray(bigVal);
226633Sdim}
226633Sdim
226633SdimAPInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
226633Sdim  : BitWidth(numBits), VAL(0) {
226633Sdim  initFromArray(makeArrayRef(bigVal, numWords));
226633Sdim}
226633Sdim
210299SedAPInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
193323Sed  : BitWidth(numbits), VAL(0) {
198090Srdivacky  assert(BitWidth && "Bitwidth too small");
198090Srdivacky  fromString(numbits, Str, radix);
193323Sed}
193323Sed
193323SedAPInt& APInt::AssignSlowCase(const APInt& RHS) {
193323Sed  // Don't do anything for X = X
193323Sed  if (this == &RHS)
193323Sed    return *this;
193323Sed
193323Sed  if (BitWidth == RHS.getBitWidth()) {
193323Sed    // assume same bit-width single-word case is already handled
193323Sed    assert(!isSingleWord());
193323Sed    memcpy(pVal, RHS.pVal, getNumWords() * APINT_WORD_SIZE);
193323Sed    return *this;
193323Sed  }
193323Sed
193323Sed  if (isSingleWord()) {
193323Sed    // assume case where both are single words is already handled
193323Sed    assert(!RHS.isSingleWord());
193323Sed    VAL = 0;
193323Sed    pVal = getMemory(RHS.getNumWords());
193323Sed    memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
198090Srdivacky  } else if (getNumWords() == RHS.getNumWords())
193323Sed    memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
193323Sed  else if (RHS.isSingleWord()) {
193323Sed    delete [] pVal;
193323Sed    VAL = RHS.VAL;
193323Sed  } else {
193323Sed    delete [] pVal;
193323Sed    pVal = getMemory(RHS.getNumWords());
193323Sed    memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
193323Sed  }
193323Sed  BitWidth = RHS.BitWidth;
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
193323SedAPInt& APInt::operator=(uint64_t RHS) {
198090Srdivacky  if (isSingleWord())
193323Sed    VAL = RHS;
193323Sed  else {
193323Sed    pVal[0] = RHS;
193323Sed    memset(pVal+1, 0, (getNumWords() - 1) * APINT_WORD_SIZE);
193323Sed  }
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
193323Sed/// Profile - This method 'profiles' an APInt for use with FoldingSet.
193323Sedvoid APInt::Profile(FoldingSetNodeID& ID) const {
193323Sed  ID.AddInteger(BitWidth);
198090Srdivacky
193323Sed  if (isSingleWord()) {
193323Sed    ID.AddInteger(VAL);
193323Sed    return;
193323Sed  }
193323Sed
193323Sed  unsigned NumWords = getNumWords();
193323Sed  for (unsigned i = 0; i < NumWords; ++i)
193323Sed    ID.AddInteger(pVal[i]);
193323Sed}
193323Sed
198090Srdivacky/// add_1 - This function adds a single "digit" integer, y, to the multiple
193323Sed/// "digit" integer array,  x[]. x[] is modified to reflect the addition and
193323Sed/// 1 is returned if there is a carry out, otherwise 0 is returned.
193323Sed/// @returns the carry of the addition.
193323Sedstatic bool add_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
193323Sed  for (unsigned i = 0; i < len; ++i) {
193323Sed    dest[i] = y + x[i];
193323Sed    if (dest[i] < y)
193323Sed      y = 1; // Carry one to next digit.
193323Sed    else {
193323Sed      y = 0; // No need to carry so exit early
193323Sed      break;
193323Sed    }
193323Sed  }
193323Sed  return y;
193323Sed}
193323Sed
193323Sed/// @brief Prefix increment operator. Increments the APInt by one.
193323SedAPInt& APInt::operator++() {
198090Srdivacky  if (isSingleWord())
193323Sed    ++VAL;
193323Sed  else
193323Sed    add_1(pVal, pVal, getNumWords(), 1);
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
198090Srdivacky/// sub_1 - This function subtracts a single "digit" (64-bit word), y, from
198090Srdivacky/// the multi-digit integer array, x[], propagating the borrowed 1 value until
193323Sed/// no further borrowing is neeeded or it runs out of "digits" in x.  The result
193323Sed/// is 1 if "borrowing" exhausted the digits in x, or 0 if x was not exhausted.
193323Sed/// In other words, if y > x then this function returns 1, otherwise 0.
193323Sed/// @returns the borrow out of the subtraction
193323Sedstatic bool sub_1(uint64_t x[], unsigned len, uint64_t y) {
193323Sed  for (unsigned i = 0; i < len; ++i) {
193323Sed    uint64_t X = x[i];
193323Sed    x[i] -= y;
198090Srdivacky    if (y > X)
193323Sed      y = 1;  // We have to "borrow 1" from next "digit"
193323Sed    else {
193323Sed      y = 0;  // No need to borrow
193323Sed      break;  // Remaining digits are unchanged so exit early
193323Sed    }
193323Sed  }
193323Sed  return bool(y);
193323Sed}
193323Sed
193323Sed/// @brief Prefix decrement operator. Decrements the APInt by one.
193323SedAPInt& APInt::operator--() {
198090Srdivacky  if (isSingleWord())
193323Sed    --VAL;
193323Sed  else
193323Sed    sub_1(pVal, getNumWords(), 1);
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
193323Sed/// add - This function adds the integer array x to the integer array Y and
198090Srdivacky/// places the result in dest.
193323Sed/// @returns the carry out from the addition
193323Sed/// @brief General addition of 64-bit integer arrays
198090Srdivackystatic bool add(uint64_t *dest, const uint64_t *x, const uint64_t *y,
193323Sed                unsigned len) {
193323Sed  bool carry = false;
193323Sed  for (unsigned i = 0; i< len; ++i) {
193323Sed    uint64_t limit = std::min(x[i],y[i]); // must come first in case dest == x
193323Sed    dest[i] = x[i] + y[i] + carry;
193323Sed    carry = dest[i] < limit || (carry && dest[i] == limit);
193323Sed  }
193323Sed  return carry;
193323Sed}
193323Sed
193323Sed/// Adds the RHS APint to this APInt.
193323Sed/// @returns this, after addition of RHS.
198090Srdivacky/// @brief Addition assignment operator.
193323SedAPInt& APInt::operator+=(const APInt& RHS) {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
198090Srdivacky  if (isSingleWord())
193323Sed    VAL += RHS.VAL;
193323Sed  else {
193323Sed    add(pVal, pVal, RHS.pVal, getNumWords());
193323Sed  }
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
198090Srdivacky/// Subtracts the integer array y from the integer array x
193323Sed/// @returns returns the borrow out.
193323Sed/// @brief Generalized subtraction of 64-bit integer arrays.
198090Srdivackystatic bool sub(uint64_t *dest, const uint64_t *x, const uint64_t *y,
193323Sed                unsigned len) {
193323Sed  bool borrow = false;
193323Sed  for (unsigned i = 0; i < len; ++i) {
193323Sed    uint64_t x_tmp = borrow ? x[i] - 1 : x[i];
193323Sed    borrow = y[i] > x_tmp || (borrow && x[i] == 0);
193323Sed    dest[i] = x_tmp - y[i];
193323Sed  }
193323Sed  return borrow;
193323Sed}
193323Sed
193323Sed/// Subtracts the RHS APInt from this APInt
193323Sed/// @returns this, after subtraction
198090Srdivacky/// @brief Subtraction assignment operator.
193323SedAPInt& APInt::operator-=(const APInt& RHS) {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
198090Srdivacky  if (isSingleWord())
193323Sed    VAL -= RHS.VAL;
193323Sed  else
193323Sed    sub(pVal, pVal, RHS.pVal, getNumWords());
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
203954Srdivacky/// Multiplies an integer array, x, by a uint64_t integer and places the result
198090Srdivacky/// into dest.
193323Sed/// @returns the carry out of the multiplication.
193323Sed/// @brief Multiply a multi-digit APInt by a single digit (64-bit) integer.
193323Sedstatic uint64_t mul_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
193323Sed  // Split y into high 32-bit part (hy)  and low 32-bit part (ly)
193323Sed  uint64_t ly = y & 0xffffffffULL, hy = y >> 32;
193323Sed  uint64_t carry = 0;
193323Sed
193323Sed  // For each digit of x.
193323Sed  for (unsigned i = 0; i < len; ++i) {
193323Sed    // Split x into high and low words
193323Sed    uint64_t lx = x[i] & 0xffffffffULL;
193323Sed    uint64_t hx = x[i] >> 32;
193323Sed    // hasCarry - A flag to indicate if there is a carry to the next digit.
193323Sed    // hasCarry == 0, no carry
193323Sed    // hasCarry == 1, has carry
193323Sed    // hasCarry == 2, no carry and the calculation result == 0.
193323Sed    uint8_t hasCarry = 0;
193323Sed    dest[i] = carry + lx * ly;
193323Sed    // Determine if the add above introduces carry.
193323Sed    hasCarry = (dest[i] < carry) ? 1 : 0;
193323Sed    carry = hx * ly + (dest[i] >> 32) + (hasCarry ? (1ULL << 32) : 0);
198090Srdivacky    // The upper limit of carry can be (2^32 - 1)(2^32 - 1) +
193323Sed    // (2^32 - 1) + 2^32 = 2^64.
193323Sed    hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
193323Sed
193323Sed    carry += (lx * hy) & 0xffffffffULL;
193323Sed    dest[i] = (carry << 32) | (dest[i] & 0xffffffffULL);
198090Srdivacky    carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0) +
193323Sed            (carry >> 32) + ((lx * hy) >> 32) + hx * hy;
193323Sed  }
193323Sed  return carry;
193323Sed}
193323Sed
198090Srdivacky/// Multiplies integer array x by integer array y and stores the result into
193323Sed/// the integer array dest. Note that dest's size must be >= xlen + ylen.
193323Sed/// @brief Generalized multiplicate of integer arrays.
193323Sedstatic void mul(uint64_t dest[], uint64_t x[], unsigned xlen, uint64_t y[],
193323Sed                unsigned ylen) {
193323Sed  dest[xlen] = mul_1(dest, x, xlen, y[0]);
193323Sed  for (unsigned i = 1; i < ylen; ++i) {
193323Sed    uint64_t ly = y[i] & 0xffffffffULL, hy = y[i] >> 32;
193323Sed    uint64_t carry = 0, lx = 0, hx = 0;
193323Sed    for (unsigned j = 0; j < xlen; ++j) {
193323Sed      lx = x[j] & 0xffffffffULL;
193323Sed      hx = x[j] >> 32;
193323Sed      // hasCarry - A flag to indicate if has carry.
193323Sed      // hasCarry == 0, no carry
193323Sed      // hasCarry == 1, has carry
193323Sed      // hasCarry == 2, no carry and the calculation result == 0.
193323Sed      uint8_t hasCarry = 0;
193323Sed      uint64_t resul = carry + lx * ly;
193323Sed      hasCarry = (resul < carry) ? 1 : 0;
193323Sed      carry = (hasCarry ? (1ULL << 32) : 0) + hx * ly + (resul >> 32);
193323Sed      hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
193323Sed
193323Sed      carry += (lx * hy) & 0xffffffffULL;
193323Sed      resul = (carry << 32) | (resul & 0xffffffffULL);
193323Sed      dest[i+j] += resul;
193323Sed      carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0)+
198090Srdivacky              (carry >> 32) + (dest[i+j] < resul ? 1 : 0) +
193323Sed              ((lx * hy) >> 32) + hx * hy;
193323Sed    }
193323Sed    dest[i+xlen] = carry;
193323Sed  }
193323Sed}
193323Sed
193323SedAPInt& APInt::operator*=(const APInt& RHS) {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord()) {
193323Sed    VAL *= RHS.VAL;
193323Sed    clearUnusedBits();
193323Sed    return *this;
193323Sed  }
193323Sed
193323Sed  // Get some bit facts about LHS and check for zero
193323Sed  unsigned lhsBits = getActiveBits();
193323Sed  unsigned lhsWords = !lhsBits ? 0 : whichWord(lhsBits - 1) + 1;
198090Srdivacky  if (!lhsWords)
193323Sed    // 0 * X ===> 0
193323Sed    return *this;
193323Sed
193323Sed  // Get some bit facts about RHS and check for zero
193323Sed  unsigned rhsBits = RHS.getActiveBits();
193323Sed  unsigned rhsWords = !rhsBits ? 0 : whichWord(rhsBits - 1) + 1;
193323Sed  if (!rhsWords) {
193323Sed    // X * 0 ===> 0
218893Sdim    clearAllBits();
193323Sed    return *this;
193323Sed  }
193323Sed
193323Sed  // Allocate space for the result
193323Sed  unsigned destWords = rhsWords + lhsWords;
193323Sed  uint64_t *dest = getMemory(destWords);
193323Sed
193323Sed  // Perform the long multiply
193323Sed  mul(dest, pVal, lhsWords, RHS.pVal, rhsWords);
193323Sed
193323Sed  // Copy result back into *this
218893Sdim  clearAllBits();
193323Sed  unsigned wordsToCopy = destWords >= getNumWords() ? getNumWords() : destWords;
193323Sed  memcpy(pVal, dest, wordsToCopy * APINT_WORD_SIZE);
226633Sdim  clearUnusedBits();
193323Sed
193323Sed  // delete dest array and return
193323Sed  delete[] dest;
193323Sed  return *this;
193323Sed}
193323Sed
193323SedAPInt& APInt::operator&=(const APInt& RHS) {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord()) {
193323Sed    VAL &= RHS.VAL;
193323Sed    return *this;
193323Sed  }
193323Sed  unsigned numWords = getNumWords();
193323Sed  for (unsigned i = 0; i < numWords; ++i)
193323Sed    pVal[i] &= RHS.pVal[i];
193323Sed  return *this;
193323Sed}
193323Sed
193323SedAPInt& APInt::operator|=(const APInt& RHS) {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord()) {
193323Sed    VAL |= RHS.VAL;
193323Sed    return *this;
193323Sed  }
193323Sed  unsigned numWords = getNumWords();
193323Sed  for (unsigned i = 0; i < numWords; ++i)
193323Sed    pVal[i] |= RHS.pVal[i];
193323Sed  return *this;
193323Sed}
193323Sed
193323SedAPInt& APInt::operator^=(const APInt& RHS) {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord()) {
193323Sed    VAL ^= RHS.VAL;
193323Sed    this->clearUnusedBits();
193323Sed    return *this;
198090Srdivacky  }
193323Sed  unsigned numWords = getNumWords();
193323Sed  for (unsigned i = 0; i < numWords; ++i)
193323Sed    pVal[i] ^= RHS.pVal[i];
193323Sed  return clearUnusedBits();
193323Sed}
193323Sed
193323SedAPInt APInt::AndSlowCase(const APInt& RHS) const {
193323Sed  unsigned numWords = getNumWords();
193323Sed  uint64_t* val = getMemory(numWords);
193323Sed  for (unsigned i = 0; i < numWords; ++i)
193323Sed    val[i] = pVal[i] & RHS.pVal[i];
193323Sed  return APInt(val, getBitWidth());
193323Sed}
193323Sed
193323SedAPInt APInt::OrSlowCase(const APInt& RHS) const {
193323Sed  unsigned numWords = getNumWords();
193323Sed  uint64_t *val = getMemory(numWords);
193323Sed  for (unsigned i = 0; i < numWords; ++i)
193323Sed    val[i] = pVal[i] | RHS.pVal[i];
193323Sed  return APInt(val, getBitWidth());
193323Sed}
193323Sed
193323SedAPInt APInt::XorSlowCase(const APInt& RHS) const {
193323Sed  unsigned numWords = getNumWords();
193323Sed  uint64_t *val = getMemory(numWords);
193323Sed  for (unsigned i = 0; i < numWords; ++i)
193323Sed    val[i] = pVal[i] ^ RHS.pVal[i];
193323Sed
193323Sed  // 0^0==1 so clear the high bits in case they got set.
193323Sed  return APInt(val, getBitWidth()).clearUnusedBits();
193323Sed}
193323Sed
193323SedAPInt APInt::operator*(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord())
193323Sed    return APInt(BitWidth, VAL * RHS.VAL);
193323Sed  APInt Result(*this);
193323Sed  Result *= RHS;
226633Sdim  return Result;
193323Sed}
193323Sed
193323SedAPInt APInt::operator+(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord())
193323Sed    return APInt(BitWidth, VAL + RHS.VAL);
193323Sed  APInt Result(BitWidth, 0);
193323Sed  add(Result.pVal, this->pVal, RHS.pVal, getNumWords());
193323Sed  return Result.clearUnusedBits();
193323Sed}
193323Sed
193323SedAPInt APInt::operator-(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord())
193323Sed    return APInt(BitWidth, VAL - RHS.VAL);
193323Sed  APInt Result(BitWidth, 0);
193323Sed  sub(Result.pVal, this->pVal, RHS.pVal, getNumWords());
193323Sed  return Result.clearUnusedBits();
193323Sed}
193323Sed
193323Sedbool APInt::EqualSlowCase(const APInt& RHS) const {
193323Sed  // Get some facts about the number of bits used in the two operands.
193323Sed  unsigned n1 = getActiveBits();
193323Sed  unsigned n2 = RHS.getActiveBits();
193323Sed
193323Sed  // If the number of bits isn't the same, they aren't equal
198090Srdivacky  if (n1 != n2)
193323Sed    return false;
193323Sed
193323Sed  // If the number of bits fits in a word, we only need to compare the low word.
193323Sed  if (n1 <= APINT_BITS_PER_WORD)
193323Sed    return pVal[0] == RHS.pVal[0];
193323Sed
193323Sed  // Otherwise, compare everything
193323Sed  for (int i = whichWord(n1 - 1); i >= 0; --i)
198090Srdivacky    if (pVal[i] != RHS.pVal[i])
193323Sed      return false;
193323Sed  return true;
193323Sed}
193323Sed
193323Sedbool APInt::EqualSlowCase(uint64_t Val) const {
193323Sed  unsigned n = getActiveBits();
193323Sed  if (n <= APINT_BITS_PER_WORD)
193323Sed    return pVal[0] == Val;
193323Sed  else
193323Sed    return false;
193323Sed}
193323Sed
193323Sedbool APInt::ult(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
193323Sed  if (isSingleWord())
193323Sed    return VAL < RHS.VAL;
193323Sed
193323Sed  // Get active bit length of both operands
193323Sed  unsigned n1 = getActiveBits();
193323Sed  unsigned n2 = RHS.getActiveBits();
193323Sed
193323Sed  // If magnitude of LHS is less than RHS, return true.
193323Sed  if (n1 < n2)
193323Sed    return true;
193323Sed
193323Sed  // If magnitude of RHS is greather than LHS, return false.
193323Sed  if (n2 < n1)
193323Sed    return false;
193323Sed
193323Sed  // If they bot fit in a word, just compare the low order word
193323Sed  if (n1 <= APINT_BITS_PER_WORD && n2 <= APINT_BITS_PER_WORD)
193323Sed    return pVal[0] < RHS.pVal[0];
193323Sed
193323Sed  // Otherwise, compare all words
193323Sed  unsigned topWord = whichWord(std::max(n1,n2)-1);
193323Sed  for (int i = topWord; i >= 0; --i) {
198090Srdivacky    if (pVal[i] > RHS.pVal[i])
193323Sed      return false;
198090Srdivacky    if (pVal[i] < RHS.pVal[i])
193323Sed      return true;
193323Sed  }
193323Sed  return false;
193323Sed}
193323Sed
193323Sedbool APInt::slt(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
193323Sed  if (isSingleWord()) {
193323Sed    int64_t lhsSext = (int64_t(VAL) << (64-BitWidth)) >> (64-BitWidth);
193323Sed    int64_t rhsSext = (int64_t(RHS.VAL) << (64-BitWidth)) >> (64-BitWidth);
193323Sed    return lhsSext < rhsSext;
193323Sed  }
193323Sed
193323Sed  APInt lhs(*this);
193323Sed  APInt rhs(RHS);
193323Sed  bool lhsNeg = isNegative();
193323Sed  bool rhsNeg = rhs.isNegative();
193323Sed  if (lhsNeg) {
193323Sed    // Sign bit is set so perform two's complement to make it positive
218893Sdim    lhs.flipAllBits();
249423Sdim    ++lhs;
193323Sed  }
193323Sed  if (rhsNeg) {
193323Sed    // Sign bit is set so perform two's complement to make it positive
218893Sdim    rhs.flipAllBits();
249423Sdim    ++rhs;
193323Sed  }
193323Sed
193323Sed  // Now we have unsigned values to compare so do the comparison if necessary
193323Sed  // based on the negativeness of the values.
193323Sed  if (lhsNeg)
193323Sed    if (rhsNeg)
193323Sed      return lhs.ugt(rhs);
193323Sed    else
193323Sed      return true;
193323Sed  else if (rhsNeg)
193323Sed    return false;
198090Srdivacky  else
193323Sed    return lhs.ult(rhs);
193323Sed}
193323Sed
218893Sdimvoid APInt::setBit(unsigned bitPosition) {
198090Srdivacky  if (isSingleWord())
193323Sed    VAL |= maskBit(bitPosition);
198090Srdivacky  else
193323Sed    pVal[whichWord(bitPosition)] |= maskBit(bitPosition);
193323Sed}
193323Sed
193323Sed/// Set the given bit to 0 whose position is given as "bitPosition".
193323Sed/// @brief Set a given bit to 0.
218893Sdimvoid APInt::clearBit(unsigned bitPosition) {
198090Srdivacky  if (isSingleWord())
193323Sed    VAL &= ~maskBit(bitPosition);
198090Srdivacky  else
193323Sed    pVal[whichWord(bitPosition)] &= ~maskBit(bitPosition);
193323Sed}
193323Sed
193323Sed/// @brief Toggle every bit to its opposite value.
193323Sed
198090Srdivacky/// Toggle a given bit to its opposite value whose position is given
193323Sed/// as "bitPosition".
193323Sed/// @brief Toggles a given bit to its opposite value.
218893Sdimvoid APInt::flipBit(unsigned bitPosition) {
193323Sed  assert(bitPosition < BitWidth && "Out of the bit-width range!");
218893Sdim  if ((*this)[bitPosition]) clearBit(bitPosition);
218893Sdim  else setBit(bitPosition);
193323Sed}
193323Sed
210299Sedunsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
198090Srdivacky  assert(!str.empty() && "Invalid string length");
226633Sdim  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
226633Sdim          radix == 36) &&
226633Sdim         "Radix should be 2, 8, 10, 16, or 36!");
193323Sed
198090Srdivacky  size_t slen = str.size();
198090Srdivacky
198090Srdivacky  // Each computation below needs to know if it's negative.
198090Srdivacky  StringRef::iterator p = str.begin();
198090Srdivacky  unsigned isNegative = *p == '-';
198090Srdivacky  if (*p == '-' || *p == '+') {
198090Srdivacky    p++;
193323Sed    slen--;
198090Srdivacky    assert(slen && "String is only a sign, needs a value.");
193323Sed  }
198090Srdivacky
193323Sed  // For radixes of power-of-two values, the bits required is accurately and
193323Sed  // easily computed
193323Sed  if (radix == 2)
193323Sed    return slen + isNegative;
193323Sed  if (radix == 8)
193323Sed    return slen * 3 + isNegative;
193323Sed  if (radix == 16)
193323Sed    return slen * 4 + isNegative;
193323Sed
226633Sdim  // FIXME: base 36
226633Sdim
193323Sed  // This is grossly inefficient but accurate. We could probably do something
193323Sed  // with a computation of roughly slen*64/20 and then adjust by the value of
193323Sed  // the first few digits. But, I'm not sure how accurate that could be.
193323Sed
193323Sed  // Compute a sufficient number of bits that is always large enough but might
198090Srdivacky  // be too large. This avoids the assertion in the constructor. This
198090Srdivacky  // calculation doesn't work appropriately for the numbers 0-9, so just use 4
198090Srdivacky  // bits in that case.
226633Sdim  unsigned sufficient
226633Sdim    = radix == 10? (slen == 1 ? 4 : slen * 64/18)
226633Sdim                 : (slen == 1 ? 7 : slen * 16/3);
193323Sed
193323Sed  // Convert to the actual binary value.
198090Srdivacky  APInt tmp(sufficient, StringRef(p, slen), radix);
193323Sed
198090Srdivacky  // Compute how many bits are required. If the log is infinite, assume we need
198090Srdivacky  // just bit.
198090Srdivacky  unsigned log = tmp.logBase2();
198090Srdivacky  if (log == (unsigned)-1) {
198090Srdivacky    return isNegative + 1;
198090Srdivacky  } else {
198090Srdivacky    return isNegative + log + 1;
198090Srdivacky  }
193323Sed}
193323Sed
234353Sdimhash_code llvm::hash_value(const APInt &Arg) {
234353Sdim  if (Arg.isSingleWord())
234353Sdim    return hash_combine(Arg.VAL);
193323Sed
234353Sdim  return hash_combine_range(Arg.pVal, Arg.pVal + Arg.getNumWords());
193323Sed}
193323Sed
193323Sed/// HiBits - This function returns the high "numBits" bits of this APInt.
193323SedAPInt APInt::getHiBits(unsigned numBits) const {
193323Sed  return APIntOps::lshr(*this, BitWidth - numBits);
193323Sed}
193323Sed
193323Sed/// LoBits - This function returns the low "numBits" bits of this APInt.
193323SedAPInt APInt::getLoBits(unsigned numBits) const {
198090Srdivacky  return APIntOps::lshr(APIntOps::shl(*this, BitWidth - numBits),
193323Sed                        BitWidth - numBits);
193323Sed}
193323Sed
193323Sedunsigned APInt::countLeadingZerosSlowCase() const {
203954Srdivacky  // Treat the most significand word differently because it might have
203954Srdivacky  // meaningless bits set beyond the precision.
203954Srdivacky  unsigned BitsInMSW = BitWidth % APINT_BITS_PER_WORD;
203954Srdivacky  integerPart MSWMask;
203954Srdivacky  if (BitsInMSW) MSWMask = (integerPart(1) << BitsInMSW) - 1;
203954Srdivacky  else {
203954Srdivacky    MSWMask = ~integerPart(0);
203954Srdivacky    BitsInMSW = APINT_BITS_PER_WORD;
203954Srdivacky  }
203954Srdivacky
203954Srdivacky  unsigned i = getNumWords();
203954Srdivacky  integerPart MSW = pVal[i-1] & MSWMask;
203954Srdivacky  if (MSW)
263508Sdim    return llvm::countLeadingZeros(MSW) - (APINT_BITS_PER_WORD - BitsInMSW);
203954Srdivacky
203954Srdivacky  unsigned Count = BitsInMSW;
203954Srdivacky  for (--i; i > 0u; --i) {
193323Sed    if (pVal[i-1] == 0)
193323Sed      Count += APINT_BITS_PER_WORD;
193323Sed    else {
263508Sdim      Count += llvm::countLeadingZeros(pVal[i-1]);
193323Sed      break;
193323Sed    }
193323Sed  }
203954Srdivacky  return Count;
193323Sed}
193323Sed
193323Sedunsigned APInt::countLeadingOnes() const {
193323Sed  if (isSingleWord())
234353Sdim    return CountLeadingOnes_64(VAL << (APINT_BITS_PER_WORD - BitWidth));
193323Sed
193323Sed  unsigned highWordBits = BitWidth % APINT_BITS_PER_WORD;
193323Sed  unsigned shift;
193323Sed  if (!highWordBits) {
193323Sed    highWordBits = APINT_BITS_PER_WORD;
193323Sed    shift = 0;
193323Sed  } else {
193323Sed    shift = APINT_BITS_PER_WORD - highWordBits;
193323Sed  }
193323Sed  int i = getNumWords() - 1;
234353Sdim  unsigned Count = CountLeadingOnes_64(pVal[i] << shift);
193323Sed  if (Count == highWordBits) {
193323Sed    for (i--; i >= 0; --i) {
193323Sed      if (pVal[i] == -1ULL)
193323Sed        Count += APINT_BITS_PER_WORD;
193323Sed      else {
234353Sdim        Count += CountLeadingOnes_64(pVal[i]);
193323Sed        break;
193323Sed      }
193323Sed    }
193323Sed  }
193323Sed  return Count;
193323Sed}
193323Sed
193323Sedunsigned APInt::countTrailingZeros() const {
193323Sed  if (isSingleWord())
263508Sdim    return std::min(unsigned(llvm::countTrailingZeros(VAL)), BitWidth);
193323Sed  unsigned Count = 0;
193323Sed  unsigned i = 0;
193323Sed  for (; i < getNumWords() && pVal[i] == 0; ++i)
193323Sed    Count += APINT_BITS_PER_WORD;
193323Sed  if (i < getNumWords())
263508Sdim    Count += llvm::countTrailingZeros(pVal[i]);
193323Sed  return std::min(Count, BitWidth);
193323Sed}
193323Sed
193323Sedunsigned APInt::countTrailingOnesSlowCase() const {
193323Sed  unsigned Count = 0;
193323Sed  unsigned i = 0;
193323Sed  for (; i < getNumWords() && pVal[i] == -1ULL; ++i)
193323Sed    Count += APINT_BITS_PER_WORD;
193323Sed  if (i < getNumWords())
193323Sed    Count += CountTrailingOnes_64(pVal[i]);
193323Sed  return std::min(Count, BitWidth);
193323Sed}
193323Sed
193323Sedunsigned APInt::countPopulationSlowCase() const {
193323Sed  unsigned Count = 0;
193323Sed  for (unsigned i = 0; i < getNumWords(); ++i)
193323Sed    Count += CountPopulation_64(pVal[i]);
193323Sed  return Count;
193323Sed}
193323Sed
234353Sdim/// Perform a logical right-shift from Src to Dst, which must be equal or
234353Sdim/// non-overlapping, of Words words, by Shift, which must be less than 64.
234353Sdimstatic void lshrNear(uint64_t *Dst, uint64_t *Src, unsigned Words,
234353Sdim                     unsigned Shift) {
234353Sdim  uint64_t Carry = 0;
234353Sdim  for (int I = Words - 1; I >= 0; --I) {
234353Sdim    uint64_t Tmp = Src[I];
234353Sdim    Dst[I] = (Tmp >> Shift) | Carry;
234353Sdim    Carry = Tmp << (64 - Shift);
234353Sdim  }
234353Sdim}
234353Sdim
193323SedAPInt APInt::byteSwap() const {
193323Sed  assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
193323Sed  if (BitWidth == 16)
193323Sed    return APInt(BitWidth, ByteSwap_16(uint16_t(VAL)));
234353Sdim  if (BitWidth == 32)
193323Sed    return APInt(BitWidth, ByteSwap_32(unsigned(VAL)));
234353Sdim  if (BitWidth == 48) {
193323Sed    unsigned Tmp1 = unsigned(VAL >> 16);
193323Sed    Tmp1 = ByteSwap_32(Tmp1);
193323Sed    uint16_t Tmp2 = uint16_t(VAL);
193323Sed    Tmp2 = ByteSwap_16(Tmp2);
193323Sed    return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
234353Sdim  }
234353Sdim  if (BitWidth == 64)
193323Sed    return APInt(BitWidth, ByteSwap_64(VAL));
234353Sdim
234353Sdim  APInt Result(getNumWords() * APINT_BITS_PER_WORD, 0);
234353Sdim  for (unsigned I = 0, N = getNumWords(); I != N; ++I)
234353Sdim    Result.pVal[I] = ByteSwap_64(pVal[N - I - 1]);
234353Sdim  if (Result.BitWidth != BitWidth) {
234353Sdim    lshrNear(Result.pVal, Result.pVal, getNumWords(),
234353Sdim             Result.BitWidth - BitWidth);
234353Sdim    Result.BitWidth = BitWidth;
193323Sed  }
234353Sdim  return Result;
193323Sed}
193323Sed
198090SrdivackyAPInt llvm::APIntOps::GreatestCommonDivisor(const APInt& API1,
193323Sed                                            const APInt& API2) {
193323Sed  APInt A = API1, B = API2;
193323Sed  while (!!B) {
193323Sed    APInt T = B;
193323Sed    B = APIntOps::urem(A, B);
193323Sed    A = T;
193323Sed  }
193323Sed  return A;
193323Sed}
193323Sed
193323SedAPInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
193323Sed  union {
193323Sed    double D;
193323Sed    uint64_t I;
193323Sed  } T;
193323Sed  T.D = Double;
193323Sed
193323Sed  // Get the sign bit from the highest order bit
193323Sed  bool isNeg = T.I >> 63;
193323Sed
193323Sed  // Get the 11-bit exponent and adjust for the 1023 bit bias
193323Sed  int64_t exp = ((T.I >> 52) & 0x7ff) - 1023;
193323Sed
193323Sed  // If the exponent is negative, the value is < 0 so just return 0.
193323Sed  if (exp < 0)
193323Sed    return APInt(width, 0u);
193323Sed
193323Sed  // Extract the mantissa by clearing the top 12 bits (sign + exponent).
193323Sed  uint64_t mantissa = (T.I & (~0ULL >> 12)) | 1ULL << 52;
193323Sed
193323Sed  // If the exponent doesn't shift all bits out of the mantissa
193323Sed  if (exp < 52)
198090Srdivacky    return isNeg ? -APInt(width, mantissa >> (52 - exp)) :
193323Sed                    APInt(width, mantissa >> (52 - exp));
193323Sed
193323Sed  // If the client didn't provide enough bits for us to shift the mantissa into
193323Sed  // then the result is undefined, just return 0
193323Sed  if (width <= exp - 52)
193323Sed    return APInt(width, 0);
193323Sed
193323Sed  // Otherwise, we have to shift the mantissa bits up to the right location
193323Sed  APInt Tmp(width, mantissa);
193323Sed  Tmp = Tmp.shl((unsigned)exp - 52);
193323Sed  return isNeg ? -Tmp : Tmp;
193323Sed}
193323Sed
198090Srdivacky/// RoundToDouble - This function converts this APInt to a double.
193323Sed/// The layout for double is as following (IEEE Standard 754):
193323Sed///  --------------------------------------
193323Sed/// |  Sign    Exponent    Fraction    Bias |
193323Sed/// |-------------------------------------- |
193323Sed/// |  1[63]   11[62-52]   52[51-00]   1023 |
198090Srdivacky///  --------------------------------------
193323Seddouble APInt::roundToDouble(bool isSigned) const {
193323Sed
193323Sed  // Handle the simple case where the value is contained in one uint64_t.
198090Srdivacky  // It is wrong to optimize getWord(0) to VAL; there might be more than one word.
193323Sed  if (isSingleWord() || getActiveBits() <= APINT_BITS_PER_WORD) {
193323Sed    if (isSigned) {
198090Srdivacky      int64_t sext = (int64_t(getWord(0)) << (64-BitWidth)) >> (64-BitWidth);
193323Sed      return double(sext);
193323Sed    } else
198090Srdivacky      return double(getWord(0));
193323Sed  }
193323Sed
193323Sed  // Determine if the value is negative.
193323Sed  bool isNeg = isSigned ? (*this)[BitWidth-1] : false;
193323Sed
193323Sed  // Construct the absolute value if we're negative.
193323Sed  APInt Tmp(isNeg ? -(*this) : (*this));
193323Sed
193323Sed  // Figure out how many bits we're using.
193323Sed  unsigned n = Tmp.getActiveBits();
193323Sed
193323Sed  // The exponent (without bias normalization) is just the number of bits
193323Sed  // we are using. Note that the sign bit is gone since we constructed the
193323Sed  // absolute value.
193323Sed  uint64_t exp = n;
193323Sed
193323Sed  // Return infinity for exponent overflow
193323Sed  if (exp > 1023) {
193323Sed    if (!isSigned || !isNeg)
193323Sed      return std::numeric_limits<double>::infinity();
198090Srdivacky    else
193323Sed      return -std::numeric_limits<double>::infinity();
193323Sed  }
193323Sed  exp += 1023; // Increment for 1023 bias
193323Sed
193323Sed  // Number of bits in mantissa is 52. To obtain the mantissa value, we must
193323Sed  // extract the high 52 bits from the correct words in pVal.
193323Sed  uint64_t mantissa;
193323Sed  unsigned hiWord = whichWord(n-1);
193323Sed  if (hiWord == 0) {
193323Sed    mantissa = Tmp.pVal[0];
193323Sed    if (n > 52)
193323Sed      mantissa >>= n - 52; // shift down, we want the top 52 bits.
193323Sed  } else {
193323Sed    assert(hiWord > 0 && "huh?");
193323Sed    uint64_t hibits = Tmp.pVal[hiWord] << (52 - n % APINT_BITS_PER_WORD);
193323Sed    uint64_t lobits = Tmp.pVal[hiWord-1] >> (11 + n % APINT_BITS_PER_WORD);
193323Sed    mantissa = hibits | lobits;
193323Sed  }
193323Sed
193323Sed  // The leading bit of mantissa is implicit, so get rid of it.
193323Sed  uint64_t sign = isNeg ? (1ULL << (APINT_BITS_PER_WORD - 1)) : 0;
193323Sed  union {
193323Sed    double D;
193323Sed    uint64_t I;
193323Sed  } T;
193323Sed  T.I = sign | (exp << 52) | mantissa;
193323Sed  return T.D;
193323Sed}
193323Sed
193323Sed// Truncate to new width.
218893SdimAPInt APInt::trunc(unsigned width) const {
193323Sed  assert(width < BitWidth && "Invalid APInt Truncate request");
193323Sed  assert(width && "Can't truncate to 0 bits");
218893Sdim
218893Sdim  if (width <= APINT_BITS_PER_WORD)
218893Sdim    return APInt(width, getRawData()[0]);
218893Sdim
218893Sdim  APInt Result(getMemory(getNumWords(width)), width);
218893Sdim
218893Sdim  // Copy full words.
218893Sdim  unsigned i;
218893Sdim  for (i = 0; i != width / APINT_BITS_PER_WORD; i++)
218893Sdim    Result.pVal[i] = pVal[i];
218893Sdim
218893Sdim  // Truncate and copy any partial word.
218893Sdim  unsigned bits = (0 - width) % APINT_BITS_PER_WORD;
218893Sdim  if (bits != 0)
218893Sdim    Result.pVal[i] = pVal[i] << bits >> bits;
218893Sdim
218893Sdim  return Result;
193323Sed}
193323Sed
193323Sed// Sign extend to a new width.
218893SdimAPInt APInt::sext(unsigned width) const {
193323Sed  assert(width > BitWidth && "Invalid APInt SignExtend request");
218893Sdim
218893Sdim  if (width <= APINT_BITS_PER_WORD) {
218893Sdim    uint64_t val = VAL << (APINT_BITS_PER_WORD - BitWidth);
218893Sdim    val = (int64_t)val >> (width - BitWidth);
218893Sdim    return APInt(width, val >> (APINT_BITS_PER_WORD - width));
193323Sed  }
193323Sed
218893Sdim  APInt Result(getMemory(getNumWords(width)), width);
193323Sed
218893Sdim  // Copy full words.
218893Sdim  unsigned i;
218893Sdim  uint64_t word = 0;
218893Sdim  for (i = 0; i != BitWidth / APINT_BITS_PER_WORD; i++) {
218893Sdim    word = getRawData()[i];
218893Sdim    Result.pVal[i] = word;
193323Sed  }
193323Sed
218893Sdim  // Read and sign-extend any partial word.
218893Sdim  unsigned bits = (0 - BitWidth) % APINT_BITS_PER_WORD;
218893Sdim  if (bits != 0)
218893Sdim    word = (int64_t)getRawData()[i] << bits >> bits;
218893Sdim  else
218893Sdim    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
218893Sdim
218893Sdim  // Write remaining full words.
218893Sdim  for (; i != width / APINT_BITS_PER_WORD; i++) {
218893Sdim    Result.pVal[i] = word;
218893Sdim    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
193323Sed  }
218893Sdim
218893Sdim  // Write any partial word.
218893Sdim  bits = (0 - width) % APINT_BITS_PER_WORD;
218893Sdim  if (bits != 0)
218893Sdim    Result.pVal[i] = word << bits >> bits;
218893Sdim
218893Sdim  return Result;
193323Sed}
193323Sed
193323Sed//  Zero extend to a new width.
218893SdimAPInt APInt::zext(unsigned width) const {
193323Sed  assert(width > BitWidth && "Invalid APInt ZeroExtend request");
218893Sdim
218893Sdim  if (width <= APINT_BITS_PER_WORD)
218893Sdim    return APInt(width, VAL);
218893Sdim
218893Sdim  APInt Result(getMemory(getNumWords(width)), width);
218893Sdim
218893Sdim  // Copy words.
218893Sdim  unsigned i;
218893Sdim  for (i = 0; i != getNumWords(); i++)
218893Sdim    Result.pVal[i] = getRawData()[i];
218893Sdim
218893Sdim  // Zero remaining words.
218893Sdim  memset(&Result.pVal[i], 0, (Result.getNumWords() - i) * APINT_WORD_SIZE);
218893Sdim
218893Sdim  return Result;
193323Sed}
193323Sed
218893SdimAPInt APInt::zextOrTrunc(unsigned width) const {
193323Sed  if (BitWidth < width)
193323Sed    return zext(width);
193323Sed  if (BitWidth > width)
193323Sed    return trunc(width);
193323Sed  return *this;
193323Sed}
193323Sed
218893SdimAPInt APInt::sextOrTrunc(unsigned width) const {
193323Sed  if (BitWidth < width)
193323Sed    return sext(width);
193323Sed  if (BitWidth > width)
193323Sed    return trunc(width);
193323Sed  return *this;
193323Sed}
193323Sed
234353SdimAPInt APInt::zextOrSelf(unsigned width) const {
234353Sdim  if (BitWidth < width)
234353Sdim    return zext(width);
234353Sdim  return *this;
234353Sdim}
234353Sdim
234353SdimAPInt APInt::sextOrSelf(unsigned width) const {
234353Sdim  if (BitWidth < width)
234353Sdim    return sext(width);
234353Sdim  return *this;
234353Sdim}
234353Sdim
193323Sed/// Arithmetic right-shift this APInt by shiftAmt.
193323Sed/// @brief Arithmetic right-shift function.
193323SedAPInt APInt::ashr(const APInt &shiftAmt) const {
193323Sed  return ashr((unsigned)shiftAmt.getLimitedValue(BitWidth));
193323Sed}
193323Sed
193323Sed/// Arithmetic right-shift this APInt by shiftAmt.
193323Sed/// @brief Arithmetic right-shift function.
193323SedAPInt APInt::ashr(unsigned shiftAmt) const {
193323Sed  assert(shiftAmt <= BitWidth && "Invalid shift amount");
193323Sed  // Handle a degenerate case
193323Sed  if (shiftAmt == 0)
193323Sed    return *this;
193323Sed
193323Sed  // Handle single word shifts with built-in ashr
193323Sed  if (isSingleWord()) {
193323Sed    if (shiftAmt == BitWidth)
193323Sed      return APInt(BitWidth, 0); // undefined
193323Sed    else {
193323Sed      unsigned SignBit = APINT_BITS_PER_WORD - BitWidth;
198090Srdivacky      return APInt(BitWidth,
193323Sed        (((int64_t(VAL) << SignBit) >> SignBit) >> shiftAmt));
193323Sed    }
193323Sed  }
193323Sed
193323Sed  // If all the bits were shifted out, the result is, technically, undefined.
193323Sed  // We return -1 if it was negative, 0 otherwise. We check this early to avoid
193323Sed  // issues in the algorithm below.
193323Sed  if (shiftAmt == BitWidth) {
193323Sed    if (isNegative())
193323Sed      return APInt(BitWidth, -1ULL, true);
193323Sed    else
193323Sed      return APInt(BitWidth, 0);
193323Sed  }
193323Sed
193323Sed  // Create some space for the result.
193323Sed  uint64_t * val = new uint64_t[getNumWords()];
193323Sed
193323Sed  // Compute some values needed by the following shift algorithms
193323Sed  unsigned wordShift = shiftAmt % APINT_BITS_PER_WORD; // bits to shift per word
193323Sed  unsigned offset = shiftAmt / APINT_BITS_PER_WORD; // word offset for shift
193323Sed  unsigned breakWord = getNumWords() - 1 - offset; // last word affected
193323Sed  unsigned bitsInWord = whichBit(BitWidth); // how many bits in last word?
193323Sed  if (bitsInWord == 0)
193323Sed    bitsInWord = APINT_BITS_PER_WORD;
193323Sed
193323Sed  // If we are shifting whole words, just move whole words
193323Sed  if (wordShift == 0) {
193323Sed    // Move the words containing significant bits
193323Sed    for (unsigned i = 0; i <= breakWord; ++i)
193323Sed      val[i] = pVal[i+offset]; // move whole word
193323Sed
193323Sed    // Adjust the top significant word for sign bit fill, if negative
193323Sed    if (isNegative())
193323Sed      if (bitsInWord < APINT_BITS_PER_WORD)
193323Sed        val[breakWord] |= ~0ULL << bitsInWord; // set high bits
193323Sed  } else {
198090Srdivacky    // Shift the low order words
193323Sed    for (unsigned i = 0; i < breakWord; ++i) {
193323Sed      // This combines the shifted corresponding word with the low bits from
193323Sed      // the next word (shifted into this word's high bits).
198090Srdivacky      val[i] = (pVal[i+offset] >> wordShift) |
193323Sed               (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
193323Sed    }
193323Sed
193323Sed    // Shift the break word. In this case there are no bits from the next word
193323Sed    // to include in this word.
193323Sed    val[breakWord] = pVal[breakWord+offset] >> wordShift;
193323Sed
193323Sed    // Deal with sign extenstion in the break word, and possibly the word before
193323Sed    // it.
193323Sed    if (isNegative()) {
193323Sed      if (wordShift > bitsInWord) {
193323Sed        if (breakWord > 0)
198090Srdivacky          val[breakWord-1] |=
193323Sed            ~0ULL << (APINT_BITS_PER_WORD - (wordShift - bitsInWord));
193323Sed        val[breakWord] |= ~0ULL;
198090Srdivacky      } else
193323Sed        val[breakWord] |= (~0ULL << (bitsInWord - wordShift));
193323Sed    }
193323Sed  }
193323Sed
193323Sed  // Remaining words are 0 or -1, just assign them.
193323Sed  uint64_t fillValue = (isNegative() ? -1ULL : 0);
193323Sed  for (unsigned i = breakWord+1; i < getNumWords(); ++i)
193323Sed    val[i] = fillValue;
193323Sed  return APInt(val, BitWidth).clearUnusedBits();
193323Sed}
193323Sed
193323Sed/// Logical right-shift this APInt by shiftAmt.
193323Sed/// @brief Logical right-shift function.
193323SedAPInt APInt::lshr(const APInt &shiftAmt) const {
193323Sed  return lshr((unsigned)shiftAmt.getLimitedValue(BitWidth));
193323Sed}
193323Sed
193323Sed/// Logical right-shift this APInt by shiftAmt.
193323Sed/// @brief Logical right-shift function.
193323SedAPInt APInt::lshr(unsigned shiftAmt) const {
193323Sed  if (isSingleWord()) {
234353Sdim    if (shiftAmt >= BitWidth)
193323Sed      return APInt(BitWidth, 0);
198090Srdivacky    else
193323Sed      return APInt(BitWidth, this->VAL >> shiftAmt);
193323Sed  }
193323Sed
193323Sed  // If all the bits were shifted out, the result is 0. This avoids issues
193323Sed  // with shifting by the size of the integer type, which produces undefined
193323Sed  // results. We define these "undefined results" to always be 0.
239462Sdim  if (shiftAmt >= BitWidth)
193323Sed    return APInt(BitWidth, 0);
193323Sed
193323Sed  // If none of the bits are shifted out, the result is *this. This avoids
198090Srdivacky  // issues with shifting by the size of the integer type, which produces
193323Sed  // undefined results in the code below. This is also an optimization.
193323Sed  if (shiftAmt == 0)
193323Sed    return *this;
193323Sed
193323Sed  // Create some space for the result.
193323Sed  uint64_t * val = new uint64_t[getNumWords()];
193323Sed
193323Sed  // If we are shifting less than a word, compute the shift with a simple carry
193323Sed  if (shiftAmt < APINT_BITS_PER_WORD) {
234353Sdim    lshrNear(val, pVal, getNumWords(), shiftAmt);
193323Sed    return APInt(val, BitWidth).clearUnusedBits();
193323Sed  }
193323Sed
193323Sed  // Compute some values needed by the remaining shift algorithms
193323Sed  unsigned wordShift = shiftAmt % APINT_BITS_PER_WORD;
193323Sed  unsigned offset = shiftAmt / APINT_BITS_PER_WORD;
193323Sed
193323Sed  // If we are shifting whole words, just move whole words
193323Sed  if (wordShift == 0) {
193323Sed    for (unsigned i = 0; i < getNumWords() - offset; ++i)
193323Sed      val[i] = pVal[i+offset];
193323Sed    for (unsigned i = getNumWords()-offset; i < getNumWords(); i++)
193323Sed      val[i] = 0;
193323Sed    return APInt(val,BitWidth).clearUnusedBits();
193323Sed  }
193323Sed
198090Srdivacky  // Shift the low order words
193323Sed  unsigned breakWord = getNumWords() - offset -1;
193323Sed  for (unsigned i = 0; i < breakWord; ++i)
193323Sed    val[i] = (pVal[i+offset] >> wordShift) |
193323Sed             (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
193323Sed  // Shift the break word.
193323Sed  val[breakWord] = pVal[breakWord+offset] >> wordShift;
193323Sed
193323Sed  // Remaining words are 0
193323Sed  for (unsigned i = breakWord+1; i < getNumWords(); ++i)
193323Sed    val[i] = 0;
193323Sed  return APInt(val, BitWidth).clearUnusedBits();
193323Sed}
193323Sed
193323Sed/// Left-shift this APInt by shiftAmt.
193323Sed/// @brief Left-shift function.
193323SedAPInt APInt::shl(const APInt &shiftAmt) const {
193323Sed  // It's undefined behavior in C to shift by BitWidth or greater.
193323Sed  return shl((unsigned)shiftAmt.getLimitedValue(BitWidth));
193323Sed}
193323Sed
193323SedAPInt APInt::shlSlowCase(unsigned shiftAmt) const {
193323Sed  // If all the bits were shifted out, the result is 0. This avoids issues
193323Sed  // with shifting by the size of the integer type, which produces undefined
193323Sed  // results. We define these "undefined results" to always be 0.
193323Sed  if (shiftAmt == BitWidth)
193323Sed    return APInt(BitWidth, 0);
193323Sed
193323Sed  // If none of the bits are shifted out, the result is *this. This avoids a
193323Sed  // lshr by the words size in the loop below which can produce incorrect
193323Sed  // results. It also avoids the expensive computation below for a common case.
193323Sed  if (shiftAmt == 0)
193323Sed    return *this;
193323Sed
193323Sed  // Create some space for the result.
193323Sed  uint64_t * val = new uint64_t[getNumWords()];
193323Sed
193323Sed  // If we are shifting less than a word, do it the easy way
193323Sed  if (shiftAmt < APINT_BITS_PER_WORD) {
193323Sed    uint64_t carry = 0;
193323Sed    for (unsigned i = 0; i < getNumWords(); i++) {
193323Sed      val[i] = pVal[i] << shiftAmt | carry;
193323Sed      carry = pVal[i] >> (APINT_BITS_PER_WORD - shiftAmt);
193323Sed    }
193323Sed    return APInt(val, BitWidth).clearUnusedBits();
193323Sed  }
193323Sed
193323Sed  // Compute some values needed by the remaining shift algorithms
193323Sed  unsigned wordShift = shiftAmt % APINT_BITS_PER_WORD;
193323Sed  unsigned offset = shiftAmt / APINT_BITS_PER_WORD;
193323Sed
193323Sed  // If we are shifting whole words, just move whole words
193323Sed  if (wordShift == 0) {
193323Sed    for (unsigned i = 0; i < offset; i++)
193323Sed      val[i] = 0;
193323Sed    for (unsigned i = offset; i < getNumWords(); i++)
193323Sed      val[i] = pVal[i-offset];
193323Sed    return APInt(val,BitWidth).clearUnusedBits();
193323Sed  }
193323Sed
193323Sed  // Copy whole words from this to Result.
193323Sed  unsigned i = getNumWords() - 1;
193323Sed  for (; i > offset; --i)
193323Sed    val[i] = pVal[i-offset] << wordShift |
193323Sed             pVal[i-offset-1] >> (APINT_BITS_PER_WORD - wordShift);
193323Sed  val[offset] = pVal[0] << wordShift;
193323Sed  for (i = 0; i < offset; ++i)
193323Sed    val[i] = 0;
193323Sed  return APInt(val, BitWidth).clearUnusedBits();
193323Sed}
193323Sed
193323SedAPInt APInt::rotl(const APInt &rotateAmt) const {
193323Sed  return rotl((unsigned)rotateAmt.getLimitedValue(BitWidth));
193323Sed}
193323Sed
193323SedAPInt APInt::rotl(unsigned rotateAmt) const {
234353Sdim  rotateAmt %= BitWidth;
193323Sed  if (rotateAmt == 0)
193323Sed    return *this;
234353Sdim  return shl(rotateAmt) | lshr(BitWidth - rotateAmt);
193323Sed}
193323Sed
193323SedAPInt APInt::rotr(const APInt &rotateAmt) const {
193323Sed  return rotr((unsigned)rotateAmt.getLimitedValue(BitWidth));
193323Sed}
193323Sed
193323SedAPInt APInt::rotr(unsigned rotateAmt) const {
234353Sdim  rotateAmt %= BitWidth;
193323Sed  if (rotateAmt == 0)
193323Sed    return *this;
234353Sdim  return lshr(rotateAmt) | shl(BitWidth - rotateAmt);
193323Sed}
193323Sed
193323Sed// Square Root - this method computes and returns the square root of "this".
193323Sed// Three mechanisms are used for computation. For small values (<= 5 bits),
193323Sed// a table lookup is done. This gets some performance for common cases. For
193323Sed// values using less than 52 bits, the value is converted to double and then
193323Sed// the libc sqrt function is called. The result is rounded and then converted
193323Sed// back to a uint64_t which is then used to construct the result. Finally,
198090Srdivacky// the Babylonian method for computing square roots is used.
193323SedAPInt APInt::sqrt() const {
193323Sed
193323Sed  // Determine the magnitude of the value.
193323Sed  unsigned magnitude = getActiveBits();
193323Sed
193323Sed  // Use a fast table for some small values. This also gets rid of some
193323Sed  // rounding errors in libc sqrt for small values.
193323Sed  if (magnitude <= 5) {
193323Sed    static const uint8_t results[32] = {
193323Sed      /*     0 */ 0,
193323Sed      /*  1- 2 */ 1, 1,
198090Srdivacky      /*  3- 6 */ 2, 2, 2, 2,
193323Sed      /*  7-12 */ 3, 3, 3, 3, 3, 3,
193323Sed      /* 13-20 */ 4, 4, 4, 4, 4, 4, 4, 4,
193323Sed      /* 21-30 */ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
193323Sed      /*    31 */ 6
193323Sed    };
193323Sed    return APInt(BitWidth, results[ (isSingleWord() ? VAL : pVal[0]) ]);
193323Sed  }
193323Sed
193323Sed  // If the magnitude of the value fits in less than 52 bits (the precision of
193323Sed  // an IEEE double precision floating point value), then we can use the
193323Sed  // libc sqrt function which will probably use a hardware sqrt computation.
193323Sed  // This should be faster than the algorithm below.
193323Sed  if (magnitude < 52) {
208599Srdivacky#if HAVE_ROUND
198090Srdivacky    return APInt(BitWidth,
208599Srdivacky                 uint64_t(::round(::sqrt(double(isSingleWord()?VAL:pVal[0])))));
193323Sed#else
198090Srdivacky    return APInt(BitWidth,
223017Sdim                 uint64_t(::sqrt(double(isSingleWord()?VAL:pVal[0])) + 0.5));
193323Sed#endif
193323Sed  }
193323Sed
193323Sed  // Okay, all the short cuts are exhausted. We must compute it. The following
193323Sed  // is a classical Babylonian method for computing the square root. This code
193323Sed  // was adapted to APINt from a wikipedia article on such computations.
193323Sed  // See http://www.wikipedia.org/ and go to the page named
198090Srdivacky  // Calculate_an_integer_square_root.
193323Sed  unsigned nbits = BitWidth, i = 4;
193323Sed  APInt testy(BitWidth, 16);
193323Sed  APInt x_old(BitWidth, 1);
193323Sed  APInt x_new(BitWidth, 0);
193323Sed  APInt two(BitWidth, 2);
193323Sed
193323Sed  // Select a good starting value using binary logarithms.
198090Srdivacky  for (;; i += 2, testy = testy.shl(2))
193323Sed    if (i >= nbits || this->ule(testy)) {
193323Sed      x_old = x_old.shl(i / 2);
193323Sed      break;
193323Sed    }
193323Sed
198090Srdivacky  // Use the Babylonian method to arrive at the integer square root:
193323Sed  for (;;) {
193323Sed    x_new = (this->udiv(x_old) + x_old).udiv(two);
193323Sed    if (x_old.ule(x_new))
193323Sed      break;
193323Sed    x_old = x_new;
193323Sed  }
193323Sed
193323Sed  // Make sure we return the closest approximation
198090Srdivacky  // NOTE: The rounding calculation below is correct. It will produce an
193323Sed  // off-by-one discrepancy with results from pari/gp. That discrepancy has been
198090Srdivacky  // determined to be a rounding issue with pari/gp as it begins to use a
193323Sed  // floating point representation after 192 bits. There are no discrepancies
193323Sed  // between this algorithm and pari/gp for bit widths < 192 bits.
193323Sed  APInt square(x_old * x_old);
193323Sed  APInt nextSquare((x_old + 1) * (x_old +1));
193323Sed  if (this->ult(square))
193323Sed    return x_old;
234353Sdim  assert(this->ule(nextSquare) && "Error in APInt::sqrt computation");
234353Sdim  APInt midpoint((nextSquare - square).udiv(two));
234353Sdim  APInt offset(*this - square);
234353Sdim  if (offset.ult(midpoint))
234353Sdim    return x_old;
193323Sed  return x_old + 1;
193323Sed}
193323Sed
193323Sed/// Computes the multiplicative inverse of this APInt for a given modulo. The
193323Sed/// iterative extended Euclidean algorithm is used to solve for this value,
193323Sed/// however we simplify it to speed up calculating only the inverse, and take
193323Sed/// advantage of div+rem calculations. We also use some tricks to avoid copying
193323Sed/// (potentially large) APInts around.
193323SedAPInt APInt::multiplicativeInverse(const APInt& modulo) const {
193323Sed  assert(ult(modulo) && "This APInt must be smaller than the modulo");
193323Sed
193323Sed  // Using the properties listed at the following web page (accessed 06/21/08):
193323Sed  //   http://www.numbertheory.org/php/euclid.html
193323Sed  // (especially the properties numbered 3, 4 and 9) it can be proved that
193323Sed  // BitWidth bits suffice for all the computations in the algorithm implemented
193323Sed  // below. More precisely, this number of bits suffice if the multiplicative
193323Sed  // inverse exists, but may not suffice for the general extended Euclidean
193323Sed  // algorithm.
193323Sed
193323Sed  APInt r[2] = { modulo, *this };
193323Sed  APInt t[2] = { APInt(BitWidth, 0), APInt(BitWidth, 1) };
193323Sed  APInt q(BitWidth, 0);
198090Srdivacky
193323Sed  unsigned i;
193323Sed  for (i = 0; r[i^1] != 0; i ^= 1) {
193323Sed    // An overview of the math without the confusing bit-flipping:
193323Sed    // q = r[i-2] / r[i-1]
193323Sed    // r[i] = r[i-2] % r[i-1]
193323Sed    // t[i] = t[i-2] - t[i-1] * q
193323Sed    udivrem(r[i], r[i^1], q, r[i]);
193323Sed    t[i] -= t[i^1] * q;
193323Sed  }
193323Sed
193323Sed  // If this APInt and the modulo are not coprime, there is no multiplicative
193323Sed  // inverse, so return 0. We check this by looking at the next-to-last
193323Sed  // remainder, which is the gcd(*this,modulo) as calculated by the Euclidean
193323Sed  // algorithm.
193323Sed  if (r[i] != 1)
193323Sed    return APInt(BitWidth, 0);
193323Sed
193323Sed  // The next-to-last t is the multiplicative inverse.  However, we are
193323Sed  // interested in a positive inverse. Calcuate a positive one from a negative
193323Sed  // one if necessary. A simple addition of the modulo suffices because
193323Sed  // abs(t[i]) is known to be less than *this/2 (see the link above).
193323Sed  return t[i].isNegative() ? t[i] + modulo : t[i];
193323Sed}
193323Sed
193323Sed/// Calculate the magic numbers required to implement a signed integer division
193323Sed/// by a constant as a sequence of multiplies, adds and shifts.  Requires that
193323Sed/// the divisor not be 0, 1, or -1.  Taken from "Hacker's Delight", Henry S.
193323Sed/// Warren, Jr., chapter 10.
193323SedAPInt::ms APInt::magic() const {
193323Sed  const APInt& d = *this;
193323Sed  unsigned p;
193323Sed  APInt ad, anc, delta, q1, r1, q2, r2, t;
193323Sed  APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
193323Sed  struct ms mag;
198090Srdivacky
193323Sed  ad = d.abs();
193323Sed  t = signedMin + (d.lshr(d.getBitWidth() - 1));
193323Sed  anc = t - 1 - t.urem(ad);   // absolute value of nc
193323Sed  p = d.getBitWidth() - 1;    // initialize p
193323Sed  q1 = signedMin.udiv(anc);   // initialize q1 = 2p/abs(nc)
193323Sed  r1 = signedMin - q1*anc;    // initialize r1 = rem(2p,abs(nc))
193323Sed  q2 = signedMin.udiv(ad);    // initialize q2 = 2p/abs(d)
193323Sed  r2 = signedMin - q2*ad;     // initialize r2 = rem(2p,abs(d))
193323Sed  do {
193323Sed    p = p + 1;
193323Sed    q1 = q1<<1;          // update q1 = 2p/abs(nc)
193323Sed    r1 = r1<<1;          // update r1 = rem(2p/abs(nc))
193323Sed    if (r1.uge(anc)) {  // must be unsigned comparison
193323Sed      q1 = q1 + 1;
193323Sed      r1 = r1 - anc;
193323Sed    }
193323Sed    q2 = q2<<1;          // update q2 = 2p/abs(d)
193323Sed    r2 = r2<<1;          // update r2 = rem(2p/abs(d))
193323Sed    if (r2.uge(ad)) {   // must be unsigned comparison
193323Sed      q2 = q2 + 1;
193323Sed      r2 = r2 - ad;
193323Sed    }
193323Sed    delta = ad - r2;
219077Sdim  } while (q1.ult(delta) || (q1 == delta && r1 == 0));
198090Srdivacky
193323Sed  mag.m = q2 + 1;
193323Sed  if (d.isNegative()) mag.m = -mag.m;   // resulting magic number
193323Sed  mag.s = p - d.getBitWidth();          // resulting shift
193323Sed  return mag;
193323Sed}
193323Sed
193323Sed/// Calculate the magic numbers required to implement an unsigned integer
193323Sed/// division by a constant as a sequence of multiplies, adds and shifts.
193323Sed/// Requires that the divisor not be 0.  Taken from "Hacker's Delight", Henry
193323Sed/// S. Warren, Jr., chapter 10.
221345Sdim/// LeadingZeros can be used to simplify the calculation if the upper bits
221345Sdim/// of the divided value are known zero.
221345SdimAPInt::mu APInt::magicu(unsigned LeadingZeros) const {
193323Sed  const APInt& d = *this;
193323Sed  unsigned p;
193323Sed  APInt nc, delta, q1, r1, q2, r2;
193323Sed  struct mu magu;
193323Sed  magu.a = 0;               // initialize "add" indicator
221345Sdim  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth()).lshr(LeadingZeros);
193323Sed  APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
193323Sed  APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
193323Sed
239462Sdim  nc = allOnes - (allOnes - d).urem(d);
193323Sed  p = d.getBitWidth() - 1;  // initialize p
193323Sed  q1 = signedMin.udiv(nc);  // initialize q1 = 2p/nc
193323Sed  r1 = signedMin - q1*nc;   // initialize r1 = rem(2p,nc)
193323Sed  q2 = signedMax.udiv(d);   // initialize q2 = (2p-1)/d
193323Sed  r2 = signedMax - q2*d;    // initialize r2 = rem((2p-1),d)
193323Sed  do {
193323Sed    p = p + 1;
193323Sed    if (r1.uge(nc - r1)) {
193323Sed      q1 = q1 + q1 + 1;  // update q1
193323Sed      r1 = r1 + r1 - nc; // update r1
193323Sed    }
193323Sed    else {
193323Sed      q1 = q1+q1; // update q1
193323Sed      r1 = r1+r1; // update r1
193323Sed    }
193323Sed    if ((r2 + 1).uge(d - r2)) {
193323Sed      if (q2.uge(signedMax)) magu.a = 1;
193323Sed      q2 = q2+q2 + 1;     // update q2
193323Sed      r2 = r2+r2 + 1 - d; // update r2
193323Sed    }
193323Sed    else {
193323Sed      if (q2.uge(signedMin)) magu.a = 1;
193323Sed      q2 = q2+q2;     // update q2
193323Sed      r2 = r2+r2 + 1; // update r2
193323Sed    }
193323Sed    delta = d - 1 - r2;
193323Sed  } while (p < d.getBitWidth()*2 &&
193323Sed           (q1.ult(delta) || (q1 == delta && r1 == 0)));
193323Sed  magu.m = q2 + 1; // resulting magic number
193323Sed  magu.s = p - d.getBitWidth();  // resulting shift
193323Sed  return magu;
193323Sed}
193323Sed
193323Sed/// Implementation of Knuth's Algorithm D (Division of nonnegative integers)
193323Sed/// from "Art of Computer Programming, Volume 2", section 4.3.1, p. 272. The
193323Sed/// variables here have the same names as in the algorithm. Comments explain
193323Sed/// the algorithm and any deviation from it.
193323Sedstatic void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
193323Sed                     unsigned m, unsigned n) {
193323Sed  assert(u && "Must provide dividend");
193323Sed  assert(v && "Must provide divisor");
193323Sed  assert(q && "Must provide quotient");
193323Sed  assert(u != v && u != q && v != q && "Must us different memory");
193323Sed  assert(n>1 && "n must be > 1");
193323Sed
193323Sed  // Knuth uses the value b as the base of the number system. In our case b
193323Sed  // is 2^31 so we just set it to -1u.
193323Sed  uint64_t b = uint64_t(1) << 32;
193323Sed
193323Sed#if 0
202375Srdivacky  DEBUG(dbgs() << "KnuthDiv: m=" << m << " n=" << n << '\n');
202375Srdivacky  DEBUG(dbgs() << "KnuthDiv: original:");
202375Srdivacky  DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
202375Srdivacky  DEBUG(dbgs() << " by");
202375Srdivacky  DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
202375Srdivacky  DEBUG(dbgs() << '\n');
193323Sed#endif
198090Srdivacky  // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
198090Srdivacky  // u and v by d. Note that we have taken Knuth's advice here to use a power
198090Srdivacky  // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
198090Srdivacky  // 2 allows us to shift instead of multiply and it is easy to determine the
193323Sed  // shift amount from the leading zeros.  We are basically normalizing the u
193323Sed  // and v so that its high bits are shifted to the top of v's range without
193323Sed  // overflow. Note that this can require an extra word in u so that u must
193323Sed  // be of length m+n+1.
263508Sdim  unsigned shift = countLeadingZeros(v[n-1]);
193323Sed  unsigned v_carry = 0;
193323Sed  unsigned u_carry = 0;
193323Sed  if (shift) {
193323Sed    for (unsigned i = 0; i < m+n; ++i) {
193323Sed      unsigned u_tmp = u[i] >> (32 - shift);
193323Sed      u[i] = (u[i] << shift) | u_carry;
193323Sed      u_carry = u_tmp;
193323Sed    }
193323Sed    for (unsigned i = 0; i < n; ++i) {
193323Sed      unsigned v_tmp = v[i] >> (32 - shift);
193323Sed      v[i] = (v[i] << shift) | v_carry;
193323Sed      v_carry = v_tmp;
193323Sed    }
193323Sed  }
193323Sed  u[m+n] = u_carry;
193323Sed#if 0
202375Srdivacky  DEBUG(dbgs() << "KnuthDiv:   normal:");
202375Srdivacky  DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
202375Srdivacky  DEBUG(dbgs() << " by");
202375Srdivacky  DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
202375Srdivacky  DEBUG(dbgs() << '\n');
193323Sed#endif
193323Sed
193323Sed  // D2. [Initialize j.]  Set j to m. This is the loop counter over the places.
193323Sed  int j = m;
193323Sed  do {
202375Srdivacky    DEBUG(dbgs() << "KnuthDiv: quotient digit #" << j << '\n');
198090Srdivacky    // D3. [Calculate q'.].
193323Sed    //     Set qp = (u[j+n]*b + u[j+n-1]) / v[n-1]. (qp=qprime=q')
193323Sed    //     Set rp = (u[j+n]*b + u[j+n-1]) % v[n-1]. (rp=rprime=r')
193323Sed    // Now test if qp == b or qp*v[n-2] > b*rp + u[j+n-2]; if so, decrease
193323Sed    // qp by 1, inrease rp by v[n-1], and repeat this test if rp < b. The test
193323Sed    // on v[n-2] determines at high speed most of the cases in which the trial
198090Srdivacky    // value qp is one too large, and it eliminates all cases where qp is two
198090Srdivacky    // too large.
193323Sed    uint64_t dividend = ((uint64_t(u[j+n]) << 32) + u[j+n-1]);
202375Srdivacky    DEBUG(dbgs() << "KnuthDiv: dividend == " << dividend << '\n');
193323Sed    uint64_t qp = dividend / v[n-1];
193323Sed    uint64_t rp = dividend % v[n-1];
193323Sed    if (qp == b || qp*v[n-2] > b*rp + u[j+n-2]) {
193323Sed      qp--;
193323Sed      rp += v[n-1];
193323Sed      if (rp < b && (qp == b || qp*v[n-2] > b*rp + u[j+n-2]))
193323Sed        qp--;
193323Sed    }
202375Srdivacky    DEBUG(dbgs() << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
193323Sed
193323Sed    // D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
193323Sed    // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
193323Sed    // consists of a simple multiplication by a one-place number, combined with
198090Srdivacky    // a subtraction.
193323Sed    bool isNeg = false;
193323Sed    for (unsigned i = 0; i < n; ++i) {
193323Sed      uint64_t u_tmp = uint64_t(u[j+i]) | (uint64_t(u[j+i+1]) << 32);
193323Sed      uint64_t subtrahend = uint64_t(qp) * uint64_t(v[i]);
193323Sed      bool borrow = subtrahend > u_tmp;
202375Srdivacky      DEBUG(dbgs() << "KnuthDiv: u_tmp == " << u_tmp
198090Srdivacky                   << ", subtrahend == " << subtrahend
198090Srdivacky                   << ", borrow = " << borrow << '\n');
193323Sed
193323Sed      uint64_t result = u_tmp - subtrahend;
193323Sed      unsigned k = j + i;
193323Sed      u[k++] = (unsigned)(result & (b-1)); // subtract low word
193323Sed      u[k++] = (unsigned)(result >> 32);   // subtract high word
193323Sed      while (borrow && k <= m+n) { // deal with borrow to the left
193323Sed        borrow = u[k] == 0;
193323Sed        u[k]--;
193323Sed        k++;
193323Sed      }
193323Sed      isNeg |= borrow;
202375Srdivacky      DEBUG(dbgs() << "KnuthDiv: u[j+i] == " << u[j+i] << ",  u[j+i+1] == " <<
198090Srdivacky                    u[j+i+1] << '\n');
193323Sed    }
202375Srdivacky    DEBUG(dbgs() << "KnuthDiv: after subtraction:");
202375Srdivacky    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
202375Srdivacky    DEBUG(dbgs() << '\n');
198090Srdivacky    // The digits (u[j+n]...u[j]) should be kept positive; if the result of
198090Srdivacky    // this step is actually negative, (u[j+n]...u[j]) should be left as the
193323Sed    // true value plus b**(n+1), namely as the b's complement of
193323Sed    // the true value, and a "borrow" to the left should be remembered.
193323Sed    //
193323Sed    if (isNeg) {
193323Sed      bool carry = true;  // true because b's complement is "complement + 1"
193323Sed      for (unsigned i = 0; i <= m+n; ++i) {
193323Sed        u[i] = ~u[i] + carry; // b's complement
193323Sed        carry = carry && u[i] == 0;
193323Sed      }
193323Sed    }
202375Srdivacky    DEBUG(dbgs() << "KnuthDiv: after complement:");
202375Srdivacky    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
202375Srdivacky    DEBUG(dbgs() << '\n');
193323Sed
198090Srdivacky    // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
193323Sed    // negative, go to step D6; otherwise go on to step D7.
193323Sed    q[j] = (unsigned)qp;
193323Sed    if (isNeg) {
198090Srdivacky      // D6. [Add back]. The probability that this step is necessary is very
193323Sed      // small, on the order of only 2/b. Make sure that test data accounts for
198090Srdivacky      // this possibility. Decrease q[j] by 1
193323Sed      q[j]--;
198090Srdivacky      // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
198090Srdivacky      // A carry will occur to the left of u[j+n], and it should be ignored
193323Sed      // since it cancels with the borrow that occurred in D4.
193323Sed      bool carry = false;
193323Sed      for (unsigned i = 0; i < n; i++) {
193323Sed        unsigned limit = std::min(u[j+i],v[i]);
193323Sed        u[j+i] += v[i] + carry;
193323Sed        carry = u[j+i] < limit || (carry && u[j+i] == limit);
193323Sed      }
193323Sed      u[j+n] += carry;
193323Sed    }
202375Srdivacky    DEBUG(dbgs() << "KnuthDiv: after correction:");
202375Srdivacky    DEBUG(for (int i = m+n; i >=0; i--) dbgs() <<" " << u[i]);
202375Srdivacky    DEBUG(dbgs() << "\nKnuthDiv: digit result = " << q[j] << '\n');
193323Sed
193323Sed  // D7. [Loop on j.]  Decrease j by one. Now if j >= 0, go back to D3.
193323Sed  } while (--j >= 0);
193323Sed
202375Srdivacky  DEBUG(dbgs() << "KnuthDiv: quotient:");
202375Srdivacky  DEBUG(for (int i = m; i >=0; i--) dbgs() <<" " << q[i]);
202375Srdivacky  DEBUG(dbgs() << '\n');
193323Sed
193323Sed  // D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
193323Sed  // remainder may be obtained by dividing u[...] by d. If r is non-null we
193323Sed  // compute the remainder (urem uses this).
193323Sed  if (r) {
193323Sed    // The value d is expressed by the "shift" value above since we avoided
193323Sed    // multiplication by d by using a shift left. So, all we have to do is
193323Sed    // shift right here. In order to mak
193323Sed    if (shift) {
193323Sed      unsigned carry = 0;
202375Srdivacky      DEBUG(dbgs() << "KnuthDiv: remainder:");
193323Sed      for (int i = n-1; i >= 0; i--) {
193323Sed        r[i] = (u[i] >> shift) | carry;
193323Sed        carry = u[i] << (32 - shift);
202375Srdivacky        DEBUG(dbgs() << " " << r[i]);
193323Sed      }
193323Sed    } else {
193323Sed      for (int i = n-1; i >= 0; i--) {
193323Sed        r[i] = u[i];
202375Srdivacky        DEBUG(dbgs() << " " << r[i]);
193323Sed      }
193323Sed    }
202375Srdivacky    DEBUG(dbgs() << '\n');
193323Sed  }
193323Sed#if 0
202375Srdivacky  DEBUG(dbgs() << '\n');
193323Sed#endif
193323Sed}
193323Sed
193323Sedvoid APInt::divide(const APInt LHS, unsigned lhsWords,
193323Sed                   const APInt &RHS, unsigned rhsWords,
193323Sed                   APInt *Quotient, APInt *Remainder)
193323Sed{
193323Sed  assert(lhsWords >= rhsWords && "Fractional result");
193323Sed
198090Srdivacky  // First, compose the values into an array of 32-bit words instead of
193323Sed  // 64-bit words. This is a necessity of both the "short division" algorithm
203954Srdivacky  // and the Knuth "classical algorithm" which requires there to be native
198090Srdivacky  // operations for +, -, and * on an m bit value with an m*2 bit result. We
198090Srdivacky  // can't use 64-bit operands here because we don't have native results of
198090Srdivacky  // 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't
193323Sed  // work on large-endian machines.
193323Sed  uint64_t mask = ~0ull >> (sizeof(unsigned)*CHAR_BIT);
193323Sed  unsigned n = rhsWords * 2;
193323Sed  unsigned m = (lhsWords * 2) - n;
193323Sed
193323Sed  // Allocate space for the temporary values we need either on the stack, if
193323Sed  // it will fit, or on the heap if it won't.
193323Sed  unsigned SPACE[128];
193323Sed  unsigned *U = 0;
193323Sed  unsigned *V = 0;
193323Sed  unsigned *Q = 0;
193323Sed  unsigned *R = 0;
193323Sed  if ((Remainder?4:3)*n+2*m+1 <= 128) {
193323Sed    U = &SPACE[0];
193323Sed    V = &SPACE[m+n+1];
193323Sed    Q = &SPACE[(m+n+1) + n];
193323Sed    if (Remainder)
193323Sed      R = &SPACE[(m+n+1) + n + (m+n)];
193323Sed  } else {
193323Sed    U = new unsigned[m + n + 1];
193323Sed    V = new unsigned[n];
193323Sed    Q = new unsigned[m+n];
193323Sed    if (Remainder)
193323Sed      R = new unsigned[n];
193323Sed  }
193323Sed
193323Sed  // Initialize the dividend
193323Sed  memset(U, 0, (m+n+1)*sizeof(unsigned));
193323Sed  for (unsigned i = 0; i < lhsWords; ++i) {
193323Sed    uint64_t tmp = (LHS.getNumWords() == 1 ? LHS.VAL : LHS.pVal[i]);
193323Sed    U[i * 2] = (unsigned)(tmp & mask);
193323Sed    U[i * 2 + 1] = (unsigned)(tmp >> (sizeof(unsigned)*CHAR_BIT));
193323Sed  }
193323Sed  U[m+n] = 0; // this extra word is for "spill" in the Knuth algorithm.
193323Sed
193323Sed  // Initialize the divisor
193323Sed  memset(V, 0, (n)*sizeof(unsigned));
193323Sed  for (unsigned i = 0; i < rhsWords; ++i) {
193323Sed    uint64_t tmp = (RHS.getNumWords() == 1 ? RHS.VAL : RHS.pVal[i]);
193323Sed    V[i * 2] = (unsigned)(tmp & mask);
193323Sed    V[i * 2 + 1] = (unsigned)(tmp >> (sizeof(unsigned)*CHAR_BIT));
193323Sed  }
193323Sed
193323Sed  // initialize the quotient and remainder
193323Sed  memset(Q, 0, (m+n) * sizeof(unsigned));
193323Sed  if (Remainder)
193323Sed    memset(R, 0, n * sizeof(unsigned));
193323Sed
198090Srdivacky  // Now, adjust m and n for the Knuth division. n is the number of words in
193323Sed  // the divisor. m is the number of words by which the dividend exceeds the
198090Srdivacky  // divisor (i.e. m+n is the length of the dividend). These sizes must not
193323Sed  // contain any zero words or the Knuth algorithm fails.
193323Sed  for (unsigned i = n; i > 0 && V[i-1] == 0; i--) {
193323Sed    n--;
193323Sed    m++;
193323Sed  }
193323Sed  for (unsigned i = m+n; i > 0 && U[i-1] == 0; i--)
193323Sed    m--;
193323Sed
193323Sed  // If we're left with only a single word for the divisor, Knuth doesn't work
193323Sed  // so we implement the short division algorithm here. This is much simpler
193323Sed  // and faster because we are certain that we can divide a 64-bit quantity
193323Sed  // by a 32-bit quantity at hardware speed and short division is simply a
193323Sed  // series of such operations. This is just like doing short division but we
193323Sed  // are using base 2^32 instead of base 10.
193323Sed  assert(n != 0 && "Divide by zero?");
193323Sed  if (n == 1) {
193323Sed    unsigned divisor = V[0];
193323Sed    unsigned remainder = 0;
193323Sed    for (int i = m+n-1; i >= 0; i--) {
193323Sed      uint64_t partial_dividend = uint64_t(remainder) << 32 | U[i];
193323Sed      if (partial_dividend == 0) {
193323Sed        Q[i] = 0;
193323Sed        remainder = 0;
193323Sed      } else if (partial_dividend < divisor) {
193323Sed        Q[i] = 0;
193323Sed        remainder = (unsigned)partial_dividend;
193323Sed      } else if (partial_dividend == divisor) {
193323Sed        Q[i] = 1;
193323Sed        remainder = 0;
193323Sed      } else {
193323Sed        Q[i] = (unsigned)(partial_dividend / divisor);
193323Sed        remainder = (unsigned)(partial_dividend - (Q[i] * divisor));
193323Sed      }
193323Sed    }
193323Sed    if (R)
193323Sed      R[0] = remainder;
193323Sed  } else {
193323Sed    // Now we're ready to invoke the Knuth classical divide algorithm. In this
193323Sed    // case n > 1.
193323Sed    KnuthDiv(U, V, Q, R, m, n);
193323Sed  }
193323Sed
193323Sed  // If the caller wants the quotient
193323Sed  if (Quotient) {
193323Sed    // Set up the Quotient value's memory.
193323Sed    if (Quotient->BitWidth != LHS.BitWidth) {
193323Sed      if (Quotient->isSingleWord())
193323Sed        Quotient->VAL = 0;
193323Sed      else
193323Sed        delete [] Quotient->pVal;
193323Sed      Quotient->BitWidth = LHS.BitWidth;
193323Sed      if (!Quotient->isSingleWord())
193323Sed        Quotient->pVal = getClearedMemory(Quotient->getNumWords());
193323Sed    } else
218893Sdim      Quotient->clearAllBits();
193323Sed
198090Srdivacky    // The quotient is in Q. Reconstitute the quotient into Quotient's low
193323Sed    // order words.
193323Sed    if (lhsWords == 1) {
198090Srdivacky      uint64_t tmp =
193323Sed        uint64_t(Q[0]) | (uint64_t(Q[1]) << (APINT_BITS_PER_WORD / 2));
193323Sed      if (Quotient->isSingleWord())
193323Sed        Quotient->VAL = tmp;
193323Sed      else
193323Sed        Quotient->pVal[0] = tmp;
193323Sed    } else {
193323Sed      assert(!Quotient->isSingleWord() && "Quotient APInt not large enough");
193323Sed      for (unsigned i = 0; i < lhsWords; ++i)
198090Srdivacky        Quotient->pVal[i] =
193323Sed          uint64_t(Q[i*2]) | (uint64_t(Q[i*2+1]) << (APINT_BITS_PER_WORD / 2));
193323Sed    }
193323Sed  }
193323Sed
193323Sed  // If the caller wants the remainder
193323Sed  if (Remainder) {
193323Sed    // Set up the Remainder value's memory.
193323Sed    if (Remainder->BitWidth != RHS.BitWidth) {
193323Sed      if (Remainder->isSingleWord())
193323Sed        Remainder->VAL = 0;
193323Sed      else
193323Sed        delete [] Remainder->pVal;
193323Sed      Remainder->BitWidth = RHS.BitWidth;
193323Sed      if (!Remainder->isSingleWord())
193323Sed        Remainder->pVal = getClearedMemory(Remainder->getNumWords());
193323Sed    } else
218893Sdim      Remainder->clearAllBits();
193323Sed
193323Sed    // The remainder is in R. Reconstitute the remainder into Remainder's low
193323Sed    // order words.
193323Sed    if (rhsWords == 1) {
198090Srdivacky      uint64_t tmp =
193323Sed        uint64_t(R[0]) | (uint64_t(R[1]) << (APINT_BITS_PER_WORD / 2));
193323Sed      if (Remainder->isSingleWord())
193323Sed        Remainder->VAL = tmp;
193323Sed      else
193323Sed        Remainder->pVal[0] = tmp;
193323Sed    } else {
193323Sed      assert(!Remainder->isSingleWord() && "Remainder APInt not large enough");
193323Sed      for (unsigned i = 0; i < rhsWords; ++i)
198090Srdivacky        Remainder->pVal[i] =
193323Sed          uint64_t(R[i*2]) | (uint64_t(R[i*2+1]) << (APINT_BITS_PER_WORD / 2));
193323Sed    }
193323Sed  }
193323Sed
193323Sed  // Clean up the memory we allocated.
193323Sed  if (U != &SPACE[0]) {
193323Sed    delete [] U;
193323Sed    delete [] V;
193323Sed    delete [] Q;
193323Sed    delete [] R;
193323Sed  }
193323Sed}
193323Sed
193323SedAPInt APInt::udiv(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed
193323Sed  // First, deal with the easy case
193323Sed  if (isSingleWord()) {
193323Sed    assert(RHS.VAL != 0 && "Divide by zero?");
193323Sed    return APInt(BitWidth, VAL / RHS.VAL);
193323Sed  }
193323Sed
193323Sed  // Get some facts about the LHS and RHS number of bits and words
193323Sed  unsigned rhsBits = RHS.getActiveBits();
193323Sed  unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
193323Sed  assert(rhsWords && "Divided by zero???");
193323Sed  unsigned lhsBits = this->getActiveBits();
193323Sed  unsigned lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
193323Sed
193323Sed  // Deal with some degenerate cases
198090Srdivacky  if (!lhsWords)
193323Sed    // 0 / X ===> 0
198090Srdivacky    return APInt(BitWidth, 0);
193323Sed  else if (lhsWords < rhsWords || this->ult(RHS)) {
193323Sed    // X / Y ===> 0, iff X < Y
193323Sed    return APInt(BitWidth, 0);
193323Sed  } else if (*this == RHS) {
193323Sed    // X / X ===> 1
193323Sed    return APInt(BitWidth, 1);
193323Sed  } else if (lhsWords == 1 && rhsWords == 1) {
193323Sed    // All high words are zero, just use native divide
193323Sed    return APInt(BitWidth, this->pVal[0] / RHS.pVal[0]);
193323Sed  }
193323Sed
193323Sed  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
193323Sed  APInt Quotient(1,0); // to hold result.
193323Sed  divide(*this, lhsWords, RHS, rhsWords, &Quotient, 0);
193323Sed  return Quotient;
193323Sed}
193323Sed
249423SdimAPInt APInt::sdiv(const APInt &RHS) const {
249423Sdim  if (isNegative()) {
249423Sdim    if (RHS.isNegative())
249423Sdim      return (-(*this)).udiv(-RHS);
249423Sdim    return -((-(*this)).udiv(RHS));
249423Sdim  }
249423Sdim  if (RHS.isNegative())
249423Sdim    return -(this->udiv(-RHS));
249423Sdim  return this->udiv(RHS);
249423Sdim}
249423Sdim
193323SedAPInt APInt::urem(const APInt& RHS) const {
193323Sed  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
193323Sed  if (isSingleWord()) {
193323Sed    assert(RHS.VAL != 0 && "Remainder by zero?");
193323Sed    return APInt(BitWidth, VAL % RHS.VAL);
193323Sed  }
193323Sed
193323Sed  // Get some facts about the LHS
193323Sed  unsigned lhsBits = getActiveBits();
193323Sed  unsigned lhsWords = !lhsBits ? 0 : (whichWord(lhsBits - 1) + 1);
193323Sed
193323Sed  // Get some facts about the RHS
193323Sed  unsigned rhsBits = RHS.getActiveBits();
193323Sed  unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
193323Sed  assert(rhsWords && "Performing remainder operation by zero ???");
193323Sed
193323Sed  // Check the degenerate cases
193323Sed  if (lhsWords == 0) {
193323Sed    // 0 % Y ===> 0
193323Sed    return APInt(BitWidth, 0);
193323Sed  } else if (lhsWords < rhsWords || this->ult(RHS)) {
193323Sed    // X % Y ===> X, iff X < Y
193323Sed    return *this;
193323Sed  } else if (*this == RHS) {
193323Sed    // X % X == 0;
193323Sed    return APInt(BitWidth, 0);
193323Sed  } else if (lhsWords == 1) {
193323Sed    // All high words are zero, just use native remainder
193323Sed    return APInt(BitWidth, pVal[0] % RHS.pVal[0]);
193323Sed  }
193323Sed
193323Sed  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
193323Sed  APInt Remainder(1,0);
193323Sed  divide(*this, lhsWords, RHS, rhsWords, 0, &Remainder);
193323Sed  return Remainder;
193323Sed}
193323Sed
249423SdimAPInt APInt::srem(const APInt &RHS) const {
249423Sdim  if (isNegative()) {
249423Sdim    if (RHS.isNegative())
249423Sdim      return -((-(*this)).urem(-RHS));
249423Sdim    return -((-(*this)).urem(RHS));
249423Sdim  }
249423Sdim  if (RHS.isNegative())
249423Sdim    return this->urem(-RHS);
249423Sdim  return this->urem(RHS);
249423Sdim}
249423Sdim
198090Srdivackyvoid APInt::udivrem(const APInt &LHS, const APInt &RHS,
193323Sed                    APInt &Quotient, APInt &Remainder) {
193323Sed  // Get some size facts about the dividend and divisor
193323Sed  unsigned lhsBits  = LHS.getActiveBits();
193323Sed  unsigned lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
193323Sed  unsigned rhsBits  = RHS.getActiveBits();
193323Sed  unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
193323Sed
193323Sed  // Check the degenerate cases
198090Srdivacky  if (lhsWords == 0) {
193323Sed    Quotient = 0;                // 0 / Y ===> 0
193323Sed    Remainder = 0;               // 0 % Y ===> 0
193323Sed    return;
198090Srdivacky  }
198090Srdivacky
198090Srdivacky  if (lhsWords < rhsWords || LHS.ult(RHS)) {
201360Srdivacky    Remainder = LHS;            // X % Y ===> X, iff X < Y
193323Sed    Quotient = 0;               // X / Y ===> 0, iff X < Y
193323Sed    return;
198090Srdivacky  }
198090Srdivacky
193323Sed  if (LHS == RHS) {
193323Sed    Quotient  = 1;              // X / X ===> 1
193323Sed    Remainder = 0;              // X % X ===> 0;
193323Sed    return;
198090Srdivacky  }
198090Srdivacky
193323Sed  if (lhsWords == 1 && rhsWords == 1) {
193323Sed    // There is only one word to consider so use the native versions.
193323Sed    uint64_t lhsValue = LHS.isSingleWord() ? LHS.VAL : LHS.pVal[0];
193323Sed    uint64_t rhsValue = RHS.isSingleWord() ? RHS.VAL : RHS.pVal[0];
193323Sed    Quotient = APInt(LHS.getBitWidth(), lhsValue / rhsValue);
193323Sed    Remainder = APInt(LHS.getBitWidth(), lhsValue % rhsValue);
193323Sed    return;
193323Sed  }
193323Sed
193323Sed  // Okay, lets do it the long way
193323Sed  divide(LHS, lhsWords, RHS, rhsWords, &Quotient, &Remainder);
193323Sed}
193323Sed
249423Sdimvoid APInt::sdivrem(const APInt &LHS, const APInt &RHS,
249423Sdim                    APInt &Quotient, APInt &Remainder) {
249423Sdim  if (LHS.isNegative()) {
249423Sdim    if (RHS.isNegative())
249423Sdim      APInt::udivrem(-LHS, -RHS, Quotient, Remainder);
249423Sdim    else {
249423Sdim      APInt::udivrem(-LHS, RHS, Quotient, Remainder);
249423Sdim      Quotient = -Quotient;
249423Sdim    }
249423Sdim    Remainder = -Remainder;
249423Sdim  } else if (RHS.isNegative()) {
249423Sdim    APInt::udivrem(LHS, -RHS, Quotient, Remainder);
249423Sdim    Quotient = -Quotient;
249423Sdim  } else {
249423Sdim    APInt::udivrem(LHS, RHS, Quotient, Remainder);
249423Sdim  }
249423Sdim}
249423Sdim
218893SdimAPInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
218893Sdim  APInt Res = *this+RHS;
218893Sdim  Overflow = isNonNegative() == RHS.isNonNegative() &&
218893Sdim             Res.isNonNegative() != isNonNegative();
218893Sdim  return Res;
218893Sdim}
218893Sdim
218893SdimAPInt APInt::uadd_ov(const APInt &RHS, bool &Overflow) const {
218893Sdim  APInt Res = *this+RHS;
218893Sdim  Overflow = Res.ult(RHS);
218893Sdim  return Res;
218893Sdim}
218893Sdim
218893SdimAPInt APInt::ssub_ov(const APInt &RHS, bool &Overflow) const {
218893Sdim  APInt Res = *this - RHS;
218893Sdim  Overflow = isNonNegative() != RHS.isNonNegative() &&
218893Sdim             Res.isNonNegative() != isNonNegative();
218893Sdim  return Res;
218893Sdim}
218893Sdim
218893SdimAPInt APInt::usub_ov(const APInt &RHS, bool &Overflow) const {
218893Sdim  APInt Res = *this-RHS;
218893Sdim  Overflow = Res.ugt(*this);
218893Sdim  return Res;
218893Sdim}
218893Sdim
218893SdimAPInt APInt::sdiv_ov(const APInt &RHS, bool &Overflow) const {
218893Sdim  // MININT/-1  -->  overflow.
218893Sdim  Overflow = isMinSignedValue() && RHS.isAllOnesValue();
218893Sdim  return sdiv(RHS);
218893Sdim}
218893Sdim
218893SdimAPInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
218893Sdim  APInt Res = *this * RHS;
218893Sdim
218893Sdim  if (*this != 0 && RHS != 0)
218893Sdim    Overflow = Res.sdiv(RHS) != *this || Res.sdiv(*this) != RHS;
218893Sdim  else
218893Sdim    Overflow = false;
218893Sdim  return Res;
218893Sdim}
218893Sdim
221345SdimAPInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
221345Sdim  APInt Res = *this * RHS;
221345Sdim
221345Sdim  if (*this != 0 && RHS != 0)
221345Sdim    Overflow = Res.udiv(RHS) != *this || Res.udiv(*this) != RHS;
221345Sdim  else
221345Sdim    Overflow = false;
221345Sdim  return Res;
221345Sdim}
221345Sdim
218893SdimAPInt APInt::sshl_ov(unsigned ShAmt, bool &Overflow) const {
218893Sdim  Overflow = ShAmt >= getBitWidth();
218893Sdim  if (Overflow)
218893Sdim    ShAmt = getBitWidth()-1;
218893Sdim
218893Sdim  if (isNonNegative()) // Don't allow sign change.
218893Sdim    Overflow = ShAmt >= countLeadingZeros();
218893Sdim  else
218893Sdim    Overflow = ShAmt >= countLeadingOnes();
218893Sdim
218893Sdim  return *this << ShAmt;
218893Sdim}
218893Sdim
218893Sdim
218893Sdim
218893Sdim
210299Sedvoid APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
193323Sed  // Check our assumptions here
198090Srdivacky  assert(!str.empty() && "Invalid string length");
226633Sdim  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
226633Sdim          radix == 36) &&
226633Sdim         "Radix should be 2, 8, 10, 16, or 36!");
198090Srdivacky
198090Srdivacky  StringRef::iterator p = str.begin();
198090Srdivacky  size_t slen = str.size();
198090Srdivacky  bool isNeg = *p == '-';
198090Srdivacky  if (*p == '-' || *p == '+') {
198090Srdivacky    p++;
198090Srdivacky    slen--;
198090Srdivacky    assert(slen && "String is only a sign, needs a value.");
198090Srdivacky  }
193323Sed  assert((slen <= numbits || radix != 2) && "Insufficient bit width");
193323Sed  assert(((slen-1)*3 <= numbits || radix != 8) && "Insufficient bit width");
193323Sed  assert(((slen-1)*4 <= numbits || radix != 16) && "Insufficient bit width");
206083Srdivacky  assert((((slen-1)*64)/22 <= numbits || radix != 10) &&
206083Srdivacky         "Insufficient bit width");
193323Sed
193323Sed  // Allocate memory
193323Sed  if (!isSingleWord())
193323Sed    pVal = getClearedMemory(getNumWords());
193323Sed
193323Sed  // Figure out if we can shift instead of multiply
193323Sed  unsigned shift = (radix == 16 ? 4 : radix == 8 ? 3 : radix == 2 ? 1 : 0);
193323Sed
193323Sed  // Set up an APInt for the digit to add outside the loop so we don't
193323Sed  // constantly construct/destruct it.
193323Sed  APInt apdigit(getBitWidth(), 0);
193323Sed  APInt apradix(getBitWidth(), radix);
193323Sed
193323Sed  // Enter digit traversal loop
198090Srdivacky  for (StringRef::iterator e = str.end(); p != e; ++p) {
198090Srdivacky    unsigned digit = getDigit(*p, radix);
198090Srdivacky    assert(digit < radix && "Invalid character in digit string");
193323Sed
193323Sed    // Shift or multiply the value by the radix
193323Sed    if (slen > 1) {
193323Sed      if (shift)
193323Sed        *this <<= shift;
193323Sed      else
193323Sed        *this *= apradix;
193323Sed    }
193323Sed
193323Sed    // Add in the digit we just interpreted
193323Sed    if (apdigit.isSingleWord())
193323Sed      apdigit.VAL = digit;
193323Sed    else
193323Sed      apdigit.pVal[0] = digit;
193323Sed    *this += apdigit;
193323Sed  }
193323Sed  // If its negative, put it in two's complement form
193323Sed  if (isNeg) {
249423Sdim    --(*this);
218893Sdim    this->flipAllBits();
193323Sed  }
193323Sed}
193323Sed
193323Sedvoid APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
224145Sdim                     bool Signed, bool formatAsCLiteral) const {
226633Sdim  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2 ||
226633Sdim          Radix == 36) &&
234353Sdim         "Radix should be 2, 8, 10, 16, or 36!");
198090Srdivacky
224145Sdim  const char *Prefix = "";
224145Sdim  if (formatAsCLiteral) {
224145Sdim    switch (Radix) {
224145Sdim      case 2:
224145Sdim        // Binary literals are a non-standard extension added in gcc 4.3:
224145Sdim        // http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
224145Sdim        Prefix = "0b";
224145Sdim        break;
224145Sdim      case 8:
224145Sdim        Prefix = "0";
224145Sdim        break;
234353Sdim      case 10:
234353Sdim        break; // No prefix
224145Sdim      case 16:
224145Sdim        Prefix = "0x";
224145Sdim        break;
234353Sdim      default:
234353Sdim        llvm_unreachable("Invalid radix!");
224145Sdim    }
224145Sdim  }
224145Sdim
193323Sed  // First, check for a zero value and just short circuit the logic below.
193323Sed  if (*this == 0) {
224145Sdim    while (*Prefix) {
224145Sdim      Str.push_back(*Prefix);
224145Sdim      ++Prefix;
224145Sdim    };
193323Sed    Str.push_back('0');
193323Sed    return;
193323Sed  }
198090Srdivacky
226633Sdim  static const char Digits[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
198090Srdivacky
193323Sed  if (isSingleWord()) {
193323Sed    char Buffer[65];
193323Sed    char *BufPtr = Buffer+65;
198090Srdivacky
193323Sed    uint64_t N;
212904Sdim    if (!Signed) {
212904Sdim      N = getZExtValue();
212904Sdim    } else {
193323Sed      int64_t I = getSExtValue();
212904Sdim      if (I >= 0) {
212904Sdim        N = I;
212904Sdim      } else {
193323Sed        Str.push_back('-');
212904Sdim        N = -(uint64_t)I;
193323Sed      }
193323Sed    }
198090Srdivacky
224145Sdim    while (*Prefix) {
224145Sdim      Str.push_back(*Prefix);
224145Sdim      ++Prefix;
224145Sdim    };
224145Sdim
193323Sed    while (N) {
193323Sed      *--BufPtr = Digits[N % Radix];
193323Sed      N /= Radix;
193323Sed    }
193323Sed    Str.append(BufPtr, Buffer+65);
193323Sed    return;
193323Sed  }
193323Sed
193323Sed  APInt Tmp(*this);
198090Srdivacky
193323Sed  if (Signed && isNegative()) {
193323Sed    // They want to print the signed version and it is a negative value
193323Sed    // Flip the bits and add one to turn it into the equivalent positive
193323Sed    // value and put a '-' in the result.
218893Sdim    Tmp.flipAllBits();
249423Sdim    ++Tmp;
193323Sed    Str.push_back('-');
193323Sed  }
198090Srdivacky
224145Sdim  while (*Prefix) {
224145Sdim    Str.push_back(*Prefix);
224145Sdim    ++Prefix;
224145Sdim  };
224145Sdim
193323Sed  // We insert the digits backward, then reverse them to get the right order.
193323Sed  unsigned StartDig = Str.size();
198090Srdivacky
198090Srdivacky  // For the 2, 8 and 16 bit cases, we can just shift instead of divide
198090Srdivacky  // because the number of bits per digit (1, 3 and 4 respectively) divides
193323Sed  // equaly.  We just shift until the value is zero.
226633Sdim  if (Radix == 2 || Radix == 8 || Radix == 16) {
193323Sed    // Just shift tmp right for each digit width until it becomes zero
193323Sed    unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
193323Sed    unsigned MaskAmt = Radix - 1;
198090Srdivacky
193323Sed    while (Tmp != 0) {
193323Sed      unsigned Digit = unsigned(Tmp.getRawData()[0]) & MaskAmt;
193323Sed      Str.push_back(Digits[Digit]);
193323Sed      Tmp = Tmp.lshr(ShiftAmt);
193323Sed    }
193323Sed  } else {
226633Sdim    APInt divisor(Radix == 10? 4 : 8, Radix);
193323Sed    while (Tmp != 0) {
193323Sed      APInt APdigit(1, 0);
193323Sed      APInt tmp2(Tmp.getBitWidth(), 0);
198090Srdivacky      divide(Tmp, Tmp.getNumWords(), divisor, divisor.getNumWords(), &tmp2,
193323Sed             &APdigit);
193323Sed      unsigned Digit = (unsigned)APdigit.getZExtValue();
193323Sed      assert(Digit < Radix && "divide failed");
193323Sed      Str.push_back(Digits[Digit]);
193323Sed      Tmp = tmp2;
193323Sed    }
193323Sed  }
198090Srdivacky
193323Sed  // Reverse the digits before returning.
193323Sed  std::reverse(Str.begin()+StartDig, Str.end());
193323Sed}
193323Sed
193323Sed/// toString - This returns the APInt as a std::string.  Note that this is an
193323Sed/// inefficient method.  It is better to pass in a SmallVector/SmallString
193323Sed/// to the methods above.
193323Sedstd::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
193323Sed  SmallString<40> S;
224145Sdim  toString(S, Radix, Signed, /* formatAsCLiteral = */false);
198090Srdivacky  return S.str();
193323Sed}
193323Sed
193323Sed
193323Sedvoid APInt::dump() const {
193323Sed  SmallString<40> S, U;
193323Sed  this->toStringUnsigned(U);
193323Sed  this->toStringSigned(S);
202375Srdivacky  dbgs() << "APInt(" << BitWidth << "b, "
198090Srdivacky         << U.str() << "u " << S.str() << "s)";
193323Sed}
193323Sed
193323Sedvoid APInt::print(raw_ostream &OS, bool isSigned) const {
193323Sed  SmallString<40> S;
224145Sdim  this->toString(S, 10, isSigned, /* formatAsCLiteral = */false);
198090Srdivacky  OS << S.str();
193323Sed}
193323Sed
193323Sed// This implements a variety of operations on a representation of
193323Sed// arbitrary precision, two's-complement, bignum integer values.
193323Sed
198090Srdivacky// Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
198090Srdivacky// and unrestricting assumption.
193323Sed#define COMPILE_TIME_ASSERT(cond) extern int CTAssert[(cond) ? 1 : -1]
193323SedCOMPILE_TIME_ASSERT(integerPartWidth % 2 == 0);
193323Sed
193323Sed/* Some handy functions local to this file.  */
193323Sednamespace {
193323Sed
193323Sed  /* Returns the integer part with the least significant BITS set.
193323Sed     BITS cannot be zero.  */
193323Sed  static inline integerPart
193323Sed  lowBitMask(unsigned int bits)
193323Sed  {
206083Srdivacky    assert(bits != 0 && bits <= integerPartWidth);
193323Sed
193323Sed    return ~(integerPart) 0 >> (integerPartWidth - bits);
193323Sed  }
193323Sed
193323Sed  /* Returns the value of the lower half of PART.  */
193323Sed  static inline integerPart
193323Sed  lowHalf(integerPart part)
193323Sed  {
193323Sed    return part & lowBitMask(integerPartWidth / 2);
193323Sed  }
193323Sed
193323Sed  /* Returns the value of the upper half of PART.  */
193323Sed  static inline integerPart
193323Sed  highHalf(integerPart part)
193323Sed  {
193323Sed    return part >> (integerPartWidth / 2);
193323Sed  }
193323Sed
193323Sed  /* Returns the bit number of the most significant set bit of a part.
193323Sed     If the input number has no bits set -1U is returned.  */
193323Sed  static unsigned int
193323Sed  partMSB(integerPart value)
193323Sed  {
263508Sdim    return findLastSet(value, ZB_Max);
193323Sed  }
193323Sed
193323Sed  /* Returns the bit number of the least significant set bit of a
193323Sed     part.  If the input number has no bits set -1U is returned.  */
193323Sed  static unsigned int
193323Sed  partLSB(integerPart value)
193323Sed  {
263508Sdim    return findFirstSet(value, ZB_Max);
193323Sed  }
193323Sed}
193323Sed
193323Sed/* Sets the least significant part of a bignum to the input value, and
193323Sed   zeroes out higher parts.  */
193323Sedvoid
193323SedAPInt::tcSet(integerPart *dst, integerPart part, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  assert(parts > 0);
193323Sed
193323Sed  dst[0] = part;
206083Srdivacky  for (i = 1; i < parts; i++)
193323Sed    dst[i] = 0;
193323Sed}
193323Sed
193323Sed/* Assign one bignum to another.  */
193323Sedvoid
193323SedAPInt::tcAssign(integerPart *dst, const integerPart *src, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    dst[i] = src[i];
193323Sed}
193323Sed
193323Sed/* Returns true if a bignum is zero, false otherwise.  */
193323Sedbool
193323SedAPInt::tcIsZero(const integerPart *src, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    if (src[i])
193323Sed      return false;
193323Sed
193323Sed  return true;
193323Sed}
193323Sed
193323Sed/* Extract the given bit of a bignum; returns 0 or 1.  */
193323Sedint
193323SedAPInt::tcExtractBit(const integerPart *parts, unsigned int bit)
193323Sed{
206083Srdivacky  return (parts[bit / integerPartWidth] &
206083Srdivacky          ((integerPart) 1 << bit % integerPartWidth)) != 0;
193323Sed}
193323Sed
204642Srdivacky/* Set the given bit of a bignum. */
193323Sedvoid
193323SedAPInt::tcSetBit(integerPart *parts, unsigned int bit)
193323Sed{
193323Sed  parts[bit / integerPartWidth] |= (integerPart) 1 << (bit % integerPartWidth);
193323Sed}
193323Sed
204642Srdivacky/* Clears the given bit of a bignum. */
204642Srdivackyvoid
204642SrdivackyAPInt::tcClearBit(integerPart *parts, unsigned int bit)
204642Srdivacky{
204642Srdivacky  parts[bit / integerPartWidth] &=
204642Srdivacky    ~((integerPart) 1 << (bit % integerPartWidth));
204642Srdivacky}
204642Srdivacky
193323Sed/* Returns the bit number of the least significant set bit of a
193323Sed   number.  If the input number has no bits set -1U is returned.  */
193323Sedunsigned int
193323SedAPInt::tcLSB(const integerPart *parts, unsigned int n)
193323Sed{
193323Sed  unsigned int i, lsb;
193323Sed
206083Srdivacky  for (i = 0; i < n; i++) {
193323Sed      if (parts[i] != 0) {
193323Sed          lsb = partLSB(parts[i]);
193323Sed
193323Sed          return lsb + i * integerPartWidth;
193323Sed      }
193323Sed  }
193323Sed
193323Sed  return -1U;
193323Sed}
193323Sed
193323Sed/* Returns the bit number of the most significant set bit of a number.
193323Sed   If the input number has no bits set -1U is returned.  */
193323Sedunsigned int
193323SedAPInt::tcMSB(const integerPart *parts, unsigned int n)
193323Sed{
193323Sed  unsigned int msb;
193323Sed
193323Sed  do {
206083Srdivacky    --n;
193323Sed
206083Srdivacky    if (parts[n] != 0) {
206083Srdivacky      msb = partMSB(parts[n]);
193323Sed
206083Srdivacky      return msb + n * integerPartWidth;
206083Srdivacky    }
193323Sed  } while (n);
193323Sed
193323Sed  return -1U;
193323Sed}
193323Sed
193323Sed/* Copy the bit vector of width srcBITS from SRC, starting at bit
193323Sed   srcLSB, to DST, of dstCOUNT parts, such that the bit srcLSB becomes
193323Sed   the least significant bit of DST.  All high bits above srcBITS in
193323Sed   DST are zero-filled.  */
193323Sedvoid
193323SedAPInt::tcExtract(integerPart *dst, unsigned int dstCount,const integerPart *src,
193323Sed                 unsigned int srcBits, unsigned int srcLSB)
193323Sed{
193323Sed  unsigned int firstSrcPart, dstParts, shift, n;
193323Sed
193323Sed  dstParts = (srcBits + integerPartWidth - 1) / integerPartWidth;
206083Srdivacky  assert(dstParts <= dstCount);
193323Sed
193323Sed  firstSrcPart = srcLSB / integerPartWidth;
193323Sed  tcAssign (dst, src + firstSrcPart, dstParts);
193323Sed
193323Sed  shift = srcLSB % integerPartWidth;
193323Sed  tcShiftRight (dst, dstParts, shift);
193323Sed
193323Sed  /* We now have (dstParts * integerPartWidth - shift) bits from SRC
193323Sed     in DST.  If this is less that srcBits, append the rest, else
193323Sed     clear the high bits.  */
193323Sed  n = dstParts * integerPartWidth - shift;
193323Sed  if (n < srcBits) {
193323Sed    integerPart mask = lowBitMask (srcBits - n);
193323Sed    dst[dstParts - 1] |= ((src[firstSrcPart + dstParts] & mask)
193323Sed                          << n % integerPartWidth);
193323Sed  } else if (n > srcBits) {
193323Sed    if (srcBits % integerPartWidth)
193323Sed      dst[dstParts - 1] &= lowBitMask (srcBits % integerPartWidth);
193323Sed  }
193323Sed
193323Sed  /* Clear high parts.  */
193323Sed  while (dstParts < dstCount)
193323Sed    dst[dstParts++] = 0;
193323Sed}
193323Sed
193323Sed/* DST += RHS + C where C is zero or one.  Returns the carry flag.  */
193323SedintegerPart
193323SedAPInt::tcAdd(integerPart *dst, const integerPart *rhs,
193323Sed             integerPart c, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
193323Sed  assert(c <= 1);
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++) {
193323Sed    integerPart l;
193323Sed
193323Sed    l = dst[i];
193323Sed    if (c) {
193323Sed      dst[i] += rhs[i] + 1;
193323Sed      c = (dst[i] <= l);
193323Sed    } else {
193323Sed      dst[i] += rhs[i];
193323Sed      c = (dst[i] < l);
193323Sed    }
193323Sed  }
193323Sed
193323Sed  return c;
193323Sed}
193323Sed
193323Sed/* DST -= RHS + C where C is zero or one.  Returns the carry flag.  */
193323SedintegerPart
193323SedAPInt::tcSubtract(integerPart *dst, const integerPart *rhs,
193323Sed                  integerPart c, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
193323Sed  assert(c <= 1);
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++) {
193323Sed    integerPart l;
193323Sed
193323Sed    l = dst[i];
193323Sed    if (c) {
193323Sed      dst[i] -= rhs[i] + 1;
193323Sed      c = (dst[i] >= l);
193323Sed    } else {
193323Sed      dst[i] -= rhs[i];
193323Sed      c = (dst[i] > l);
193323Sed    }
193323Sed  }
193323Sed
193323Sed  return c;
193323Sed}
193323Sed
193323Sed/* Negate a bignum in-place.  */
193323Sedvoid
193323SedAPInt::tcNegate(integerPart *dst, unsigned int parts)
193323Sed{
193323Sed  tcComplement(dst, parts);
193323Sed  tcIncrement(dst, parts);
193323Sed}
193323Sed
193323Sed/*  DST += SRC * MULTIPLIER + CARRY   if add is true
193323Sed    DST  = SRC * MULTIPLIER + CARRY   if add is false
193323Sed
193323Sed    Requires 0 <= DSTPARTS <= SRCPARTS + 1.  If DST overlaps SRC
193323Sed    they must start at the same point, i.e. DST == SRC.
193323Sed
193323Sed    If DSTPARTS == SRCPARTS + 1 no overflow occurs and zero is
193323Sed    returned.  Otherwise DST is filled with the least significant
193323Sed    DSTPARTS parts of the result, and if all of the omitted higher
193323Sed    parts were zero return zero, otherwise overflow occurred and
193323Sed    return one.  */
193323Sedint
193323SedAPInt::tcMultiplyPart(integerPart *dst, const integerPart *src,
193323Sed                      integerPart multiplier, integerPart carry,
193323Sed                      unsigned int srcParts, unsigned int dstParts,
193323Sed                      bool add)
193323Sed{
193323Sed  unsigned int i, n;
193323Sed
193323Sed  /* Otherwise our writes of DST kill our later reads of SRC.  */
193323Sed  assert(dst <= src || dst >= src + srcParts);
193323Sed  assert(dstParts <= srcParts + 1);
193323Sed
193323Sed  /* N loops; minimum of dstParts and srcParts.  */
193323Sed  n = dstParts < srcParts ? dstParts: srcParts;
193323Sed
206083Srdivacky  for (i = 0; i < n; i++) {
193323Sed    integerPart low, mid, high, srcPart;
193323Sed
193323Sed      /* [ LOW, HIGH ] = MULTIPLIER * SRC[i] + DST[i] + CARRY.
193323Sed
193323Sed         This cannot overflow, because
193323Sed
193323Sed         (n - 1) * (n - 1) + 2 (n - 1) = (n - 1) * (n + 1)
193323Sed
193323Sed         which is less than n^2.  */
193323Sed
193323Sed    srcPart = src[i];
193323Sed
193323Sed    if (multiplier == 0 || srcPart == 0)        {
193323Sed      low = carry;
193323Sed      high = 0;
193323Sed    } else {
193323Sed      low = lowHalf(srcPart) * lowHalf(multiplier);
193323Sed      high = highHalf(srcPart) * highHalf(multiplier);
193323Sed
193323Sed      mid = lowHalf(srcPart) * highHalf(multiplier);
193323Sed      high += highHalf(mid);
193323Sed      mid <<= integerPartWidth / 2;
193323Sed      if (low + mid < low)
193323Sed        high++;
193323Sed      low += mid;
193323Sed
193323Sed      mid = highHalf(srcPart) * lowHalf(multiplier);
193323Sed      high += highHalf(mid);
193323Sed      mid <<= integerPartWidth / 2;
193323Sed      if (low + mid < low)
193323Sed        high++;
193323Sed      low += mid;
193323Sed
193323Sed      /* Now add carry.  */
193323Sed      if (low + carry < low)
193323Sed        high++;
193323Sed      low += carry;
193323Sed    }
193323Sed
193323Sed    if (add) {
193323Sed      /* And now DST[i], and store the new low part there.  */
193323Sed      if (low + dst[i] < low)
193323Sed        high++;
193323Sed      dst[i] += low;
193323Sed    } else
193323Sed      dst[i] = low;
193323Sed
193323Sed    carry = high;
193323Sed  }
193323Sed
193323Sed  if (i < dstParts) {
193323Sed    /* Full multiplication, there is no overflow.  */
193323Sed    assert(i + 1 == dstParts);
193323Sed    dst[i] = carry;
193323Sed    return 0;
193323Sed  } else {
193323Sed    /* We overflowed if there is carry.  */
193323Sed    if (carry)
193323Sed      return 1;
193323Sed
193323Sed    /* We would overflow if any significant unwritten parts would be
193323Sed       non-zero.  This is true if any remaining src parts are non-zero
193323Sed       and the multiplier is non-zero.  */
193323Sed    if (multiplier)
206083Srdivacky      for (; i < srcParts; i++)
193323Sed        if (src[i])
193323Sed          return 1;
193323Sed
193323Sed    /* We fitted in the narrow destination.  */
193323Sed    return 0;
193323Sed  }
193323Sed}
193323Sed
193323Sed/* DST = LHS * RHS, where DST has the same width as the operands and
193323Sed   is filled with the least significant parts of the result.  Returns
193323Sed   one if overflow occurred, otherwise zero.  DST must be disjoint
193323Sed   from both operands.  */
193323Sedint
193323SedAPInt::tcMultiply(integerPart *dst, const integerPart *lhs,
193323Sed                  const integerPart *rhs, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed  int overflow;
193323Sed
193323Sed  assert(dst != lhs && dst != rhs);
193323Sed
193323Sed  overflow = 0;
193323Sed  tcSet(dst, 0, parts);
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    overflow |= tcMultiplyPart(&dst[i], lhs, rhs[i], 0, parts,
193323Sed                               parts - i, true);
193323Sed
193323Sed  return overflow;
193323Sed}
193323Sed
193323Sed/* DST = LHS * RHS, where DST has width the sum of the widths of the
193323Sed   operands.  No overflow occurs.  DST must be disjoint from both
193323Sed   operands.  Returns the number of parts required to hold the
193323Sed   result.  */
193323Sedunsigned int
193323SedAPInt::tcFullMultiply(integerPart *dst, const integerPart *lhs,
193323Sed                      const integerPart *rhs, unsigned int lhsParts,
193323Sed                      unsigned int rhsParts)
193323Sed{
193323Sed  /* Put the narrower number on the LHS for less loops below.  */
193323Sed  if (lhsParts > rhsParts) {
193323Sed    return tcFullMultiply (dst, rhs, lhs, rhsParts, lhsParts);
193323Sed  } else {
193323Sed    unsigned int n;
193323Sed
193323Sed    assert(dst != lhs && dst != rhs);
193323Sed
193323Sed    tcSet(dst, 0, rhsParts);
193323Sed
206083Srdivacky    for (n = 0; n < lhsParts; n++)
193323Sed      tcMultiplyPart(&dst[n], rhs, lhs[n], 0, rhsParts, rhsParts + 1, true);
193323Sed
193323Sed    n = lhsParts + rhsParts;
193323Sed
193323Sed    return n - (dst[n - 1] == 0);
193323Sed  }
193323Sed}
193323Sed
193323Sed/* If RHS is zero LHS and REMAINDER are left unchanged, return one.
193323Sed   Otherwise set LHS to LHS / RHS with the fractional part discarded,
193323Sed   set REMAINDER to the remainder, return zero.  i.e.
193323Sed
193323Sed   OLD_LHS = RHS * LHS + REMAINDER
193323Sed
193323Sed   SCRATCH is a bignum of the same size as the operands and result for
193323Sed   use by the routine; its contents need not be initialized and are
193323Sed   destroyed.  LHS, REMAINDER and SCRATCH must be distinct.
193323Sed*/
193323Sedint
193323SedAPInt::tcDivide(integerPart *lhs, const integerPart *rhs,
193323Sed                integerPart *remainder, integerPart *srhs,
193323Sed                unsigned int parts)
193323Sed{
193323Sed  unsigned int n, shiftCount;
193323Sed  integerPart mask;
193323Sed
193323Sed  assert(lhs != remainder && lhs != srhs && remainder != srhs);
193323Sed
193323Sed  shiftCount = tcMSB(rhs, parts) + 1;
193323Sed  if (shiftCount == 0)
193323Sed    return true;
193323Sed
193323Sed  shiftCount = parts * integerPartWidth - shiftCount;
193323Sed  n = shiftCount / integerPartWidth;
193323Sed  mask = (integerPart) 1 << (shiftCount % integerPartWidth);
193323Sed
193323Sed  tcAssign(srhs, rhs, parts);
193323Sed  tcShiftLeft(srhs, parts, shiftCount);
193323Sed  tcAssign(remainder, lhs, parts);
193323Sed  tcSet(lhs, 0, parts);
193323Sed
193323Sed  /* Loop, subtracting SRHS if REMAINDER is greater and adding that to
193323Sed     the total.  */
206083Srdivacky  for (;;) {
193323Sed      int compare;
193323Sed
193323Sed      compare = tcCompare(remainder, srhs, parts);
193323Sed      if (compare >= 0) {
193323Sed        tcSubtract(remainder, srhs, 0, parts);
193323Sed        lhs[n] |= mask;
193323Sed      }
193323Sed
193323Sed      if (shiftCount == 0)
193323Sed        break;
193323Sed      shiftCount--;
193323Sed      tcShiftRight(srhs, parts, 1);
193323Sed      if ((mask >>= 1) == 0)
193323Sed        mask = (integerPart) 1 << (integerPartWidth - 1), n--;
193323Sed  }
193323Sed
193323Sed  return false;
193323Sed}
193323Sed
193323Sed/* Shift a bignum left COUNT bits in-place.  Shifted in bits are zero.
193323Sed   There are no restrictions on COUNT.  */
193323Sedvoid
193323SedAPInt::tcShiftLeft(integerPart *dst, unsigned int parts, unsigned int count)
193323Sed{
193323Sed  if (count) {
193323Sed    unsigned int jump, shift;
193323Sed
193323Sed    /* Jump is the inter-part jump; shift is is intra-part shift.  */
193323Sed    jump = count / integerPartWidth;
193323Sed    shift = count % integerPartWidth;
193323Sed
193323Sed    while (parts > jump) {
193323Sed      integerPart part;
193323Sed
193323Sed      parts--;
193323Sed
193323Sed      /* dst[i] comes from the two parts src[i - jump] and, if we have
193323Sed         an intra-part shift, src[i - jump - 1].  */
193323Sed      part = dst[parts - jump];
193323Sed      if (shift) {
193323Sed        part <<= shift;
193323Sed        if (parts >= jump + 1)
193323Sed          part |= dst[parts - jump - 1] >> (integerPartWidth - shift);
193323Sed      }
193323Sed
193323Sed      dst[parts] = part;
193323Sed    }
193323Sed
193323Sed    while (parts > 0)
193323Sed      dst[--parts] = 0;
193323Sed  }
193323Sed}
193323Sed
193323Sed/* Shift a bignum right COUNT bits in-place.  Shifted in bits are
193323Sed   zero.  There are no restrictions on COUNT.  */
193323Sedvoid
193323SedAPInt::tcShiftRight(integerPart *dst, unsigned int parts, unsigned int count)
193323Sed{
193323Sed  if (count) {
193323Sed    unsigned int i, jump, shift;
193323Sed
193323Sed    /* Jump is the inter-part jump; shift is is intra-part shift.  */
193323Sed    jump = count / integerPartWidth;
193323Sed    shift = count % integerPartWidth;
193323Sed
193323Sed    /* Perform the shift.  This leaves the most significant COUNT bits
193323Sed       of the result at zero.  */
206083Srdivacky    for (i = 0; i < parts; i++) {
193323Sed      integerPart part;
193323Sed
193323Sed      if (i + jump >= parts) {
193323Sed        part = 0;
193323Sed      } else {
193323Sed        part = dst[i + jump];
193323Sed        if (shift) {
193323Sed          part >>= shift;
193323Sed          if (i + jump + 1 < parts)
193323Sed            part |= dst[i + jump + 1] << (integerPartWidth - shift);
193323Sed        }
193323Sed      }
193323Sed
193323Sed      dst[i] = part;
193323Sed    }
193323Sed  }
193323Sed}
193323Sed
193323Sed/* Bitwise and of two bignums.  */
193323Sedvoid
193323SedAPInt::tcAnd(integerPart *dst, const integerPart *rhs, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    dst[i] &= rhs[i];
193323Sed}
193323Sed
193323Sed/* Bitwise inclusive or of two bignums.  */
193323Sedvoid
193323SedAPInt::tcOr(integerPart *dst, const integerPart *rhs, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    dst[i] |= rhs[i];
193323Sed}
193323Sed
193323Sed/* Bitwise exclusive or of two bignums.  */
193323Sedvoid
193323SedAPInt::tcXor(integerPart *dst, const integerPart *rhs, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    dst[i] ^= rhs[i];
193323Sed}
193323Sed
193323Sed/* Complement a bignum in-place.  */
193323Sedvoid
193323SedAPInt::tcComplement(integerPart *dst, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    dst[i] = ~dst[i];
193323Sed}
193323Sed
193323Sed/* Comparison (unsigned) of two bignums.  */
193323Sedint
193323SedAPInt::tcCompare(const integerPart *lhs, const integerPart *rhs,
193323Sed                 unsigned int parts)
193323Sed{
193323Sed  while (parts) {
193323Sed      parts--;
193323Sed      if (lhs[parts] == rhs[parts])
193323Sed        continue;
193323Sed
193323Sed      if (lhs[parts] > rhs[parts])
193323Sed        return 1;
193323Sed      else
193323Sed        return -1;
193323Sed    }
193323Sed
193323Sed  return 0;
193323Sed}
193323Sed
193323Sed/* Increment a bignum in-place, return the carry flag.  */
193323SedintegerPart
193323SedAPInt::tcIncrement(integerPart *dst, unsigned int parts)
193323Sed{
193323Sed  unsigned int i;
193323Sed
206083Srdivacky  for (i = 0; i < parts; i++)
193323Sed    if (++dst[i] != 0)
193323Sed      break;
193323Sed
193323Sed  return i == parts;
193323Sed}
193323Sed
263508Sdim/* Decrement a bignum in-place, return the borrow flag.  */
263508SdimintegerPart
263508SdimAPInt::tcDecrement(integerPart *dst, unsigned int parts) {
263508Sdim  for (unsigned int i = 0; i < parts; i++) {
263508Sdim    // If the current word is non-zero, then the decrement has no effect on the
263508Sdim    // higher-order words of the integer and no borrow can occur. Exit early.
263508Sdim    if (dst[i]--)
263508Sdim      return 0;
263508Sdim  }
263508Sdim  // If every word was zero, then there is a borrow.
263508Sdim  return 1;
263508Sdim}
263508Sdim
263508Sdim
193323Sed/* Set the least significant BITS bits of a bignum, clear the
193323Sed   rest.  */
193323Sedvoid
193323SedAPInt::tcSetLeastSignificantBits(integerPart *dst, unsigned int parts,
193323Sed                                 unsigned int bits)
193323Sed{
193323Sed  unsigned int i;
193323Sed
193323Sed  i = 0;
193323Sed  while (bits > integerPartWidth) {
193323Sed    dst[i++] = ~(integerPart) 0;
193323Sed    bits -= integerPartWidth;
193323Sed  }
193323Sed
193323Sed  if (bits)
193323Sed    dst[i++] = ~(integerPart) 0 >> (integerPartWidth - bits);
193323Sed
193323Sed  while (i < parts)
193323Sed    dst[i++] = 0;
193323Sed}