lib/Support/APInt.cpp

130803Smarcel//===-- APInt.cpp - Implement APInt class ---------------------------------===//
130803Smarcel//
130803Smarcel//                     The LLVM Compiler Infrastructure
130803Smarcel//
130803Smarcel// This file is distributed under the University of Illinois Open Source
130803Smarcel// License. See LICENSE.TXT for details.
130803Smarcel//
130803Smarcel//===----------------------------------------------------------------------===//
130803Smarcel//
130803Smarcel// This file implements a class to represent arbitrary precision integer
130803Smarcel// constant values and provide a variety of arithmetic operations on them.
130803Smarcel//
130803Smarcel//===----------------------------------------------------------------------===//
130803Smarcel
130803Smarcel#define DEBUG_TYPE "apint"
130803Smarcel#include "llvm/ADT/APInt.h"
130803Smarcel#include "llvm/ADT/StringRef.h"
130803Smarcel#include "llvm/ADT/FoldingSet.h"
130803Smarcel#include "llvm/ADT/SmallString.h"
130803Smarcel#include "llvm/Support/Debug.h"
130803Smarcel#include "llvm/Support/ErrorHandling.h"
130803Smarcel#include "llvm/Support/MathExtras.h"
130803Smarcel#include "llvm/Support/raw_ostream.h"
130803Smarcel#include <cmath>
130803Smarcel#include <limits>
130803Smarcel#include <cstring>
130803Smarcel#include <cstdlib>
130803Smarcelusing namespace llvm;
130803Smarcel
130803Smarcel/// A utility function for allocating memory, checking for allocation failures,
130803Smarcel/// and ensuring the contents are zeroed.
130803Smarcelinline static uint64_t* getClearedMemory(unsigned numWords) {
130803Smarcel  uint64_t * result = new uint64_t[numWords];
130803Smarcel  assert(result && "APInt memory allocation fails!");
130803Smarcel  memset(result, 0, numWords * sizeof(uint64_t));
130803Smarcel  return result;
130803Smarcel}
130803Smarcel
130803Smarcel/// A utility function for allocating memory and checking for allocation
130803Smarcel/// failure.  The content is not zeroed.
130803Smarcelinline static uint64_t* getMemory(unsigned numWords) {
130803Smarcel  uint64_t * result = new uint64_t[numWords];
130803Smarcel  assert(result && "APInt memory allocation fails!");
130803Smarcel  return result;
130803Smarcel}
130803Smarcel
130803Smarcel/// A utility function that converts a character to a digit.
130803Smarcelinline static unsigned getDigit(char cdigit, uint8_t radix) {
130803Smarcel  unsigned r;
130803Smarcel
130803Smarcel  if (radix == 16 || radix == 36) {
130803Smarcel    r = cdigit - '0';
130803Smarcel    if (r <= 9)
130803Smarcel      return r;
130803Smarcel
130803Smarcel    r = cdigit - 'A';
130803Smarcel    if (r <= radix - 11U)
130803Smarcel      return r + 10;
130803Smarcel
130803Smarcel    r = cdigit - 'a';
130803Smarcel    if (r <= radix - 11U)
130803Smarcel      return r + 10;
130803Smarcel
130803Smarcel    radix = 10;
130803Smarcel  }
130803Smarcel
130803Smarcel  r = cdigit - '0';
130803Smarcel  if (r < radix)
130803Smarcel    return r;
130803Smarcel
130803Smarcel  return -1U;
130803Smarcel}
130803Smarcel
130803Smarcel
130803Smarcelvoid APInt::initSlowCase(unsigned numBits, uint64_t val, bool isSigned) {
130803Smarcel  pVal = getClearedMemory(getNumWords());
130803Smarcel  pVal[0] = val;
130803Smarcel  if (isSigned && int64_t(val) < 0)
130803Smarcel    for (unsigned i = 1; i < getNumWords(); ++i)
130803Smarcel      pVal[i] = -1ULL;
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::initSlowCase(const APInt& that) {
130803Smarcel  pVal = getMemory(getNumWords());
130803Smarcel  memcpy(pVal, that.pVal, getNumWords() * APINT_WORD_SIZE);
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
130803Smarcel  assert(BitWidth && "Bitwidth too small");
130803Smarcel  assert(bigVal.data() && "Null pointer detected!");
130803Smarcel  if (isSingleWord())
130803Smarcel    VAL = bigVal[0];
130803Smarcel  else {
130803Smarcel    // Get memory, cleared to 0
130803Smarcel    pVal = getClearedMemory(getNumWords());
130803Smarcel    // Calculate the number of words to copy
130803Smarcel    unsigned words = std::min<unsigned>(bigVal.size(), getNumWords());
130803Smarcel    // Copy the words from bigVal to pVal
130803Smarcel    memcpy(pVal, bigVal.data(), words * APINT_WORD_SIZE);
130803Smarcel  }
130803Smarcel  // Make sure unused high bits are cleared
130803Smarcel  clearUnusedBits();
130803Smarcel}
130803Smarcel
130803SmarcelAPInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal)
130803Smarcel  : BitWidth(numBits), VAL(0) {
130803Smarcel  initFromArray(bigVal);
130803Smarcel}
130803Smarcel
130803SmarcelAPInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
130803Smarcel  : BitWidth(numBits), VAL(0) {
130803Smarcel  initFromArray(makeArrayRef(bigVal, numWords));
130803Smarcel}
130803Smarcel
130803SmarcelAPInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
130803Smarcel  : BitWidth(numbits), VAL(0) {
130803Smarcel  assert(BitWidth && "Bitwidth too small");
130803Smarcel  fromString(numbits, Str, radix);
130803Smarcel}
130803Smarcel
130803SmarcelAPInt& APInt::AssignSlowCase(const APInt& RHS) {
130803Smarcel  // Don't do anything for X = X
130803Smarcel  if (this == &RHS)
130803Smarcel    return *this;
130803Smarcel
130803Smarcel  if (BitWidth == RHS.getBitWidth()) {
130803Smarcel    // assume same bit-width single-word case is already handled
130803Smarcel    assert(!isSingleWord());
130803Smarcel    memcpy(pVal, RHS.pVal, getNumWords() * APINT_WORD_SIZE);
130803Smarcel    return *this;
130803Smarcel  }
130803Smarcel
130803Smarcel  if (isSingleWord()) {
130803Smarcel    // assume case where both are single words is already handled
130803Smarcel    assert(!RHS.isSingleWord());
130803Smarcel    VAL = 0;
130803Smarcel    pVal = getMemory(RHS.getNumWords());
130803Smarcel    memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
130803Smarcel  } else if (getNumWords() == RHS.getNumWords())
130803Smarcel    memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
130803Smarcel  else if (RHS.isSingleWord()) {
130803Smarcel    delete [] pVal;
130803Smarcel    VAL = RHS.VAL;
130803Smarcel  } else {
130803Smarcel    delete [] pVal;
130803Smarcel    pVal = getMemory(RHS.getNumWords());
130803Smarcel    memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
130803Smarcel  }
130803Smarcel  BitWidth = RHS.BitWidth;
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803SmarcelAPInt& APInt::operator=(uint64_t RHS) {
130803Smarcel  if (isSingleWord())
130803Smarcel    VAL = RHS;
130803Smarcel  else {
130803Smarcel    pVal[0] = RHS;
130803Smarcel    memset(pVal+1, 0, (getNumWords() - 1) * APINT_WORD_SIZE);
130803Smarcel  }
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// Profile - This method 'profiles' an APInt for use with FoldingSet.
130803Smarcelvoid APInt::Profile(FoldingSetNodeID& ID) const {
130803Smarcel  ID.AddInteger(BitWidth);
130803Smarcel
130803Smarcel  if (isSingleWord()) {
130803Smarcel    ID.AddInteger(VAL);
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  unsigned NumWords = getNumWords();
130803Smarcel  for (unsigned i = 0; i < NumWords; ++i)
130803Smarcel    ID.AddInteger(pVal[i]);
130803Smarcel}
130803Smarcel
130803Smarcel/// add_1 - This function adds a single "digit" integer, y, to the multiple
130803Smarcel/// "digit" integer array,  x[]. x[] is modified to reflect the addition and
130803Smarcel/// 1 is returned if there is a carry out, otherwise 0 is returned.
130803Smarcel/// @returns the carry of the addition.
130803Smarcelstatic bool add_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
130803Smarcel  for (unsigned i = 0; i < len; ++i) {
130803Smarcel    dest[i] = y + x[i];
130803Smarcel    if (dest[i] < y)
130803Smarcel      y = 1; // Carry one to next digit.
130803Smarcel    else {
130803Smarcel      y = 0; // No need to carry so exit early
130803Smarcel      break;
130803Smarcel    }
130803Smarcel  }
130803Smarcel  return y;
130803Smarcel}
130803Smarcel
130803Smarcel/// @brief Prefix increment operator. Increments the APInt by one.
130803SmarcelAPInt& APInt::operator++() {
130803Smarcel  if (isSingleWord())
130803Smarcel    ++VAL;
130803Smarcel  else
130803Smarcel    add_1(pVal, pVal, getNumWords(), 1);
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// sub_1 - This function subtracts a single "digit" (64-bit word), y, from
130803Smarcel/// the multi-digit integer array, x[], propagating the borrowed 1 value until
130803Smarcel/// no further borrowing is neeeded or it runs out of "digits" in x.  The result
130803Smarcel/// is 1 if "borrowing" exhausted the digits in x, or 0 if x was not exhausted.
130803Smarcel/// In other words, if y > x then this function returns 1, otherwise 0.
130803Smarcel/// @returns the borrow out of the subtraction
130803Smarcelstatic bool sub_1(uint64_t x[], unsigned len, uint64_t y) {
130803Smarcel  for (unsigned i = 0; i < len; ++i) {
130803Smarcel    uint64_t X = x[i];
130803Smarcel    x[i] -= y;
130803Smarcel    if (y > X)
130803Smarcel      y = 1;  // We have to "borrow 1" from next "digit"
130803Smarcel    else {
130803Smarcel      y = 0;  // No need to borrow
130803Smarcel      break;  // Remaining digits are unchanged so exit early
130803Smarcel    }
130803Smarcel  }
130803Smarcel  return bool(y);
130803Smarcel}
130803Smarcel
130803Smarcel/// @brief Prefix decrement operator. Decrements the APInt by one.
130803SmarcelAPInt& APInt::operator--() {
130803Smarcel  if (isSingleWord())
130803Smarcel    --VAL;
130803Smarcel  else
130803Smarcel    sub_1(pVal, getNumWords(), 1);
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// add - This function adds the integer array x to the integer array Y and
130803Smarcel/// places the result in dest.
130803Smarcel/// @returns the carry out from the addition
130803Smarcel/// @brief General addition of 64-bit integer arrays
130803Smarcelstatic bool add(uint64_t *dest, const uint64_t *x, const uint64_t *y,
130803Smarcel                unsigned len) {
130803Smarcel  bool carry = false;
130803Smarcel  for (unsigned i = 0; i< len; ++i) {
130803Smarcel    uint64_t limit = std::min(x[i],y[i]); // must come first in case dest == x
130803Smarcel    dest[i] = x[i] + y[i] + carry;
130803Smarcel    carry = dest[i] < limit || (carry && dest[i] == limit);
130803Smarcel  }
130803Smarcel  return carry;
130803Smarcel}
130803Smarcel
130803Smarcel/// Adds the RHS APint to this APInt.
130803Smarcel/// @returns this, after addition of RHS.
130803Smarcel/// @brief Addition assignment operator.
130803SmarcelAPInt& APInt::operator+=(const APInt& RHS) {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord())
130803Smarcel    VAL += RHS.VAL;
130803Smarcel  else {
130803Smarcel    add(pVal, pVal, RHS.pVal, getNumWords());
130803Smarcel  }
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// Subtracts the integer array y from the integer array x
130803Smarcel/// @returns returns the borrow out.
130803Smarcel/// @brief Generalized subtraction of 64-bit integer arrays.
130803Smarcelstatic bool sub(uint64_t *dest, const uint64_t *x, const uint64_t *y,
130803Smarcel                unsigned len) {
130803Smarcel  bool borrow = false;
130803Smarcel  for (unsigned i = 0; i < len; ++i) {
130803Smarcel    uint64_t x_tmp = borrow ? x[i] - 1 : x[i];
130803Smarcel    borrow = y[i] > x_tmp || (borrow && x[i] == 0);
130803Smarcel    dest[i] = x_tmp - y[i];
130803Smarcel  }
130803Smarcel  return borrow;
130803Smarcel}
130803Smarcel
130803Smarcel/// Subtracts the RHS APInt from this APInt
130803Smarcel/// @returns this, after subtraction
130803Smarcel/// @brief Subtraction assignment operator.
130803SmarcelAPInt& APInt::operator-=(const APInt& RHS) {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord())
130803Smarcel    VAL -= RHS.VAL;
130803Smarcel  else
130803Smarcel    sub(pVal, pVal, RHS.pVal, getNumWords());
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// Multiplies an integer array, x, by a uint64_t integer and places the result
130803Smarcel/// into dest.
130803Smarcel/// @returns the carry out of the multiplication.
130803Smarcel/// @brief Multiply a multi-digit APInt by a single digit (64-bit) integer.
130803Smarcelstatic uint64_t mul_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
130803Smarcel  // Split y into high 32-bit part (hy)  and low 32-bit part (ly)
130803Smarcel  uint64_t ly = y & 0xffffffffULL, hy = y >> 32;
130803Smarcel  uint64_t carry = 0;
130803Smarcel
130803Smarcel  // For each digit of x.
130803Smarcel  for (unsigned i = 0; i < len; ++i) {
130803Smarcel    // Split x into high and low words
130803Smarcel    uint64_t lx = x[i] & 0xffffffffULL;
130803Smarcel    uint64_t hx = x[i] >> 32;
130803Smarcel    // hasCarry - A flag to indicate if there is a carry to the next digit.
130803Smarcel    // hasCarry == 0, no carry
130803Smarcel    // hasCarry == 1, has carry
130803Smarcel    // hasCarry == 2, no carry and the calculation result == 0.
130803Smarcel    uint8_t hasCarry = 0;
130803Smarcel    dest[i] = carry + lx * ly;
130803Smarcel    // Determine if the add above introduces carry.
130803Smarcel    hasCarry = (dest[i] < carry) ? 1 : 0;
130803Smarcel    carry = hx * ly + (dest[i] >> 32) + (hasCarry ? (1ULL << 32) : 0);
130803Smarcel    // The upper limit of carry can be (2^32 - 1)(2^32 - 1) +
130803Smarcel    // (2^32 - 1) + 2^32 = 2^64.
130803Smarcel    hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
130803Smarcel
130803Smarcel    carry += (lx * hy) & 0xffffffffULL;
130803Smarcel    dest[i] = (carry << 32) | (dest[i] & 0xffffffffULL);
130803Smarcel    carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0) +
130803Smarcel            (carry >> 32) + ((lx * hy) >> 32) + hx * hy;
130803Smarcel  }
130803Smarcel  return carry;
130803Smarcel}
130803Smarcel
130803Smarcel/// Multiplies integer array x by integer array y and stores the result into
130803Smarcel/// the integer array dest. Note that dest's size must be >= xlen + ylen.
130803Smarcel/// @brief Generalized multiplicate of integer arrays.
130803Smarcelstatic void mul(uint64_t dest[], uint64_t x[], unsigned xlen, uint64_t y[],
130803Smarcel                unsigned ylen) {
130803Smarcel  dest[xlen] = mul_1(dest, x, xlen, y[0]);
130803Smarcel  for (unsigned i = 1; i < ylen; ++i) {
130803Smarcel    uint64_t ly = y[i] & 0xffffffffULL, hy = y[i] >> 32;
130803Smarcel    uint64_t carry = 0, lx = 0, hx = 0;
130803Smarcel    for (unsigned j = 0; j < xlen; ++j) {
130803Smarcel      lx = x[j] & 0xffffffffULL;
130803Smarcel      hx = x[j] >> 32;
130803Smarcel      // hasCarry - A flag to indicate if has carry.
130803Smarcel      // hasCarry == 0, no carry
130803Smarcel      // hasCarry == 1, has carry
130803Smarcel      // hasCarry == 2, no carry and the calculation result == 0.
130803Smarcel      uint8_t hasCarry = 0;
130803Smarcel      uint64_t resul = carry + lx * ly;
130803Smarcel      hasCarry = (resul < carry) ? 1 : 0;
130803Smarcel      carry = (hasCarry ? (1ULL << 32) : 0) + hx * ly + (resul >> 32);
130803Smarcel      hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
130803Smarcel
130803Smarcel      carry += (lx * hy) & 0xffffffffULL;
130803Smarcel      resul = (carry << 32) | (resul & 0xffffffffULL);
130803Smarcel      dest[i+j] += resul;
130803Smarcel      carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0)+
130803Smarcel              (carry >> 32) + (dest[i+j] < resul ? 1 : 0) +
130803Smarcel              ((lx * hy) >> 32) + hx * hy;
130803Smarcel    }
130803Smarcel    dest[i+xlen] = carry;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803SmarcelAPInt& APInt::operator*=(const APInt& RHS) {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord()) {
130803Smarcel    VAL *= RHS.VAL;
130803Smarcel    clearUnusedBits();
130803Smarcel    return *this;
130803Smarcel  }
130803Smarcel
130803Smarcel  // Get some bit facts about LHS and check for zero
130803Smarcel  unsigned lhsBits = getActiveBits();
130803Smarcel  unsigned lhsWords = !lhsBits ? 0 : whichWord(lhsBits - 1) + 1;
130803Smarcel  if (!lhsWords)
130803Smarcel    // 0 * X ===> 0
130803Smarcel    return *this;
130803Smarcel
130803Smarcel  // Get some bit facts about RHS and check for zero
130803Smarcel  unsigned rhsBits = RHS.getActiveBits();
130803Smarcel  unsigned rhsWords = !rhsBits ? 0 : whichWord(rhsBits - 1) + 1;
130803Smarcel  if (!rhsWords) {
130803Smarcel    // X * 0 ===> 0
130803Smarcel    clearAllBits();
130803Smarcel    return *this;
130803Smarcel  }
130803Smarcel
130803Smarcel  // Allocate space for the result
130803Smarcel  unsigned destWords = rhsWords + lhsWords;
130803Smarcel  uint64_t *dest = getMemory(destWords);
130803Smarcel
130803Smarcel  // Perform the long multiply
130803Smarcel  mul(dest, pVal, lhsWords, RHS.pVal, rhsWords);
130803Smarcel
130803Smarcel  // Copy result back into *this
130803Smarcel  clearAllBits();
130803Smarcel  unsigned wordsToCopy = destWords >= getNumWords() ? getNumWords() : destWords;
130803Smarcel  memcpy(pVal, dest, wordsToCopy * APINT_WORD_SIZE);
130803Smarcel  clearUnusedBits();
130803Smarcel
130803Smarcel  // delete dest array and return
130803Smarcel  delete[] dest;
130803Smarcel  return *this;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt& APInt::operator&=(const APInt& RHS) {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord()) {
130803Smarcel    VAL &= RHS.VAL;
130803Smarcel    return *this;
130803Smarcel  }
130803Smarcel  unsigned numWords = getNumWords();
130803Smarcel  for (unsigned i = 0; i < numWords; ++i)
130803Smarcel    pVal[i] &= RHS.pVal[i];
130803Smarcel  return *this;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt& APInt::operator|=(const APInt& RHS) {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord()) {
130803Smarcel    VAL |= RHS.VAL;
130803Smarcel    return *this;
130803Smarcel  }
130803Smarcel  unsigned numWords = getNumWords();
130803Smarcel  for (unsigned i = 0; i < numWords; ++i)
130803Smarcel    pVal[i] |= RHS.pVal[i];
130803Smarcel  return *this;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt& APInt::operator^=(const APInt& RHS) {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord()) {
130803Smarcel    VAL ^= RHS.VAL;
130803Smarcel    this->clearUnusedBits();
130803Smarcel    return *this;
130803Smarcel  }
130803Smarcel  unsigned numWords = getNumWords();
130803Smarcel  for (unsigned i = 0; i < numWords; ++i)
130803Smarcel    pVal[i] ^= RHS.pVal[i];
130803Smarcel  return clearUnusedBits();
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::AndSlowCase(const APInt& RHS) const {
130803Smarcel  unsigned numWords = getNumWords();
130803Smarcel  uint64_t* val = getMemory(numWords);
130803Smarcel  for (unsigned i = 0; i < numWords; ++i)
130803Smarcel    val[i] = pVal[i] & RHS.pVal[i];
130803Smarcel  return APInt(val, getBitWidth());
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::OrSlowCase(const APInt& RHS) const {
130803Smarcel  unsigned numWords = getNumWords();
130803Smarcel  uint64_t *val = getMemory(numWords);
130803Smarcel  for (unsigned i = 0; i < numWords; ++i)
130803Smarcel    val[i] = pVal[i] | RHS.pVal[i];
130803Smarcel  return APInt(val, getBitWidth());
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::XorSlowCase(const APInt& RHS) const {
130803Smarcel  unsigned numWords = getNumWords();
130803Smarcel  uint64_t *val = getMemory(numWords);
130803Smarcel  for (unsigned i = 0; i < numWords; ++i)
130803Smarcel    val[i] = pVal[i] ^ RHS.pVal[i];
130803Smarcel
130803Smarcel  // 0^0==1 so clear the high bits in case they got set.
130803Smarcel  return APInt(val, getBitWidth()).clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcelbool APInt::operator !() const {
130803Smarcel  if (isSingleWord())
130803Smarcel    return !VAL;
130803Smarcel
130803Smarcel  for (unsigned i = 0; i < getNumWords(); ++i)
130803Smarcel    if (pVal[i])
130803Smarcel      return false;
130803Smarcel  return true;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::operator*(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord())
130803Smarcel    return APInt(BitWidth, VAL * RHS.VAL);
130803Smarcel  APInt Result(*this);
130803Smarcel  Result *= RHS;
130803Smarcel  return Result;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::operator+(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord())
130803Smarcel    return APInt(BitWidth, VAL + RHS.VAL);
130803Smarcel  APInt Result(BitWidth, 0);
130803Smarcel  add(Result.pVal, this->pVal, RHS.pVal, getNumWords());
130803Smarcel  return Result.clearUnusedBits();
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::operator-(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord())
130803Smarcel    return APInt(BitWidth, VAL - RHS.VAL);
130803Smarcel  APInt Result(BitWidth, 0);
130803Smarcel  sub(Result.pVal, this->pVal, RHS.pVal, getNumWords());
130803Smarcel  return Result.clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcelbool APInt::operator[](unsigned bitPosition) const {
130803Smarcel  assert(bitPosition < getBitWidth() && "Bit position out of bounds!");
130803Smarcel  return (maskBit(bitPosition) &
130803Smarcel          (isSingleWord() ?  VAL : pVal[whichWord(bitPosition)])) != 0;
130803Smarcel}
130803Smarcel
130803Smarcelbool APInt::EqualSlowCase(const APInt& RHS) const {
130803Smarcel  // Get some facts about the number of bits used in the two operands.
130803Smarcel  unsigned n1 = getActiveBits();
130803Smarcel  unsigned n2 = RHS.getActiveBits();
130803Smarcel
130803Smarcel  // If the number of bits isn't the same, they aren't equal
130803Smarcel  if (n1 != n2)
130803Smarcel    return false;
130803Smarcel
130803Smarcel  // If the number of bits fits in a word, we only need to compare the low word.
130803Smarcel  if (n1 <= APINT_BITS_PER_WORD)
130803Smarcel    return pVal[0] == RHS.pVal[0];
130803Smarcel
130803Smarcel  // Otherwise, compare everything
130803Smarcel  for (int i = whichWord(n1 - 1); i >= 0; --i)
130803Smarcel    if (pVal[i] != RHS.pVal[i])
130803Smarcel      return false;
130803Smarcel  return true;
130803Smarcel}
130803Smarcel
130803Smarcelbool APInt::EqualSlowCase(uint64_t Val) const {
130803Smarcel  unsigned n = getActiveBits();
130803Smarcel  if (n <= APINT_BITS_PER_WORD)
130803Smarcel    return pVal[0] == Val;
130803Smarcel  else
130803Smarcel    return false;
130803Smarcel}
130803Smarcel
130803Smarcelbool APInt::ult(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
130803Smarcel  if (isSingleWord())
130803Smarcel    return VAL < RHS.VAL;
130803Smarcel
130803Smarcel  // Get active bit length of both operands
130803Smarcel  unsigned n1 = getActiveBits();
130803Smarcel  unsigned n2 = RHS.getActiveBits();
130803Smarcel
130803Smarcel  // If magnitude of LHS is less than RHS, return true.
130803Smarcel  if (n1 < n2)
130803Smarcel    return true;
130803Smarcel
130803Smarcel  // If magnitude of RHS is greather than LHS, return false.
130803Smarcel  if (n2 < n1)
130803Smarcel    return false;
130803Smarcel
130803Smarcel  // If they bot fit in a word, just compare the low order word
130803Smarcel  if (n1 <= APINT_BITS_PER_WORD && n2 <= APINT_BITS_PER_WORD)
130803Smarcel    return pVal[0] < RHS.pVal[0];
130803Smarcel
130803Smarcel  // Otherwise, compare all words
130803Smarcel  unsigned topWord = whichWord(std::max(n1,n2)-1);
130803Smarcel  for (int i = topWord; i >= 0; --i) {
130803Smarcel    if (pVal[i] > RHS.pVal[i])
130803Smarcel      return false;
130803Smarcel    if (pVal[i] < RHS.pVal[i])
130803Smarcel      return true;
130803Smarcel  }
130803Smarcel  return false;
130803Smarcel}
130803Smarcel
130803Smarcelbool APInt::slt(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
130803Smarcel  if (isSingleWord()) {
130803Smarcel    int64_t lhsSext = (int64_t(VAL) << (64-BitWidth)) >> (64-BitWidth);
130803Smarcel    int64_t rhsSext = (int64_t(RHS.VAL) << (64-BitWidth)) >> (64-BitWidth);
130803Smarcel    return lhsSext < rhsSext;
130803Smarcel  }
130803Smarcel
130803Smarcel  APInt lhs(*this);
130803Smarcel  APInt rhs(RHS);
130803Smarcel  bool lhsNeg = isNegative();
130803Smarcel  bool rhsNeg = rhs.isNegative();
130803Smarcel  if (lhsNeg) {
130803Smarcel    // Sign bit is set so perform two's complement to make it positive
130803Smarcel    lhs.flipAllBits();
130803Smarcel    lhs++;
130803Smarcel  }
130803Smarcel  if (rhsNeg) {
130803Smarcel    // Sign bit is set so perform two's complement to make it positive
130803Smarcel    rhs.flipAllBits();
130803Smarcel    rhs++;
130803Smarcel  }
130803Smarcel
130803Smarcel  // Now we have unsigned values to compare so do the comparison if necessary
130803Smarcel  // based on the negativeness of the values.
130803Smarcel  if (lhsNeg)
130803Smarcel    if (rhsNeg)
130803Smarcel      return lhs.ugt(rhs);
130803Smarcel    else
130803Smarcel      return true;
130803Smarcel  else if (rhsNeg)
130803Smarcel    return false;
130803Smarcel  else
130803Smarcel    return lhs.ult(rhs);
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::setBit(unsigned bitPosition) {
130803Smarcel  if (isSingleWord())
130803Smarcel    VAL |= maskBit(bitPosition);
130803Smarcel  else
130803Smarcel    pVal[whichWord(bitPosition)] |= maskBit(bitPosition);
130803Smarcel}
130803Smarcel
130803Smarcel/// Set the given bit to 0 whose position is given as "bitPosition".
130803Smarcel/// @brief Set a given bit to 0.
130803Smarcelvoid APInt::clearBit(unsigned bitPosition) {
130803Smarcel  if (isSingleWord())
130803Smarcel    VAL &= ~maskBit(bitPosition);
130803Smarcel  else
130803Smarcel    pVal[whichWord(bitPosition)] &= ~maskBit(bitPosition);
130803Smarcel}
130803Smarcel
130803Smarcel/// @brief Toggle every bit to its opposite value.
130803Smarcel
130803Smarcel/// Toggle a given bit to its opposite value whose position is given
130803Smarcel/// as "bitPosition".
130803Smarcel/// @brief Toggles a given bit to its opposite value.
130803Smarcelvoid APInt::flipBit(unsigned bitPosition) {
130803Smarcel  assert(bitPosition < BitWidth && "Out of the bit-width range!");
130803Smarcel  if ((*this)[bitPosition]) clearBit(bitPosition);
130803Smarcel  else setBit(bitPosition);
130803Smarcel}
130803Smarcel
130803Smarcelunsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
130803Smarcel  assert(!str.empty() && "Invalid string length");
130803Smarcel  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
130803Smarcel          radix == 36) &&
130803Smarcel         "Radix should be 2, 8, 10, 16, or 36!");
130803Smarcel
130803Smarcel  size_t slen = str.size();
130803Smarcel
130803Smarcel  // Each computation below needs to know if it's negative.
130803Smarcel  StringRef::iterator p = str.begin();
130803Smarcel  unsigned isNegative = *p == '-';
130803Smarcel  if (*p == '-' || *p == '+') {
130803Smarcel    p++;
130803Smarcel    slen--;
130803Smarcel    assert(slen && "String is only a sign, needs a value.");
130803Smarcel  }
130803Smarcel
130803Smarcel  // For radixes of power-of-two values, the bits required is accurately and
130803Smarcel  // easily computed
130803Smarcel  if (radix == 2)
130803Smarcel    return slen + isNegative;
130803Smarcel  if (radix == 8)
130803Smarcel    return slen * 3 + isNegative;
130803Smarcel  if (radix == 16)
130803Smarcel    return slen * 4 + isNegative;
130803Smarcel
130803Smarcel  // FIXME: base 36
130803Smarcel
130803Smarcel  // This is grossly inefficient but accurate. We could probably do something
130803Smarcel  // with a computation of roughly slen*64/20 and then adjust by the value of
130803Smarcel  // the first few digits. But, I'm not sure how accurate that could be.
130803Smarcel
130803Smarcel  // Compute a sufficient number of bits that is always large enough but might
130803Smarcel  // be too large. This avoids the assertion in the constructor. This
130803Smarcel  // calculation doesn't work appropriately for the numbers 0-9, so just use 4
130803Smarcel  // bits in that case.
130803Smarcel  unsigned sufficient
130803Smarcel    = radix == 10? (slen == 1 ? 4 : slen * 64/18)
130803Smarcel                 : (slen == 1 ? 7 : slen * 16/3);
130803Smarcel
130803Smarcel  // Convert to the actual binary value.
130803Smarcel  APInt tmp(sufficient, StringRef(p, slen), radix);
130803Smarcel
130803Smarcel  // Compute how many bits are required. If the log is infinite, assume we need
130803Smarcel  // just bit.
130803Smarcel  unsigned log = tmp.logBase2();
130803Smarcel  if (log == (unsigned)-1) {
130803Smarcel    return isNegative + 1;
130803Smarcel  } else {
130803Smarcel    return isNegative + log + 1;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcel// From http://www.burtleburtle.net, byBob Jenkins.
130803Smarcel// When targeting x86, both GCC and LLVM seem to recognize this as a
130803Smarcel// rotate instruction.
130803Smarcel#define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))
130803Smarcel
130803Smarcel// From http://www.burtleburtle.net, by Bob Jenkins.
130803Smarcel#define mix(a,b,c) \
130803Smarcel  { \
130803Smarcel    a -= c;  a ^= rot(c, 4);  c += b; \
130803Smarcel    b -= a;  b ^= rot(a, 6);  a += c; \
130803Smarcel    c -= b;  c ^= rot(b, 8);  b += a; \
130803Smarcel    a -= c;  a ^= rot(c,16);  c += b; \
130803Smarcel    b -= a;  b ^= rot(a,19);  a += c; \
130803Smarcel    c -= b;  c ^= rot(b, 4);  b += a; \
130803Smarcel  }
130803Smarcel
130803Smarcel// From http://www.burtleburtle.net, by Bob Jenkins.
130803Smarcel#define final(a,b,c) \
130803Smarcel  { \
130803Smarcel    c ^= b; c -= rot(b,14); \
130803Smarcel    a ^= c; a -= rot(c,11); \
130803Smarcel    b ^= a; b -= rot(a,25); \
130803Smarcel    c ^= b; c -= rot(b,16); \
130803Smarcel    a ^= c; a -= rot(c,4);  \
130803Smarcel    b ^= a; b -= rot(a,14); \
130803Smarcel    c ^= b; c -= rot(b,24); \
130803Smarcel  }
130803Smarcel
130803Smarcel// hashword() was adapted from http://www.burtleburtle.net, by Bob
130803Smarcel// Jenkins.  k is a pointer to an array of uint32_t values; length is
130803Smarcel// the length of the key, in 32-bit chunks.  This version only handles
130803Smarcel// keys that are a multiple of 32 bits in size.
130803Smarcelstatic inline uint32_t hashword(const uint64_t *k64, size_t length)
130803Smarcel{
130803Smarcel  const uint32_t *k = reinterpret_cast<const uint32_t *>(k64);
130803Smarcel  uint32_t a,b,c;
130803Smarcel
130803Smarcel  /* Set up the internal state */
130803Smarcel  a = b = c = 0xdeadbeef + (((uint32_t)length)<<2);
130803Smarcel
130803Smarcel  /*------------------------------------------------- handle most of the key */
130803Smarcel  while (length > 3) {
130803Smarcel    a += k[0];
130803Smarcel    b += k[1];
130803Smarcel    c += k[2];
130803Smarcel    mix(a,b,c);
130803Smarcel    length -= 3;
130803Smarcel    k += 3;
130803Smarcel  }
130803Smarcel
130803Smarcel  /*------------------------------------------- handle the last 3 uint32_t's */
130803Smarcel  switch (length) {                  /* all the case statements fall through */
130803Smarcel  case 3 : c+=k[2];
130803Smarcel  case 2 : b+=k[1];
130803Smarcel  case 1 : a+=k[0];
130803Smarcel    final(a,b,c);
130803Smarcel    case 0:     /* case 0: nothing left to add */
130803Smarcel      break;
130803Smarcel    }
130803Smarcel  /*------------------------------------------------------ report the result */
130803Smarcel  return c;
130803Smarcel}
130803Smarcel
130803Smarcel// hashword8() was adapted from http://www.burtleburtle.net, by Bob
130803Smarcel// Jenkins.  This computes a 32-bit hash from one 64-bit word.  When
130803Smarcel// targeting x86 (32 or 64 bit), both LLVM and GCC compile this
130803Smarcel// function into about 35 instructions when inlined.
130803Smarcelstatic inline uint32_t hashword8(const uint64_t k64)
130803Smarcel{
130803Smarcel  uint32_t a,b,c;
130803Smarcel  a = b = c = 0xdeadbeef + 4;
130803Smarcel  b += k64 >> 32;
130803Smarcel  a += k64 & 0xffffffff;
130803Smarcel  final(a,b,c);
130803Smarcel  return c;
130803Smarcel}
130803Smarcel#undef final
130803Smarcel#undef mix
130803Smarcel#undef rot
130803Smarcel
130803Smarceluint64_t APInt::getHashValue() const {
130803Smarcel  uint64_t hash;
130803Smarcel  if (isSingleWord())
130803Smarcel    hash = hashword8(VAL);
130803Smarcel  else
130803Smarcel    hash = hashword(pVal, getNumWords()*2);
130803Smarcel  return hash;
130803Smarcel}
130803Smarcel
130803Smarcel/// HiBits - This function returns the high "numBits" bits of this APInt.
130803SmarcelAPInt APInt::getHiBits(unsigned numBits) const {
130803Smarcel  return APIntOps::lshr(*this, BitWidth - numBits);
130803Smarcel}
130803Smarcel
130803Smarcel/// LoBits - This function returns the low "numBits" bits of this APInt.
130803SmarcelAPInt APInt::getLoBits(unsigned numBits) const {
130803Smarcel  return APIntOps::lshr(APIntOps::shl(*this, BitWidth - numBits),
130803Smarcel                        BitWidth - numBits);
130803Smarcel}
130803Smarcel
130803Smarcelunsigned APInt::countLeadingZerosSlowCase() const {
130803Smarcel  // Treat the most significand word differently because it might have
130803Smarcel  // meaningless bits set beyond the precision.
130803Smarcel  unsigned BitsInMSW = BitWidth % APINT_BITS_PER_WORD;
130803Smarcel  integerPart MSWMask;
130803Smarcel  if (BitsInMSW) MSWMask = (integerPart(1) << BitsInMSW) - 1;
130803Smarcel  else {
130803Smarcel    MSWMask = ~integerPart(0);
130803Smarcel    BitsInMSW = APINT_BITS_PER_WORD;
130803Smarcel  }
130803Smarcel
130803Smarcel  unsigned i = getNumWords();
130803Smarcel  integerPart MSW = pVal[i-1] & MSWMask;
130803Smarcel  if (MSW)
130803Smarcel    return CountLeadingZeros_64(MSW) - (APINT_BITS_PER_WORD - BitsInMSW);
130803Smarcel
130803Smarcel  unsigned Count = BitsInMSW;
130803Smarcel  for (--i; i > 0u; --i) {
130803Smarcel    if (pVal[i-1] == 0)
130803Smarcel      Count += APINT_BITS_PER_WORD;
130803Smarcel    else {
130803Smarcel      Count += CountLeadingZeros_64(pVal[i-1]);
130803Smarcel      break;
130803Smarcel    }
130803Smarcel  }
130803Smarcel  return Count;
130803Smarcel}
130803Smarcel
130803Smarcelstatic unsigned countLeadingOnes_64(uint64_t V, unsigned skip) {
130803Smarcel  unsigned Count = 0;
130803Smarcel  if (skip)
130803Smarcel    V <<= skip;
130803Smarcel  while (V && (V & (1ULL << 63))) {
130803Smarcel    Count++;
130803Smarcel    V <<= 1;
130803Smarcel  }
130803Smarcel  return Count;
130803Smarcel}
130803Smarcel
130803Smarcelunsigned APInt::countLeadingOnes() const {
130803Smarcel  if (isSingleWord())
130803Smarcel    return countLeadingOnes_64(VAL, APINT_BITS_PER_WORD - BitWidth);
130803Smarcel
130803Smarcel  unsigned highWordBits = BitWidth % APINT_BITS_PER_WORD;
130803Smarcel  unsigned shift;
130803Smarcel  if (!highWordBits) {
130803Smarcel    highWordBits = APINT_BITS_PER_WORD;
130803Smarcel    shift = 0;
130803Smarcel  } else {
130803Smarcel    shift = APINT_BITS_PER_WORD - highWordBits;
130803Smarcel  }
130803Smarcel  int i = getNumWords() - 1;
130803Smarcel  unsigned Count = countLeadingOnes_64(pVal[i], shift);
130803Smarcel  if (Count == highWordBits) {
130803Smarcel    for (i--; i >= 0; --i) {
130803Smarcel      if (pVal[i] == -1ULL)
130803Smarcel        Count += APINT_BITS_PER_WORD;
130803Smarcel      else {
130803Smarcel        Count += countLeadingOnes_64(pVal[i], 0);
130803Smarcel        break;
130803Smarcel      }
130803Smarcel    }
130803Smarcel  }
130803Smarcel  return Count;
130803Smarcel}
130803Smarcel
130803Smarcelunsigned APInt::countTrailingZeros() const {
130803Smarcel  if (isSingleWord())
130803Smarcel    return std::min(unsigned(CountTrailingZeros_64(VAL)), BitWidth);
130803Smarcel  unsigned Count = 0;
130803Smarcel  unsigned i = 0;
130803Smarcel  for (; i < getNumWords() && pVal[i] == 0; ++i)
130803Smarcel    Count += APINT_BITS_PER_WORD;
130803Smarcel  if (i < getNumWords())
130803Smarcel    Count += CountTrailingZeros_64(pVal[i]);
130803Smarcel  return std::min(Count, BitWidth);
130803Smarcel}
130803Smarcel
130803Smarcelunsigned APInt::countTrailingOnesSlowCase() const {
130803Smarcel  unsigned Count = 0;
130803Smarcel  unsigned i = 0;
130803Smarcel  for (; i < getNumWords() && pVal[i] == -1ULL; ++i)
130803Smarcel    Count += APINT_BITS_PER_WORD;
130803Smarcel  if (i < getNumWords())
130803Smarcel    Count += CountTrailingOnes_64(pVal[i]);
130803Smarcel  return std::min(Count, BitWidth);
130803Smarcel}
130803Smarcel
130803Smarcelunsigned APInt::countPopulationSlowCase() const {
130803Smarcel  unsigned Count = 0;
130803Smarcel  for (unsigned i = 0; i < getNumWords(); ++i)
130803Smarcel    Count += CountPopulation_64(pVal[i]);
130803Smarcel  return Count;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::byteSwap() const {
130803Smarcel  assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
130803Smarcel  if (BitWidth == 16)
130803Smarcel    return APInt(BitWidth, ByteSwap_16(uint16_t(VAL)));
130803Smarcel  else if (BitWidth == 32)
130803Smarcel    return APInt(BitWidth, ByteSwap_32(unsigned(VAL)));
130803Smarcel  else if (BitWidth == 48) {
130803Smarcel    unsigned Tmp1 = unsigned(VAL >> 16);
130803Smarcel    Tmp1 = ByteSwap_32(Tmp1);
130803Smarcel    uint16_t Tmp2 = uint16_t(VAL);
130803Smarcel    Tmp2 = ByteSwap_16(Tmp2);
130803Smarcel    return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
130803Smarcel  } else if (BitWidth == 64)
130803Smarcel    return APInt(BitWidth, ByteSwap_64(VAL));
130803Smarcel  else {
130803Smarcel    APInt Result(BitWidth, 0);
130803Smarcel    char *pByte = (char*)Result.pVal;
130803Smarcel    for (unsigned i = 0; i < BitWidth / APINT_WORD_SIZE / 2; ++i) {
130803Smarcel      char Tmp = pByte[i];
130803Smarcel      pByte[i] = pByte[BitWidth / APINT_WORD_SIZE - 1 - i];
130803Smarcel      pByte[BitWidth / APINT_WORD_SIZE - i - 1] = Tmp;
130803Smarcel    }
130803Smarcel    return Result;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803SmarcelAPInt llvm::APIntOps::GreatestCommonDivisor(const APInt& API1,
130803Smarcel                                            const APInt& API2) {
130803Smarcel  APInt A = API1, B = API2;
130803Smarcel  while (!!B) {
130803Smarcel    APInt T = B;
130803Smarcel    B = APIntOps::urem(A, B);
130803Smarcel    A = T;
130803Smarcel  }
130803Smarcel  return A;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
130803Smarcel  union {
130803Smarcel    double D;
130803Smarcel    uint64_t I;
130803Smarcel  } T;
130803Smarcel  T.D = Double;
130803Smarcel
130803Smarcel  // Get the sign bit from the highest order bit
130803Smarcel  bool isNeg = T.I >> 63;
130803Smarcel
130803Smarcel  // Get the 11-bit exponent and adjust for the 1023 bit bias
130803Smarcel  int64_t exp = ((T.I >> 52) & 0x7ff) - 1023;
130803Smarcel
130803Smarcel  // If the exponent is negative, the value is < 0 so just return 0.
130803Smarcel  if (exp < 0)
130803Smarcel    return APInt(width, 0u);
130803Smarcel
130803Smarcel  // Extract the mantissa by clearing the top 12 bits (sign + exponent).
130803Smarcel  uint64_t mantissa = (T.I & (~0ULL >> 12)) | 1ULL << 52;
130803Smarcel
130803Smarcel  // If the exponent doesn't shift all bits out of the mantissa
130803Smarcel  if (exp < 52)
130803Smarcel    return isNeg ? -APInt(width, mantissa >> (52 - exp)) :
130803Smarcel                    APInt(width, mantissa >> (52 - exp));
130803Smarcel
130803Smarcel  // If the client didn't provide enough bits for us to shift the mantissa into
130803Smarcel  // then the result is undefined, just return 0
130803Smarcel  if (width <= exp - 52)
130803Smarcel    return APInt(width, 0);
130803Smarcel
130803Smarcel  // Otherwise, we have to shift the mantissa bits up to the right location
130803Smarcel  APInt Tmp(width, mantissa);
130803Smarcel  Tmp = Tmp.shl((unsigned)exp - 52);
130803Smarcel  return isNeg ? -Tmp : Tmp;
130803Smarcel}
130803Smarcel
130803Smarcel/// RoundToDouble - This function converts this APInt to a double.
130803Smarcel/// The layout for double is as following (IEEE Standard 754):
130803Smarcel///  --------------------------------------
130803Smarcel/// |  Sign    Exponent    Fraction    Bias |
130803Smarcel/// |-------------------------------------- |
130803Smarcel/// |  1[63]   11[62-52]   52[51-00]   1023 |
130803Smarcel///  --------------------------------------
130803Smarceldouble APInt::roundToDouble(bool isSigned) const {
130803Smarcel
130803Smarcel  // Handle the simple case where the value is contained in one uint64_t.
130803Smarcel  // It is wrong to optimize getWord(0) to VAL; there might be more than one word.
130803Smarcel  if (isSingleWord() || getActiveBits() <= APINT_BITS_PER_WORD) {
130803Smarcel    if (isSigned) {
130803Smarcel      int64_t sext = (int64_t(getWord(0)) << (64-BitWidth)) >> (64-BitWidth);
130803Smarcel      return double(sext);
130803Smarcel    } else
130803Smarcel      return double(getWord(0));
130803Smarcel  }
130803Smarcel
130803Smarcel  // Determine if the value is negative.
130803Smarcel  bool isNeg = isSigned ? (*this)[BitWidth-1] : false;
130803Smarcel
130803Smarcel  // Construct the absolute value if we're negative.
130803Smarcel  APInt Tmp(isNeg ? -(*this) : (*this));
130803Smarcel
130803Smarcel  // Figure out how many bits we're using.
130803Smarcel  unsigned n = Tmp.getActiveBits();
130803Smarcel
130803Smarcel  // The exponent (without bias normalization) is just the number of bits
130803Smarcel  // we are using. Note that the sign bit is gone since we constructed the
130803Smarcel  // absolute value.
130803Smarcel  uint64_t exp = n;
130803Smarcel
130803Smarcel  // Return infinity for exponent overflow
130803Smarcel  if (exp > 1023) {
130803Smarcel    if (!isSigned || !isNeg)
130803Smarcel      return std::numeric_limits<double>::infinity();
130803Smarcel    else
130803Smarcel      return -std::numeric_limits<double>::infinity();
130803Smarcel  }
130803Smarcel  exp += 1023; // Increment for 1023 bias
130803Smarcel
130803Smarcel  // Number of bits in mantissa is 52. To obtain the mantissa value, we must
130803Smarcel  // extract the high 52 bits from the correct words in pVal.
130803Smarcel  uint64_t mantissa;
130803Smarcel  unsigned hiWord = whichWord(n-1);
130803Smarcel  if (hiWord == 0) {
130803Smarcel    mantissa = Tmp.pVal[0];
130803Smarcel    if (n > 52)
130803Smarcel      mantissa >>= n - 52; // shift down, we want the top 52 bits.
130803Smarcel  } else {
130803Smarcel    assert(hiWord > 0 && "huh?");
130803Smarcel    uint64_t hibits = Tmp.pVal[hiWord] << (52 - n % APINT_BITS_PER_WORD);
130803Smarcel    uint64_t lobits = Tmp.pVal[hiWord-1] >> (11 + n % APINT_BITS_PER_WORD);
130803Smarcel    mantissa = hibits | lobits;
130803Smarcel  }
130803Smarcel
130803Smarcel  // The leading bit of mantissa is implicit, so get rid of it.
130803Smarcel  uint64_t sign = isNeg ? (1ULL << (APINT_BITS_PER_WORD - 1)) : 0;
130803Smarcel  union {
130803Smarcel    double D;
130803Smarcel    uint64_t I;
130803Smarcel  } T;
130803Smarcel  T.I = sign | (exp << 52) | mantissa;
130803Smarcel  return T.D;
130803Smarcel}
130803Smarcel
130803Smarcel// Truncate to new width.
130803SmarcelAPInt APInt::trunc(unsigned width) const {
130803Smarcel  assert(width < BitWidth && "Invalid APInt Truncate request");
130803Smarcel  assert(width && "Can't truncate to 0 bits");
130803Smarcel
130803Smarcel  if (width <= APINT_BITS_PER_WORD)
130803Smarcel    return APInt(width, getRawData()[0]);
130803Smarcel
130803Smarcel  APInt Result(getMemory(getNumWords(width)), width);
130803Smarcel
130803Smarcel  // Copy full words.
130803Smarcel  unsigned i;
130803Smarcel  for (i = 0; i != width / APINT_BITS_PER_WORD; i++)
130803Smarcel    Result.pVal[i] = pVal[i];
130803Smarcel
130803Smarcel  // Truncate and copy any partial word.
130803Smarcel  unsigned bits = (0 - width) % APINT_BITS_PER_WORD;
130803Smarcel  if (bits != 0)
130803Smarcel    Result.pVal[i] = pVal[i] << bits >> bits;
130803Smarcel
130803Smarcel  return Result;
130803Smarcel}
130803Smarcel
130803Smarcel// Sign extend to a new width.
130803SmarcelAPInt APInt::sext(unsigned width) const {
130803Smarcel  assert(width > BitWidth && "Invalid APInt SignExtend request");
130803Smarcel
130803Smarcel  if (width <= APINT_BITS_PER_WORD) {
130803Smarcel    uint64_t val = VAL << (APINT_BITS_PER_WORD - BitWidth);
130803Smarcel    val = (int64_t)val >> (width - BitWidth);
130803Smarcel    return APInt(width, val >> (APINT_BITS_PER_WORD - width));
130803Smarcel  }
130803Smarcel
130803Smarcel  APInt Result(getMemory(getNumWords(width)), width);
130803Smarcel
130803Smarcel  // Copy full words.
130803Smarcel  unsigned i;
130803Smarcel  uint64_t word = 0;
130803Smarcel  for (i = 0; i != BitWidth / APINT_BITS_PER_WORD; i++) {
130803Smarcel    word = getRawData()[i];
130803Smarcel    Result.pVal[i] = word;
130803Smarcel  }
130803Smarcel
130803Smarcel  // Read and sign-extend any partial word.
130803Smarcel  unsigned bits = (0 - BitWidth) % APINT_BITS_PER_WORD;
130803Smarcel  if (bits != 0)
130803Smarcel    word = (int64_t)getRawData()[i] << bits >> bits;
130803Smarcel  else
130803Smarcel    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
130803Smarcel
130803Smarcel  // Write remaining full words.
130803Smarcel  for (; i != width / APINT_BITS_PER_WORD; i++) {
130803Smarcel    Result.pVal[i] = word;
130803Smarcel    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
130803Smarcel  }
130803Smarcel
130803Smarcel  // Write any partial word.
130803Smarcel  bits = (0 - width) % APINT_BITS_PER_WORD;
130803Smarcel  if (bits != 0)
130803Smarcel    Result.pVal[i] = word << bits >> bits;
130803Smarcel
130803Smarcel  return Result;
130803Smarcel}
130803Smarcel
130803Smarcel//  Zero extend to a new width.
130803SmarcelAPInt APInt::zext(unsigned width) const {
130803Smarcel  assert(width > BitWidth && "Invalid APInt ZeroExtend request");
130803Smarcel
130803Smarcel  if (width <= APINT_BITS_PER_WORD)
130803Smarcel    return APInt(width, VAL);
130803Smarcel
130803Smarcel  APInt Result(getMemory(getNumWords(width)), width);
130803Smarcel
130803Smarcel  // Copy words.
130803Smarcel  unsigned i;
130803Smarcel  for (i = 0; i != getNumWords(); i++)
130803Smarcel    Result.pVal[i] = getRawData()[i];
130803Smarcel
130803Smarcel  // Zero remaining words.
130803Smarcel  memset(&Result.pVal[i], 0, (Result.getNumWords() - i) * APINT_WORD_SIZE);
130803Smarcel
130803Smarcel  return Result;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::zextOrTrunc(unsigned width) const {
130803Smarcel  if (BitWidth < width)
130803Smarcel    return zext(width);
130803Smarcel  if (BitWidth > width)
130803Smarcel    return trunc(width);
130803Smarcel  return *this;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::sextOrTrunc(unsigned width) const {
130803Smarcel  if (BitWidth < width)
130803Smarcel    return sext(width);
130803Smarcel  if (BitWidth > width)
130803Smarcel    return trunc(width);
130803Smarcel  return *this;
130803Smarcel}
130803Smarcel
130803Smarcel/// Arithmetic right-shift this APInt by shiftAmt.
130803Smarcel/// @brief Arithmetic right-shift function.
130803SmarcelAPInt APInt::ashr(const APInt &shiftAmt) const {
130803Smarcel  return ashr((unsigned)shiftAmt.getLimitedValue(BitWidth));
130803Smarcel}
130803Smarcel
130803Smarcel/// Arithmetic right-shift this APInt by shiftAmt.
130803Smarcel/// @brief Arithmetic right-shift function.
130803SmarcelAPInt APInt::ashr(unsigned shiftAmt) const {
130803Smarcel  assert(shiftAmt <= BitWidth && "Invalid shift amount");
130803Smarcel  // Handle a degenerate case
130803Smarcel  if (shiftAmt == 0)
130803Smarcel    return *this;
130803Smarcel
130803Smarcel  // Handle single word shifts with built-in ashr
130803Smarcel  if (isSingleWord()) {
130803Smarcel    if (shiftAmt == BitWidth)
130803Smarcel      return APInt(BitWidth, 0); // undefined
130803Smarcel    else {
130803Smarcel      unsigned SignBit = APINT_BITS_PER_WORD - BitWidth;
130803Smarcel      return APInt(BitWidth,
130803Smarcel        (((int64_t(VAL) << SignBit) >> SignBit) >> shiftAmt));
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  // If all the bits were shifted out, the result is, technically, undefined.
130803Smarcel  // We return -1 if it was negative, 0 otherwise. We check this early to avoid
130803Smarcel  // issues in the algorithm below.
130803Smarcel  if (shiftAmt == BitWidth) {
130803Smarcel    if (isNegative())
130803Smarcel      return APInt(BitWidth, -1ULL, true);
130803Smarcel    else
130803Smarcel      return APInt(BitWidth, 0);
130803Smarcel  }
130803Smarcel
130803Smarcel  // Create some space for the result.
130803Smarcel  uint64_t * val = new uint64_t[getNumWords()];
130803Smarcel
130803Smarcel  // Compute some values needed by the following shift algorithms
130803Smarcel  unsigned wordShift = shiftAmt % APINT_BITS_PER_WORD; // bits to shift per word
130803Smarcel  unsigned offset = shiftAmt / APINT_BITS_PER_WORD; // word offset for shift
130803Smarcel  unsigned breakWord = getNumWords() - 1 - offset; // last word affected
130803Smarcel  unsigned bitsInWord = whichBit(BitWidth); // how many bits in last word?
130803Smarcel  if (bitsInWord == 0)
130803Smarcel    bitsInWord = APINT_BITS_PER_WORD;
130803Smarcel
130803Smarcel  // If we are shifting whole words, just move whole words
130803Smarcel  if (wordShift == 0) {
130803Smarcel    // Move the words containing significant bits
130803Smarcel    for (unsigned i = 0; i <= breakWord; ++i)
130803Smarcel      val[i] = pVal[i+offset]; // move whole word
130803Smarcel
130803Smarcel    // Adjust the top significant word for sign bit fill, if negative
130803Smarcel    if (isNegative())
130803Smarcel      if (bitsInWord < APINT_BITS_PER_WORD)
130803Smarcel        val[breakWord] |= ~0ULL << bitsInWord; // set high bits
130803Smarcel  } else {
130803Smarcel    // Shift the low order words
130803Smarcel    for (unsigned i = 0; i < breakWord; ++i) {
130803Smarcel      // This combines the shifted corresponding word with the low bits from
130803Smarcel      // the next word (shifted into this word's high bits).
130803Smarcel      val[i] = (pVal[i+offset] >> wordShift) |
130803Smarcel               (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
130803Smarcel    }
130803Smarcel
130803Smarcel    // Shift the break word. In this case there are no bits from the next word
130803Smarcel    // to include in this word.
130803Smarcel    val[breakWord] = pVal[breakWord+offset] >> wordShift;
130803Smarcel
130803Smarcel    // Deal with sign extenstion in the break word, and possibly the word before
130803Smarcel    // it.
130803Smarcel    if (isNegative()) {
130803Smarcel      if (wordShift > bitsInWord) {
130803Smarcel        if (breakWord > 0)
130803Smarcel          val[breakWord-1] |=
130803Smarcel            ~0ULL << (APINT_BITS_PER_WORD - (wordShift - bitsInWord));
130803Smarcel        val[breakWord] |= ~0ULL;
130803Smarcel      } else
130803Smarcel        val[breakWord] |= (~0ULL << (bitsInWord - wordShift));
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  // Remaining words are 0 or -1, just assign them.
130803Smarcel  uint64_t fillValue = (isNegative() ? -1ULL : 0);
130803Smarcel  for (unsigned i = breakWord+1; i < getNumWords(); ++i)
130803Smarcel    val[i] = fillValue;
130803Smarcel  return APInt(val, BitWidth).clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// Logical right-shift this APInt by shiftAmt.
130803Smarcel/// @brief Logical right-shift function.
130803SmarcelAPInt APInt::lshr(const APInt &shiftAmt) const {
130803Smarcel  return lshr((unsigned)shiftAmt.getLimitedValue(BitWidth));
130803Smarcel}
130803Smarcel
130803Smarcel/// Logical right-shift this APInt by shiftAmt.
130803Smarcel/// @brief Logical right-shift function.
130803SmarcelAPInt APInt::lshr(unsigned shiftAmt) const {
130803Smarcel  if (isSingleWord()) {
130803Smarcel    if (shiftAmt == BitWidth)
130803Smarcel      return APInt(BitWidth, 0);
130803Smarcel    else
130803Smarcel      return APInt(BitWidth, this->VAL >> shiftAmt);
130803Smarcel  }
130803Smarcel
130803Smarcel  // If all the bits were shifted out, the result is 0. This avoids issues
130803Smarcel  // with shifting by the size of the integer type, which produces undefined
130803Smarcel  // results. We define these "undefined results" to always be 0.
130803Smarcel  if (shiftAmt == BitWidth)
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel
130803Smarcel  // If none of the bits are shifted out, the result is *this. This avoids
130803Smarcel  // issues with shifting by the size of the integer type, which produces
130803Smarcel  // undefined results in the code below. This is also an optimization.
130803Smarcel  if (shiftAmt == 0)
130803Smarcel    return *this;
130803Smarcel
130803Smarcel  // Create some space for the result.
130803Smarcel  uint64_t * val = new uint64_t[getNumWords()];
130803Smarcel
130803Smarcel  // If we are shifting less than a word, compute the shift with a simple carry
130803Smarcel  if (shiftAmt < APINT_BITS_PER_WORD) {
130803Smarcel    uint64_t carry = 0;
130803Smarcel    for (int i = getNumWords()-1; i >= 0; --i) {
130803Smarcel      val[i] = (pVal[i] >> shiftAmt) | carry;
130803Smarcel      carry = pVal[i] << (APINT_BITS_PER_WORD - shiftAmt);
130803Smarcel    }
130803Smarcel    return APInt(val, BitWidth).clearUnusedBits();
130803Smarcel  }
130803Smarcel
130803Smarcel  // Compute some values needed by the remaining shift algorithms
130803Smarcel  unsigned wordShift = shiftAmt % APINT_BITS_PER_WORD;
130803Smarcel  unsigned offset = shiftAmt / APINT_BITS_PER_WORD;
130803Smarcel
130803Smarcel  // If we are shifting whole words, just move whole words
130803Smarcel  if (wordShift == 0) {
130803Smarcel    for (unsigned i = 0; i < getNumWords() - offset; ++i)
130803Smarcel      val[i] = pVal[i+offset];
130803Smarcel    for (unsigned i = getNumWords()-offset; i < getNumWords(); i++)
130803Smarcel      val[i] = 0;
130803Smarcel    return APInt(val,BitWidth).clearUnusedBits();
130803Smarcel  }
130803Smarcel
130803Smarcel  // Shift the low order words
130803Smarcel  unsigned breakWord = getNumWords() - offset -1;
130803Smarcel  for (unsigned i = 0; i < breakWord; ++i)
130803Smarcel    val[i] = (pVal[i+offset] >> wordShift) |
130803Smarcel             (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
130803Smarcel  // Shift the break word.
130803Smarcel  val[breakWord] = pVal[breakWord+offset] >> wordShift;
130803Smarcel
130803Smarcel  // Remaining words are 0
130803Smarcel  for (unsigned i = breakWord+1; i < getNumWords(); ++i)
130803Smarcel    val[i] = 0;
130803Smarcel  return APInt(val, BitWidth).clearUnusedBits();
130803Smarcel}
130803Smarcel
130803Smarcel/// Left-shift this APInt by shiftAmt.
130803Smarcel/// @brief Left-shift function.
130803SmarcelAPInt APInt::shl(const APInt &shiftAmt) const {
130803Smarcel  // It's undefined behavior in C to shift by BitWidth or greater.
130803Smarcel  return shl((unsigned)shiftAmt.getLimitedValue(BitWidth));
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::shlSlowCase(unsigned shiftAmt) const {
130803Smarcel  // If all the bits were shifted out, the result is 0. This avoids issues
130803Smarcel  // with shifting by the size of the integer type, which produces undefined
130803Smarcel  // results. We define these "undefined results" to always be 0.
130803Smarcel  if (shiftAmt == BitWidth)
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel
130803Smarcel  // If none of the bits are shifted out, the result is *this. This avoids a
130803Smarcel  // lshr by the words size in the loop below which can produce incorrect
130803Smarcel  // results. It also avoids the expensive computation below for a common case.
130803Smarcel  if (shiftAmt == 0)
130803Smarcel    return *this;
130803Smarcel
130803Smarcel  // Create some space for the result.
130803Smarcel  uint64_t * val = new uint64_t[getNumWords()];
130803Smarcel
130803Smarcel  // If we are shifting less than a word, do it the easy way
130803Smarcel  if (shiftAmt < APINT_BITS_PER_WORD) {
130803Smarcel    uint64_t carry = 0;
130803Smarcel    for (unsigned i = 0; i < getNumWords(); i++) {
130803Smarcel      val[i] = pVal[i] << shiftAmt | carry;
130803Smarcel      carry = pVal[i] >> (APINT_BITS_PER_WORD - shiftAmt);
130803Smarcel    }
130803Smarcel    return APInt(val, BitWidth).clearUnusedBits();
130803Smarcel  }
130803Smarcel
130803Smarcel  // Compute some values needed by the remaining shift algorithms
130803Smarcel  unsigned wordShift = shiftAmt % APINT_BITS_PER_WORD;
130803Smarcel  unsigned offset = shiftAmt / APINT_BITS_PER_WORD;
130803Smarcel
130803Smarcel  // If we are shifting whole words, just move whole words
130803Smarcel  if (wordShift == 0) {
130803Smarcel    for (unsigned i = 0; i < offset; i++)
130803Smarcel      val[i] = 0;
130803Smarcel    for (unsigned i = offset; i < getNumWords(); i++)
130803Smarcel      val[i] = pVal[i-offset];
130803Smarcel    return APInt(val,BitWidth).clearUnusedBits();
130803Smarcel  }
130803Smarcel
130803Smarcel  // Copy whole words from this to Result.
130803Smarcel  unsigned i = getNumWords() - 1;
130803Smarcel  for (; i > offset; --i)
130803Smarcel    val[i] = pVal[i-offset] << wordShift |
130803Smarcel             pVal[i-offset-1] >> (APINT_BITS_PER_WORD - wordShift);
130803Smarcel  val[offset] = pVal[0] << wordShift;
130803Smarcel  for (i = 0; i < offset; ++i)
130803Smarcel    val[i] = 0;
130803Smarcel  return APInt(val, BitWidth).clearUnusedBits();
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::rotl(const APInt &rotateAmt) const {
130803Smarcel  return rotl((unsigned)rotateAmt.getLimitedValue(BitWidth));
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::rotl(unsigned rotateAmt) const {
130803Smarcel  if (rotateAmt == 0)
130803Smarcel    return *this;
130803Smarcel  // Don't get too fancy, just use existing shift/or facilities
130803Smarcel  APInt hi(*this);
130803Smarcel  APInt lo(*this);
130803Smarcel  hi.shl(rotateAmt);
130803Smarcel  lo.lshr(BitWidth - rotateAmt);
130803Smarcel  return hi | lo;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::rotr(const APInt &rotateAmt) const {
130803Smarcel  return rotr((unsigned)rotateAmt.getLimitedValue(BitWidth));
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::rotr(unsigned rotateAmt) const {
130803Smarcel  if (rotateAmt == 0)
130803Smarcel    return *this;
130803Smarcel  // Don't get too fancy, just use existing shift/or facilities
130803Smarcel  APInt hi(*this);
130803Smarcel  APInt lo(*this);
130803Smarcel  lo.lshr(rotateAmt);
130803Smarcel  hi.shl(BitWidth - rotateAmt);
130803Smarcel  return hi | lo;
130803Smarcel}
130803Smarcel
130803Smarcel// Square Root - this method computes and returns the square root of "this".
130803Smarcel// Three mechanisms are used for computation. For small values (<= 5 bits),
130803Smarcel// a table lookup is done. This gets some performance for common cases. For
130803Smarcel// values using less than 52 bits, the value is converted to double and then
130803Smarcel// the libc sqrt function is called. The result is rounded and then converted
130803Smarcel// back to a uint64_t which is then used to construct the result. Finally,
130803Smarcel// the Babylonian method for computing square roots is used.
130803SmarcelAPInt APInt::sqrt() const {
130803Smarcel
130803Smarcel  // Determine the magnitude of the value.
130803Smarcel  unsigned magnitude = getActiveBits();
130803Smarcel
130803Smarcel  // Use a fast table for some small values. This also gets rid of some
130803Smarcel  // rounding errors in libc sqrt for small values.
130803Smarcel  if (magnitude <= 5) {
130803Smarcel    static const uint8_t results[32] = {
130803Smarcel      /*     0 */ 0,
130803Smarcel      /*  1- 2 */ 1, 1,
130803Smarcel      /*  3- 6 */ 2, 2, 2, 2,
130803Smarcel      /*  7-12 */ 3, 3, 3, 3, 3, 3,
130803Smarcel      /* 13-20 */ 4, 4, 4, 4, 4, 4, 4, 4,
130803Smarcel      /* 21-30 */ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
130803Smarcel      /*    31 */ 6
130803Smarcel    };
130803Smarcel    return APInt(BitWidth, results[ (isSingleWord() ? VAL : pVal[0]) ]);
130803Smarcel  }
130803Smarcel
130803Smarcel  // If the magnitude of the value fits in less than 52 bits (the precision of
130803Smarcel  // an IEEE double precision floating point value), then we can use the
130803Smarcel  // libc sqrt function which will probably use a hardware sqrt computation.
130803Smarcel  // This should be faster than the algorithm below.
130803Smarcel  if (magnitude < 52) {
130803Smarcel#if HAVE_ROUND
130803Smarcel    return APInt(BitWidth,
130803Smarcel                 uint64_t(::round(::sqrt(double(isSingleWord()?VAL:pVal[0])))));
130803Smarcel#else
130803Smarcel    return APInt(BitWidth,
130803Smarcel                 uint64_t(::sqrt(double(isSingleWord()?VAL:pVal[0])) + 0.5));
130803Smarcel#endif
130803Smarcel  }
130803Smarcel
130803Smarcel  // Okay, all the short cuts are exhausted. We must compute it. The following
130803Smarcel  // is a classical Babylonian method for computing the square root. This code
130803Smarcel  // was adapted to APINt from a wikipedia article on such computations.
130803Smarcel  // See http://www.wikipedia.org/ and go to the page named
130803Smarcel  // Calculate_an_integer_square_root.
130803Smarcel  unsigned nbits = BitWidth, i = 4;
130803Smarcel  APInt testy(BitWidth, 16);
130803Smarcel  APInt x_old(BitWidth, 1);
130803Smarcel  APInt x_new(BitWidth, 0);
130803Smarcel  APInt two(BitWidth, 2);
130803Smarcel
130803Smarcel  // Select a good starting value using binary logarithms.
130803Smarcel  for (;; i += 2, testy = testy.shl(2))
130803Smarcel    if (i >= nbits || this->ule(testy)) {
130803Smarcel      x_old = x_old.shl(i / 2);
130803Smarcel      break;
130803Smarcel    }
130803Smarcel
130803Smarcel  // Use the Babylonian method to arrive at the integer square root:
130803Smarcel  for (;;) {
130803Smarcel    x_new = (this->udiv(x_old) + x_old).udiv(two);
130803Smarcel    if (x_old.ule(x_new))
130803Smarcel      break;
130803Smarcel    x_old = x_new;
130803Smarcel  }
130803Smarcel
130803Smarcel  // Make sure we return the closest approximation
130803Smarcel  // NOTE: The rounding calculation below is correct. It will produce an
130803Smarcel  // off-by-one discrepancy with results from pari/gp. That discrepancy has been
130803Smarcel  // determined to be a rounding issue with pari/gp as it begins to use a
130803Smarcel  // floating point representation after 192 bits. There are no discrepancies
130803Smarcel  // between this algorithm and pari/gp for bit widths < 192 bits.
130803Smarcel  APInt square(x_old * x_old);
130803Smarcel  APInt nextSquare((x_old + 1) * (x_old +1));
130803Smarcel  if (this->ult(square))
130803Smarcel    return x_old;
130803Smarcel  else if (this->ule(nextSquare)) {
130803Smarcel    APInt midpoint((nextSquare - square).udiv(two));
130803Smarcel    APInt offset(*this - square);
130803Smarcel    if (offset.ult(midpoint))
130803Smarcel      return x_old;
130803Smarcel    else
130803Smarcel      return x_old + 1;
130803Smarcel  } else
130803Smarcel    llvm_unreachable("Error in APInt::sqrt computation");
130803Smarcel  return x_old + 1;
130803Smarcel}
130803Smarcel
130803Smarcel/// Computes the multiplicative inverse of this APInt for a given modulo. The
130803Smarcel/// iterative extended Euclidean algorithm is used to solve for this value,
130803Smarcel/// however we simplify it to speed up calculating only the inverse, and take
130803Smarcel/// advantage of div+rem calculations. We also use some tricks to avoid copying
130803Smarcel/// (potentially large) APInts around.
130803SmarcelAPInt APInt::multiplicativeInverse(const APInt& modulo) const {
130803Smarcel  assert(ult(modulo) && "This APInt must be smaller than the modulo");
130803Smarcel
130803Smarcel  // Using the properties listed at the following web page (accessed 06/21/08):
130803Smarcel  //   http://www.numbertheory.org/php/euclid.html
130803Smarcel  // (especially the properties numbered 3, 4 and 9) it can be proved that
130803Smarcel  // BitWidth bits suffice for all the computations in the algorithm implemented
130803Smarcel  // below. More precisely, this number of bits suffice if the multiplicative
130803Smarcel  // inverse exists, but may not suffice for the general extended Euclidean
130803Smarcel  // algorithm.
130803Smarcel
130803Smarcel  APInt r[2] = { modulo, *this };
130803Smarcel  APInt t[2] = { APInt(BitWidth, 0), APInt(BitWidth, 1) };
130803Smarcel  APInt q(BitWidth, 0);
130803Smarcel
130803Smarcel  unsigned i;
130803Smarcel  for (i = 0; r[i^1] != 0; i ^= 1) {
130803Smarcel    // An overview of the math without the confusing bit-flipping:
130803Smarcel    // q = r[i-2] / r[i-1]
130803Smarcel    // r[i] = r[i-2] % r[i-1]
130803Smarcel    // t[i] = t[i-2] - t[i-1] * q
130803Smarcel    udivrem(r[i], r[i^1], q, r[i]);
130803Smarcel    t[i] -= t[i^1] * q;
130803Smarcel  }
130803Smarcel
130803Smarcel  // If this APInt and the modulo are not coprime, there is no multiplicative
130803Smarcel  // inverse, so return 0. We check this by looking at the next-to-last
130803Smarcel  // remainder, which is the gcd(*this,modulo) as calculated by the Euclidean
130803Smarcel  // algorithm.
130803Smarcel  if (r[i] != 1)
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel
130803Smarcel  // The next-to-last t is the multiplicative inverse.  However, we are
130803Smarcel  // interested in a positive inverse. Calcuate a positive one from a negative
130803Smarcel  // one if necessary. A simple addition of the modulo suffices because
130803Smarcel  // abs(t[i]) is known to be less than *this/2 (see the link above).
130803Smarcel  return t[i].isNegative() ? t[i] + modulo : t[i];
130803Smarcel}
130803Smarcel
130803Smarcel/// Calculate the magic numbers required to implement a signed integer division
130803Smarcel/// by a constant as a sequence of multiplies, adds and shifts.  Requires that
130803Smarcel/// the divisor not be 0, 1, or -1.  Taken from "Hacker's Delight", Henry S.
130803Smarcel/// Warren, Jr., chapter 10.
130803SmarcelAPInt::ms APInt::magic() const {
130803Smarcel  const APInt& d = *this;
130803Smarcel  unsigned p;
130803Smarcel  APInt ad, anc, delta, q1, r1, q2, r2, t;
130803Smarcel  APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
130803Smarcel  struct ms mag;
130803Smarcel
130803Smarcel  ad = d.abs();
130803Smarcel  t = signedMin + (d.lshr(d.getBitWidth() - 1));
130803Smarcel  anc = t - 1 - t.urem(ad);   // absolute value of nc
130803Smarcel  p = d.getBitWidth() - 1;    // initialize p
130803Smarcel  q1 = signedMin.udiv(anc);   // initialize q1 = 2p/abs(nc)
130803Smarcel  r1 = signedMin - q1*anc;    // initialize r1 = rem(2p,abs(nc))
130803Smarcel  q2 = signedMin.udiv(ad);    // initialize q2 = 2p/abs(d)
130803Smarcel  r2 = signedMin - q2*ad;     // initialize r2 = rem(2p,abs(d))
130803Smarcel  do {
130803Smarcel    p = p + 1;
130803Smarcel    q1 = q1<<1;          // update q1 = 2p/abs(nc)
130803Smarcel    r1 = r1<<1;          // update r1 = rem(2p/abs(nc))
130803Smarcel    if (r1.uge(anc)) {  // must be unsigned comparison
130803Smarcel      q1 = q1 + 1;
130803Smarcel      r1 = r1 - anc;
130803Smarcel    }
130803Smarcel    q2 = q2<<1;          // update q2 = 2p/abs(d)
130803Smarcel    r2 = r2<<1;          // update r2 = rem(2p/abs(d))
130803Smarcel    if (r2.uge(ad)) {   // must be unsigned comparison
130803Smarcel      q2 = q2 + 1;
130803Smarcel      r2 = r2 - ad;
130803Smarcel    }
130803Smarcel    delta = ad - r2;
130803Smarcel  } while (q1.ult(delta) || (q1 == delta && r1 == 0));
130803Smarcel
130803Smarcel  mag.m = q2 + 1;
130803Smarcel  if (d.isNegative()) mag.m = -mag.m;   // resulting magic number
130803Smarcel  mag.s = p - d.getBitWidth();          // resulting shift
130803Smarcel  return mag;
130803Smarcel}
130803Smarcel
130803Smarcel/// Calculate the magic numbers required to implement an unsigned integer
130803Smarcel/// division by a constant as a sequence of multiplies, adds and shifts.
130803Smarcel/// Requires that the divisor not be 0.  Taken from "Hacker's Delight", Henry
130803Smarcel/// S. Warren, Jr., chapter 10.
130803Smarcel/// LeadingZeros can be used to simplify the calculation if the upper bits
130803Smarcel/// of the divided value are known zero.
130803SmarcelAPInt::mu APInt::magicu(unsigned LeadingZeros) const {
130803Smarcel  const APInt& d = *this;
130803Smarcel  unsigned p;
130803Smarcel  APInt nc, delta, q1, r1, q2, r2;
130803Smarcel  struct mu magu;
130803Smarcel  magu.a = 0;               // initialize "add" indicator
130803Smarcel  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth()).lshr(LeadingZeros);
130803Smarcel  APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
130803Smarcel  APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
130803Smarcel
130803Smarcel  nc = allOnes - (-d).urem(d);
130803Smarcel  p = d.getBitWidth() - 1;  // initialize p
130803Smarcel  q1 = signedMin.udiv(nc);  // initialize q1 = 2p/nc
130803Smarcel  r1 = signedMin - q1*nc;   // initialize r1 = rem(2p,nc)
130803Smarcel  q2 = signedMax.udiv(d);   // initialize q2 = (2p-1)/d
130803Smarcel  r2 = signedMax - q2*d;    // initialize r2 = rem((2p-1),d)
130803Smarcel  do {
130803Smarcel    p = p + 1;
130803Smarcel    if (r1.uge(nc - r1)) {
130803Smarcel      q1 = q1 + q1 + 1;  // update q1
130803Smarcel      r1 = r1 + r1 - nc; // update r1
130803Smarcel    }
130803Smarcel    else {
130803Smarcel      q1 = q1+q1; // update q1
130803Smarcel      r1 = r1+r1; // update r1
130803Smarcel    }
130803Smarcel    if ((r2 + 1).uge(d - r2)) {
130803Smarcel      if (q2.uge(signedMax)) magu.a = 1;
130803Smarcel      q2 = q2+q2 + 1;     // update q2
130803Smarcel      r2 = r2+r2 + 1 - d; // update r2
130803Smarcel    }
130803Smarcel    else {
130803Smarcel      if (q2.uge(signedMin)) magu.a = 1;
130803Smarcel      q2 = q2+q2;     // update q2
130803Smarcel      r2 = r2+r2 + 1; // update r2
130803Smarcel    }
130803Smarcel    delta = d - 1 - r2;
130803Smarcel  } while (p < d.getBitWidth()*2 &&
130803Smarcel           (q1.ult(delta) || (q1 == delta && r1 == 0)));
130803Smarcel  magu.m = q2 + 1; // resulting magic number
130803Smarcel  magu.s = p - d.getBitWidth();  // resulting shift
130803Smarcel  return magu;
130803Smarcel}
130803Smarcel
130803Smarcel/// Implementation of Knuth's Algorithm D (Division of nonnegative integers)
130803Smarcel/// from "Art of Computer Programming, Volume 2", section 4.3.1, p. 272. The
130803Smarcel/// variables here have the same names as in the algorithm. Comments explain
130803Smarcel/// the algorithm and any deviation from it.
130803Smarcelstatic void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
130803Smarcel                     unsigned m, unsigned n) {
130803Smarcel  assert(u && "Must provide dividend");
130803Smarcel  assert(v && "Must provide divisor");
130803Smarcel  assert(q && "Must provide quotient");
130803Smarcel  assert(u != v && u != q && v != q && "Must us different memory");
130803Smarcel  assert(n>1 && "n must be > 1");
130803Smarcel
130803Smarcel  // Knuth uses the value b as the base of the number system. In our case b
130803Smarcel  // is 2^31 so we just set it to -1u.
130803Smarcel  uint64_t b = uint64_t(1) << 32;
130803Smarcel
130803Smarcel#if 0
130803Smarcel  DEBUG(dbgs() << "KnuthDiv: m=" << m << " n=" << n << '\n');
130803Smarcel  DEBUG(dbgs() << "KnuthDiv: original:");
130803Smarcel  DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
130803Smarcel  DEBUG(dbgs() << " by");
130803Smarcel  DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
130803Smarcel  DEBUG(dbgs() << '\n');
130803Smarcel#endif
130803Smarcel  // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
130803Smarcel  // u and v by d. Note that we have taken Knuth's advice here to use a power
130803Smarcel  // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
130803Smarcel  // 2 allows us to shift instead of multiply and it is easy to determine the
130803Smarcel  // shift amount from the leading zeros.  We are basically normalizing the u
130803Smarcel  // and v so that its high bits are shifted to the top of v's range without
130803Smarcel  // overflow. Note that this can require an extra word in u so that u must
130803Smarcel  // be of length m+n+1.
130803Smarcel  unsigned shift = CountLeadingZeros_32(v[n-1]);
130803Smarcel  unsigned v_carry = 0;
130803Smarcel  unsigned u_carry = 0;
130803Smarcel  if (shift) {
130803Smarcel    for (unsigned i = 0; i < m+n; ++i) {
130803Smarcel      unsigned u_tmp = u[i] >> (32 - shift);
130803Smarcel      u[i] = (u[i] << shift) | u_carry;
130803Smarcel      u_carry = u_tmp;
130803Smarcel    }
130803Smarcel    for (unsigned i = 0; i < n; ++i) {
130803Smarcel      unsigned v_tmp = v[i] >> (32 - shift);
130803Smarcel      v[i] = (v[i] << shift) | v_carry;
130803Smarcel      v_carry = v_tmp;
130803Smarcel    }
130803Smarcel  }
130803Smarcel  u[m+n] = u_carry;
130803Smarcel#if 0
130803Smarcel  DEBUG(dbgs() << "KnuthDiv:   normal:");
130803Smarcel  DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
130803Smarcel  DEBUG(dbgs() << " by");
130803Smarcel  DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
130803Smarcel  DEBUG(dbgs() << '\n');
130803Smarcel#endif
130803Smarcel
130803Smarcel  // D2. [Initialize j.]  Set j to m. This is the loop counter over the places.
130803Smarcel  int j = m;
130803Smarcel  do {
130803Smarcel    DEBUG(dbgs() << "KnuthDiv: quotient digit #" << j << '\n');
130803Smarcel    // D3. [Calculate q'.].
130803Smarcel    //     Set qp = (u[j+n]*b + u[j+n-1]) / v[n-1]. (qp=qprime=q')
130803Smarcel    //     Set rp = (u[j+n]*b + u[j+n-1]) % v[n-1]. (rp=rprime=r')
130803Smarcel    // Now test if qp == b or qp*v[n-2] > b*rp + u[j+n-2]; if so, decrease
130803Smarcel    // qp by 1, inrease rp by v[n-1], and repeat this test if rp < b. The test
130803Smarcel    // on v[n-2] determines at high speed most of the cases in which the trial
130803Smarcel    // value qp is one too large, and it eliminates all cases where qp is two
130803Smarcel    // too large.
130803Smarcel    uint64_t dividend = ((uint64_t(u[j+n]) << 32) + u[j+n-1]);
130803Smarcel    DEBUG(dbgs() << "KnuthDiv: dividend == " << dividend << '\n');
130803Smarcel    uint64_t qp = dividend / v[n-1];
130803Smarcel    uint64_t rp = dividend % v[n-1];
130803Smarcel    if (qp == b || qp*v[n-2] > b*rp + u[j+n-2]) {
130803Smarcel      qp--;
130803Smarcel      rp += v[n-1];
130803Smarcel      if (rp < b && (qp == b || qp*v[n-2] > b*rp + u[j+n-2]))
130803Smarcel        qp--;
130803Smarcel    }
130803Smarcel    DEBUG(dbgs() << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
130803Smarcel
130803Smarcel    // D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
130803Smarcel    // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
130803Smarcel    // consists of a simple multiplication by a one-place number, combined with
130803Smarcel    // a subtraction.
130803Smarcel    bool isNeg = false;
130803Smarcel    for (unsigned i = 0; i < n; ++i) {
130803Smarcel      uint64_t u_tmp = uint64_t(u[j+i]) | (uint64_t(u[j+i+1]) << 32);
130803Smarcel      uint64_t subtrahend = uint64_t(qp) * uint64_t(v[i]);
130803Smarcel      bool borrow = subtrahend > u_tmp;
130803Smarcel      DEBUG(dbgs() << "KnuthDiv: u_tmp == " << u_tmp
130803Smarcel                   << ", subtrahend == " << subtrahend
130803Smarcel                   << ", borrow = " << borrow << '\n');
130803Smarcel
130803Smarcel      uint64_t result = u_tmp - subtrahend;
130803Smarcel      unsigned k = j + i;
130803Smarcel      u[k++] = (unsigned)(result & (b-1)); // subtract low word
130803Smarcel      u[k++] = (unsigned)(result >> 32);   // subtract high word
130803Smarcel      while (borrow && k <= m+n) { // deal with borrow to the left
130803Smarcel        borrow = u[k] == 0;
130803Smarcel        u[k]--;
130803Smarcel        k++;
130803Smarcel      }
130803Smarcel      isNeg |= borrow;
130803Smarcel      DEBUG(dbgs() << "KnuthDiv: u[j+i] == " << u[j+i] << ",  u[j+i+1] == " <<
130803Smarcel                    u[j+i+1] << '\n');
130803Smarcel    }
130803Smarcel    DEBUG(dbgs() << "KnuthDiv: after subtraction:");
130803Smarcel    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
130803Smarcel    DEBUG(dbgs() << '\n');
130803Smarcel    // The digits (u[j+n]...u[j]) should be kept positive; if the result of
130803Smarcel    // this step is actually negative, (u[j+n]...u[j]) should be left as the
130803Smarcel    // true value plus b**(n+1), namely as the b's complement of
130803Smarcel    // the true value, and a "borrow" to the left should be remembered.
130803Smarcel    //
130803Smarcel    if (isNeg) {
130803Smarcel      bool carry = true;  // true because b's complement is "complement + 1"
130803Smarcel      for (unsigned i = 0; i <= m+n; ++i) {
130803Smarcel        u[i] = ~u[i] + carry; // b's complement
130803Smarcel        carry = carry && u[i] == 0;
130803Smarcel      }
130803Smarcel    }
130803Smarcel    DEBUG(dbgs() << "KnuthDiv: after complement:");
130803Smarcel    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
130803Smarcel    DEBUG(dbgs() << '\n');
130803Smarcel
130803Smarcel    // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
130803Smarcel    // negative, go to step D6; otherwise go on to step D7.
130803Smarcel    q[j] = (unsigned)qp;
130803Smarcel    if (isNeg) {
130803Smarcel      // D6. [Add back]. The probability that this step is necessary is very
130803Smarcel      // small, on the order of only 2/b. Make sure that test data accounts for
130803Smarcel      // this possibility. Decrease q[j] by 1
130803Smarcel      q[j]--;
130803Smarcel      // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
130803Smarcel      // A carry will occur to the left of u[j+n], and it should be ignored
130803Smarcel      // since it cancels with the borrow that occurred in D4.
130803Smarcel      bool carry = false;
130803Smarcel      for (unsigned i = 0; i < n; i++) {
130803Smarcel        unsigned limit = std::min(u[j+i],v[i]);
130803Smarcel        u[j+i] += v[i] + carry;
130803Smarcel        carry = u[j+i] < limit || (carry && u[j+i] == limit);
130803Smarcel      }
130803Smarcel      u[j+n] += carry;
130803Smarcel    }
130803Smarcel    DEBUG(dbgs() << "KnuthDiv: after correction:");
130803Smarcel    DEBUG(for (int i = m+n; i >=0; i--) dbgs() <<" " << u[i]);
130803Smarcel    DEBUG(dbgs() << "\nKnuthDiv: digit result = " << q[j] << '\n');
130803Smarcel
130803Smarcel  // D7. [Loop on j.]  Decrease j by one. Now if j >= 0, go back to D3.
130803Smarcel  } while (--j >= 0);
130803Smarcel
130803Smarcel  DEBUG(dbgs() << "KnuthDiv: quotient:");
130803Smarcel  DEBUG(for (int i = m; i >=0; i--) dbgs() <<" " << q[i]);
130803Smarcel  DEBUG(dbgs() << '\n');
130803Smarcel
130803Smarcel  // D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
130803Smarcel  // remainder may be obtained by dividing u[...] by d. If r is non-null we
130803Smarcel  // compute the remainder (urem uses this).
130803Smarcel  if (r) {
130803Smarcel    // The value d is expressed by the "shift" value above since we avoided
130803Smarcel    // multiplication by d by using a shift left. So, all we have to do is
130803Smarcel    // shift right here. In order to mak
130803Smarcel    if (shift) {
130803Smarcel      unsigned carry = 0;
130803Smarcel      DEBUG(dbgs() << "KnuthDiv: remainder:");
130803Smarcel      for (int i = n-1; i >= 0; i--) {
130803Smarcel        r[i] = (u[i] >> shift) | carry;
130803Smarcel        carry = u[i] << (32 - shift);
130803Smarcel        DEBUG(dbgs() << " " << r[i]);
130803Smarcel      }
130803Smarcel    } else {
130803Smarcel      for (int i = n-1; i >= 0; i--) {
130803Smarcel        r[i] = u[i];
130803Smarcel        DEBUG(dbgs() << " " << r[i]);
130803Smarcel      }
130803Smarcel    }
130803Smarcel    DEBUG(dbgs() << '\n');
130803Smarcel  }
130803Smarcel#if 0
130803Smarcel  DEBUG(dbgs() << '\n');
130803Smarcel#endif
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::divide(const APInt LHS, unsigned lhsWords,
130803Smarcel                   const APInt &RHS, unsigned rhsWords,
130803Smarcel                   APInt *Quotient, APInt *Remainder)
130803Smarcel{
130803Smarcel  assert(lhsWords >= rhsWords && "Fractional result");
130803Smarcel
130803Smarcel  // First, compose the values into an array of 32-bit words instead of
130803Smarcel  // 64-bit words. This is a necessity of both the "short division" algorithm
130803Smarcel  // and the Knuth "classical algorithm" which requires there to be native
130803Smarcel  // operations for +, -, and * on an m bit value with an m*2 bit result. We
130803Smarcel  // can't use 64-bit operands here because we don't have native results of
130803Smarcel  // 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't
130803Smarcel  // work on large-endian machines.
130803Smarcel  uint64_t mask = ~0ull >> (sizeof(unsigned)*CHAR_BIT);
130803Smarcel  unsigned n = rhsWords * 2;
130803Smarcel  unsigned m = (lhsWords * 2) - n;
130803Smarcel
130803Smarcel  // Allocate space for the temporary values we need either on the stack, if
130803Smarcel  // it will fit, or on the heap if it won't.
130803Smarcel  unsigned SPACE[128];
130803Smarcel  unsigned *U = 0;
130803Smarcel  unsigned *V = 0;
130803Smarcel  unsigned *Q = 0;
130803Smarcel  unsigned *R = 0;
130803Smarcel  if ((Remainder?4:3)*n+2*m+1 <= 128) {
130803Smarcel    U = &SPACE[0];
130803Smarcel    V = &SPACE[m+n+1];
130803Smarcel    Q = &SPACE[(m+n+1) + n];
130803Smarcel    if (Remainder)
130803Smarcel      R = &SPACE[(m+n+1) + n + (m+n)];
130803Smarcel  } else {
130803Smarcel    U = new unsigned[m + n + 1];
130803Smarcel    V = new unsigned[n];
130803Smarcel    Q = new unsigned[m+n];
130803Smarcel    if (Remainder)
130803Smarcel      R = new unsigned[n];
130803Smarcel  }
130803Smarcel
130803Smarcel  // Initialize the dividend
130803Smarcel  memset(U, 0, (m+n+1)*sizeof(unsigned));
130803Smarcel  for (unsigned i = 0; i < lhsWords; ++i) {
130803Smarcel    uint64_t tmp = (LHS.getNumWords() == 1 ? LHS.VAL : LHS.pVal[i]);
130803Smarcel    U[i * 2] = (unsigned)(tmp & mask);
130803Smarcel    U[i * 2 + 1] = (unsigned)(tmp >> (sizeof(unsigned)*CHAR_BIT));
130803Smarcel  }
130803Smarcel  U[m+n] = 0; // this extra word is for "spill" in the Knuth algorithm.
130803Smarcel
130803Smarcel  // Initialize the divisor
130803Smarcel  memset(V, 0, (n)*sizeof(unsigned));
130803Smarcel  for (unsigned i = 0; i < rhsWords; ++i) {
130803Smarcel    uint64_t tmp = (RHS.getNumWords() == 1 ? RHS.VAL : RHS.pVal[i]);
130803Smarcel    V[i * 2] = (unsigned)(tmp & mask);
130803Smarcel    V[i * 2 + 1] = (unsigned)(tmp >> (sizeof(unsigned)*CHAR_BIT));
130803Smarcel  }
130803Smarcel
130803Smarcel  // initialize the quotient and remainder
130803Smarcel  memset(Q, 0, (m+n) * sizeof(unsigned));
130803Smarcel  if (Remainder)
130803Smarcel    memset(R, 0, n * sizeof(unsigned));
130803Smarcel
130803Smarcel  // Now, adjust m and n for the Knuth division. n is the number of words in
130803Smarcel  // the divisor. m is the number of words by which the dividend exceeds the
130803Smarcel  // divisor (i.e. m+n is the length of the dividend). These sizes must not
130803Smarcel  // contain any zero words or the Knuth algorithm fails.
130803Smarcel  for (unsigned i = n; i > 0 && V[i-1] == 0; i--) {
130803Smarcel    n--;
130803Smarcel    m++;
130803Smarcel  }
130803Smarcel  for (unsigned i = m+n; i > 0 && U[i-1] == 0; i--)
130803Smarcel    m--;
130803Smarcel
130803Smarcel  // If we're left with only a single word for the divisor, Knuth doesn't work
130803Smarcel  // so we implement the short division algorithm here. This is much simpler
130803Smarcel  // and faster because we are certain that we can divide a 64-bit quantity
130803Smarcel  // by a 32-bit quantity at hardware speed and short division is simply a
130803Smarcel  // series of such operations. This is just like doing short division but we
130803Smarcel  // are using base 2^32 instead of base 10.
130803Smarcel  assert(n != 0 && "Divide by zero?");
130803Smarcel  if (n == 1) {
130803Smarcel    unsigned divisor = V[0];
130803Smarcel    unsigned remainder = 0;
130803Smarcel    for (int i = m+n-1; i >= 0; i--) {
130803Smarcel      uint64_t partial_dividend = uint64_t(remainder) << 32 | U[i];
130803Smarcel      if (partial_dividend == 0) {
130803Smarcel        Q[i] = 0;
130803Smarcel        remainder = 0;
130803Smarcel      } else if (partial_dividend < divisor) {
130803Smarcel        Q[i] = 0;
130803Smarcel        remainder = (unsigned)partial_dividend;
130803Smarcel      } else if (partial_dividend == divisor) {
130803Smarcel        Q[i] = 1;
130803Smarcel        remainder = 0;
130803Smarcel      } else {
130803Smarcel        Q[i] = (unsigned)(partial_dividend / divisor);
130803Smarcel        remainder = (unsigned)(partial_dividend - (Q[i] * divisor));
130803Smarcel      }
130803Smarcel    }
130803Smarcel    if (R)
130803Smarcel      R[0] = remainder;
130803Smarcel  } else {
130803Smarcel    // Now we're ready to invoke the Knuth classical divide algorithm. In this
130803Smarcel    // case n > 1.
130803Smarcel    KnuthDiv(U, V, Q, R, m, n);
130803Smarcel  }
130803Smarcel
130803Smarcel  // If the caller wants the quotient
130803Smarcel  if (Quotient) {
130803Smarcel    // Set up the Quotient value's memory.
130803Smarcel    if (Quotient->BitWidth != LHS.BitWidth) {
130803Smarcel      if (Quotient->isSingleWord())
130803Smarcel        Quotient->VAL = 0;
130803Smarcel      else
130803Smarcel        delete [] Quotient->pVal;
130803Smarcel      Quotient->BitWidth = LHS.BitWidth;
130803Smarcel      if (!Quotient->isSingleWord())
130803Smarcel        Quotient->pVal = getClearedMemory(Quotient->getNumWords());
130803Smarcel    } else
130803Smarcel      Quotient->clearAllBits();
130803Smarcel
130803Smarcel    // The quotient is in Q. Reconstitute the quotient into Quotient's low
130803Smarcel    // order words.
130803Smarcel    if (lhsWords == 1) {
130803Smarcel      uint64_t tmp =
130803Smarcel        uint64_t(Q[0]) | (uint64_t(Q[1]) << (APINT_BITS_PER_WORD / 2));
130803Smarcel      if (Quotient->isSingleWord())
130803Smarcel        Quotient->VAL = tmp;
130803Smarcel      else
130803Smarcel        Quotient->pVal[0] = tmp;
130803Smarcel    } else {
130803Smarcel      assert(!Quotient->isSingleWord() && "Quotient APInt not large enough");
130803Smarcel      for (unsigned i = 0; i < lhsWords; ++i)
130803Smarcel        Quotient->pVal[i] =
130803Smarcel          uint64_t(Q[i*2]) | (uint64_t(Q[i*2+1]) << (APINT_BITS_PER_WORD / 2));
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  // If the caller wants the remainder
130803Smarcel  if (Remainder) {
130803Smarcel    // Set up the Remainder value's memory.
130803Smarcel    if (Remainder->BitWidth != RHS.BitWidth) {
130803Smarcel      if (Remainder->isSingleWord())
130803Smarcel        Remainder->VAL = 0;
130803Smarcel      else
130803Smarcel        delete [] Remainder->pVal;
130803Smarcel      Remainder->BitWidth = RHS.BitWidth;
130803Smarcel      if (!Remainder->isSingleWord())
130803Smarcel        Remainder->pVal = getClearedMemory(Remainder->getNumWords());
130803Smarcel    } else
130803Smarcel      Remainder->clearAllBits();
130803Smarcel
130803Smarcel    // The remainder is in R. Reconstitute the remainder into Remainder's low
130803Smarcel    // order words.
130803Smarcel    if (rhsWords == 1) {
130803Smarcel      uint64_t tmp =
130803Smarcel        uint64_t(R[0]) | (uint64_t(R[1]) << (APINT_BITS_PER_WORD / 2));
130803Smarcel      if (Remainder->isSingleWord())
130803Smarcel        Remainder->VAL = tmp;
130803Smarcel      else
130803Smarcel        Remainder->pVal[0] = tmp;
130803Smarcel    } else {
130803Smarcel      assert(!Remainder->isSingleWord() && "Remainder APInt not large enough");
130803Smarcel      for (unsigned i = 0; i < rhsWords; ++i)
130803Smarcel        Remainder->pVal[i] =
130803Smarcel          uint64_t(R[i*2]) | (uint64_t(R[i*2+1]) << (APINT_BITS_PER_WORD / 2));
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  // Clean up the memory we allocated.
130803Smarcel  if (U != &SPACE[0]) {
130803Smarcel    delete [] U;
130803Smarcel    delete [] V;
130803Smarcel    delete [] Q;
130803Smarcel    delete [] R;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::udiv(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel
130803Smarcel  // First, deal with the easy case
130803Smarcel  if (isSingleWord()) {
130803Smarcel    assert(RHS.VAL != 0 && "Divide by zero?");
130803Smarcel    return APInt(BitWidth, VAL / RHS.VAL);
130803Smarcel  }
130803Smarcel
130803Smarcel  // Get some facts about the LHS and RHS number of bits and words
130803Smarcel  unsigned rhsBits = RHS.getActiveBits();
130803Smarcel  unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
130803Smarcel  assert(rhsWords && "Divided by zero???");
130803Smarcel  unsigned lhsBits = this->getActiveBits();
130803Smarcel  unsigned lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
130803Smarcel
130803Smarcel  // Deal with some degenerate cases
130803Smarcel  if (!lhsWords)
130803Smarcel    // 0 / X ===> 0
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel  else if (lhsWords < rhsWords || this->ult(RHS)) {
130803Smarcel    // X / Y ===> 0, iff X < Y
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel  } else if (*this == RHS) {
130803Smarcel    // X / X ===> 1
130803Smarcel    return APInt(BitWidth, 1);
130803Smarcel  } else if (lhsWords == 1 && rhsWords == 1) {
130803Smarcel    // All high words are zero, just use native divide
130803Smarcel    return APInt(BitWidth, this->pVal[0] / RHS.pVal[0]);
130803Smarcel  }
130803Smarcel
130803Smarcel  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
130803Smarcel  APInt Quotient(1,0); // to hold result.
130803Smarcel  divide(*this, lhsWords, RHS, rhsWords, &Quotient, 0);
130803Smarcel  return Quotient;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::urem(const APInt& RHS) const {
130803Smarcel  assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
130803Smarcel  if (isSingleWord()) {
130803Smarcel    assert(RHS.VAL != 0 && "Remainder by zero?");
130803Smarcel    return APInt(BitWidth, VAL % RHS.VAL);
130803Smarcel  }
130803Smarcel
130803Smarcel  // Get some facts about the LHS
130803Smarcel  unsigned lhsBits = getActiveBits();
130803Smarcel  unsigned lhsWords = !lhsBits ? 0 : (whichWord(lhsBits - 1) + 1);
130803Smarcel
130803Smarcel  // Get some facts about the RHS
130803Smarcel  unsigned rhsBits = RHS.getActiveBits();
130803Smarcel  unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
130803Smarcel  assert(rhsWords && "Performing remainder operation by zero ???");
130803Smarcel
130803Smarcel  // Check the degenerate cases
130803Smarcel  if (lhsWords == 0) {
130803Smarcel    // 0 % Y ===> 0
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel  } else if (lhsWords < rhsWords || this->ult(RHS)) {
130803Smarcel    // X % Y ===> X, iff X < Y
130803Smarcel    return *this;
130803Smarcel  } else if (*this == RHS) {
130803Smarcel    // X % X == 0;
130803Smarcel    return APInt(BitWidth, 0);
130803Smarcel  } else if (lhsWords == 1) {
130803Smarcel    // All high words are zero, just use native remainder
130803Smarcel    return APInt(BitWidth, pVal[0] % RHS.pVal[0]);
130803Smarcel  }
130803Smarcel
130803Smarcel  // We have to compute it the hard way. Invoke the Knuth divide algorithm.
130803Smarcel  APInt Remainder(1,0);
130803Smarcel  divide(*this, lhsWords, RHS, rhsWords, 0, &Remainder);
130803Smarcel  return Remainder;
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::udivrem(const APInt &LHS, const APInt &RHS,
130803Smarcel                    APInt &Quotient, APInt &Remainder) {
130803Smarcel  // Get some size facts about the dividend and divisor
130803Smarcel  unsigned lhsBits  = LHS.getActiveBits();
130803Smarcel  unsigned lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
130803Smarcel  unsigned rhsBits  = RHS.getActiveBits();
130803Smarcel  unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
130803Smarcel
130803Smarcel  // Check the degenerate cases
130803Smarcel  if (lhsWords == 0) {
130803Smarcel    Quotient = 0;                // 0 / Y ===> 0
130803Smarcel    Remainder = 0;               // 0 % Y ===> 0
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  if (lhsWords < rhsWords || LHS.ult(RHS)) {
130803Smarcel    Remainder = LHS;            // X % Y ===> X, iff X < Y
130803Smarcel    Quotient = 0;               // X / Y ===> 0, iff X < Y
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  if (LHS == RHS) {
130803Smarcel    Quotient  = 1;              // X / X ===> 1
130803Smarcel    Remainder = 0;              // X % X ===> 0;
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  if (lhsWords == 1 && rhsWords == 1) {
130803Smarcel    // There is only one word to consider so use the native versions.
130803Smarcel    uint64_t lhsValue = LHS.isSingleWord() ? LHS.VAL : LHS.pVal[0];
130803Smarcel    uint64_t rhsValue = RHS.isSingleWord() ? RHS.VAL : RHS.pVal[0];
130803Smarcel    Quotient = APInt(LHS.getBitWidth(), lhsValue / rhsValue);
130803Smarcel    Remainder = APInt(LHS.getBitWidth(), lhsValue % rhsValue);
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  // Okay, lets do it the long way
130803Smarcel  divide(LHS, lhsWords, RHS, rhsWords, &Quotient, &Remainder);
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  APInt Res = *this+RHS;
130803Smarcel  Overflow = isNonNegative() == RHS.isNonNegative() &&
130803Smarcel             Res.isNonNegative() != isNonNegative();
130803Smarcel  return Res;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::uadd_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  APInt Res = *this+RHS;
130803Smarcel  Overflow = Res.ult(RHS);
130803Smarcel  return Res;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::ssub_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  APInt Res = *this - RHS;
130803Smarcel  Overflow = isNonNegative() != RHS.isNonNegative() &&
130803Smarcel             Res.isNonNegative() != isNonNegative();
130803Smarcel  return Res;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::usub_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  APInt Res = *this-RHS;
130803Smarcel  Overflow = Res.ugt(*this);
130803Smarcel  return Res;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::sdiv_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  // MININT/-1  -->  overflow.
130803Smarcel  Overflow = isMinSignedValue() && RHS.isAllOnesValue();
130803Smarcel  return sdiv(RHS);
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  APInt Res = *this * RHS;
130803Smarcel
130803Smarcel  if (*this != 0 && RHS != 0)
130803Smarcel    Overflow = Res.sdiv(RHS) != *this || Res.sdiv(*this) != RHS;
130803Smarcel  else
130803Smarcel    Overflow = false;
130803Smarcel  return Res;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
130803Smarcel  APInt Res = *this * RHS;
130803Smarcel
130803Smarcel  if (*this != 0 && RHS != 0)
130803Smarcel    Overflow = Res.udiv(RHS) != *this || Res.udiv(*this) != RHS;
130803Smarcel  else
130803Smarcel    Overflow = false;
130803Smarcel  return Res;
130803Smarcel}
130803Smarcel
130803SmarcelAPInt APInt::sshl_ov(unsigned ShAmt, bool &Overflow) const {
130803Smarcel  Overflow = ShAmt >= getBitWidth();
130803Smarcel  if (Overflow)
130803Smarcel    ShAmt = getBitWidth()-1;
130803Smarcel
130803Smarcel  if (isNonNegative()) // Don't allow sign change.
130803Smarcel    Overflow = ShAmt >= countLeadingZeros();
130803Smarcel  else
130803Smarcel    Overflow = ShAmt >= countLeadingOnes();
130803Smarcel
130803Smarcel  return *this << ShAmt;
130803Smarcel}
130803Smarcel
130803Smarcel
130803Smarcel
130803Smarcel
130803Smarcelvoid APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
130803Smarcel  // Check our assumptions here
130803Smarcel  assert(!str.empty() && "Invalid string length");
130803Smarcel  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
130803Smarcel          radix == 36) &&
130803Smarcel         "Radix should be 2, 8, 10, 16, or 36!");
130803Smarcel
130803Smarcel  StringRef::iterator p = str.begin();
130803Smarcel  size_t slen = str.size();
130803Smarcel  bool isNeg = *p == '-';
130803Smarcel  if (*p == '-' || *p == '+') {
130803Smarcel    p++;
130803Smarcel    slen--;
130803Smarcel    assert(slen && "String is only a sign, needs a value.");
130803Smarcel  }
130803Smarcel  assert((slen <= numbits || radix != 2) && "Insufficient bit width");
130803Smarcel  assert(((slen-1)*3 <= numbits || radix != 8) && "Insufficient bit width");
130803Smarcel  assert(((slen-1)*4 <= numbits || radix != 16) && "Insufficient bit width");
130803Smarcel  assert((((slen-1)*64)/22 <= numbits || radix != 10) &&
130803Smarcel         "Insufficient bit width");
130803Smarcel
130803Smarcel  // Allocate memory
130803Smarcel  if (!isSingleWord())
130803Smarcel    pVal = getClearedMemory(getNumWords());
130803Smarcel
130803Smarcel  // Figure out if we can shift instead of multiply
130803Smarcel  unsigned shift = (radix == 16 ? 4 : radix == 8 ? 3 : radix == 2 ? 1 : 0);
130803Smarcel
130803Smarcel  // Set up an APInt for the digit to add outside the loop so we don't
130803Smarcel  // constantly construct/destruct it.
130803Smarcel  APInt apdigit(getBitWidth(), 0);
130803Smarcel  APInt apradix(getBitWidth(), radix);
130803Smarcel
130803Smarcel  // Enter digit traversal loop
130803Smarcel  for (StringRef::iterator e = str.end(); p != e; ++p) {
130803Smarcel    unsigned digit = getDigit(*p, radix);
130803Smarcel    assert(digit < radix && "Invalid character in digit string");
130803Smarcel
130803Smarcel    // Shift or multiply the value by the radix
130803Smarcel    if (slen > 1) {
130803Smarcel      if (shift)
130803Smarcel        *this <<= shift;
130803Smarcel      else
130803Smarcel        *this *= apradix;
130803Smarcel    }
130803Smarcel
130803Smarcel    // Add in the digit we just interpreted
130803Smarcel    if (apdigit.isSingleWord())
130803Smarcel      apdigit.VAL = digit;
130803Smarcel    else
130803Smarcel      apdigit.pVal[0] = digit;
130803Smarcel    *this += apdigit;
130803Smarcel  }
130803Smarcel  // If its negative, put it in two's complement form
130803Smarcel  if (isNeg) {
130803Smarcel    (*this)--;
130803Smarcel    this->flipAllBits();
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
130803Smarcel                     bool Signed, bool formatAsCLiteral) const {
130803Smarcel  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2 ||
130803Smarcel          Radix == 36) &&
130803Smarcel         "Radix should be 2, 8, 10, or 16!");
130803Smarcel
130803Smarcel  const char *Prefix = "";
130803Smarcel  if (formatAsCLiteral) {
130803Smarcel    switch (Radix) {
130803Smarcel      case 2:
130803Smarcel        // Binary literals are a non-standard extension added in gcc 4.3:
130803Smarcel        // http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
130803Smarcel        Prefix = "0b";
130803Smarcel        break;
130803Smarcel      case 8:
130803Smarcel        Prefix = "0";
130803Smarcel        break;
130803Smarcel      case 16:
130803Smarcel        Prefix = "0x";
130803Smarcel        break;
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  // First, check for a zero value and just short circuit the logic below.
130803Smarcel  if (*this == 0) {
130803Smarcel    while (*Prefix) {
130803Smarcel      Str.push_back(*Prefix);
130803Smarcel      ++Prefix;
130803Smarcel    };
130803Smarcel    Str.push_back('0');
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  static const char Digits[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
130803Smarcel
130803Smarcel  if (isSingleWord()) {
130803Smarcel    char Buffer[65];
130803Smarcel    char *BufPtr = Buffer+65;
130803Smarcel
130803Smarcel    uint64_t N;
130803Smarcel    if (!Signed) {
130803Smarcel      N = getZExtValue();
130803Smarcel    } else {
130803Smarcel      int64_t I = getSExtValue();
130803Smarcel      if (I >= 0) {
130803Smarcel        N = I;
130803Smarcel      } else {
130803Smarcel        Str.push_back('-');
130803Smarcel        N = -(uint64_t)I;
130803Smarcel      }
130803Smarcel    }
130803Smarcel
130803Smarcel    while (*Prefix) {
130803Smarcel      Str.push_back(*Prefix);
130803Smarcel      ++Prefix;
130803Smarcel    };
130803Smarcel
130803Smarcel    while (N) {
130803Smarcel      *--BufPtr = Digits[N % Radix];
130803Smarcel      N /= Radix;
130803Smarcel    }
130803Smarcel    Str.append(BufPtr, Buffer+65);
130803Smarcel    return;
130803Smarcel  }
130803Smarcel
130803Smarcel  APInt Tmp(*this);
130803Smarcel
130803Smarcel  if (Signed && isNegative()) {
130803Smarcel    // They want to print the signed version and it is a negative value
130803Smarcel    // Flip the bits and add one to turn it into the equivalent positive
130803Smarcel    // value and put a '-' in the result.
130803Smarcel    Tmp.flipAllBits();
130803Smarcel    Tmp++;
130803Smarcel    Str.push_back('-');
130803Smarcel  }
130803Smarcel
130803Smarcel  while (*Prefix) {
130803Smarcel    Str.push_back(*Prefix);
130803Smarcel    ++Prefix;
130803Smarcel  };
130803Smarcel
130803Smarcel  // We insert the digits backward, then reverse them to get the right order.
130803Smarcel  unsigned StartDig = Str.size();
130803Smarcel
130803Smarcel  // For the 2, 8 and 16 bit cases, we can just shift instead of divide
130803Smarcel  // because the number of bits per digit (1, 3 and 4 respectively) divides
130803Smarcel  // equaly.  We just shift until the value is zero.
130803Smarcel  if (Radix == 2 || Radix == 8 || Radix == 16) {
130803Smarcel    // Just shift tmp right for each digit width until it becomes zero
130803Smarcel    unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
130803Smarcel    unsigned MaskAmt = Radix - 1;
130803Smarcel
130803Smarcel    while (Tmp != 0) {
130803Smarcel      unsigned Digit = unsigned(Tmp.getRawData()[0]) & MaskAmt;
130803Smarcel      Str.push_back(Digits[Digit]);
130803Smarcel      Tmp = Tmp.lshr(ShiftAmt);
130803Smarcel    }
130803Smarcel  } else {
130803Smarcel    APInt divisor(Radix == 10? 4 : 8, Radix);
130803Smarcel    while (Tmp != 0) {
130803Smarcel      APInt APdigit(1, 0);
130803Smarcel      APInt tmp2(Tmp.getBitWidth(), 0);
130803Smarcel      divide(Tmp, Tmp.getNumWords(), divisor, divisor.getNumWords(), &tmp2,
130803Smarcel             &APdigit);
130803Smarcel      unsigned Digit = (unsigned)APdigit.getZExtValue();
130803Smarcel      assert(Digit < Radix && "divide failed");
130803Smarcel      Str.push_back(Digits[Digit]);
130803Smarcel      Tmp = tmp2;
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  // Reverse the digits before returning.
130803Smarcel  std::reverse(Str.begin()+StartDig, Str.end());
130803Smarcel}
130803Smarcel
130803Smarcel/// toString - This returns the APInt as a std::string.  Note that this is an
130803Smarcel/// inefficient method.  It is better to pass in a SmallVector/SmallString
130803Smarcel/// to the methods above.
130803Smarcelstd::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
130803Smarcel  SmallString<40> S;
130803Smarcel  toString(S, Radix, Signed, /* formatAsCLiteral = */false);
130803Smarcel  return S.str();
130803Smarcel}
130803Smarcel
130803Smarcel
130803Smarcelvoid APInt::dump() const {
130803Smarcel  SmallString<40> S, U;
130803Smarcel  this->toStringUnsigned(U);
130803Smarcel  this->toStringSigned(S);
130803Smarcel  dbgs() << "APInt(" << BitWidth << "b, "
130803Smarcel         << U.str() << "u " << S.str() << "s)";
130803Smarcel}
130803Smarcel
130803Smarcelvoid APInt::print(raw_ostream &OS, bool isSigned) const {
130803Smarcel  SmallString<40> S;
130803Smarcel  this->toString(S, 10, isSigned, /* formatAsCLiteral = */false);
130803Smarcel  OS << S.str();
130803Smarcel}
130803Smarcel
130803Smarcel// This implements a variety of operations on a representation of
130803Smarcel// arbitrary precision, two's-complement, bignum integer values.
130803Smarcel
130803Smarcel// Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
130803Smarcel// and unrestricting assumption.
130803Smarcel#define COMPILE_TIME_ASSERT(cond) extern int CTAssert[(cond) ? 1 : -1]
130803SmarcelCOMPILE_TIME_ASSERT(integerPartWidth % 2 == 0);
130803Smarcel
130803Smarcel/* Some handy functions local to this file.  */
130803Smarcelnamespace {
130803Smarcel
130803Smarcel  /* Returns the integer part with the least significant BITS set.
130803Smarcel     BITS cannot be zero.  */
130803Smarcel  static inline integerPart
130803Smarcel  lowBitMask(unsigned int bits)
130803Smarcel  {
130803Smarcel    assert(bits != 0 && bits <= integerPartWidth);
130803Smarcel
130803Smarcel    return ~(integerPart) 0 >> (integerPartWidth - bits);
130803Smarcel  }
130803Smarcel
130803Smarcel  /* Returns the value of the lower half of PART.  */
130803Smarcel  static inline integerPart
130803Smarcel  lowHalf(integerPart part)
130803Smarcel  {
130803Smarcel    return part & lowBitMask(integerPartWidth / 2);
130803Smarcel  }
130803Smarcel
130803Smarcel  /* Returns the value of the upper half of PART.  */
130803Smarcel  static inline integerPart
130803Smarcel  highHalf(integerPart part)
130803Smarcel  {
130803Smarcel    return part >> (integerPartWidth / 2);
130803Smarcel  }
130803Smarcel
130803Smarcel  /* Returns the bit number of the most significant set bit of a part.
130803Smarcel     If the input number has no bits set -1U is returned.  */
130803Smarcel  static unsigned int
130803Smarcel  partMSB(integerPart value)
130803Smarcel  {
130803Smarcel    unsigned int n, msb;
130803Smarcel
130803Smarcel    if (value == 0)
130803Smarcel      return -1U;
130803Smarcel
130803Smarcel    n = integerPartWidth / 2;
130803Smarcel
130803Smarcel    msb = 0;
130803Smarcel    do {
130803Smarcel      if (value >> n) {
130803Smarcel        value >>= n;
130803Smarcel        msb += n;
130803Smarcel      }
130803Smarcel
130803Smarcel      n >>= 1;
130803Smarcel    } while (n);
130803Smarcel
130803Smarcel    return msb;
130803Smarcel  }
130803Smarcel
130803Smarcel  /* Returns the bit number of the least significant set bit of a
130803Smarcel     part.  If the input number has no bits set -1U is returned.  */
130803Smarcel  static unsigned int
130803Smarcel  partLSB(integerPart value)
130803Smarcel  {
130803Smarcel    unsigned int n, lsb;
130803Smarcel
130803Smarcel    if (value == 0)
130803Smarcel      return -1U;
130803Smarcel
130803Smarcel    lsb = integerPartWidth - 1;
130803Smarcel    n = integerPartWidth / 2;
130803Smarcel
130803Smarcel    do {
130803Smarcel      if (value << n) {
130803Smarcel        value <<= n;
130803Smarcel        lsb -= n;
130803Smarcel      }
130803Smarcel
130803Smarcel      n >>= 1;
130803Smarcel    } while (n);
130803Smarcel
130803Smarcel    return lsb;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcel/* Sets the least significant part of a bignum to the input value, and
130803Smarcel   zeroes out higher parts.  */
130803Smarcelvoid
130803SmarcelAPInt::tcSet(integerPart *dst, integerPart part, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  assert(parts > 0);
130803Smarcel
130803Smarcel  dst[0] = part;
130803Smarcel  for (i = 1; i < parts; i++)
130803Smarcel    dst[i] = 0;
130803Smarcel}
130803Smarcel
130803Smarcel/* Assign one bignum to another.  */
130803Smarcelvoid
130803SmarcelAPInt::tcAssign(integerPart *dst, const integerPart *src, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    dst[i] = src[i];
130803Smarcel}
130803Smarcel
130803Smarcel/* Returns true if a bignum is zero, false otherwise.  */
130803Smarcelbool
130803SmarcelAPInt::tcIsZero(const integerPart *src, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    if (src[i])
130803Smarcel      return false;
130803Smarcel
130803Smarcel  return true;
130803Smarcel}
130803Smarcel
130803Smarcel/* Extract the given bit of a bignum; returns 0 or 1.  */
130803Smarcelint
130803SmarcelAPInt::tcExtractBit(const integerPart *parts, unsigned int bit)
130803Smarcel{
130803Smarcel  return (parts[bit / integerPartWidth] &
130803Smarcel          ((integerPart) 1 << bit % integerPartWidth)) != 0;
130803Smarcel}
130803Smarcel
130803Smarcel/* Set the given bit of a bignum. */
130803Smarcelvoid
130803SmarcelAPInt::tcSetBit(integerPart *parts, unsigned int bit)
130803Smarcel{
130803Smarcel  parts[bit / integerPartWidth] |= (integerPart) 1 << (bit % integerPartWidth);
130803Smarcel}
130803Smarcel
130803Smarcel/* Clears the given bit of a bignum. */
130803Smarcelvoid
130803SmarcelAPInt::tcClearBit(integerPart *parts, unsigned int bit)
130803Smarcel{
130803Smarcel  parts[bit / integerPartWidth] &=
130803Smarcel    ~((integerPart) 1 << (bit % integerPartWidth));
130803Smarcel}
130803Smarcel
130803Smarcel/* Returns the bit number of the least significant set bit of a
130803Smarcel   number.  If the input number has no bits set -1U is returned.  */
130803Smarcelunsigned int
130803SmarcelAPInt::tcLSB(const integerPart *parts, unsigned int n)
130803Smarcel{
130803Smarcel  unsigned int i, lsb;
130803Smarcel
130803Smarcel  for (i = 0; i < n; i++) {
130803Smarcel      if (parts[i] != 0) {
130803Smarcel          lsb = partLSB(parts[i]);
130803Smarcel
130803Smarcel          return lsb + i * integerPartWidth;
130803Smarcel      }
130803Smarcel  }
130803Smarcel
130803Smarcel  return -1U;
130803Smarcel}
130803Smarcel
130803Smarcel/* Returns the bit number of the most significant set bit of a number.
130803Smarcel   If the input number has no bits set -1U is returned.  */
130803Smarcelunsigned int
130803SmarcelAPInt::tcMSB(const integerPart *parts, unsigned int n)
130803Smarcel{
130803Smarcel  unsigned int msb;
130803Smarcel
130803Smarcel  do {
130803Smarcel    --n;
130803Smarcel
130803Smarcel    if (parts[n] != 0) {
130803Smarcel      msb = partMSB(parts[n]);
130803Smarcel
130803Smarcel      return msb + n * integerPartWidth;
130803Smarcel    }
130803Smarcel  } while (n);
130803Smarcel
130803Smarcel  return -1U;
130803Smarcel}
130803Smarcel
130803Smarcel/* Copy the bit vector of width srcBITS from SRC, starting at bit
130803Smarcel   srcLSB, to DST, of dstCOUNT parts, such that the bit srcLSB becomes
130803Smarcel   the least significant bit of DST.  All high bits above srcBITS in
130803Smarcel   DST are zero-filled.  */
130803Smarcelvoid
130803SmarcelAPInt::tcExtract(integerPart *dst, unsigned int dstCount,const integerPart *src,
130803Smarcel                 unsigned int srcBits, unsigned int srcLSB)
130803Smarcel{
130803Smarcel  unsigned int firstSrcPart, dstParts, shift, n;
130803Smarcel
130803Smarcel  dstParts = (srcBits + integerPartWidth - 1) / integerPartWidth;
130803Smarcel  assert(dstParts <= dstCount);
130803Smarcel
130803Smarcel  firstSrcPart = srcLSB / integerPartWidth;
130803Smarcel  tcAssign (dst, src + firstSrcPart, dstParts);
130803Smarcel
130803Smarcel  shift = srcLSB % integerPartWidth;
130803Smarcel  tcShiftRight (dst, dstParts, shift);
130803Smarcel
130803Smarcel  /* We now have (dstParts * integerPartWidth - shift) bits from SRC
130803Smarcel     in DST.  If this is less that srcBits, append the rest, else
130803Smarcel     clear the high bits.  */
130803Smarcel  n = dstParts * integerPartWidth - shift;
130803Smarcel  if (n < srcBits) {
130803Smarcel    integerPart mask = lowBitMask (srcBits - n);
130803Smarcel    dst[dstParts - 1] |= ((src[firstSrcPart + dstParts] & mask)
130803Smarcel                          << n % integerPartWidth);
130803Smarcel  } else if (n > srcBits) {
130803Smarcel    if (srcBits % integerPartWidth)
130803Smarcel      dst[dstParts - 1] &= lowBitMask (srcBits % integerPartWidth);
130803Smarcel  }
130803Smarcel
130803Smarcel  /* Clear high parts.  */
130803Smarcel  while (dstParts < dstCount)
130803Smarcel    dst[dstParts++] = 0;
130803Smarcel}
130803Smarcel
130803Smarcel/* DST += RHS + C where C is zero or one.  Returns the carry flag.  */
130803SmarcelintegerPart
130803SmarcelAPInt::tcAdd(integerPart *dst, const integerPart *rhs,
130803Smarcel             integerPart c, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  assert(c <= 1);
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++) {
130803Smarcel    integerPart l;
130803Smarcel
130803Smarcel    l = dst[i];
130803Smarcel    if (c) {
130803Smarcel      dst[i] += rhs[i] + 1;
130803Smarcel      c = (dst[i] <= l);
130803Smarcel    } else {
130803Smarcel      dst[i] += rhs[i];
130803Smarcel      c = (dst[i] < l);
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  return c;
130803Smarcel}
130803Smarcel
130803Smarcel/* DST -= RHS + C where C is zero or one.  Returns the carry flag.  */
130803SmarcelintegerPart
130803SmarcelAPInt::tcSubtract(integerPart *dst, const integerPart *rhs,
130803Smarcel                  integerPart c, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  assert(c <= 1);
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++) {
130803Smarcel    integerPart l;
130803Smarcel
130803Smarcel    l = dst[i];
130803Smarcel    if (c) {
130803Smarcel      dst[i] -= rhs[i] + 1;
130803Smarcel      c = (dst[i] >= l);
130803Smarcel    } else {
130803Smarcel      dst[i] -= rhs[i];
130803Smarcel      c = (dst[i] > l);
130803Smarcel    }
130803Smarcel  }
130803Smarcel
130803Smarcel  return c;
130803Smarcel}
130803Smarcel
130803Smarcel/* Negate a bignum in-place.  */
130803Smarcelvoid
130803SmarcelAPInt::tcNegate(integerPart *dst, unsigned int parts)
130803Smarcel{
130803Smarcel  tcComplement(dst, parts);
130803Smarcel  tcIncrement(dst, parts);
130803Smarcel}
130803Smarcel
130803Smarcel/*  DST += SRC * MULTIPLIER + CARRY   if add is true
130803Smarcel    DST  = SRC * MULTIPLIER + CARRY   if add is false
130803Smarcel
130803Smarcel    Requires 0 <= DSTPARTS <= SRCPARTS + 1.  If DST overlaps SRC
130803Smarcel    they must start at the same point, i.e. DST == SRC.
130803Smarcel
130803Smarcel    If DSTPARTS == SRCPARTS + 1 no overflow occurs and zero is
130803Smarcel    returned.  Otherwise DST is filled with the least significant
130803Smarcel    DSTPARTS parts of the result, and if all of the omitted higher
130803Smarcel    parts were zero return zero, otherwise overflow occurred and
130803Smarcel    return one.  */
130803Smarcelint
130803SmarcelAPInt::tcMultiplyPart(integerPart *dst, const integerPart *src,
130803Smarcel                      integerPart multiplier, integerPart carry,
130803Smarcel                      unsigned int srcParts, unsigned int dstParts,
130803Smarcel                      bool add)
130803Smarcel{
130803Smarcel  unsigned int i, n;
130803Smarcel
130803Smarcel  /* Otherwise our writes of DST kill our later reads of SRC.  */
130803Smarcel  assert(dst <= src || dst >= src + srcParts);
130803Smarcel  assert(dstParts <= srcParts + 1);
130803Smarcel
130803Smarcel  /* N loops; minimum of dstParts and srcParts.  */
130803Smarcel  n = dstParts < srcParts ? dstParts: srcParts;
130803Smarcel
130803Smarcel  for (i = 0; i < n; i++) {
130803Smarcel    integerPart low, mid, high, srcPart;
130803Smarcel
130803Smarcel      /* [ LOW, HIGH ] = MULTIPLIER * SRC[i] + DST[i] + CARRY.
130803Smarcel
130803Smarcel         This cannot overflow, because
130803Smarcel
130803Smarcel         (n - 1) * (n - 1) + 2 (n - 1) = (n - 1) * (n + 1)
130803Smarcel
130803Smarcel         which is less than n^2.  */
130803Smarcel
130803Smarcel    srcPart = src[i];
130803Smarcel
130803Smarcel    if (multiplier == 0 || srcPart == 0)        {
130803Smarcel      low = carry;
130803Smarcel      high = 0;
130803Smarcel    } else {
130803Smarcel      low = lowHalf(srcPart) * lowHalf(multiplier);
130803Smarcel      high = highHalf(srcPart) * highHalf(multiplier);
130803Smarcel
130803Smarcel      mid = lowHalf(srcPart) * highHalf(multiplier);
130803Smarcel      high += highHalf(mid);
130803Smarcel      mid <<= integerPartWidth / 2;
130803Smarcel      if (low + mid < low)
130803Smarcel        high++;
130803Smarcel      low += mid;
130803Smarcel
130803Smarcel      mid = highHalf(srcPart) * lowHalf(multiplier);
130803Smarcel      high += highHalf(mid);
130803Smarcel      mid <<= integerPartWidth / 2;
130803Smarcel      if (low + mid < low)
130803Smarcel        high++;
130803Smarcel      low += mid;
130803Smarcel
130803Smarcel      /* Now add carry.  */
130803Smarcel      if (low + carry < low)
130803Smarcel        high++;
130803Smarcel      low += carry;
130803Smarcel    }
130803Smarcel
130803Smarcel    if (add) {
130803Smarcel      /* And now DST[i], and store the new low part there.  */
130803Smarcel      if (low + dst[i] < low)
130803Smarcel        high++;
130803Smarcel      dst[i] += low;
130803Smarcel    } else
130803Smarcel      dst[i] = low;
130803Smarcel
130803Smarcel    carry = high;
130803Smarcel  }
130803Smarcel
130803Smarcel  if (i < dstParts) {
130803Smarcel    /* Full multiplication, there is no overflow.  */
130803Smarcel    assert(i + 1 == dstParts);
130803Smarcel    dst[i] = carry;
130803Smarcel    return 0;
130803Smarcel  } else {
130803Smarcel    /* We overflowed if there is carry.  */
130803Smarcel    if (carry)
130803Smarcel      return 1;
130803Smarcel
130803Smarcel    /* We would overflow if any significant unwritten parts would be
130803Smarcel       non-zero.  This is true if any remaining src parts are non-zero
130803Smarcel       and the multiplier is non-zero.  */
130803Smarcel    if (multiplier)
130803Smarcel      for (; i < srcParts; i++)
130803Smarcel        if (src[i])
130803Smarcel          return 1;
130803Smarcel
130803Smarcel    /* We fitted in the narrow destination.  */
130803Smarcel    return 0;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcel/* DST = LHS * RHS, where DST has the same width as the operands and
130803Smarcel   is filled with the least significant parts of the result.  Returns
130803Smarcel   one if overflow occurred, otherwise zero.  DST must be disjoint
130803Smarcel   from both operands.  */
130803Smarcelint
130803SmarcelAPInt::tcMultiply(integerPart *dst, const integerPart *lhs,
130803Smarcel                  const integerPart *rhs, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel  int overflow;
130803Smarcel
130803Smarcel  assert(dst != lhs && dst != rhs);
130803Smarcel
130803Smarcel  overflow = 0;
130803Smarcel  tcSet(dst, 0, parts);
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    overflow |= tcMultiplyPart(&dst[i], lhs, rhs[i], 0, parts,
130803Smarcel                               parts - i, true);
130803Smarcel
130803Smarcel  return overflow;
130803Smarcel}
130803Smarcel
130803Smarcel/* DST = LHS * RHS, where DST has width the sum of the widths of the
130803Smarcel   operands.  No overflow occurs.  DST must be disjoint from both
130803Smarcel   operands.  Returns the number of parts required to hold the
130803Smarcel   result.  */
130803Smarcelunsigned int
130803SmarcelAPInt::tcFullMultiply(integerPart *dst, const integerPart *lhs,
130803Smarcel                      const integerPart *rhs, unsigned int lhsParts,
130803Smarcel                      unsigned int rhsParts)
130803Smarcel{
130803Smarcel  /* Put the narrower number on the LHS for less loops below.  */
130803Smarcel  if (lhsParts > rhsParts) {
130803Smarcel    return tcFullMultiply (dst, rhs, lhs, rhsParts, lhsParts);
130803Smarcel  } else {
130803Smarcel    unsigned int n;
130803Smarcel
130803Smarcel    assert(dst != lhs && dst != rhs);
130803Smarcel
130803Smarcel    tcSet(dst, 0, rhsParts);
130803Smarcel
130803Smarcel    for (n = 0; n < lhsParts; n++)
130803Smarcel      tcMultiplyPart(&dst[n], rhs, lhs[n], 0, rhsParts, rhsParts + 1, true);
130803Smarcel
130803Smarcel    n = lhsParts + rhsParts;
130803Smarcel
130803Smarcel    return n - (dst[n - 1] == 0);
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcel/* If RHS is zero LHS and REMAINDER are left unchanged, return one.
130803Smarcel   Otherwise set LHS to LHS / RHS with the fractional part discarded,
130803Smarcel   set REMAINDER to the remainder, return zero.  i.e.
130803Smarcel
130803Smarcel   OLD_LHS = RHS * LHS + REMAINDER
130803Smarcel
130803Smarcel   SCRATCH is a bignum of the same size as the operands and result for
130803Smarcel   use by the routine; its contents need not be initialized and are
130803Smarcel   destroyed.  LHS, REMAINDER and SCRATCH must be distinct.
130803Smarcel*/
130803Smarcelint
130803SmarcelAPInt::tcDivide(integerPart *lhs, const integerPart *rhs,
130803Smarcel                integerPart *remainder, integerPart *srhs,
130803Smarcel                unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int n, shiftCount;
130803Smarcel  integerPart mask;
130803Smarcel
130803Smarcel  assert(lhs != remainder && lhs != srhs && remainder != srhs);
130803Smarcel
130803Smarcel  shiftCount = tcMSB(rhs, parts) + 1;
130803Smarcel  if (shiftCount == 0)
130803Smarcel    return true;
130803Smarcel
130803Smarcel  shiftCount = parts * integerPartWidth - shiftCount;
130803Smarcel  n = shiftCount / integerPartWidth;
130803Smarcel  mask = (integerPart) 1 << (shiftCount % integerPartWidth);
130803Smarcel
130803Smarcel  tcAssign(srhs, rhs, parts);
130803Smarcel  tcShiftLeft(srhs, parts, shiftCount);
130803Smarcel  tcAssign(remainder, lhs, parts);
130803Smarcel  tcSet(lhs, 0, parts);
130803Smarcel
130803Smarcel  /* Loop, subtracting SRHS if REMAINDER is greater and adding that to
130803Smarcel     the total.  */
130803Smarcel  for (;;) {
130803Smarcel      int compare;
130803Smarcel
130803Smarcel      compare = tcCompare(remainder, srhs, parts);
130803Smarcel      if (compare >= 0) {
130803Smarcel        tcSubtract(remainder, srhs, 0, parts);
130803Smarcel        lhs[n] |= mask;
130803Smarcel      }
130803Smarcel
130803Smarcel      if (shiftCount == 0)
130803Smarcel        break;
130803Smarcel      shiftCount--;
130803Smarcel      tcShiftRight(srhs, parts, 1);
130803Smarcel      if ((mask >>= 1) == 0)
130803Smarcel        mask = (integerPart) 1 << (integerPartWidth - 1), n--;
130803Smarcel  }
130803Smarcel
130803Smarcel  return false;
130803Smarcel}
130803Smarcel
130803Smarcel/* Shift a bignum left COUNT bits in-place.  Shifted in bits are zero.
130803Smarcel   There are no restrictions on COUNT.  */
130803Smarcelvoid
130803SmarcelAPInt::tcShiftLeft(integerPart *dst, unsigned int parts, unsigned int count)
130803Smarcel{
130803Smarcel  if (count) {
130803Smarcel    unsigned int jump, shift;
130803Smarcel
130803Smarcel    /* Jump is the inter-part jump; shift is is intra-part shift.  */
130803Smarcel    jump = count / integerPartWidth;
130803Smarcel    shift = count % integerPartWidth;
130803Smarcel
130803Smarcel    while (parts > jump) {
130803Smarcel      integerPart part;
130803Smarcel
130803Smarcel      parts--;
130803Smarcel
130803Smarcel      /* dst[i] comes from the two parts src[i - jump] and, if we have
130803Smarcel         an intra-part shift, src[i - jump - 1].  */
130803Smarcel      part = dst[parts - jump];
130803Smarcel      if (shift) {
130803Smarcel        part <<= shift;
130803Smarcel        if (parts >= jump + 1)
130803Smarcel          part |= dst[parts - jump - 1] >> (integerPartWidth - shift);
130803Smarcel      }
130803Smarcel
130803Smarcel      dst[parts] = part;
130803Smarcel    }
130803Smarcel
130803Smarcel    while (parts > 0)
130803Smarcel      dst[--parts] = 0;
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcel/* Shift a bignum right COUNT bits in-place.  Shifted in bits are
130803Smarcel   zero.  There are no restrictions on COUNT.  */
130803Smarcelvoid
130803SmarcelAPInt::tcShiftRight(integerPart *dst, unsigned int parts, unsigned int count)
130803Smarcel{
130803Smarcel  if (count) {
130803Smarcel    unsigned int i, jump, shift;
130803Smarcel
130803Smarcel    /* Jump is the inter-part jump; shift is is intra-part shift.  */
130803Smarcel    jump = count / integerPartWidth;
130803Smarcel    shift = count % integerPartWidth;
130803Smarcel
130803Smarcel    /* Perform the shift.  This leaves the most significant COUNT bits
130803Smarcel       of the result at zero.  */
130803Smarcel    for (i = 0; i < parts; i++) {
130803Smarcel      integerPart part;
130803Smarcel
130803Smarcel      if (i + jump >= parts) {
130803Smarcel        part = 0;
130803Smarcel      } else {
130803Smarcel        part = dst[i + jump];
130803Smarcel        if (shift) {
130803Smarcel          part >>= shift;
130803Smarcel          if (i + jump + 1 < parts)
130803Smarcel            part |= dst[i + jump + 1] << (integerPartWidth - shift);
130803Smarcel        }
130803Smarcel      }
130803Smarcel
130803Smarcel      dst[i] = part;
130803Smarcel    }
130803Smarcel  }
130803Smarcel}
130803Smarcel
130803Smarcel/* Bitwise and of two bignums.  */
130803Smarcelvoid
130803SmarcelAPInt::tcAnd(integerPart *dst, const integerPart *rhs, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    dst[i] &= rhs[i];
130803Smarcel}
130803Smarcel
130803Smarcel/* Bitwise inclusive or of two bignums.  */
130803Smarcelvoid
130803SmarcelAPInt::tcOr(integerPart *dst, const integerPart *rhs, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    dst[i] |= rhs[i];
130803Smarcel}
130803Smarcel
130803Smarcel/* Bitwise exclusive or of two bignums.  */
130803Smarcelvoid
130803SmarcelAPInt::tcXor(integerPart *dst, const integerPart *rhs, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    dst[i] ^= rhs[i];
130803Smarcel}
130803Smarcel
130803Smarcel/* Complement a bignum in-place.  */
130803Smarcelvoid
130803SmarcelAPInt::tcComplement(integerPart *dst, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    dst[i] = ~dst[i];
130803Smarcel}
130803Smarcel
130803Smarcel/* Comparison (unsigned) of two bignums.  */
130803Smarcelint
130803SmarcelAPInt::tcCompare(const integerPart *lhs, const integerPart *rhs,
130803Smarcel                 unsigned int parts)
130803Smarcel{
130803Smarcel  while (parts) {
130803Smarcel      parts--;
130803Smarcel      if (lhs[parts] == rhs[parts])
130803Smarcel        continue;
130803Smarcel
130803Smarcel      if (lhs[parts] > rhs[parts])
130803Smarcel        return 1;
130803Smarcel      else
130803Smarcel        return -1;
130803Smarcel    }
130803Smarcel
130803Smarcel  return 0;
130803Smarcel}
130803Smarcel
130803Smarcel/* Increment a bignum in-place, return the carry flag.  */
130803SmarcelintegerPart
130803SmarcelAPInt::tcIncrement(integerPart *dst, unsigned int parts)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  for (i = 0; i < parts; i++)
130803Smarcel    if (++dst[i] != 0)
130803Smarcel      break;
130803Smarcel
130803Smarcel  return i == parts;
130803Smarcel}
130803Smarcel
130803Smarcel/* Set the least significant BITS bits of a bignum, clear the
130803Smarcel   rest.  */
130803Smarcelvoid
130803SmarcelAPInt::tcSetLeastSignificantBits(integerPart *dst, unsigned int parts,
130803Smarcel                                 unsigned int bits)
130803Smarcel{
130803Smarcel  unsigned int i;
130803Smarcel
130803Smarcel  i = 0;
130803Smarcel  while (bits > integerPartWidth) {
130803Smarcel    dst[i++] = ~(integerPart) 0;
130803Smarcel    bits -= integerPartWidth;
130803Smarcel  }
130803Smarcel
130803Smarcel  if (bits)
130803Smarcel    dst[i++] = ~(integerPart) 0 >> (integerPartWidth - bits);
130803Smarcel
130803Smarcel  while (i < parts)
130803Smarcel    dst[i++] = 0;
130803Smarcel}
130803Smarcel