lib/Support/APInt.cpp

   1 //===-- APInt.cpp - Implement APInt class ---------------------------------===//
   2 //
   3 //                     The LLVM Compiler Infrastructure
   4 //
   5 // This file is distributed under the University of Illinois Open Source
   6 // License. See LICENSE.TXT for details.
   7 //
   8 //===----------------------------------------------------------------------===//
   9 //
  10 // This file implements a class to represent arbitrary precision integer
  11 // constant values and provide a variety of arithmetic operations on them.
  12 //
  13 //===----------------------------------------------------------------------===//
  14
  15 #define DEBUG_TYPE "apint"
  16 #include "llvm/ADT/APInt.h"
  17 #include "llvm/ADT/FoldingSet.h"
  18 #include "llvm/ADT/SmallString.h"
  19 #include "llvm/Support/Debug.h"
  20 #include "llvm/Support/MathExtras.h"
  21 #include <cmath>
  22 #include <limits>
  23 #include <cstring>
  24 #include <cstdlib>
  25 using namespace llvm;
  26
  27 /// A utility function for allocating memory, checking for allocation failures,
  28 /// and ensuring the contents are zeroed.
  29 inline static uint64_t* getClearedMemory(uint32_t numWords) {
  30   uint64_t * result = new uint64_t[numWords];
  31   assert(result && "APInt memory allocation fails!");
  32   memset(result, 0, numWords * sizeof(uint64_t));
  33   return result;
  34 }
  35
  36 /// A utility function for allocating memory and checking for allocation
  37 /// failure.  The content is not zeroed.
  38 inline static uint64_t* getMemory(uint32_t numWords) {
  39   uint64_t * result = new uint64_t[numWords];
  40   assert(result && "APInt memory allocation fails!");
  41   return result;
  42 }
  43
  44 void APInt::initSlowCase(uint32_t numBits, uint64_t val, bool isSigned)
  45 {
  46   pVal = getClearedMemory(getNumWords());
  47   pVal[0] = val;
  48   if (isSigned && int64_t(val) < 0)
  49     for (unsigned i = 1; i < getNumWords(); ++i)
  50       pVal[i] = -1ULL;
  51 }
  52
  53 APInt::APInt(uint32_t numBits, uint32_t numWords, const uint64_t bigVal[])
  54   : BitWidth(numBits), VAL(0)  {
  55   assert(BitWidth && "bitwidth too small");
  56   assert(bigVal && "Null pointer detected!");
  57   if (isSingleWord())
  58     VAL = bigVal[0];
  59   else {
  60     // Get memory, cleared to 0
  61     pVal = getClearedMemory(getNumWords());
  62     // Calculate the number of words to copy
  63     uint32_t words = std::min<uint32_t>(numWords, getNumWords());
  64     // Copy the words from bigVal to pVal
  65     memcpy(pVal, bigVal, words * APINT_WORD_SIZE);
  66   }
  67   // Make sure unused high bits are cleared
  68   clearUnusedBits();
  69 }
  70
  71 APInt::APInt(uint32_t numbits, const char StrStart[], uint32_t slen,
  72              uint8_t radix)
  73   : BitWidth(numbits), VAL(0) {
  74   assert(BitWidth && "bitwidth too small");
  75   fromString(numbits, StrStart, slen, radix);
  76 }
  77
  78 void APInt::initSlowCase(const APInt& that)
  79 {
  80   pVal = getMemory(getNumWords());
  81   memcpy(pVal, that.pVal, getNumWords() * APINT_WORD_SIZE);
  82 }
  83
  84 APInt& APInt::AssignSlowCase(const APInt& RHS) {
  85   // Don't do anything for X = X
  86   if (this == &RHS)
  87     return *this;
  88
  89   if (BitWidth == RHS.getBitWidth()) {
  90     // assume same bit-width single-word case is already handled
  91     assert(!isSingleWord());
  92     memcpy(pVal, RHS.pVal, getNumWords() * APINT_WORD_SIZE);
  93     return *this;
  94   }
  95
  96   if (isSingleWord()) {
  97     // assume case where both are single words is already handled
  98     assert(!RHS.isSingleWord());
  99     VAL = 0;
 100     pVal = getMemory(RHS.getNumWords());
 101     memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
 102   } else if (getNumWords() == RHS.getNumWords())
 103     memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
 104   else if (RHS.isSingleWord()) {
 105     delete [] pVal;
 106     VAL = RHS.VAL;
 107   } else {
 108     delete [] pVal;
 109     pVal = getMemory(RHS.getNumWords());
 110     memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
 111   }
 112   BitWidth = RHS.BitWidth;
 113   return clearUnusedBits();
 114 }
 115
 116 APInt& APInt::operator=(uint64_t RHS) {
 117   if (isSingleWord())
 118     VAL = RHS;
 119   else {
 120     pVal[0] = RHS;
 121     memset(pVal+1, 0, (getNumWords() - 1) * APINT_WORD_SIZE);
 122   }
 123   return clearUnusedBits();
 124 }
 125
 126 /// Profile - This method 'profiles' an APInt for use with FoldingSet.
 127 void APInt::Profile(FoldingSetNodeID& ID) const {
 128   ID.AddInteger(BitWidth);
 129
 130   if (isSingleWord()) {
 131     ID.AddInteger(VAL);
 132     return;
 133   }
 134
 135   uint32_t NumWords = getNumWords();
 136   for (unsigned i = 0; i < NumWords; ++i)
 137     ID.AddInteger(pVal[i]);
 138 }
 139
 140 /// add_1 - This function adds a single "digit" integer, y, to the multiple
 141 /// "digit" integer array,  x[]. x[] is modified to reflect the addition and
 142 /// 1 is returned if there is a carry out, otherwise 0 is returned.
 143 /// @returns the carry of the addition.
 144 static bool add_1(uint64_t dest[], uint64_t x[], uint32_t len, uint64_t y) {
 145   for (uint32_t i = 0; i < len; ++i) {
 146     dest[i] = y + x[i];
 147     if (dest[i] < y)
 148       y = 1; // Carry one to next digit.
 149     else {
 150       y = 0; // No need to carry so exit early
 151       break;
 152     }
 153   }
 154   return y;
 155 }
 156
 157 /// @brief Prefix increment operator. Increments the APInt by one.
 158 APInt& APInt::operator++() {
 159   if (isSingleWord())
 160     ++VAL;
 161   else
 162     add_1(pVal, pVal, getNumWords(), 1);
 163   return clearUnusedBits();
 164 }
 165
 166 /// sub_1 - This function subtracts a single "digit" (64-bit word), y, from
 167 /// the multi-digit integer array, x[], propagating the borrowed 1 value until
 168 /// no further borrowing is neeeded or it runs out of "digits" in x.  The result
 169 /// is 1 if "borrowing" exhausted the digits in x, or 0 if x was not exhausted.
 170 /// In other words, if y > x then this function returns 1, otherwise 0.
 171 /// @returns the borrow out of the subtraction
 172 static bool sub_1(uint64_t x[], uint32_t len, uint64_t y) {
 173   for (uint32_t i = 0; i < len; ++i) {
 174     uint64_t X = x[i];
 175     x[i] -= y;
 176     if (y > X)
 177       y = 1;  // We have to "borrow 1" from next "digit"
 178     else {
 179       y = 0;  // No need to borrow
 180       break;  // Remaining digits are unchanged so exit early
 181     }
 182   }
 183   return bool(y);
 184 }
 185
 186 /// @brief Prefix decrement operator. Decrements the APInt by one.
 187 APInt& APInt::operator--() {
 188   if (isSingleWord())
 189     --VAL;
 190   else
 191     sub_1(pVal, getNumWords(), 1);
 192   return clearUnusedBits();
 193 }
 194
 195 /// add - This function adds the integer array x to the integer array Y and
 196 /// places the result in dest.
 197 /// @returns the carry out from the addition
 198 /// @brief General addition of 64-bit integer arrays
 199 static bool add(uint64_t *dest, const uint64_t *x, const uint64_t *y,
 200                 uint32_t len) {
 201   bool carry = false;
 202   for (uint32_t i = 0; i< len; ++i) {
 203     uint64_t limit = std::min(x[i],y[i]); // must come first in case dest == x
 204     dest[i] = x[i] + y[i] + carry;
 205     carry = dest[i] < limit || (carry && dest[i] == limit);
 206   }
 207   return carry;
 208 }
 209
 210 /// Adds the RHS APint to this APInt.
 211 /// @returns this, after addition of RHS.
 212 /// @brief Addition assignment operator.
 213 APInt& APInt::operator+=(const APInt& RHS) {
 214   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 215   if (isSingleWord())
 216     VAL += RHS.VAL;
 217   else {
 218     add(pVal, pVal, RHS.pVal, getNumWords());
 219   }
 220   return clearUnusedBits();
 221 }
 222
 223 /// Subtracts the integer array y from the integer array x
 224 /// @returns returns the borrow out.
 225 /// @brief Generalized subtraction of 64-bit integer arrays.
 226 static bool sub(uint64_t *dest, const uint64_t *x, const uint64_t *y,
 227                 uint32_t len) {
 228   bool borrow = false;
 229   for (uint32_t i = 0; i < len; ++i) {
 230     uint64_t x_tmp = borrow ? x[i] - 1 : x[i];
 231     borrow = y[i] > x_tmp || (borrow && x[i] == 0);
 232     dest[i] = x_tmp - y[i];
 233   }
 234   return borrow;
 235 }
 236
 237 /// Subtracts the RHS APInt from this APInt
 238 /// @returns this, after subtraction
 239 /// @brief Subtraction assignment operator.
 240 APInt& APInt::operator-=(const APInt& RHS) {
 241   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 242   if (isSingleWord())
 243     VAL -= RHS.VAL;
 244   else
 245     sub(pVal, pVal, RHS.pVal, getNumWords());
 246   return clearUnusedBits();
 247 }
 248
 249 /// Multiplies an integer array, x by a a uint64_t integer and places the result
 250 /// into dest.
 251 /// @returns the carry out of the multiplication.
 252 /// @brief Multiply a multi-digit APInt by a single digit (64-bit) integer.
 253 static uint64_t mul_1(uint64_t dest[], uint64_t x[], uint32_t len, uint64_t y) {
 254   // Split y into high 32-bit part (hy)  and low 32-bit part (ly)
 255   uint64_t ly = y & 0xffffffffULL, hy = y >> 32;
 256   uint64_t carry = 0;
 257
 258   // For each digit of x.
 259   for (uint32_t i = 0; i < len; ++i) {
 260     // Split x into high and low words
 261     uint64_t lx = x[i] & 0xffffffffULL;
 262     uint64_t hx = x[i] >> 32;
 263     // hasCarry - A flag to indicate if there is a carry to the next digit.
 264     // hasCarry == 0, no carry
 265     // hasCarry == 1, has carry
 266     // hasCarry == 2, no carry and the calculation result == 0.
 267     uint8_t hasCarry = 0;
 268     dest[i] = carry + lx * ly;
 269     // Determine if the add above introduces carry.
 270     hasCarry = (dest[i] < carry) ? 1 : 0;
 271     carry = hx * ly + (dest[i] >> 32) + (hasCarry ? (1ULL << 32) : 0);
 272     // The upper limit of carry can be (2^32 - 1)(2^32 - 1) +
 273     // (2^32 - 1) + 2^32 = 2^64.
 274     hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
 275
 276     carry += (lx * hy) & 0xffffffffULL;
 277     dest[i] = (carry << 32) | (dest[i] & 0xffffffffULL);
 278     carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0) +
 279             (carry >> 32) + ((lx * hy) >> 32) + hx * hy;
 280   }
 281   return carry;
 282 }
 283
 284 /// Multiplies integer array x by integer array y and stores the result into
 285 /// the integer array dest. Note that dest's size must be >= xlen + ylen.
 286 /// @brief Generalized multiplicate of integer arrays.
 287 static void mul(uint64_t dest[], uint64_t x[], uint32_t xlen, uint64_t y[],
 288                 uint32_t ylen) {
 289   dest[xlen] = mul_1(dest, x, xlen, y[0]);
 290   for (uint32_t i = 1; i < ylen; ++i) {
 291     uint64_t ly = y[i] & 0xffffffffULL, hy = y[i] >> 32;
 292     uint64_t carry = 0, lx = 0, hx = 0;
 293     for (uint32_t j = 0; j < xlen; ++j) {
 294       lx = x[j] & 0xffffffffULL;
 295       hx = x[j] >> 32;
 296       // hasCarry - A flag to indicate if has carry.
 297       // hasCarry == 0, no carry
 298       // hasCarry == 1, has carry
 299       // hasCarry == 2, no carry and the calculation result == 0.
 300       uint8_t hasCarry = 0;
 301       uint64_t resul = carry + lx * ly;
 302       hasCarry = (resul < carry) ? 1 : 0;
 303       carry = (hasCarry ? (1ULL << 32) : 0) + hx * ly + (resul >> 32);
 304       hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
 305
 306       carry += (lx * hy) & 0xffffffffULL;
 307       resul = (carry << 32) | (resul & 0xffffffffULL);
 308       dest[i+j] += resul;
 309       carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0)+
 310               (carry >> 32) + (dest[i+j] < resul ? 1 : 0) +
 311               ((lx * hy) >> 32) + hx * hy;
 312     }
 313     dest[i+xlen] = carry;
 314   }
 315 }
 316
 317 APInt& APInt::operator*=(const APInt& RHS) {
 318   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 319   if (isSingleWord()) {
 320     VAL *= RHS.VAL;
 321     clearUnusedBits();
 322     return *this;
 323   }
 324
 325   // Get some bit facts about LHS and check for zero
 326   uint32_t lhsBits = getActiveBits();
 327   uint32_t lhsWords = !lhsBits ? 0 : whichWord(lhsBits - 1) + 1;
 328   if (!lhsWords)
 329     // 0 * X ===> 0
 330     return *this;
 331
 332   // Get some bit facts about RHS and check for zero
 333   uint32_t rhsBits = RHS.getActiveBits();
 334   uint32_t rhsWords = !rhsBits ? 0 : whichWord(rhsBits - 1) + 1;
 335   if (!rhsWords) {
 336     // X * 0 ===> 0
 337     clear();
 338     return *this;
 339   }
 340
 341   // Allocate space for the result
 342   uint32_t destWords = rhsWords + lhsWords;
 343   uint64_t *dest = getMemory(destWords);
 344
 345   // Perform the long multiply
 346   mul(dest, pVal, lhsWords, RHS.pVal, rhsWords);
 347
 348   // Copy result back into *this
 349   clear();
 350   uint32_t wordsToCopy = destWords >= getNumWords() ? getNumWords() : destWords;
 351   memcpy(pVal, dest, wordsToCopy * APINT_WORD_SIZE);
 352
 353   // delete dest array and return
 354   delete[] dest;
 355   return *this;
 356 }
 357
 358 APInt& APInt::operator&=(const APInt& RHS) {
 359   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 360   if (isSingleWord()) {
 361     VAL &= RHS.VAL;
 362     return *this;
 363   }
 364   uint32_t numWords = getNumWords();
 365   for (uint32_t i = 0; i < numWords; ++i)
 366     pVal[i] &= RHS.pVal[i];
 367   return *this;
 368 }
 369
 370 APInt& APInt::operator|=(const APInt& RHS) {
 371   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 372   if (isSingleWord()) {
 373     VAL |= RHS.VAL;
 374     return *this;
 375   }
 376   uint32_t numWords = getNumWords();
 377   for (uint32_t i = 0; i < numWords; ++i)
 378     pVal[i] |= RHS.pVal[i];
 379   return *this;
 380 }
 381
 382 APInt& APInt::operator^=(const APInt& RHS) {
 383   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 384   if (isSingleWord()) {
 385     VAL ^= RHS.VAL;
 386     this->clearUnusedBits();
 387     return *this;
 388   }
 389   uint32_t numWords = getNumWords();
 390   for (uint32_t i = 0; i < numWords; ++i)
 391     pVal[i] ^= RHS.pVal[i];
 392   return clearUnusedBits();
 393 }
 394
 395 APInt APInt::AndSlowCase(const APInt& RHS) const {
 396   uint32_t numWords = getNumWords();
 397   uint64_t* val = getMemory(numWords);
 398   for (uint32_t i = 0; i < numWords; ++i)
 399     val[i] = pVal[i] & RHS.pVal[i];
 400   return APInt(val, getBitWidth());
 401 }
 402
 403 APInt APInt::OrSlowCase(const APInt& RHS) const {
 404   uint32_t numWords = getNumWords();
 405   uint64_t *val = getMemory(numWords);
 406   for (uint32_t i = 0; i < numWords; ++i)
 407     val[i] = pVal[i] | RHS.pVal[i];
 408   return APInt(val, getBitWidth());
 409 }
 410
 411 APInt APInt::XorSlowCase(const APInt& RHS) const {
 412   uint32_t numWords = getNumWords();
 413   uint64_t *val = getMemory(numWords);
 414   for (uint32_t i = 0; i < numWords; ++i)
 415     val[i] = pVal[i] ^ RHS.pVal[i];
 416
 417   // 0^0==1 so clear the high bits in case they got set.
 418   return APInt(val, getBitWidth()).clearUnusedBits();
 419 }
 420
 421 bool APInt::operator !() const {
 422   if (isSingleWord())
 423     return !VAL;
 424
 425   for (uint32_t i = 0; i < getNumWords(); ++i)
 426     if (pVal[i])
 427       return false;
 428   return true;
 429 }
 430
 431 APInt APInt::operator*(const APInt& RHS) const {
 432   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 433   if (isSingleWord())
 434     return APInt(BitWidth, VAL * RHS.VAL);
 435   APInt Result(*this);
 436   Result *= RHS;
 437   return Result.clearUnusedBits();
 438 }
 439
 440 APInt APInt::operator+(const APInt& RHS) const {
 441   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 442   if (isSingleWord())
 443     return APInt(BitWidth, VAL + RHS.VAL);
 444   APInt Result(BitWidth, 0);
 445   add(Result.pVal, this->pVal, RHS.pVal, getNumWords());
 446   return Result.clearUnusedBits();
 447 }
 448
 449 APInt APInt::operator-(const APInt& RHS) const {
 450   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
 451   if (isSingleWord())
 452     return APInt(BitWidth, VAL - RHS.VAL);
 453   APInt Result(BitWidth, 0);
 454   sub(Result.pVal, this->pVal, RHS.pVal, getNumWords());
 455   return Result.clearUnusedBits();
 456 }
 457
 458 bool APInt::operator[](uint32_t bitPosition) const {
 459   return (maskBit(bitPosition) &
 460           (isSingleWord() ?  VAL : pVal[whichWord(bitPosition)])) != 0;
 461 }
 462
 463 bool APInt::EqualSlowCase(const APInt& RHS) const {
 464   // Get some facts about the number of bits used in the two operands.
 465   uint32_t n1 = getActiveBits();
 466   uint32_t n2 = RHS.getActiveBits();
 467
 468   // If the number of bits isn't the same, they aren't equal
 469   if (n1 != n2)
 470     return false;
 471
 472   // If the number of bits fits in a word, we only need to compare the low word.
 473   if (n1 <= APINT_BITS_PER_WORD)
 474     return pVal[0] == RHS.pVal[0];
 475
 476   // Otherwise, compare everything
 477   for (int i = whichWord(n1 - 1); i >= 0; --i)
 478     if (pVal[i] != RHS.pVal[i])
 479       return false;
 480   return true;
 481 }
 482
 483 bool APInt::EqualSlowCase(uint64_t Val) const {
 484   uint32_t n = getActiveBits();
 485   if (n <= APINT_BITS_PER_WORD)
 486     return pVal[0] == Val;
 487   else
 488     return false;
 489 }
 490
 491 bool APInt::ult(const APInt& RHS) const {
 492   assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
 493   if (isSingleWord())
 494     return VAL < RHS.VAL;
 495
 496   // Get active bit length of both operands
 497   uint32_t n1 = getActiveBits();
 498   uint32_t n2 = RHS.getActiveBits();
 499
 500   // If magnitude of LHS is less than RHS, return true.
 501   if (n1 < n2)
 502     return true;
 503
 504   // If magnitude of RHS is greather than LHS, return false.
 505   if (n2 < n1)
 506     return false;
 507
 508   // If they bot fit in a word, just compare the low order word
 509   if (n1 <= APINT_BITS_PER_WORD && n2 <= APINT_BITS_PER_WORD)
 510     return pVal[0] < RHS.pVal[0];
 511
 512   // Otherwise, compare all words
 513   uint32_t topWord = whichWord(std::max(n1,n2)-1);
 514   for (int i = topWord; i >= 0; --i) {
 515     if (pVal[i] > RHS.pVal[i])
 516       return false;
 517     if (pVal[i] < RHS.pVal[i])
 518       return true;
 519   }
 520   return false;
 521 }
 522
 523 bool APInt::slt(const APInt& RHS) const {
 524   assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
 525   if (isSingleWord()) {
 526     int64_t lhsSext = (int64_t(VAL) << (64-BitWidth)) >> (64-BitWidth);
 527     int64_t rhsSext = (int64_t(RHS.VAL) << (64-BitWidth)) >> (64-BitWidth);
 528     return lhsSext < rhsSext;
 529   }
 530
 531   APInt lhs(*this);
 532   APInt rhs(RHS);
 533   bool lhsNeg = isNegative();
 534   bool rhsNeg = rhs.isNegative();
 535   if (lhsNeg) {
 536     // Sign bit is set so perform two's complement to make it positive
 537     lhs.flip();
 538     lhs++;
 539   }
 540   if (rhsNeg) {
 541     // Sign bit is set so perform two's complement to make it positive
 542     rhs.flip();
 543     rhs++;
 544   }
 545
 546   // Now we have unsigned values to compare so do the comparison if necessary
 547   // based on the negativeness of the values.
 548   if (lhsNeg)
 549     if (rhsNeg)
 550       return lhs.ugt(rhs);
 551     else
 552       return true;
 553   else if (rhsNeg)
 554     return false;
 555   else
 556     return lhs.ult(rhs);
 557 }
 558
 559 APInt& APInt::set(uint32_t bitPosition) {
 560   if (isSingleWord())
 561     VAL |= maskBit(bitPosition);
 562   else
 563     pVal[whichWord(bitPosition)] |= maskBit(bitPosition);
 564   return *this;
 565 }
 566
 567 /// Set the given bit to 0 whose position is given as "bitPosition".
 568 /// @brief Set a given bit to 0.
 569 APInt& APInt::clear(uint32_t bitPosition) {
 570   if (isSingleWord())
 571     VAL &= ~maskBit(bitPosition);
 572   else
 573     pVal[whichWord(bitPosition)] &= ~maskBit(bitPosition);
 574   return *this;
 575 }
 576
 577 /// @brief Toggle every bit to its opposite value.
 578
 579 /// Toggle a given bit to its opposite value whose position is given
 580 /// as "bitPosition".
 581 /// @brief Toggles a given bit to its opposite value.
 582 APInt& APInt::flip(uint32_t bitPosition) {
 583   assert(bitPosition < BitWidth && "Out of the bit-width range!");
 584   if ((*this)[bitPosition]) clear(bitPosition);
 585   else set(bitPosition);
 586   return *this;
 587 }
 588
 589 uint32_t APInt::getBitsNeeded(const char* str, uint32_t slen, uint8_t radix) {
 590   assert(str != 0 && "Invalid value string");
 591   assert(slen > 0 && "Invalid string length");
 592
 593   // Each computation below needs to know if its negative
 594   uint32_t isNegative = str[0] == '-';
 595   if (isNegative) {
 596     slen--;
 597     str++;
 598   }
 599   // For radixes of power-of-two values, the bits required is accurately and
 600   // easily computed
 601   if (radix == 2)
 602     return slen + isNegative;
 603   if (radix == 8)
 604     return slen * 3 + isNegative;
 605   if (radix == 16)
 606     return slen * 4 + isNegative;
 607
 608   // Otherwise it must be radix == 10, the hard case
 609   assert(radix == 10 && "Invalid radix");
 610
 611   // This is grossly inefficient but accurate. We could probably do something
 612   // with a computation of roughly slen*64/20 and then adjust by the value of
 613   // the first few digits. But, I'm not sure how accurate that could be.
 614
 615   // Compute a sufficient number of bits that is always large enough but might
 616   // be too large. This avoids the assertion in the constructor.
 617   uint32_t sufficient = slen*64/18;
 618
 619   // Convert to the actual binary value.
 620   APInt tmp(sufficient, str, slen, radix);
 621
 622   // Compute how many bits are required.
 623   return isNegative + tmp.logBase2() + 1;
 624 }
 625
 626 uint64_t APInt::getHashValue() const {
 627   // Put the bit width into the low order bits.
 628   uint64_t hash = BitWidth;
 629
 630   // Add the sum of the words to the hash.
 631   if (isSingleWord())
 632     hash += VAL << 6; // clear separation of up to 64 bits
 633   else
 634     for (uint32_t i = 0; i < getNumWords(); ++i)
 635       hash += pVal[i] << 6; // clear sepration of up to 64 bits
 636   return hash;
 637 }
 638
 639 /// HiBits - This function returns the high "numBits" bits of this APInt.
 640 APInt APInt::getHiBits(uint32_t numBits) const {
 641   return APIntOps::lshr(*this, BitWidth - numBits);
 642 }
 643
 644 /// LoBits - This function returns the low "numBits" bits of this APInt.
 645 APInt APInt::getLoBits(uint32_t numBits) const {
 646   return APIntOps::lshr(APIntOps::shl(*this, BitWidth - numBits),
 647                         BitWidth - numBits);
 648 }
 649
 650 bool APInt::isPowerOf2() const {
 651   return (!!*this) && !(*this & (*this - APInt(BitWidth,1)));
 652 }
 653
 654 uint32_t APInt::countLeadingZerosSlowCase() const {
 655   uint32_t Count = 0;
 656   for (uint32_t i = getNumWords(); i > 0u; --i) {
 657     if (pVal[i-1] == 0)
 658       Count += APINT_BITS_PER_WORD;
 659     else {
 660       Count += CountLeadingZeros_64(pVal[i-1]);
 661       break;
 662     }
 663   }
 664   uint32_t remainder = BitWidth % APINT_BITS_PER_WORD;
 665   if (remainder)
 666     Count -= APINT_BITS_PER_WORD - remainder;
 667   return std::min(Count, BitWidth);
 668 }
 669
 670 static uint32_t countLeadingOnes_64(uint64_t V, uint32_t skip) {
 671   uint32_t Count = 0;
 672   if (skip)
 673     V <<= skip;
 674   while (V && (V & (1ULL << 63))) {
 675     Count++;
 676     V <<= 1;
 677   }
 678   return Count;
 679 }
 680
 681 uint32_t APInt::countLeadingOnes() const {
 682   if (isSingleWord())
 683     return countLeadingOnes_64(VAL, APINT_BITS_PER_WORD - BitWidth);
 684
 685   uint32_t highWordBits = BitWidth % APINT_BITS_PER_WORD;
 686   uint32_t shift = (highWordBits == 0 ? 0 : APINT_BITS_PER_WORD - highWordBits);
 687   int i = getNumWords() - 1;
 688   uint32_t Count = countLeadingOnes_64(pVal[i], shift);
 689   if (Count == highWordBits) {
 690     for (i--; i >= 0; --i) {
 691       if (pVal[i] == -1ULL)
 692         Count += APINT_BITS_PER_WORD;
 693       else {
 694         Count += countLeadingOnes_64(pVal[i], 0);
 695         break;
 696       }
 697     }
 698   }
 699   return Count;
 700 }
 701
 702 uint32_t APInt::countTrailingZeros() const {
 703   if (isSingleWord())
 704     return std::min(uint32_t(CountTrailingZeros_64(VAL)), BitWidth);
 705   uint32_t Count = 0;
 706   uint32_t i = 0;
 707   for (; i < getNumWords() && pVal[i] == 0; ++i)
 708     Count += APINT_BITS_PER_WORD;
 709   if (i < getNumWords())
 710     Count += CountTrailingZeros_64(pVal[i]);
 711   return std::min(Count, BitWidth);
 712 }
 713
 714 uint32_t APInt::countTrailingOnesSlowCase() const {
 715   uint32_t Count = 0;
 716   uint32_t i = 0;
 717   for (; i < getNumWords() && pVal[i] == -1ULL; ++i)
 718     Count += APINT_BITS_PER_WORD;
 719   if (i < getNumWords())
 720     Count += CountTrailingOnes_64(pVal[i]);
 721   return std::min(Count, BitWidth);
 722 }
 723
 724 uint32_t APInt::countPopulationSlowCase() const {
 725   uint32_t Count = 0;
 726   for (uint32_t i = 0; i < getNumWords(); ++i)
 727     Count += CountPopulation_64(pVal[i]);
 728   return Count;
 729 }
 730
 731 APInt APInt::byteSwap() const {
 732   assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
 733   if (BitWidth == 16)
 734     return APInt(BitWidth, ByteSwap_16(uint16_t(VAL)));
 735   else if (BitWidth == 32)
 736     return APInt(BitWidth, ByteSwap_32(uint32_t(VAL)));
 737   else if (BitWidth == 48) {
 738     uint32_t Tmp1 = uint32_t(VAL >> 16);
 739     Tmp1 = ByteSwap_32(Tmp1);
 740     uint16_t Tmp2 = uint16_t(VAL);
 741     Tmp2 = ByteSwap_16(Tmp2);
 742     return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
 743   } else if (BitWidth == 64)
 744     return APInt(BitWidth, ByteSwap_64(VAL));
 745   else {
 746     APInt Result(BitWidth, 0);
 747     char *pByte = (char*)Result.pVal;
 748     for (uint32_t i = 0; i < BitWidth / APINT_WORD_SIZE / 2; ++i) {
 749       char Tmp = pByte[i];
 750       pByte[i] = pByte[BitWidth / APINT_WORD_SIZE - 1 - i];
 751       pByte[BitWidth / APINT_WORD_SIZE - i - 1] = Tmp;
 752     }
 753     return Result;
 754   }
 755 }
 756
 757 APInt llvm::APIntOps::GreatestCommonDivisor(const APInt& API1,
 758                                             const APInt& API2) {
 759   APInt A = API1, B = API2;
 760   while (!!B) {
 761     APInt T = B;
 762     B = APIntOps::urem(A, B);
 763     A = T;
 764   }
 765   return A;
 766 }
 767
 768 APInt llvm::APIntOps::RoundDoubleToAPInt(double Double, uint32_t width) {
 769   union {
 770     double D;
 771     uint64_t I;
 772   } T;
 773   T.D = Double;
 774
 775   // Get the sign bit from the highest order bit
 776   bool isNeg = T.I >> 63;
 777
 778   // Get the 11-bit exponent and adjust for the 1023 bit bias
 779   int64_t exp = ((T.I >> 52) & 0x7ff) - 1023;
 780
 781   // If the exponent is negative, the value is < 0 so just return 0.
 782   if (exp < 0)
 783     return APInt(width, 0u);
 784
 785   // Extract the mantissa by clearing the top 12 bits (sign + exponent).
 786   uint64_t mantissa = (T.I & (~0ULL >> 12)) | 1ULL << 52;
 787
 788   // If the exponent doesn't shift all bits out of the mantissa
 789   if (exp < 52)
 790     return isNeg ? -APInt(width, mantissa >> (52 - exp)) :
 791                     APInt(width, mantissa >> (52 - exp));
 792
 793   // If the client didn't provide enough bits for us to shift the mantissa into
 794   // then the result is undefined, just return 0
 795   if (width <= exp - 52)
 796     return APInt(width, 0);
 797
 798   // Otherwise, we have to shift the mantissa bits up to the right location
 799   APInt Tmp(width, mantissa);
 800   Tmp = Tmp.shl((uint32_t)exp - 52);
 801   return isNeg ? -Tmp : Tmp;
 802 }
 803
 804 /// RoundToDouble - This function convert this APInt to a double.
 805 /// The layout for double is as following (IEEE Standard 754):
 806 ///  --------------------------------------
 807 /// |  Sign    Exponent    Fraction    Bias |
 808 /// |-------------------------------------- |
 809 /// |  1[63]   11[62-52]   52[51-00]   1023 |
 810 ///  --------------------------------------
 811 double APInt::roundToDouble(bool isSigned) const {
 812
 813   // Handle the simple case where the value is contained in one uint64_t.
 814   if (isSingleWord() || getActiveBits() <= APINT_BITS_PER_WORD) {
 815     if (isSigned) {
 816       int64_t sext = (int64_t(VAL) << (64-BitWidth)) >> (64-BitWidth);
 817       return double(sext);
 818     } else
 819       return double(VAL);
 820   }
 821
 822   // Determine if the value is negative.
 823   bool isNeg = isSigned ? (*this)[BitWidth-1] : false;
 824
 825   // Construct the absolute value if we're negative.
 826   APInt Tmp(isNeg ? -(*this) : (*this));
 827
 828   // Figure out how many bits we're using.
 829   uint32_t n = Tmp.getActiveBits();
 830
 831   // The exponent (without bias normalization) is just the number of bits
 832   // we are using. Note that the sign bit is gone since we constructed the
 833   // absolute value.
 834   uint64_t exp = n;
 835
 836   // Return infinity for exponent overflow
 837   if (exp > 1023) {
 838     if (!isSigned || !isNeg)
 839       return std::numeric_limits<double>::infinity();
 840     else
 841       return -std::numeric_limits<double>::infinity();
 842   }
 843   exp += 1023; // Increment for 1023 bias
 844
 845   // Number of bits in mantissa is 52. To obtain the mantissa value, we must
 846   // extract the high 52 bits from the correct words in pVal.
 847   uint64_t mantissa;
 848   unsigned hiWord = whichWord(n-1);
 849   if (hiWord == 0) {
 850     mantissa = Tmp.pVal[0];
 851     if (n > 52)
 852       mantissa >>= n - 52; // shift down, we want the top 52 bits.
 853   } else {
 854     assert(hiWord > 0 && "huh?");
 855     uint64_t hibits = Tmp.pVal[hiWord] << (52 - n % APINT_BITS_PER_WORD);
 856     uint64_t lobits = Tmp.pVal[hiWord-1] >> (11 + n % APINT_BITS_PER_WORD);
 857     mantissa = hibits | lobits;
 858   }
 859
 860   // The leading bit of mantissa is implicit, so get rid of it.
 861   uint64_t sign = isNeg ? (1ULL << (APINT_BITS_PER_WORD - 1)) : 0;
 862   union {
 863     double D;
 864     uint64_t I;
 865   } T;
 866   T.I = sign | (exp << 52) | mantissa;
 867   return T.D;
 868 }
 869
 870 // Truncate to new width.
 871 APInt &APInt::trunc(uint32_t width) {
 872   assert(width < BitWidth && "Invalid APInt Truncate request");
 873   assert(width && "Can't truncate to 0 bits");
 874   uint32_t wordsBefore = getNumWords();
 875   BitWidth = width;
 876   uint32_t wordsAfter = getNumWords();
 877   if (wordsBefore != wordsAfter) {
 878     if (wordsAfter == 1) {
 879       uint64_t *tmp = pVal;
 880       VAL = pVal[0];
 881       delete [] tmp;
 882     } else {
 883       uint64_t *newVal = getClearedMemory(wordsAfter);
 884       for (uint32_t i = 0; i < wordsAfter; ++i)
 885         newVal[i] = pVal[i];
 886       delete [] pVal;
 887       pVal = newVal;
 888     }
 889   }
 890   return clearUnusedBits();
 891 }
 892
 893 // Sign extend to a new width.
 894 APInt &APInt::sext(uint32_t width) {
 895   assert(width > BitWidth && "Invalid APInt SignExtend request");
 896   // If the sign bit isn't set, this is the same as zext.
 897   if (!isNegative()) {
 898     zext(width);
 899     return *this;
 900   }
 901
 902   // The sign bit is set. First, get some facts
 903   uint32_t wordsBefore = getNumWords();
 904   uint32_t wordBits = BitWidth % APINT_BITS_PER_WORD;
 905   BitWidth = width;
 906   uint32_t wordsAfter = getNumWords();
 907
 908   // Mask the high order word appropriately
 909   if (wordsBefore == wordsAfter) {
 910     uint32_t newWordBits = width % APINT_BITS_PER_WORD;
 911     // The extension is contained to the wordsBefore-1th word.
 912     uint64_t mask = ~0ULL;
 913     if (newWordBits)
 914       mask >>= APINT_BITS_PER_WORD - newWordBits;
 915     mask <<= wordBits;
 916     if (wordsBefore == 1)
 917       VAL |= mask;
 918     else
 919       pVal[wordsBefore-1] |= mask;
 920     return clearUnusedBits();
 921   }
 922
 923   uint64_t mask = wordBits == 0 ? 0 : ~0ULL << wordBits;
 924   uint64_t *newVal = getMemory(wordsAfter);
 925   if (wordsBefore == 1)
 926     newVal[0] = VAL | mask;
 927   else {
 928     for (uint32_t i = 0; i < wordsBefore; ++i)
 929       newVal[i] = pVal[i];
 930     newVal[wordsBefore-1] |= mask;
 931   }
 932   for (uint32_t i = wordsBefore; i < wordsAfter; i++)
 933     newVal[i] = -1ULL;
 934   if (wordsBefore != 1)
 935     delete [] pVal;
 936   pVal = newVal;
 937   return clearUnusedBits();
 938 }
 939
 940 //  Zero extend to a new width.
 941 APInt &APInt::zext(uint32_t width) {
 942   assert(width > BitWidth && "Invalid APInt ZeroExtend request");
 943   uint32_t wordsBefore = getNumWords();
 944   BitWidth = width;
 945   uint32_t wordsAfter = getNumWords();
 946   if (wordsBefore != wordsAfter) {
 947     uint64_t *newVal = getClearedMemory(wordsAfter);
 948     if (wordsBefore == 1)
 949       newVal[0] = VAL;
 950     else
 951       for (uint32_t i = 0; i < wordsBefore; ++i)
 952         newVal[i] = pVal[i];
 953     if (wordsBefore != 1)
 954       delete [] pVal;
 955     pVal = newVal;
 956   }
 957   return *this;
 958 }
 959
 960 APInt &APInt::zextOrTrunc(uint32_t width) {
 961   if (BitWidth < width)
 962     return zext(width);
 963   if (BitWidth > width)
 964     return trunc(width);
 965   return *this;
 966 }
 967
 968 APInt &APInt::sextOrTrunc(uint32_t width) {
 969   if (BitWidth < width)
 970     return sext(width);
 971   if (BitWidth > width)
 972     return trunc(width);
 973   return *this;
 974 }
 975
 976 /// Arithmetic right-shift this APInt by shiftAmt.
 977 /// @brief Arithmetic right-shift function.
 978 APInt APInt::ashr(const APInt &shiftAmt) const {
 979   return ashr((uint32_t)shiftAmt.getLimitedValue(BitWidth));
 980 }
 981
 982 /// Arithmetic right-shift this APInt by shiftAmt.
 983 /// @brief Arithmetic right-shift function.
 984 APInt APInt::ashr(uint32_t shiftAmt) const {
 985   assert(shiftAmt <= BitWidth && "Invalid shift amount");
 986   // Handle a degenerate case
 987   if (shiftAmt == 0)
 988     return *this;
 989
 990   // Handle single word shifts with built-in ashr
 991   if (isSingleWord()) {
 992     if (shiftAmt == BitWidth)
 993       return APInt(BitWidth, 0); // undefined
 994     else {
 995       uint32_t SignBit = APINT_BITS_PER_WORD - BitWidth;
 996       return APInt(BitWidth,
 997         (((int64_t(VAL) << SignBit) >> SignBit) >> shiftAmt));
 998     }
 999   }
1000
1001   // If all the bits were shifted out, the result is, technically, undefined.
1002   // We return -1 if it was negative, 0 otherwise. We check this early to avoid
1003   // issues in the algorithm below.
1004   if (shiftAmt == BitWidth) {
1005     if (isNegative())
1006       return APInt(BitWidth, -1ULL, true);
1007     else
1008       return APInt(BitWidth, 0);
1009   }
1010
1011   // Create some space for the result.
1012   uint64_t * val = new uint64_t[getNumWords()];
1013
1014   // Compute some values needed by the following shift algorithms
1015   uint32_t wordShift = shiftAmt % APINT_BITS_PER_WORD; // bits to shift per word
1016   uint32_t offset = shiftAmt / APINT_BITS_PER_WORD; // word offset for shift
1017   uint32_t breakWord = getNumWords() - 1 - offset; // last word affected
1018   uint32_t bitsInWord = whichBit(BitWidth); // how many bits in last word?
1019   if (bitsInWord == 0)
1020     bitsInWord = APINT_BITS_PER_WORD;
1021
1022   // If we are shifting whole words, just move whole words
1023   if (wordShift == 0) {
1024     // Move the words containing significant bits
1025     for (uint32_t i = 0; i <= breakWord; ++i)
1026       val[i] = pVal[i+offset]; // move whole word
1027
1028     // Adjust the top significant word for sign bit fill, if negative
1029     if (isNegative())
1030       if (bitsInWord < APINT_BITS_PER_WORD)
1031         val[breakWord] |= ~0ULL << bitsInWord; // set high bits
1032   } else {
1033     // Shift the low order words
1034     for (uint32_t i = 0; i < breakWord; ++i) {
1035       // This combines the shifted corresponding word with the low bits from
1036       // the next word (shifted into this word's high bits).
1037       val[i] = (pVal[i+offset] >> wordShift) |
1038                (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
1039     }
1040
1041     // Shift the break word. In this case there are no bits from the next word
1042     // to include in this word.
1043     val[breakWord] = pVal[breakWord+offset] >> wordShift;
1044
1045     // Deal with sign extenstion in the break word, and possibly the word before
1046     // it.
1047     if (isNegative()) {
1048       if (wordShift > bitsInWord) {
1049         if (breakWord > 0)
1050           val[breakWord-1] |=
1051             ~0ULL << (APINT_BITS_PER_WORD - (wordShift - bitsInWord));
1052         val[breakWord] |= ~0ULL;
1053       } else
1054         val[breakWord] |= (~0ULL << (bitsInWord - wordShift));
1055     }
1056   }
1057
1058   // Remaining words are 0 or -1, just assign them.
1059   uint64_t fillValue = (isNegative() ? -1ULL : 0);
1060   for (uint32_t i = breakWord+1; i < getNumWords(); ++i)
1061     val[i] = fillValue;
1062   return APInt(val, BitWidth).clearUnusedBits();
1063 }
1064
1065 /// Logical right-shift this APInt by shiftAmt.
1066 /// @brief Logical right-shift function.
1067 APInt APInt::lshr(const APInt &shiftAmt) const {
1068   return lshr((uint32_t)shiftAmt.getLimitedValue(BitWidth));
1069 }
1070
1071 /// Logical right-shift this APInt by shiftAmt.
1072 /// @brief Logical right-shift function.
1073 APInt APInt::lshr(uint32_t shiftAmt) const {
1074   if (isSingleWord()) {
1075     if (shiftAmt == BitWidth)
1076       return APInt(BitWidth, 0);
1077     else
1078       return APInt(BitWidth, this->VAL >> shiftAmt);
1079   }
1080
1081   // If all the bits were shifted out, the result is 0. This avoids issues
1082   // with shifting by the size of the integer type, which produces undefined
1083   // results. We define these "undefined results" to always be 0.
1084   if (shiftAmt == BitWidth)
1085     return APInt(BitWidth, 0);
1086
1087   // If none of the bits are shifted out, the result is *this. This avoids
1088   // issues with shifting byt he size of the integer type, which produces
1089   // undefined results in the code below. This is also an optimization.
1090   if (shiftAmt == 0)
1091     return *this;
1092
1093   // Create some space for the result.
1094   uint64_t * val = new uint64_t[getNumWords()];
1095
1096   // If we are shifting less than a word, compute the shift with a simple carry
1097   if (shiftAmt < APINT_BITS_PER_WORD) {
1098     uint64_t carry = 0;
1099     for (int i = getNumWords()-1; i >= 0; --i) {
1100       val[i] = (pVal[i] >> shiftAmt) | carry;
1101       carry = pVal[i] << (APINT_BITS_PER_WORD - shiftAmt);
1102     }
1103     return APInt(val, BitWidth).clearUnusedBits();
1104   }
1105
1106   // Compute some values needed by the remaining shift algorithms
1107   uint32_t wordShift = shiftAmt % APINT_BITS_PER_WORD;
1108   uint32_t offset = shiftAmt / APINT_BITS_PER_WORD;
1109
1110   // If we are shifting whole words, just move whole words
1111   if (wordShift == 0) {
1112     for (uint32_t i = 0; i < getNumWords() - offset; ++i)
1113       val[i] = pVal[i+offset];
1114     for (uint32_t i = getNumWords()-offset; i < getNumWords(); i++)
1115       val[i] = 0;
1116     return APInt(val,BitWidth).clearUnusedBits();
1117   }
1118
1119   // Shift the low order words
1120   uint32_t breakWord = getNumWords() - offset -1;
1121   for (uint32_t i = 0; i < breakWord; ++i)
1122     val[i] = (pVal[i+offset] >> wordShift) |
1123              (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
1124   // Shift the break word.
1125   val[breakWord] = pVal[breakWord+offset] >> wordShift;
1126
1127   // Remaining words are 0
1128   for (uint32_t i = breakWord+1; i < getNumWords(); ++i)
1129     val[i] = 0;
1130   return APInt(val, BitWidth).clearUnusedBits();
1131 }
1132
1133 /// Left-shift this APInt by shiftAmt.
1134 /// @brief Left-shift function.
1135 APInt APInt::shl(const APInt &shiftAmt) const {
1136   // It's undefined behavior in C to shift by BitWidth or greater, but
1137   return shl((uint32_t)shiftAmt.getLimitedValue(BitWidth));
1138 }
1139
1140 APInt APInt::shlSlowCase(uint32_t shiftAmt) const {
1141   // If all the bits were shifted out, the result is 0. This avoids issues
1142   // with shifting by the size of the integer type, which produces undefined
1143   // results. We define these "undefined results" to always be 0.
1144   if (shiftAmt == BitWidth)
1145     return APInt(BitWidth, 0);
1146
1147   // If none of the bits are shifted out, the result is *this. This avoids a
1148   // lshr by the words size in the loop below which can produce incorrect
1149   // results. It also avoids the expensive computation below for a common case.
1150   if (shiftAmt == 0)
1151     return *this;
1152
1153   // Create some space for the result.
1154   uint64_t * val = new uint64_t[getNumWords()];
1155
1156   // If we are shifting less than a word, do it the easy way
1157   if (shiftAmt < APINT_BITS_PER_WORD) {
1158     uint64_t carry = 0;
1159     for (uint32_t i = 0; i < getNumWords(); i++) {
1160       val[i] = pVal[i] << shiftAmt | carry;
1161       carry = pVal[i] >> (APINT_BITS_PER_WORD - shiftAmt);
1162     }
1163     return APInt(val, BitWidth).clearUnusedBits();
1164   }
1165
1166   // Compute some values needed by the remaining shift algorithms
1167   uint32_t wordShift = shiftAmt % APINT_BITS_PER_WORD;
1168   uint32_t offset = shiftAmt / APINT_BITS_PER_WORD;
1169
1170   // If we are shifting whole words, just move whole words
1171   if (wordShift == 0) {
1172     for (uint32_t i = 0; i < offset; i++)
1173       val[i] = 0;
1174     for (uint32_t i = offset; i < getNumWords(); i++)
1175       val[i] = pVal[i-offset];
1176     return APInt(val,BitWidth).clearUnusedBits();
1177   }
1178
1179   // Copy whole words from this to Result.
1180   uint32_t i = getNumWords() - 1;
1181   for (; i > offset; --i)
1182     val[i] = pVal[i-offset] << wordShift |
1183              pVal[i-offset-1] >> (APINT_BITS_PER_WORD - wordShift);
1184   val[offset] = pVal[0] << wordShift;
1185   for (i = 0; i < offset; ++i)
1186     val[i] = 0;
1187   return APInt(val, BitWidth).clearUnusedBits();
1188 }
1189
1190 APInt APInt::rotl(const APInt &rotateAmt) const {
1191   return rotl((uint32_t)rotateAmt.getLimitedValue(BitWidth));
1192 }
1193
1194 APInt APInt::rotl(uint32_t rotateAmt) const {
1195   if (rotateAmt == 0)
1196     return *this;
1197   // Don't get too fancy, just use existing shift/or facilities
1198   APInt hi(*this);
1199   APInt lo(*this);
1200   hi.shl(rotateAmt);
1201   lo.lshr(BitWidth - rotateAmt);
1202   return hi | lo;
1203 }
1204
1205 APInt APInt::rotr(const APInt &rotateAmt) const {
1206   return rotr((uint32_t)rotateAmt.getLimitedValue(BitWidth));
1207 }
1208
1209 APInt APInt::rotr(uint32_t rotateAmt) const {
1210   if (rotateAmt == 0)
1211     return *this;
1212   // Don't get too fancy, just use existing shift/or facilities
1213   APInt hi(*this);
1214   APInt lo(*this);
1215   lo.lshr(rotateAmt);
1216   hi.shl(BitWidth - rotateAmt);
1217   return hi | lo;
1218 }
1219
1220 // Square Root - this method computes and returns the square root of "this".
1221 // Three mechanisms are used for computation. For small values (<= 5 bits),
1222 // a table lookup is done. This gets some performance for common cases. For
1223 // values using less than 52 bits, the value is converted to double and then
1224 // the libc sqrt function is called. The result is rounded and then converted
1225 // back to a uint64_t which is then used to construct the result. Finally,
1226 // the Babylonian method for computing square roots is used.
1227 APInt APInt::sqrt() const {
1228
1229   // Determine the magnitude of the value.
1230   uint32_t magnitude = getActiveBits();
1231
1232   // Use a fast table for some small values. This also gets rid of some
1233   // rounding errors in libc sqrt for small values.
1234   if (magnitude <= 5) {
1235     static const uint8_t results[32] = {
1236       /*     0 */ 0,
1237       /*  1- 2 */ 1, 1,
1238       /*  3- 6 */ 2, 2, 2, 2,
1239       /*  7-12 */ 3, 3, 3, 3, 3, 3,
1240       /* 13-20 */ 4, 4, 4, 4, 4, 4, 4, 4,
1241       /* 21-30 */ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
1242       /*    31 */ 6
1243     };
1244     return APInt(BitWidth, results[ (isSingleWord() ? VAL : pVal[0]) ]);
1245   }
1246
1247   // If the magnitude of the value fits in less than 52 bits (the precision of
1248   // an IEEE double precision floating point value), then we can use the
1249   // libc sqrt function which will probably use a hardware sqrt computation.
1250   // This should be faster than the algorithm below.
1251   if (magnitude < 52) {
1252 #ifdef _MSC_VER
1253     // Amazingly, VC++ doesn't have round().
1254     return APInt(BitWidth,
1255                  uint64_t(::sqrt(double(isSingleWord()?VAL:pVal[0]))) + 0.5);
1256 #else
1257     return APInt(BitWidth,
1258                  uint64_t(::round(::sqrt(double(isSingleWord()?VAL:pVal[0])))));
1259 #endif
1260   }
1261
1262   // Okay, all the short cuts are exhausted. We must compute it. The following
1263   // is a classical Babylonian method for computing the square root. This code
1264   // was adapted to APINt from a wikipedia article on such computations.
1265   // See http://www.wikipedia.org/ and go to the page named
1266   // Calculate_an_integer_square_root.
1267   uint32_t nbits = BitWidth, i = 4;
1268   APInt testy(BitWidth, 16);
1269   APInt x_old(BitWidth, 1);
1270   APInt x_new(BitWidth, 0);
1271   APInt two(BitWidth, 2);
1272
1273   // Select a good starting value using binary logarithms.
1274   for (;; i += 2, testy = testy.shl(2))
1275     if (i >= nbits || this->ule(testy)) {
1276       x_old = x_old.shl(i / 2);
1277       break;
1278     }
1279
1280   // Use the Babylonian method to arrive at the integer square root:
1281   for (;;) {
1282     x_new = (this->udiv(x_old) + x_old).udiv(two);
1283     if (x_old.ule(x_new))
1284       break;
1285     x_old = x_new;
1286   }
1287
1288   // Make sure we return the closest approximation
1289   // NOTE: The rounding calculation below is correct. It will produce an
1290   // off-by-one discrepancy with results from pari/gp. That discrepancy has been
1291   // determined to be a rounding issue with pari/gp as it begins to use a
1292   // floating point representation after 192 bits. There are no discrepancies
1293   // between this algorithm and pari/gp for bit widths < 192 bits.
1294   APInt square(x_old * x_old);
1295   APInt nextSquare((x_old + 1) * (x_old +1));
1296   if (this->ult(square))
1297     return x_old;
1298   else if (this->ule(nextSquare)) {
1299     APInt midpoint((nextSquare - square).udiv(two));
1300     APInt offset(*this - square);
1301     if (offset.ult(midpoint))
1302       return x_old;
1303     else
1304       return x_old + 1;
1305   } else
1306     assert(0 && "Error in APInt::sqrt computation");
1307   return x_old + 1;
1308 }
1309
1310 /// Computes the multiplicative inverse of this APInt for a given modulo. The
1311 /// iterative extended Euclidean algorithm is used to solve for this value,
1312 /// however we simplify it to speed up calculating only the inverse, and take
1313 /// advantage of div+rem calculations. We also use some tricks to avoid copying
1314 /// (potentially large) APInts around.
1315 APInt APInt::multiplicativeInverse(const APInt& modulo) const {
1316   assert(ult(modulo) && "This APInt must be smaller than the modulo");
1317
1318   // Using the properties listed at the following web page (accessed 06/21/08):
1319   //   http://www.numbertheory.org/php/euclid.html
1320   // (especially the properties numbered 3, 4 and 9) it can be proved that
1321   // BitWidth bits suffice for all the computations in the algorithm implemented
1322   // below. More precisely, this number of bits suffice if the multiplicative
1323   // inverse exists, but may not suffice for the general extended Euclidean
1324   // algorithm.
1325
1326   APInt r[2] = { modulo, *this };
1327   APInt t[2] = { APInt(BitWidth, 0), APInt(BitWidth, 1) };
1328   APInt q(BitWidth, 0);
1329
1330   unsigned i;
1331   for (i = 0; r[i^1] != 0; i ^= 1) {
1332     // An overview of the math without the confusing bit-flipping:
1333     // q = r[i-2] / r[i-1]
1334     // r[i] = r[i-2] % r[i-1]
1335     // t[i] = t[i-2] - t[i-1] * q
1336     udivrem(r[i], r[i^1], q, r[i]);
1337     t[i] -= t[i^1] * q;
1338   }
1339
1340   // If this APInt and the modulo are not coprime, there is no multiplicative
1341   // inverse, so return 0. We check this by looking at the next-to-last
1342   // remainder, which is the gcd(*this,modulo) as calculated by the Euclidean
1343   // algorithm.
1344   if (r[i] != 1)
1345     return APInt(BitWidth, 0);
1346
1347   // The next-to-last t is the multiplicative inverse.  However, we are
1348   // interested in a positive inverse. Calcuate a positive one from a negative
1349   // one if necessary. A simple addition of the modulo suffices because
1350   // abs(t[i]) is known to be less than *this/2 (see the link above).
1351   return t[i].isNegative() ? t[i] + modulo : t[i];
1352 }
1353
1354 /// Implementation of Knuth's Algorithm D (Division of nonnegative integers)
1355 /// from "Art of Computer Programming, Volume 2", section 4.3.1, p. 272. The
1356 /// variables here have the same names as in the algorithm. Comments explain
1357 /// the algorithm and any deviation from it.
1358 static void KnuthDiv(uint32_t *u, uint32_t *v, uint32_t *q, uint32_t* r,
1359                      uint32_t m, uint32_t n) {
1360   assert(u && "Must provide dividend");
1361   assert(v && "Must provide divisor");
1362   assert(q && "Must provide quotient");
1363   assert(u != v && u != q && v != q && "Must us different memory");
1364   assert(n>1 && "n must be > 1");
1365
1366   // Knuth uses the value b as the base of the number system. In our case b
1367   // is 2^31 so we just set it to -1u.
1368   uint64_t b = uint64_t(1) << 32;
1369
1370 #if 0
1371   DEBUG(cerr << "KnuthDiv: m=" << m << " n=" << n << '\n');
1372   DEBUG(cerr << "KnuthDiv: original:");
1373   DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << std::setbase(16) << u[i]);
1374   DEBUG(cerr << " by");
1375   DEBUG(for (int i = n; i >0; i--) cerr << " " << std::setbase(16) << v[i-1]);
1376   DEBUG(cerr << '\n');
1377 #endif
1378   // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
1379   // u and v by d. Note that we have taken Knuth's advice here to use a power
1380   // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
1381   // 2 allows us to shift instead of multiply and it is easy to determine the
1382   // shift amount from the leading zeros.  We are basically normalizing the u
1383   // and v so that its high bits are shifted to the top of v's range without
1384   // overflow. Note that this can require an extra word in u so that u must
1385   // be of length m+n+1.
1386   uint32_t shift = CountLeadingZeros_32(v[n-1]);
1387   uint32_t v_carry = 0;
1388   uint32_t u_carry = 0;
1389   if (shift) {
1390     for (uint32_t i = 0; i < m+n; ++i) {
1391       uint32_t u_tmp = u[i] >> (32 - shift);
1392       u[i] = (u[i] << shift) | u_carry;
1393       u_carry = u_tmp;
1394     }
1395     for (uint32_t i = 0; i < n; ++i) {
1396       uint32_t v_tmp = v[i] >> (32 - shift);
1397       v[i] = (v[i] << shift) | v_carry;
1398       v_carry = v_tmp;
1399     }
1400   }
1401   u[m+n] = u_carry;
1402 #if 0
1403   DEBUG(cerr << "KnuthDiv:   normal:");
1404   DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << std::setbase(16) << u[i]);
1405   DEBUG(cerr << " by");
1406   DEBUG(for (int i = n; i >0; i--) cerr << " " << std::setbase(16) << v[i-1]);
1407   DEBUG(cerr << '\n');
1408 #endif
1409
1410   // D2. [Initialize j.]  Set j to m. This is the loop counter over the places.
1411   int j = m;
1412   do {
1413     DEBUG(cerr << "KnuthDiv: quotient digit #" << j << '\n');
1414     // D3. [Calculate q'.].
1415     //     Set qp = (u[j+n]*b + u[j+n-1]) / v[n-1]. (qp=qprime=q')
1416     //     Set rp = (u[j+n]*b + u[j+n-1]) % v[n-1]. (rp=rprime=r')
1417     // Now test if qp == b or qp*v[n-2] > b*rp + u[j+n-2]; if so, decrease
1418     // qp by 1, inrease rp by v[n-1], and repeat this test if rp < b. The test
1419     // on v[n-2] determines at high speed most of the cases in which the trial
1420     // value qp is one too large, and it eliminates all cases where qp is two
1421     // too large.
1422     uint64_t dividend = ((uint64_t(u[j+n]) << 32) + u[j+n-1]);
1423     DEBUG(cerr << "KnuthDiv: dividend == " << dividend << '\n');
1424     uint64_t qp = dividend / v[n-1];
1425     uint64_t rp = dividend % v[n-1];
1426     if (qp == b || qp*v[n-2] > b*rp + u[j+n-2]) {
1427       qp--;
1428       rp += v[n-1];
1429       if (rp < b && (qp == b || qp*v[n-2] > b*rp + u[j+n-2]))
1430         qp--;
1431     }
1432     DEBUG(cerr << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
1433
1434     // D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
1435     // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
1436     // consists of a simple multiplication by a one-place number, combined with
1437     // a subtraction.
1438     bool isNeg = false;
1439     for (uint32_t i = 0; i < n; ++i) {
1440       uint64_t u_tmp = uint64_t(u[j+i]) | (uint64_t(u[j+i+1]) << 32);
1441       uint64_t subtrahend = uint64_t(qp) * uint64_t(v[i]);
1442       bool borrow = subtrahend > u_tmp;
1443       DEBUG(cerr << "KnuthDiv: u_tmp == " << u_tmp
1444                  << ", subtrahend == " << subtrahend
1445                  << ", borrow = " << borrow << '\n');
1446
1447       uint64_t result = u_tmp - subtrahend;
1448       uint32_t k = j + i;
1449       u[k++] = (uint32_t)(result & (b-1)); // subtract low word
1450       u[k++] = (uint32_t)(result >> 32);   // subtract high word
1451       while (borrow && k <= m+n) { // deal with borrow to the left
1452         borrow = u[k] == 0;
1453         u[k]--;
1454         k++;
1455       }
1456       isNeg |= borrow;
1457       DEBUG(cerr << "KnuthDiv: u[j+i] == " << u[j+i] << ",  u[j+i+1] == " <<
1458                     u[j+i+1] << '\n');
1459     }
1460     DEBUG(cerr << "KnuthDiv: after subtraction:");
1461     DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << u[i]);
1462     DEBUG(cerr << '\n');
1463     // The digits (u[j+n]...u[j]) should be kept positive; if the result of
1464     // this step is actually negative, (u[j+n]...u[j]) should be left as the
1465     // true value plus b**(n+1), namely as the b's complement of
1466     // the true value, and a "borrow" to the left should be remembered.
1467     //
1468     if (isNeg) {
1469       bool carry = true;  // true because b's complement is "complement + 1"
1470       for (uint32_t i = 0; i <= m+n; ++i) {
1471         u[i] = ~u[i] + carry; // b's complement
1472         carry = carry && u[i] == 0;
1473       }
1474     }
1475     DEBUG(cerr << "KnuthDiv: after complement:");
1476     DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << u[i]);
1477     DEBUG(cerr << '\n');
1478
1479     // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
1480     // negative, go to step D6; otherwise go on to step D7.
1481     q[j] = (uint32_t)qp;
1482     if (isNeg) {
1483       // D6. [Add back]. The probability that this step is necessary is very
1484       // small, on the order of only 2/b. Make sure that test data accounts for
1485       // this possibility. Decrease q[j] by 1
1486       q[j]--;
1487       // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
1488       // A carry will occur to the left of u[j+n], and it should be ignored
1489       // since it cancels with the borrow that occurred in D4.
1490       bool carry = false;
1491       for (uint32_t i = 0; i < n; i++) {
1492         uint32_t limit = std::min(u[j+i],v[i]);
1493         u[j+i] += v[i] + carry;
1494         carry = u[j+i] < limit || (carry && u[j+i] == limit);
1495       }
1496       u[j+n] += carry;
1497     }
1498     DEBUG(cerr << "KnuthDiv: after correction:");
1499     DEBUG(for (int i = m+n; i >=0; i--) cerr <<" " << u[i]);
1500     DEBUG(cerr << "\nKnuthDiv: digit result = " << q[j] << '\n');
1501
1502   // D7. [Loop on j.]  Decrease j by one. Now if j >= 0, go back to D3.
1503   } while (--j >= 0);
1504
1505   DEBUG(cerr << "KnuthDiv: quotient:");
1506   DEBUG(for (int i = m; i >=0; i--) cerr <<" " << q[i]);
1507   DEBUG(cerr << '\n');
1508
1509   // D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
1510   // remainder may be obtained by dividing u[...] by d. If r is non-null we
1511   // compute the remainder (urem uses this).
1512   if (r) {
1513     // The value d is expressed by the "shift" value above since we avoided
1514     // multiplication by d by using a shift left. So, all we have to do is
1515     // shift right here. In order to mak
1516     if (shift) {
1517       uint32_t carry = 0;
1518       DEBUG(cerr << "KnuthDiv: remainder:");
1519       for (int i = n-1; i >= 0; i--) {
1520         r[i] = (u[i] >> shift) | carry;
1521         carry = u[i] << (32 - shift);
1522         DEBUG(cerr << " " << r[i]);
1523       }
1524     } else {
1525       for (int i = n-1; i >= 0; i--) {
1526         r[i] = u[i];
1527         DEBUG(cerr << " " << r[i]);
1528       }
1529     }
1530     DEBUG(cerr << '\n');
1531   }
1532 #if 0
1533   DEBUG(cerr << std::setbase(10) << '\n');
1534 #endif
1535 }
1536
1537 void APInt::divide(const APInt LHS, uint32_t lhsWords,
1538                    const APInt &RHS, uint32_t rhsWords,
1539                    APInt *Quotient, APInt *Remainder)
1540 {
1541   assert(lhsWords >= rhsWords && "Fractional result");
1542
1543   // First, compose the values into an array of 32-bit words instead of
1544   // 64-bit words. This is a necessity of both the "short division" algorithm
1545   // and the the Knuth "classical algorithm" which requires there to be native
1546   // operations for +, -, and * on an m bit value with an m*2 bit result. We
1547   // can't use 64-bit operands here because we don't have native results of
1548   // 128-bits. Furthremore, casting the 64-bit values to 32-bit values won't
1549   // work on large-endian machines.
1550   uint64_t mask = ~0ull >> (sizeof(uint32_t)*8);
1551   uint32_t n = rhsWords * 2;
1552   uint32_t m = (lhsWords * 2) - n;
1553
1554   // Allocate space for the temporary values we need either on the stack, if
1555   // it will fit, or on the heap if it won't.
1556   uint32_t SPACE[128];
1557   uint32_t *U = 0;
1558   uint32_t *V = 0;
1559   uint32_t *Q = 0;
1560   uint32_t *R = 0;
1561   if ((Remainder?4:3)*n+2*m+1 <= 128) {
1562     U = &SPACE[0];
1563     V = &SPACE[m+n+1];
1564     Q = &SPACE[(m+n+1) + n];
1565     if (Remainder)
1566       R = &SPACE[(m+n+1) + n + (m+n)];
1567   } else {
1568     U = new uint32_t[m + n + 1];
1569     V = new uint32_t[n];
1570     Q = new uint32_t[m+n];
1571     if (Remainder)
1572       R = new uint32_t[n];
1573   }
1574
1575   // Initialize the dividend
1576   memset(U, 0, (m+n+1)*sizeof(uint32_t));
1577   for (unsigned i = 0; i < lhsWords; ++i) {
1578     uint64_t tmp = (LHS.getNumWords() == 1 ? LHS.VAL : LHS.pVal[i]);
1579     U[i * 2] = (uint32_t)(tmp & mask);
1580     U[i * 2 + 1] = (uint32_t)(tmp >> (sizeof(uint32_t)*8));
1581   }
1582   U[m+n] = 0; // this extra word is for "spill" in the Knuth algorithm.
1583
1584   // Initialize the divisor
1585   memset(V, 0, (n)*sizeof(uint32_t));
1586   for (unsigned i = 0; i < rhsWords; ++i) {
1587     uint64_t tmp = (RHS.getNumWords() == 1 ? RHS.VAL : RHS.pVal[i]);
1588     V[i * 2] = (uint32_t)(tmp & mask);
1589     V[i * 2 + 1] = (uint32_t)(tmp >> (sizeof(uint32_t)*8));
1590   }
1591
1592   // initialize the quotient and remainder
1593   memset(Q, 0, (m+n) * sizeof(uint32_t));
1594   if (Remainder)
1595     memset(R, 0, n * sizeof(uint32_t));
1596
1597   // Now, adjust m and n for the Knuth division. n is the number of words in
1598   // the divisor. m is the number of words by which the dividend exceeds the
1599   // divisor (i.e. m+n is the length of the dividend). These sizes must not
1600   // contain any zero words or the Knuth algorithm fails.
1601   for (unsigned i = n; i > 0 && V[i-1] == 0; i--) {
1602     n--;
1603     m++;
1604   }
1605   for (unsigned i = m+n; i > 0 && U[i-1] == 0; i--)
1606     m--;
1607
1608   // If we're left with only a single word for the divisor, Knuth doesn't work
1609   // so we implement the short division algorithm here. This is much simpler
1610   // and faster because we are certain that we can divide a 64-bit quantity
1611   // by a 32-bit quantity at hardware speed and short division is simply a
1612   // series of such operations. This is just like doing short division but we
1613   // are using base 2^32 instead of base 10.
1614   assert(n != 0 && "Divide by zero?");
1615   if (n == 1) {
1616     uint32_t divisor = V[0];
1617     uint32_t remainder = 0;
1618     for (int i = m+n-1; i >= 0; i--) {
1619       uint64_t partial_dividend = uint64_t(remainder) << 32 | U[i];
1620       if (partial_dividend == 0) {
1621         Q[i] = 0;
1622         remainder = 0;
1623       } else if (partial_dividend < divisor) {
1624         Q[i] = 0;
1625         remainder = (uint32_t)partial_dividend;
1626       } else if (partial_dividend == divisor) {
1627         Q[i] = 1;
1628         remainder = 0;
1629       } else {
1630         Q[i] = (uint32_t)(partial_dividend / divisor);
1631         remainder = (uint32_t)(partial_dividend - (Q[i] * divisor));
1632       }
1633     }
1634     if (R)
1635       R[0] = remainder;
1636   } else {
1637     // Now we're ready to invoke the Knuth classical divide algorithm. In this
1638     // case n > 1.
1639     KnuthDiv(U, V, Q, R, m, n);
1640   }
1641
1642   // If the caller wants the quotient
1643   if (Quotient) {
1644     // Set up the Quotient value's memory.
1645     if (Quotient->BitWidth != LHS.BitWidth) {
1646       if (Quotient->isSingleWord())
1647         Quotient->VAL = 0;
1648       else
1649         delete [] Quotient->pVal;
1650       Quotient->BitWidth = LHS.BitWidth;
1651       if (!Quotient->isSingleWord())
1652         Quotient->pVal = getClearedMemory(Quotient->getNumWords());
1653     } else
1654       Quotient->clear();
1655
1656     // The quotient is in Q. Reconstitute the quotient into Quotient's low
1657     // order words.
1658     if (lhsWords == 1) {
1659       uint64_t tmp =
1660         uint64_t(Q[0]) | (uint64_t(Q[1]) << (APINT_BITS_PER_WORD / 2));
1661       if (Quotient->isSingleWord())
1662         Quotient->VAL = tmp;
1663       else
1664         Quotient->pVal[0] = tmp;
1665     } else {
1666       assert(!Quotient->isSingleWord() && "Quotient APInt not large enough");
1667       for (unsigned i = 0; i < lhsWords; ++i)
1668         Quotient->pVal[i] =
1669           uint64_t(Q[i*2]) | (uint64_t(Q[i*2+1]) << (APINT_BITS_PER_WORD / 2));
1670     }
1671   }
1672
1673   // If the caller wants the remainder
1674   if (Remainder) {
1675     // Set up the Remainder value's memory.
1676     if (Remainder->BitWidth != RHS.BitWidth) {
1677       if (Remainder->isSingleWord())
1678         Remainder->VAL = 0;
1679       else
1680         delete [] Remainder->pVal;
1681       Remainder->BitWidth = RHS.BitWidth;
1682       if (!Remainder->isSingleWord())
1683         Remainder->pVal = getClearedMemory(Remainder->getNumWords());
1684     } else
1685       Remainder->clear();
1686
1687     // The remainder is in R. Reconstitute the remainder into Remainder's low
1688     // order words.
1689     if (rhsWords == 1) {
1690       uint64_t tmp =
1691         uint64_t(R[0]) | (uint64_t(R[1]) << (APINT_BITS_PER_WORD / 2));
1692       if (Remainder->isSingleWord())
1693         Remainder->VAL = tmp;
1694       else
1695         Remainder->pVal[0] = tmp;
1696     } else {
1697       assert(!Remainder->isSingleWord() && "Remainder APInt not large enough");
1698       for (unsigned i = 0; i < rhsWords; ++i)
1699         Remainder->pVal[i] =
1700           uint64_t(R[i*2]) | (uint64_t(R[i*2+1]) << (APINT_BITS_PER_WORD / 2));
1701     }
1702   }
1703
1704   // Clean up the memory we allocated.
1705   if (U != &SPACE[0]) {
1706     delete [] U;
1707     delete [] V;
1708     delete [] Q;
1709     delete [] R;
1710   }
1711 }
1712
1713 APInt APInt::udiv(const APInt& RHS) const {
1714   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
1715
1716   // First, deal with the easy case
1717   if (isSingleWord()) {
1718     assert(RHS.VAL != 0 && "Divide by zero?");
1719     return APInt(BitWidth, VAL / RHS.VAL);
1720   }
1721
1722   // Get some facts about the LHS and RHS number of bits and words
1723   uint32_t rhsBits = RHS.getActiveBits();
1724   uint32_t rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
1725   assert(rhsWords && "Divided by zero???");
1726   uint32_t lhsBits = this->getActiveBits();
1727   uint32_t lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
1728
1729   // Deal with some degenerate cases
1730   if (!lhsWords)
1731     // 0 / X ===> 0
1732     return APInt(BitWidth, 0);
1733   else if (lhsWords < rhsWords || this->ult(RHS)) {
1734     // X / Y ===> 0, iff X < Y
1735     return APInt(BitWidth, 0);
1736   } else if (*this == RHS) {
1737     // X / X ===> 1
1738     return APInt(BitWidth, 1);
1739   } else if (lhsWords == 1 && rhsWords == 1) {
1740     // All high words are zero, just use native divide
1741     return APInt(BitWidth, this->pVal[0] / RHS.pVal[0]);
1742   }
1743
1744   // We have to compute it the hard way. Invoke the Knuth divide algorithm.
1745   APInt Quotient(1,0); // to hold result.
1746   divide(*this, lhsWords, RHS, rhsWords, &Quotient, 0);
1747   return Quotient;
1748 }
1749
1750 APInt APInt::urem(const APInt& RHS) const {
1751   assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
1752   if (isSingleWord()) {
1753     assert(RHS.VAL != 0 && "Remainder by zero?");
1754     return APInt(BitWidth, VAL % RHS.VAL);
1755   }
1756
1757   // Get some facts about the LHS
1758   uint32_t lhsBits = getActiveBits();
1759   uint32_t lhsWords = !lhsBits ? 0 : (whichWord(lhsBits - 1) + 1);
1760
1761   // Get some facts about the RHS
1762   uint32_t rhsBits = RHS.getActiveBits();
1763   uint32_t rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
1764   assert(rhsWords && "Performing remainder operation by zero ???");
1765
1766   // Check the degenerate cases
1767   if (lhsWords == 0) {
1768     // 0 % Y ===> 0
1769     return APInt(BitWidth, 0);
1770   } else if (lhsWords < rhsWords || this->ult(RHS)) {
1771     // X % Y ===> X, iff X < Y
1772     return *this;
1773   } else if (*this == RHS) {
1774     // X % X == 0;
1775     return APInt(BitWidth, 0);
1776   } else if (lhsWords == 1) {
1777     // All high words are zero, just use native remainder
1778     return APInt(BitWidth, pVal[0] % RHS.pVal[0]);
1779   }
1780
1781   // We have to compute it the hard way. Invoke the Knuth divide algorithm.
1782   APInt Remainder(1,0);
1783   divide(*this, lhsWords, RHS, rhsWords, 0, &Remainder);
1784   return Remainder;
1785 }
1786
1787 void APInt::udivrem(const APInt &LHS, const APInt &RHS,
1788                     APInt &Quotient, APInt &Remainder) {
1789   // Get some size facts about the dividend and divisor
1790   uint32_t lhsBits  = LHS.getActiveBits();
1791   uint32_t lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
1792   uint32_t rhsBits  = RHS.getActiveBits();
1793   uint32_t rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
1794
1795   // Check the degenerate cases
1796   if (lhsWords == 0) {
1797     Quotient = 0;                // 0 / Y ===> 0
1798     Remainder = 0;               // 0 % Y ===> 0
1799     return;
1800   }
1801
1802   if (lhsWords < rhsWords || LHS.ult(RHS)) {
1803     Quotient = 0;               // X / Y ===> 0, iff X < Y
1804     Remainder = LHS;            // X % Y ===> X, iff X < Y
1805     return;
1806   }
1807
1808   if (LHS == RHS) {
1809     Quotient  = 1;              // X / X ===> 1
1810     Remainder = 0;              // X % X ===> 0;
1811     return;
1812   }
1813
1814   if (lhsWords == 1 && rhsWords == 1) {
1815     // There is only one word to consider so use the native versions.
1816     uint64_t lhsValue = LHS.isSingleWord() ? LHS.VAL : LHS.pVal[0];
1817     uint64_t rhsValue = RHS.isSingleWord() ? RHS.VAL : RHS.pVal[0];
1818     Quotient = APInt(LHS.getBitWidth(), lhsValue / rhsValue);
1819     Remainder = APInt(LHS.getBitWidth(), lhsValue % rhsValue);
1820     return;
1821   }
1822
1823   // Okay, lets do it the long way
1824   divide(LHS, lhsWords, RHS, rhsWords, &Quotient, &Remainder);
1825 }
1826
1827 void APInt::fromString(uint32_t numbits, const char *str, uint32_t slen,
1828                        uint8_t radix) {
1829   // Check our assumptions here
1830   assert((radix == 10 || radix == 8 || radix == 16 || radix == 2) &&
1831          "Radix should be 2, 8, 10, or 16!");
1832   assert(str && "String is null?");
1833   bool isNeg = str[0] == '-';
1834   if (isNeg)
1835     str++, slen--;
1836   assert((slen <= numbits || radix != 2) && "Insufficient bit width");
1837   assert((slen*3 <= numbits || radix != 8) && "Insufficient bit width");
1838   assert((slen*4 <= numbits || radix != 16) && "Insufficient bit width");
1839   assert(((slen*64)/22 <= numbits || radix != 10) && "Insufficient bit width");
1840
1841   // Allocate memory
1842   if (!isSingleWord())
1843     pVal = getClearedMemory(getNumWords());
1844
1845   // Figure out if we can shift instead of multiply
1846   uint32_t shift = (radix == 16 ? 4 : radix == 8 ? 3 : radix == 2 ? 1 : 0);
1847
1848   // Set up an APInt for the digit to add outside the loop so we don't
1849   // constantly construct/destruct it.
1850   APInt apdigit(getBitWidth(), 0);
1851   APInt apradix(getBitWidth(), radix);
1852
1853   // Enter digit traversal loop
1854   for (unsigned i = 0; i < slen; i++) {
1855     // Get a digit
1856     uint32_t digit = 0;
1857     char cdigit = str[i];
1858     if (radix == 16) {
1859       if (!isxdigit(cdigit))
1860         assert(0 && "Invalid hex digit in string");
1861       if (isdigit(cdigit))
1862         digit = cdigit - '0';
1863       else if (cdigit >= 'a')
1864         digit = cdigit - 'a' + 10;
1865       else if (cdigit >= 'A')
1866         digit = cdigit - 'A' + 10;
1867       else
1868         assert(0 && "huh? we shouldn't get here");
1869     } else if (isdigit(cdigit)) {
1870       digit = cdigit - '0';
1871       assert((radix == 10 ||
1872               (radix == 8 && digit != 8 && digit != 9) ||
1873               (radix == 2 && (digit == 0 || digit == 1))) &&
1874              "Invalid digit in string for given radix");
1875     } else {
1876       assert(0 && "Invalid character in digit string");
1877     }
1878
1879     // Shift or multiply the value by the radix
1880     if (shift)
1881       *this <<= shift;
1882     else
1883       *this *= apradix;
1884
1885     // Add in the digit we just interpreted
1886     if (apdigit.isSingleWord())
1887       apdigit.VAL = digit;
1888     else
1889       apdigit.pVal[0] = digit;
1890     *this += apdigit;
1891   }
1892   // If its negative, put it in two's complement form
1893   if (isNeg) {
1894     (*this)--;
1895     this->flip();
1896   }
1897 }
1898
1899 void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
1900                      bool Signed) const {
1901   assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2) &&
1902          "Radix should be 2, 8, 10, or 16!");
1903
1904   // First, check for a zero value and just short circuit the logic below.
1905   if (*this == 0) {
1906     Str.push_back('0');
1907     return;
1908   }
1909
1910   static const char Digits[] = "0123456789ABCDEF";
1911
1912   if (isSingleWord()) {
1913     char Buffer[65];
1914     char *BufPtr = Buffer+65;
1915
1916     uint64_t N;
1917     if (Signed) {
1918       int64_t I = getSExtValue();
1919       if (I < 0) {
1920         Str.push_back('-');
1921         I = -I;
1922       }
1923       N = I;
1924     } else {
1925       N = getZExtValue();
1926     }
1927
1928     while (N) {
1929       *--BufPtr = Digits[N % Radix];
1930       N /= Radix;
1931     }
1932     Str.append(BufPtr, Buffer+65);
1933     return;
1934   }
1935
1936   APInt Tmp(*this);
1937
1938   if (Signed && isNegative()) {
1939     // They want to print the signed version and it is a negative value
1940     // Flip the bits and add one to turn it into the equivalent positive
1941     // value and put a '-' in the result.
1942     Tmp.flip();
1943     Tmp++;
1944     Str.push_back('-');
1945   }
1946
1947   // We insert the digits backward, then reverse them to get the right order.
1948   unsigned StartDig = Str.size();
1949
1950   // For the 2, 8 and 16 bit cases, we can just shift instead of divide
1951   // because the number of bits per digit (1, 3 and 4 respectively) divides
1952   // equaly.  We just shift until the value is zero.
1953   if (Radix != 10) {
1954     // Just shift tmp right for each digit width until it becomes zero
1955     unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
1956     unsigned MaskAmt = Radix - 1;
1957
1958     while (Tmp != 0) {
1959       unsigned Digit = unsigned(Tmp.getRawData()[0]) & MaskAmt;
1960       Str.push_back(Digits[Digit]);
1961       Tmp = Tmp.lshr(ShiftAmt);
1962     }
1963   } else {
1964     APInt divisor(4, 10);
1965     while (Tmp != 0) {
1966       APInt APdigit(1, 0);
1967       APInt tmp2(Tmp.getBitWidth(), 0);
1968       divide(Tmp, Tmp.getNumWords(), divisor, divisor.getNumWords(), &tmp2,
1969              &APdigit);
1970       uint32_t Digit = (uint32_t)APdigit.getZExtValue();
1971       assert(Digit < Radix && "divide failed");
1972       Str.push_back(Digits[Digit]);
1973       Tmp = tmp2;
1974     }
1975   }
1976
1977   // Reverse the digits before returning.
1978   std::reverse(Str.begin()+StartDig, Str.end());
1979 }
1980
1981 /// toString - This returns the APInt as a std::string.  Note that this is an
1982 /// inefficient method.  It is better to pass in a SmallVector/SmallString
1983 /// to the methods above.
1984 std::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
1985   SmallString<40> S;
1986   toString(S, Radix, Signed);
1987   return S.c_str();
1988 }
1989
1990
1991 void APInt::dump() const {
1992   SmallString<40> S, U;
1993   this->toStringUnsigned(U);
1994   this->toStringSigned(S);
1995   fprintf(stderr, "APInt(%db, %su %ss)", BitWidth, U.c_str(), S.c_str());
1996 }
1997
1998 void APInt::print(std::ostream &OS, bool isSigned) const {
1999   SmallString<40> S;
2000   this->toString(S, 10, isSigned);
2001   OS << S.c_str();
2002 }
2003
2004
2005 // This implements a variety of operations on a representation of
2006 // arbitrary precision, two's-complement, bignum integer values.
2007
2008 /* Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
2009    and unrestricting assumption.  */
2010 #define COMPILE_TIME_ASSERT(cond) extern int CTAssert[(cond) ? 1 : -1]
2011 COMPILE_TIME_ASSERT(integerPartWidth % 2 == 0);
2012
2013 /* Some handy functions local to this file.  */
2014 namespace {
2015
2016   /* Returns the integer part with the least significant BITS set.
2017      BITS cannot be zero.  */
2018   static inline integerPart
2019   lowBitMask(unsigned int bits)
2020   {
2021     assert (bits != 0 && bits <= integerPartWidth);
2022
2023     return ~(integerPart) 0 >> (integerPartWidth - bits);
2024   }
2025
2026   /* Returns the value of the lower half of PART.  */
2027   static inline integerPart
2028   lowHalf(integerPart part)
2029   {
2030     return part & lowBitMask(integerPartWidth / 2);
2031   }
2032
2033   /* Returns the value of the upper half of PART.  */
2034   static inline integerPart
2035   highHalf(integerPart part)
2036   {
2037     return part >> (integerPartWidth / 2);
2038   }
2039
2040   /* Returns the bit number of the most significant set bit of a part.
2041      If the input number has no bits set -1U is returned.  */
2042   static unsigned int
2043   partMSB(integerPart value)
2044   {
2045     unsigned int n, msb;
2046
2047     if (value == 0)
2048       return -1U;
2049
2050     n = integerPartWidth / 2;
2051
2052     msb = 0;
2053     do {
2054       if (value >> n) {
2055         value >>= n;
2056         msb += n;
2057       }
2058
2059       n >>= 1;
2060     } while (n);
2061
2062     return msb;
2063   }
2064
2065   /* Returns the bit number of the least significant set bit of a
2066      part.  If the input number has no bits set -1U is returned.  */
2067   static unsigned int
2068   partLSB(integerPart value)
2069   {
2070     unsigned int n, lsb;
2071
2072     if (value == 0)
2073       return -1U;
2074
2075     lsb = integerPartWidth - 1;
2076     n = integerPartWidth / 2;
2077
2078     do {
2079       if (value << n) {
2080         value <<= n;
2081         lsb -= n;
2082       }
2083
2084       n >>= 1;
2085     } while (n);
2086
2087     return lsb;
2088   }
2089 }
2090
2091 /* Sets the least significant part of a bignum to the input value, and
2092    zeroes out higher parts.  */
2093 void
2094 APInt::tcSet(integerPart *dst, integerPart part, unsigned int parts)
2095 {
2096   unsigned int i;
2097
2098   assert (parts > 0);
2099
2100   dst[0] = part;
2101   for(i = 1; i < parts; i++)
2102     dst[i] = 0;
2103 }
2104
2105 /* Assign one bignum to another.  */
2106 void
2107 APInt::tcAssign(integerPart *dst, const integerPart *src, unsigned int parts)
2108 {
2109   unsigned int i;
2110
2111   for(i = 0; i < parts; i++)
2112     dst[i] = src[i];
2113 }
2114
2115 /* Returns true if a bignum is zero, false otherwise.  */
2116 bool
2117 APInt::tcIsZero(const integerPart *src, unsigned int parts)
2118 {
2119   unsigned int i;
2120
2121   for(i = 0; i < parts; i++)
2122     if (src[i])
2123       return false;
2124
2125   return true;
2126 }
2127
2128 /* Extract the given bit of a bignum; returns 0 or 1.  */
2129 int
2130 APInt::tcExtractBit(const integerPart *parts, unsigned int bit)
2131 {
2132   return(parts[bit / integerPartWidth]
2133          & ((integerPart) 1 << bit % integerPartWidth)) != 0;
2134 }
2135
2136 /* Set the given bit of a bignum.  */
2137 void
2138 APInt::tcSetBit(integerPart *parts, unsigned int bit)
2139 {
2140   parts[bit / integerPartWidth] |= (integerPart) 1 << (bit % integerPartWidth);
2141 }
2142
2143 /* Returns the bit number of the least significant set bit of a
2144    number.  If the input number has no bits set -1U is returned.  */
2145 unsigned int
2146 APInt::tcLSB(const integerPart *parts, unsigned int n)
2147 {
2148   unsigned int i, lsb;
2149
2150   for(i = 0; i < n; i++) {
2151       if (parts[i] != 0) {
2152           lsb = partLSB(parts[i]);
2153
2154           return lsb + i * integerPartWidth;
2155       }
2156   }
2157
2158   return -1U;
2159 }
2160
2161 /* Returns the bit number of the most significant set bit of a number.
2162    If the input number has no bits set -1U is returned.  */
2163 unsigned int
2164 APInt::tcMSB(const integerPart *parts, unsigned int n)
2165 {
2166   unsigned int msb;
2167
2168   do {
2169       --n;
2170
2171       if (parts[n] != 0) {
2172           msb = partMSB(parts[n]);
2173
2174           return msb + n * integerPartWidth;
2175       }
2176   } while (n);
2177
2178   return -1U;
2179 }
2180
2181 /* Copy the bit vector of width srcBITS from SRC, starting at bit
2182    srcLSB, to DST, of dstCOUNT parts, such that the bit srcLSB becomes
2183    the least significant bit of DST.  All high bits above srcBITS in
2184    DST are zero-filled.  */
2185 void
2186 APInt::tcExtract(integerPart *dst, unsigned int dstCount, const integerPart *src,
2187                  unsigned int srcBits, unsigned int srcLSB)
2188 {
2189   unsigned int firstSrcPart, dstParts, shift, n;
2190
2191   dstParts = (srcBits + integerPartWidth - 1) / integerPartWidth;
2192   assert (dstParts <= dstCount);
2193
2194   firstSrcPart = srcLSB / integerPartWidth;
2195   tcAssign (dst, src + firstSrcPart, dstParts);
2196
2197   shift = srcLSB % integerPartWidth;
2198   tcShiftRight (dst, dstParts, shift);
2199
2200   /* We now have (dstParts * integerPartWidth - shift) bits from SRC
2201      in DST.  If this is less that srcBits, append the rest, else
2202      clear the high bits.  */
2203   n = dstParts * integerPartWidth - shift;
2204   if (n < srcBits) {
2205     integerPart mask = lowBitMask (srcBits - n);
2206     dst[dstParts - 1] |= ((src[firstSrcPart + dstParts] & mask)
2207                           << n % integerPartWidth);
2208   } else if (n > srcBits) {
2209     if (srcBits % integerPartWidth)
2210       dst[dstParts - 1] &= lowBitMask (srcBits % integerPartWidth);
2211   }
2212
2213   /* Clear high parts.  */
2214   while (dstParts < dstCount)
2215     dst[dstParts++] = 0;
2216 }
2217
2218 /* DST += RHS + C where C is zero or one.  Returns the carry flag.  */
2219 integerPart
2220 APInt::tcAdd(integerPart *dst, const integerPart *rhs,
2221              integerPart c, unsigned int parts)
2222 {
2223   unsigned int i;
2224
2225   assert(c <= 1);
2226
2227   for(i = 0; i < parts; i++) {
2228     integerPart l;
2229
2230     l = dst[i];
2231     if (c) {
2232       dst[i] += rhs[i] + 1;
2233       c = (dst[i] <= l);
2234     } else {
2235       dst[i] += rhs[i];
2236       c = (dst[i] < l);
2237     }
2238   }
2239
2240   return c;
2241 }
2242
2243 /* DST -= RHS + C where C is zero or one.  Returns the carry flag.  */
2244 integerPart
2245 APInt::tcSubtract(integerPart *dst, const integerPart *rhs,
2246                   integerPart c, unsigned int parts)
2247 {
2248   unsigned int i;
2249
2250   assert(c <= 1);
2251
2252   for(i = 0; i < parts; i++) {
2253     integerPart l;
2254
2255     l = dst[i];
2256     if (c) {
2257       dst[i] -= rhs[i] + 1;
2258       c = (dst[i] >= l);
2259     } else {
2260       dst[i] -= rhs[i];
2261       c = (dst[i] > l);
2262     }
2263   }
2264
2265   return c;
2266 }
2267
2268 /* Negate a bignum in-place.  */
2269 void
2270 APInt::tcNegate(integerPart *dst, unsigned int parts)
2271 {
2272   tcComplement(dst, parts);
2273   tcIncrement(dst, parts);
2274 }
2275
2276 /*  DST += SRC * MULTIPLIER + CARRY   if add is true
2277     DST  = SRC * MULTIPLIER + CARRY   if add is false
2278
2279     Requires 0 <= DSTPARTS <= SRCPARTS + 1.  If DST overlaps SRC
2280     they must start at the same point, i.e. DST == SRC.
2281
2282     If DSTPARTS == SRCPARTS + 1 no overflow occurs and zero is
2283     returned.  Otherwise DST is filled with the least significant
2284     DSTPARTS parts of the result, and if all of the omitted higher
2285     parts were zero return zero, otherwise overflow occurred and
2286     return one.  */
2287 int
2288 APInt::tcMultiplyPart(integerPart *dst, const integerPart *src,
2289                       integerPart multiplier, integerPart carry,
2290                       unsigned int srcParts, unsigned int dstParts,
2291                       bool add)
2292 {
2293   unsigned int i, n;
2294
2295   /* Otherwise our writes of DST kill our later reads of SRC.  */
2296   assert(dst <= src || dst >= src + srcParts);
2297   assert(dstParts <= srcParts + 1);
2298
2299   /* N loops; minimum of dstParts and srcParts.  */
2300   n = dstParts < srcParts ? dstParts: srcParts;
2301
2302   for(i = 0; i < n; i++) {
2303     integerPart low, mid, high, srcPart;
2304
2305       /* [ LOW, HIGH ] = MULTIPLIER * SRC[i] + DST[i] + CARRY.
2306
2307          This cannot overflow, because
2308
2309          (n - 1) * (n - 1) + 2 (n - 1) = (n - 1) * (n + 1)
2310
2311          which is less than n^2.  */
2312
2313     srcPart = src[i];
2314
2315     if (multiplier == 0 || srcPart == 0)        {
2316       low = carry;
2317       high = 0;
2318     } else {
2319       low = lowHalf(srcPart) * lowHalf(multiplier);
2320       high = highHalf(srcPart) * highHalf(multiplier);
2321
2322       mid = lowHalf(srcPart) * highHalf(multiplier);
2323       high += highHalf(mid);
2324       mid <<= integerPartWidth / 2;
2325       if (low + mid < low)
2326         high++;
2327       low += mid;
2328
2329       mid = highHalf(srcPart) * lowHalf(multiplier);
2330       high += highHalf(mid);
2331       mid <<= integerPartWidth / 2;
2332       if (low + mid < low)
2333         high++;
2334       low += mid;
2335
2336       /* Now add carry.  */
2337       if (low + carry < low)
2338         high++;
2339       low += carry;
2340     }
2341
2342     if (add) {
2343       /* And now DST[i], and store the new low part there.  */
2344       if (low + dst[i] < low)
2345         high++;
2346       dst[i] += low;
2347     } else
2348       dst[i] = low;
2349
2350     carry = high;
2351   }
2352
2353   if (i < dstParts) {
2354     /* Full multiplication, there is no overflow.  */
2355     assert(i + 1 == dstParts);
2356     dst[i] = carry;
2357     return 0;
2358   } else {
2359     /* We overflowed if there is carry.  */
2360     if (carry)
2361       return 1;
2362
2363     /* We would overflow if any significant unwritten parts would be
2364        non-zero.  This is true if any remaining src parts are non-zero
2365        and the multiplier is non-zero.  */
2366     if (multiplier)
2367       for(; i < srcParts; i++)
2368         if (src[i])
2369           return 1;
2370
2371     /* We fitted in the narrow destination.  */
2372     return 0;
2373   }
2374 }
2375
2376 /* DST = LHS * RHS, where DST has the same width as the operands and
2377    is filled with the least significant parts of the result.  Returns
2378    one if overflow occurred, otherwise zero.  DST must be disjoint
2379    from both operands.  */
2380 int
2381 APInt::tcMultiply(integerPart *dst, const integerPart *lhs,
2382                   const integerPart *rhs, unsigned int parts)
2383 {
2384   unsigned int i;
2385   int overflow;
2386
2387   assert(dst != lhs && dst != rhs);
2388
2389   overflow = 0;
2390   tcSet(dst, 0, parts);
2391
2392   for(i = 0; i < parts; i++)
2393     overflow |= tcMultiplyPart(&dst[i], lhs, rhs[i], 0, parts,
2394                                parts - i, true);
2395
2396   return overflow;
2397 }
2398
2399 /* DST = LHS * RHS, where DST has width the sum of the widths of the
2400    operands.  No overflow occurs.  DST must be disjoint from both
2401    operands.  Returns the number of parts required to hold the
2402    result.  */
2403 unsigned int
2404 APInt::tcFullMultiply(integerPart *dst, const integerPart *lhs,
2405                       const integerPart *rhs, unsigned int lhsParts,
2406                       unsigned int rhsParts)
2407 {
2408   /* Put the narrower number on the LHS for less loops below.  */
2409   if (lhsParts > rhsParts) {
2410     return tcFullMultiply (dst, rhs, lhs, rhsParts, lhsParts);
2411   } else {
2412     unsigned int n;
2413
2414     assert(dst != lhs && dst != rhs);
2415
2416     tcSet(dst, 0, rhsParts);
2417
2418     for(n = 0; n < lhsParts; n++)
2419       tcMultiplyPart(&dst[n], rhs, lhs[n], 0, rhsParts, rhsParts + 1, true);
2420
2421     n = lhsParts + rhsParts;
2422
2423     return n - (dst[n - 1] == 0);
2424   }
2425 }
2426
2427 /* If RHS is zero LHS and REMAINDER are left unchanged, return one.
2428    Otherwise set LHS to LHS / RHS with the fractional part discarded,
2429    set REMAINDER to the remainder, return zero.  i.e.
2430
2431    OLD_LHS = RHS * LHS + REMAINDER
2432
2433    SCRATCH is a bignum of the same size as the operands and result for
2434    use by the routine; its contents need not be initialized and are
2435    destroyed.  LHS, REMAINDER and SCRATCH must be distinct.
2436 */
2437 int
2438 APInt::tcDivide(integerPart *lhs, const integerPart *rhs,
2439                 integerPart *remainder, integerPart *srhs,
2440                 unsigned int parts)
2441 {
2442   unsigned int n, shiftCount;
2443   integerPart mask;
2444
2445   assert(lhs != remainder && lhs != srhs && remainder != srhs);
2446
2447   shiftCount = tcMSB(rhs, parts) + 1;
2448   if (shiftCount == 0)
2449     return true;
2450
2451   shiftCount = parts * integerPartWidth - shiftCount;
2452   n = shiftCount / integerPartWidth;
2453   mask = (integerPart) 1 << (shiftCount % integerPartWidth);
2454
2455   tcAssign(srhs, rhs, parts);
2456   tcShiftLeft(srhs, parts, shiftCount);
2457   tcAssign(remainder, lhs, parts);
2458   tcSet(lhs, 0, parts);
2459
2460   /* Loop, subtracting SRHS if REMAINDER is greater and adding that to
2461      the total.  */
2462   for(;;) {
2463       int compare;
2464
2465       compare = tcCompare(remainder, srhs, parts);
2466       if (compare >= 0) {
2467         tcSubtract(remainder, srhs, 0, parts);
2468         lhs[n] |= mask;
2469       }
2470
2471       if (shiftCount == 0)
2472         break;
2473       shiftCount--;
2474       tcShiftRight(srhs, parts, 1);
2475       if ((mask >>= 1) == 0)
2476         mask = (integerPart) 1 << (integerPartWidth - 1), n--;
2477   }
2478
2479   return false;
2480 }
2481
2482 /* Shift a bignum left COUNT bits in-place.  Shifted in bits are zero.
2483    There are no restrictions on COUNT.  */
2484 void
2485 APInt::tcShiftLeft(integerPart *dst, unsigned int parts, unsigned int count)
2486 {
2487   if (count) {
2488     unsigned int jump, shift;
2489
2490     /* Jump is the inter-part jump; shift is is intra-part shift.  */
2491     jump = count / integerPartWidth;
2492     shift = count % integerPartWidth;
2493
2494     while (parts > jump) {
2495       integerPart part;
2496
2497       parts--;
2498
2499       /* dst[i] comes from the two parts src[i - jump] and, if we have
2500          an intra-part shift, src[i - jump - 1].  */
2501       part = dst[parts - jump];
2502       if (shift) {
2503         part <<= shift;
2504         if (parts >= jump + 1)
2505           part |= dst[parts - jump - 1] >> (integerPartWidth - shift);
2506       }
2507
2508       dst[parts] = part;
2509     }
2510
2511     while (parts > 0)
2512       dst[--parts] = 0;
2513   }
2514 }
2515
2516 /* Shift a bignum right COUNT bits in-place.  Shifted in bits are
2517    zero.  There are no restrictions on COUNT.  */
2518 void
2519 APInt::tcShiftRight(integerPart *dst, unsigned int parts, unsigned int count)
2520 {
2521   if (count) {
2522     unsigned int i, jump, shift;
2523
2524     /* Jump is the inter-part jump; shift is is intra-part shift.  */
2525     jump = count / integerPartWidth;
2526     shift = count % integerPartWidth;
2527
2528     /* Perform the shift.  This leaves the most significant COUNT bits
2529        of the result at zero.  */
2530     for(i = 0; i < parts; i++) {
2531       integerPart part;
2532
2533       if (i + jump >= parts) {
2534         part = 0;
2535       } else {
2536         part = dst[i + jump];
2537         if (shift) {
2538           part >>= shift;
2539           if (i + jump + 1 < parts)
2540             part |= dst[i + jump + 1] << (integerPartWidth - shift);
2541         }
2542       }
2543
2544       dst[i] = part;
2545     }
2546   }
2547 }
2548
2549 /* Bitwise and of two bignums.  */
2550 void
2551 APInt::tcAnd(integerPart *dst, const integerPart *rhs, unsigned int parts)
2552 {
2553   unsigned int i;
2554
2555   for(i = 0; i < parts; i++)
2556     dst[i] &= rhs[i];
2557 }
2558
2559 /* Bitwise inclusive or of two bignums.  */
2560 void
2561 APInt::tcOr(integerPart *dst, const integerPart *rhs, unsigned int parts)
2562 {
2563   unsigned int i;
2564
2565   for(i = 0; i < parts; i++)
2566     dst[i] |= rhs[i];
2567 }
2568
2569 /* Bitwise exclusive or of two bignums.  */
2570 void
2571 APInt::tcXor(integerPart *dst, const integerPart *rhs, unsigned int parts)
2572 {
2573   unsigned int i;
2574
2575   for(i = 0; i < parts; i++)
2576     dst[i] ^= rhs[i];
2577 }
2578
2579 /* Complement a bignum in-place.  */
2580 void
2581 APInt::tcComplement(integerPart *dst, unsigned int parts)
2582 {
2583   unsigned int i;
2584
2585   for(i = 0; i < parts; i++)
2586     dst[i] = ~dst[i];
2587 }
2588
2589 /* Comparison (unsigned) of two bignums.  */
2590 int
2591 APInt::tcCompare(const integerPart *lhs, const integerPart *rhs,
2592                  unsigned int parts)
2593 {
2594   while (parts) {
2595       parts--;
2596       if (lhs[parts] == rhs[parts])
2597         continue;
2598
2599       if (lhs[parts] > rhs[parts])
2600         return 1;
2601       else
2602         return -1;
2603     }
2604
2605   return 0;
2606 }
2607
2608 /* Increment a bignum in-place, return the carry flag.  */
2609 integerPart
2610 APInt::tcIncrement(integerPart *dst, unsigned int parts)
2611 {
2612   unsigned int i;
2613
2614   for(i = 0; i < parts; i++)
2615     if (++dst[i] != 0)
2616       break;
2617
2618   return i == parts;
2619 }
2620
2621 /* Set the least significant BITS bits of a bignum, clear the
2622    rest.  */
2623 void
2624 APInt::tcSetLeastSignificantBits(integerPart *dst, unsigned int parts,
2625                                  unsigned int bits)
2626 {
2627   unsigned int i;
2628
2629   i = 0;
2630   while (bits > integerPartWidth) {
2631     dst[i++] = ~(integerPart) 0;
2632     bits -= integerPartWidth;
2633   }
2634
2635   if (bits)
2636     dst[i++] = ~(integerPart) 0 >> (integerPartWidth - bits);
2637
2638   while (i < parts)
2639     dst[i++] = 0;
2640 }