blob: 43173311cd8029caf08fa54d7f9bb8e3c144e8ca [file] [log] [blame]
Zhou Shengdac63782007-02-06 03:00:16 +00001//===-- APInt.cpp - Implement APInt class ---------------------------------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Zhou Shengdac63782007-02-06 03:00:16 +00006//
7//===----------------------------------------------------------------------===//
8//
Reid Spencera41e93b2007-02-25 19:32:03 +00009// This file implements a class to represent arbitrary precision integer
10// constant values and provide a variety of arithmetic operations on them.
Zhou Shengdac63782007-02-06 03:00:16 +000011//
12//===----------------------------------------------------------------------===//
13
14#include "llvm/ADT/APInt.h"
Mehdi Amini47b292d2016-04-16 07:51:28 +000015#include "llvm/ADT/ArrayRef.h"
Ted Kremenek5c75d542008-01-19 04:23:33 +000016#include "llvm/ADT/FoldingSet.h"
Chandler Carruth71bd7d12012-03-04 12:02:57 +000017#include "llvm/ADT/Hashing.h"
Krzysztof Parzyszek90f32492018-08-02 19:13:35 +000018#include "llvm/ADT/Optional.h"
Chris Lattner17f71652008-08-17 07:19:36 +000019#include "llvm/ADT/SmallString.h"
Chandler Carruth71bd7d12012-03-04 12:02:57 +000020#include "llvm/ADT/StringRef.h"
JF Bastienc4986ce2018-09-08 03:55:25 +000021#include "llvm/ADT/bit.h"
Nico Weber432a3882018-04-30 14:59:11 +000022#include "llvm/Config/llvm-config.h"
Reid Spencera5e0d202007-02-24 03:58:46 +000023#include "llvm/Support/Debug.h"
Torok Edwin56d06592009-07-11 20:10:48 +000024#include "llvm/Support/ErrorHandling.h"
Zhou Shengdac63782007-02-06 03:00:16 +000025#include "llvm/Support/MathExtras.h"
Chris Lattner0c19df42008-08-23 22:23:09 +000026#include "llvm/Support/raw_ostream.h"
Vassil Vassilev2ec8b152016-09-14 08:55:18 +000027#include <climits>
Chris Lattner17f71652008-08-17 07:19:36 +000028#include <cmath>
Zhou Shengdac63782007-02-06 03:00:16 +000029#include <cstdlib>
Chandler Carruthed0881b2012-12-03 16:50:05 +000030#include <cstring>
Zhou Shengdac63782007-02-06 03:00:16 +000031using namespace llvm;
32
Chandler Carruth64648262014-04-22 03:07:47 +000033#define DEBUG_TYPE "apint"
34
Reid Spencera41e93b2007-02-25 19:32:03 +000035/// A utility function for allocating memory, checking for allocation failures,
36/// and ensuring the contents are zeroed.
Chris Lattner77527f52009-01-21 18:09:24 +000037inline static uint64_t* getClearedMemory(unsigned numWords) {
Fangrui Songc244a152018-03-23 17:26:12 +000038 uint64_t *result = new uint64_t[numWords];
Reid Spencera856b6e2007-02-18 18:38:44 +000039 memset(result, 0, numWords * sizeof(uint64_t));
40 return result;
Zhou Sheng94b623a2007-02-06 06:04:53 +000041}
42
Eric Christopher820256b2009-08-21 04:06:45 +000043/// A utility function for allocating memory and checking for allocation
Reid Spencera41e93b2007-02-25 19:32:03 +000044/// failure. The content is not zeroed.
Chris Lattner77527f52009-01-21 18:09:24 +000045inline static uint64_t* getMemory(unsigned numWords) {
Fangrui Songc244a152018-03-23 17:26:12 +000046 return new uint64_t[numWords];
Reid Spencera856b6e2007-02-18 18:38:44 +000047}
48
Erick Tryzelaardadb15712009-08-21 03:15:28 +000049/// A utility function that converts a character to a digit.
50inline static unsigned getDigit(char cdigit, uint8_t radix) {
Erick Tryzelaar60964092009-08-21 06:48:37 +000051 unsigned r;
52
Douglas Gregor663c0682011-09-14 15:54:46 +000053 if (radix == 16 || radix == 36) {
Erick Tryzelaar60964092009-08-21 06:48:37 +000054 r = cdigit - '0';
55 if (r <= 9)
56 return r;
57
58 r = cdigit - 'A';
Douglas Gregorc98ac852011-09-20 18:33:29 +000059 if (r <= radix - 11U)
Erick Tryzelaar60964092009-08-21 06:48:37 +000060 return r + 10;
61
62 r = cdigit - 'a';
Douglas Gregorc98ac852011-09-20 18:33:29 +000063 if (r <= radix - 11U)
Erick Tryzelaar60964092009-08-21 06:48:37 +000064 return r + 10;
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +000065
Douglas Gregore4e20f42011-09-20 18:11:52 +000066 radix = 10;
Erick Tryzelaardadb15712009-08-21 03:15:28 +000067 }
68
Erick Tryzelaar60964092009-08-21 06:48:37 +000069 r = cdigit - '0';
70 if (r < radix)
71 return r;
72
73 return -1U;
Erick Tryzelaardadb15712009-08-21 03:15:28 +000074}
75
76
Pawel Bylica68304012016-06-27 08:31:48 +000077void APInt::initSlowCase(uint64_t val, bool isSigned) {
Craig Topperb339c6d2017-05-03 15:46:24 +000078 U.pVal = getClearedMemory(getNumWords());
79 U.pVal[0] = val;
Eric Christopher820256b2009-08-21 04:06:45 +000080 if (isSigned && int64_t(val) < 0)
Chris Lattner1ac3e252008-08-20 17:02:31 +000081 for (unsigned i = 1; i < getNumWords(); ++i)
Simon Pilgrim8f465052018-08-16 11:08:23 +000082 U.pVal[i] = WORDTYPE_MAX;
Craig Topperf78a6f02017-03-01 21:06:18 +000083 clearUnusedBits();
Zhou Shengdac63782007-02-06 03:00:16 +000084}
85
Chris Lattnerd57b7602008-10-11 22:07:19 +000086void APInt::initSlowCase(const APInt& that) {
Craig Topperb339c6d2017-05-03 15:46:24 +000087 U.pVal = getMemory(getNumWords());
88 memcpy(U.pVal, that.U.pVal, getNumWords() * APINT_WORD_SIZE);
Chris Lattnerd57b7602008-10-11 22:07:19 +000089}
90
Jeffrey Yasskin7a162882011-07-18 21:45:40 +000091void APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +000092 assert(BitWidth && "Bitwidth too small");
Jeffrey Yasskin7a162882011-07-18 21:45:40 +000093 assert(bigVal.data() && "Null pointer detected!");
Zhou Shengdac63782007-02-06 03:00:16 +000094 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +000095 U.VAL = bigVal[0];
Zhou Shengdac63782007-02-06 03:00:16 +000096 else {
Reid Spencerdf6cf5a2007-02-24 10:01:42 +000097 // Get memory, cleared to 0
Craig Topperb339c6d2017-05-03 15:46:24 +000098 U.pVal = getClearedMemory(getNumWords());
Reid Spencerdf6cf5a2007-02-24 10:01:42 +000099 // Calculate the number of words to copy
Jeffrey Yasskin7a162882011-07-18 21:45:40 +0000100 unsigned words = std::min<unsigned>(bigVal.size(), getNumWords());
Reid Spencerdf6cf5a2007-02-24 10:01:42 +0000101 // Copy the words from bigVal to pVal
Craig Topperb339c6d2017-05-03 15:46:24 +0000102 memcpy(U.pVal, bigVal.data(), words * APINT_WORD_SIZE);
Zhou Shengdac63782007-02-06 03:00:16 +0000103 }
Reid Spencerdf6cf5a2007-02-24 10:01:42 +0000104 // Make sure unused high bits are cleared
105 clearUnusedBits();
Zhou Shengdac63782007-02-06 03:00:16 +0000106}
107
Jeffrey Yasskin7a162882011-07-18 21:45:40 +0000108APInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal)
Craig Topper0085ffb2017-03-20 01:29:52 +0000109 : BitWidth(numBits) {
Jeffrey Yasskin7a162882011-07-18 21:45:40 +0000110 initFromArray(bigVal);
111}
112
113APInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
Craig Topper0085ffb2017-03-20 01:29:52 +0000114 : BitWidth(numBits) {
Jeffrey Yasskin7a162882011-07-18 21:45:40 +0000115 initFromArray(makeArrayRef(bigVal, numWords));
116}
117
Benjamin Kramer92d89982010-07-14 22:38:02 +0000118APInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
Craig Topperb339c6d2017-05-03 15:46:24 +0000119 : BitWidth(numbits) {
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +0000120 assert(BitWidth && "Bitwidth too small");
Daniel Dunbar3a1efd112009-08-13 02:33:34 +0000121 fromString(numbits, Str, radix);
Zhou Sheng3e8022d2007-02-07 06:14:53 +0000122}
123
Craig Toppera92fd0b2017-05-12 01:46:01 +0000124void APInt::reallocate(unsigned NewBitWidth) {
125 // If the number of words is the same we can just change the width and stop.
126 if (getNumWords() == getNumWords(NewBitWidth)) {
127 BitWidth = NewBitWidth;
128 return;
129 }
130
131 // If we have an allocation, delete it.
132 if (!isSingleWord())
133 delete [] U.pVal;
134
135 // Update BitWidth.
136 BitWidth = NewBitWidth;
137
138 // If we are supposed to have an allocation, create it.
139 if (!isSingleWord())
140 U.pVal = getMemory(getNumWords());
141}
142
Craig Topperc67fe572017-04-19 17:01:58 +0000143void APInt::AssignSlowCase(const APInt& RHS) {
Reid Spencer7c16cd22007-02-26 23:38:21 +0000144 // Don't do anything for X = X
145 if (this == &RHS)
Craig Topperc67fe572017-04-19 17:01:58 +0000146 return;
Reid Spencer7c16cd22007-02-26 23:38:21 +0000147
Craig Toppera92fd0b2017-05-12 01:46:01 +0000148 // Adjust the bit width and handle allocations as necessary.
149 reallocate(RHS.getBitWidth());
Reid Spencer7c16cd22007-02-26 23:38:21 +0000150
Craig Toppera92fd0b2017-05-12 01:46:01 +0000151 // Copy the data.
152 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000153 U.VAL = RHS.U.VAL;
Craig Toppera92fd0b2017-05-12 01:46:01 +0000154 else
155 memcpy(U.pVal, RHS.U.pVal, getNumWords() * APINT_WORD_SIZE);
Zhou Shengdac63782007-02-06 03:00:16 +0000156}
157
Pawel Bylica6eeeac72015-04-06 13:31:39 +0000158/// This method 'profiles' an APInt for use with FoldingSet.
Ted Kremenek5c75d542008-01-19 04:23:33 +0000159void APInt::Profile(FoldingSetNodeID& ID) const {
Ted Kremenek901540f2008-02-19 20:50:41 +0000160 ID.AddInteger(BitWidth);
Eric Christopher820256b2009-08-21 04:06:45 +0000161
Ted Kremenek5c75d542008-01-19 04:23:33 +0000162 if (isSingleWord()) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000163 ID.AddInteger(U.VAL);
Ted Kremenek5c75d542008-01-19 04:23:33 +0000164 return;
165 }
166
Chris Lattner77527f52009-01-21 18:09:24 +0000167 unsigned NumWords = getNumWords();
Ted Kremenek5c75d542008-01-19 04:23:33 +0000168 for (unsigned i = 0; i < NumWords; ++i)
Craig Topperb339c6d2017-05-03 15:46:24 +0000169 ID.AddInteger(U.pVal[i]);
Ted Kremenek5c75d542008-01-19 04:23:33 +0000170}
171
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000172/// Prefix increment operator. Increments the APInt by one.
Zhou Shengdac63782007-02-06 03:00:16 +0000173APInt& APInt::operator++() {
Eric Christopher820256b2009-08-21 04:06:45 +0000174 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000175 ++U.VAL;
Zhou Shengdac63782007-02-06 03:00:16 +0000176 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000177 tcIncrement(U.pVal, getNumWords());
Reid Spencera41e93b2007-02-25 19:32:03 +0000178 return clearUnusedBits();
Zhou Shengdac63782007-02-06 03:00:16 +0000179}
180
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000181/// Prefix decrement operator. Decrements the APInt by one.
Zhou Shengdac63782007-02-06 03:00:16 +0000182APInt& APInt::operator--() {
Eric Christopher820256b2009-08-21 04:06:45 +0000183 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000184 --U.VAL;
Zhou Shengdac63782007-02-06 03:00:16 +0000185 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000186 tcDecrement(U.pVal, getNumWords());
Reid Spencera41e93b2007-02-25 19:32:03 +0000187 return clearUnusedBits();
Zhou Shengdac63782007-02-06 03:00:16 +0000188}
189
Reid Spencera41e93b2007-02-25 19:32:03 +0000190/// Adds the RHS APint to this APInt.
191/// @returns this, after addition of RHS.
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000192/// Addition assignment operator.
Zhou Shengdac63782007-02-06 03:00:16 +0000193APInt& APInt::operator+=(const APInt& RHS) {
Reid Spencera32372d12007-02-17 00:18:01 +0000194 assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
Eric Christopher820256b2009-08-21 04:06:45 +0000195 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000196 U.VAL += RHS.U.VAL;
Craig Topper15e484a2017-04-02 06:59:43 +0000197 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000198 tcAdd(U.pVal, RHS.U.pVal, 0, getNumWords());
Reid Spencera41e93b2007-02-25 19:32:03 +0000199 return clearUnusedBits();
Zhou Shengdac63782007-02-06 03:00:16 +0000200}
201
Pete Cooperfea21392016-07-22 20:55:46 +0000202APInt& APInt::operator+=(uint64_t RHS) {
203 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000204 U.VAL += RHS;
Pete Cooperfea21392016-07-22 20:55:46 +0000205 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000206 tcAddPart(U.pVal, RHS, getNumWords());
Pete Cooperfea21392016-07-22 20:55:46 +0000207 return clearUnusedBits();
208}
209
Reid Spencera41e93b2007-02-25 19:32:03 +0000210/// Subtracts the RHS APInt from this APInt
211/// @returns this, after subtraction
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000212/// Subtraction assignment operator.
Zhou Shengdac63782007-02-06 03:00:16 +0000213APInt& APInt::operator-=(const APInt& RHS) {
Reid Spencera32372d12007-02-17 00:18:01 +0000214 assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
Eric Christopher820256b2009-08-21 04:06:45 +0000215 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000216 U.VAL -= RHS.U.VAL;
Reid Spencer7a6a8d52007-02-20 23:40:25 +0000217 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000218 tcSubtract(U.pVal, RHS.U.pVal, 0, getNumWords());
Reid Spencera41e93b2007-02-25 19:32:03 +0000219 return clearUnusedBits();
Zhou Shengdac63782007-02-06 03:00:16 +0000220}
221
Pete Cooperfea21392016-07-22 20:55:46 +0000222APInt& APInt::operator-=(uint64_t RHS) {
223 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000224 U.VAL -= RHS;
Pete Cooperfea21392016-07-22 20:55:46 +0000225 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000226 tcSubtractPart(U.pVal, RHS, getNumWords());
Pete Cooperfea21392016-07-22 20:55:46 +0000227 return clearUnusedBits();
228}
229
Craig Topper93c68e12017-05-04 17:00:41 +0000230APInt APInt::operator*(const APInt& RHS) const {
Reid Spencera32372d12007-02-17 00:18:01 +0000231 assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
Craig Topper93c68e12017-05-04 17:00:41 +0000232 if (isSingleWord())
233 return APInt(BitWidth, U.VAL * RHS.U.VAL);
Reid Spencer58a6a432007-02-21 08:21:52 +0000234
Craig Topper93c68e12017-05-04 17:00:41 +0000235 APInt Result(getMemory(getNumWords()), getBitWidth());
Reid Spencer58a6a432007-02-21 08:21:52 +0000236
Craig Topper93c68e12017-05-04 17:00:41 +0000237 tcMultiply(Result.U.pVal, U.pVal, RHS.U.pVal, getNumWords());
Reid Spencer58a6a432007-02-21 08:21:52 +0000238
Craig Topper93c68e12017-05-04 17:00:41 +0000239 Result.clearUnusedBits();
240 return Result;
Zhou Shengdac63782007-02-06 03:00:16 +0000241}
242
Craig Topperc67fe572017-04-19 17:01:58 +0000243void APInt::AndAssignSlowCase(const APInt& RHS) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000244 tcAnd(U.pVal, RHS.U.pVal, getNumWords());
Zhou Shengdac63782007-02-06 03:00:16 +0000245}
246
Craig Topperc67fe572017-04-19 17:01:58 +0000247void APInt::OrAssignSlowCase(const APInt& RHS) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000248 tcOr(U.pVal, RHS.U.pVal, getNumWords());
Zhou Shengdac63782007-02-06 03:00:16 +0000249}
250
Craig Topperc67fe572017-04-19 17:01:58 +0000251void APInt::XorAssignSlowCase(const APInt& RHS) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000252 tcXor(U.pVal, RHS.U.pVal, getNumWords());
Zhou Shengdac63782007-02-06 03:00:16 +0000253}
254
Craig Topper93c68e12017-05-04 17:00:41 +0000255APInt& APInt::operator*=(const APInt& RHS) {
Reid Spencera32372d12007-02-17 00:18:01 +0000256 assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
Craig Topper93c68e12017-05-04 17:00:41 +0000257 *this = *this * RHS;
258 return *this;
Zhou Shengdac63782007-02-06 03:00:16 +0000259}
260
Craig Toppera51941f2017-05-08 04:55:09 +0000261APInt& APInt::operator*=(uint64_t RHS) {
262 if (isSingleWord()) {
263 U.VAL *= RHS;
264 } else {
265 unsigned NumWords = getNumWords();
266 tcMultiplyPart(U.pVal, U.pVal, RHS, 0, NumWords, NumWords, false);
267 }
268 return clearUnusedBits();
269}
270
Chris Lattner1ac3e252008-08-20 17:02:31 +0000271bool APInt::EqualSlowCase(const APInt& RHS) const {
Craig Topperb339c6d2017-05-03 15:46:24 +0000272 return std::equal(U.pVal, U.pVal + getNumWords(), RHS.U.pVal);
Zhou Shengdac63782007-02-06 03:00:16 +0000273}
274
Craig Topper1dc8fc82017-04-21 16:13:15 +0000275int APInt::compare(const APInt& RHS) const {
Reid Spencer1d072122007-02-16 22:36:51 +0000276 assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
277 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000278 return U.VAL < RHS.U.VAL ? -1 : U.VAL > RHS.U.VAL;
Reid Spencera41e93b2007-02-25 19:32:03 +0000279
Craig Topperb339c6d2017-05-03 15:46:24 +0000280 return tcCompare(U.pVal, RHS.U.pVal, getNumWords());
Zhou Shengdac63782007-02-06 03:00:16 +0000281}
282
Craig Topper1dc8fc82017-04-21 16:13:15 +0000283int APInt::compareSigned(const APInt& RHS) const {
Reid Spencer1d072122007-02-16 22:36:51 +0000284 assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
Reid Spencerbe4ddf62007-02-18 20:09:41 +0000285 if (isSingleWord()) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000286 int64_t lhsSext = SignExtend64(U.VAL, BitWidth);
287 int64_t rhsSext = SignExtend64(RHS.U.VAL, BitWidth);
Craig Topper1dc8fc82017-04-21 16:13:15 +0000288 return lhsSext < rhsSext ? -1 : lhsSext > rhsSext;
Reid Spencer1d072122007-02-16 22:36:51 +0000289 }
Reid Spencerbe4ddf62007-02-18 20:09:41 +0000290
Reid Spencer54abdcf2007-02-27 18:23:40 +0000291 bool lhsNeg = isNegative();
Pete Cooperd6e6bf12016-05-26 17:40:07 +0000292 bool rhsNeg = RHS.isNegative();
Reid Spencera41e93b2007-02-25 19:32:03 +0000293
Pete Cooperd6e6bf12016-05-26 17:40:07 +0000294 // If the sign bits don't match, then (LHS < RHS) if LHS is negative
295 if (lhsNeg != rhsNeg)
Craig Topper1dc8fc82017-04-21 16:13:15 +0000296 return lhsNeg ? -1 : 1;
Pete Cooperd6e6bf12016-05-26 17:40:07 +0000297
Simon Pilgrim0099beb2017-03-09 13:57:04 +0000298 // Otherwise we can just use an unsigned comparison, because even negative
Pete Cooperd6e6bf12016-05-26 17:40:07 +0000299 // numbers compare correctly this way if both have the same signed-ness.
Craig Topperb339c6d2017-05-03 15:46:24 +0000300 return tcCompare(U.pVal, RHS.U.pVal, getNumWords());
Zhou Shengdac63782007-02-06 03:00:16 +0000301}
302
Craig Topperbafdd032017-03-07 01:56:01 +0000303void APInt::setBitsSlowCase(unsigned loBit, unsigned hiBit) {
304 unsigned loWord = whichWord(loBit);
305 unsigned hiWord = whichWord(hiBit);
Simon Pilgrimaed35222017-02-24 10:15:29 +0000306
Simon Pilgrim0099beb2017-03-09 13:57:04 +0000307 // Create an initial mask for the low word with zeros below loBit.
Simon Pilgrim8f465052018-08-16 11:08:23 +0000308 uint64_t loMask = WORDTYPE_MAX << whichBit(loBit);
Simon Pilgrimaed35222017-02-24 10:15:29 +0000309
Craig Topperbafdd032017-03-07 01:56:01 +0000310 // If hiBit is not aligned, we need a high mask.
311 unsigned hiShiftAmt = whichBit(hiBit);
312 if (hiShiftAmt != 0) {
313 // Create a high mask with zeros above hiBit.
Simon Pilgrim8f465052018-08-16 11:08:23 +0000314 uint64_t hiMask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - hiShiftAmt);
Craig Topperbafdd032017-03-07 01:56:01 +0000315 // If loWord and hiWord are equal, then we combine the masks. Otherwise,
316 // set the bits in hiWord.
317 if (hiWord == loWord)
318 loMask &= hiMask;
319 else
Craig Topperb339c6d2017-05-03 15:46:24 +0000320 U.pVal[hiWord] |= hiMask;
Simon Pilgrimaed35222017-02-24 10:15:29 +0000321 }
Craig Topperbafdd032017-03-07 01:56:01 +0000322 // Apply the mask to the low word.
Craig Topperb339c6d2017-05-03 15:46:24 +0000323 U.pVal[loWord] |= loMask;
Craig Topperbafdd032017-03-07 01:56:01 +0000324
325 // Fill any words between loWord and hiWord with all ones.
326 for (unsigned word = loWord + 1; word < hiWord; ++word)
Simon Pilgrim8f465052018-08-16 11:08:23 +0000327 U.pVal[word] = WORDTYPE_MAX;
Simon Pilgrimaed35222017-02-24 10:15:29 +0000328}
329
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000330/// Toggle every bit to its opposite value.
Craig Topperafc9e352017-03-27 17:10:21 +0000331void APInt::flipAllBitsSlowCase() {
Craig Topperb339c6d2017-05-03 15:46:24 +0000332 tcComplement(U.pVal, getNumWords());
Craig Topperafc9e352017-03-27 17:10:21 +0000333 clearUnusedBits();
334}
Zhou Shengdac63782007-02-06 03:00:16 +0000335
Eric Christopher820256b2009-08-21 04:06:45 +0000336/// Toggle a given bit to its opposite value whose position is given
Zhou Shengdac63782007-02-06 03:00:16 +0000337/// as "bitPosition".
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000338/// Toggles a given bit to its opposite value.
Jay Foad25a5e4c2010-12-01 08:53:58 +0000339void APInt::flipBit(unsigned bitPosition) {
Reid Spencer1d072122007-02-16 22:36:51 +0000340 assert(bitPosition < BitWidth && "Out of the bit-width range!");
Jay Foad25a5e4c2010-12-01 08:53:58 +0000341 if ((*this)[bitPosition]) clearBit(bitPosition);
342 else setBit(bitPosition);
Zhou Shengdac63782007-02-06 03:00:16 +0000343}
344
Simon Pilgrimb02667c2017-03-10 13:44:32 +0000345void APInt::insertBits(const APInt &subBits, unsigned bitPosition) {
346 unsigned subBitWidth = subBits.getBitWidth();
347 assert(0 < subBitWidth && (subBitWidth + bitPosition) <= BitWidth &&
348 "Illegal bit insertion");
349
350 // Insertion is a direct copy.
351 if (subBitWidth == BitWidth) {
352 *this = subBits;
353 return;
354 }
355
356 // Single word result can be done as a direct bitmask.
357 if (isSingleWord()) {
Simon Pilgrim8f465052018-08-16 11:08:23 +0000358 uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - subBitWidth);
Craig Topperb339c6d2017-05-03 15:46:24 +0000359 U.VAL &= ~(mask << bitPosition);
360 U.VAL |= (subBits.U.VAL << bitPosition);
Simon Pilgrimb02667c2017-03-10 13:44:32 +0000361 return;
362 }
363
364 unsigned loBit = whichBit(bitPosition);
365 unsigned loWord = whichWord(bitPosition);
366 unsigned hi1Word = whichWord(bitPosition + subBitWidth - 1);
367
368 // Insertion within a single word can be done as a direct bitmask.
369 if (loWord == hi1Word) {
Simon Pilgrim8f465052018-08-16 11:08:23 +0000370 uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - subBitWidth);
Craig Topperb339c6d2017-05-03 15:46:24 +0000371 U.pVal[loWord] &= ~(mask << loBit);
372 U.pVal[loWord] |= (subBits.U.VAL << loBit);
Simon Pilgrimb02667c2017-03-10 13:44:32 +0000373 return;
374 }
375
376 // Insert on word boundaries.
377 if (loBit == 0) {
378 // Direct copy whole words.
379 unsigned numWholeSubWords = subBitWidth / APINT_BITS_PER_WORD;
Craig Topperb339c6d2017-05-03 15:46:24 +0000380 memcpy(U.pVal + loWord, subBits.getRawData(),
Simon Pilgrimb02667c2017-03-10 13:44:32 +0000381 numWholeSubWords * APINT_WORD_SIZE);
382
383 // Mask+insert remaining bits.
384 unsigned remainingBits = subBitWidth % APINT_BITS_PER_WORD;
385 if (remainingBits != 0) {
Simon Pilgrim8f465052018-08-16 11:08:23 +0000386 uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - remainingBits);
Craig Topperb339c6d2017-05-03 15:46:24 +0000387 U.pVal[hi1Word] &= ~mask;
388 U.pVal[hi1Word] |= subBits.getWord(subBitWidth - 1);
Simon Pilgrimb02667c2017-03-10 13:44:32 +0000389 }
390 return;
391 }
392
393 // General case - set/clear individual bits in dst based on src.
394 // TODO - there is scope for optimization here, but at the moment this code
395 // path is barely used so prefer readability over performance.
396 for (unsigned i = 0; i != subBitWidth; ++i) {
397 if (subBits[i])
398 setBit(bitPosition + i);
399 else
400 clearBit(bitPosition + i);
401 }
402}
403
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000404APInt APInt::extractBits(unsigned numBits, unsigned bitPosition) const {
405 assert(numBits > 0 && "Can't extract zero bits");
406 assert(bitPosition < BitWidth && (numBits + bitPosition) <= BitWidth &&
407 "Illegal bit extraction");
408
409 if (isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000410 return APInt(numBits, U.VAL >> bitPosition);
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000411
412 unsigned loBit = whichBit(bitPosition);
413 unsigned loWord = whichWord(bitPosition);
414 unsigned hiWord = whichWord(bitPosition + numBits - 1);
415
416 // Single word result extracting bits from a single word source.
417 if (loWord == hiWord)
Craig Topperb339c6d2017-05-03 15:46:24 +0000418 return APInt(numBits, U.pVal[loWord] >> loBit);
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000419
420 // Extracting bits that start on a source word boundary can be done
421 // as a fast memory copy.
422 if (loBit == 0)
Craig Topperb339c6d2017-05-03 15:46:24 +0000423 return APInt(numBits, makeArrayRef(U.pVal + loWord, 1 + hiWord - loWord));
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000424
425 // General case - shift + copy source words directly into place.
426 APInt Result(numBits, 0);
427 unsigned NumSrcWords = getNumWords();
428 unsigned NumDstWords = Result.getNumWords();
429
Tim Shen89337752018-02-16 01:44:36 +0000430 uint64_t *DestPtr = Result.isSingleWord() ? &Result.U.VAL : Result.U.pVal;
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000431 for (unsigned word = 0; word < NumDstWords; ++word) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000432 uint64_t w0 = U.pVal[loWord + word];
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000433 uint64_t w1 =
Craig Topperb339c6d2017-05-03 15:46:24 +0000434 (loWord + word + 1) < NumSrcWords ? U.pVal[loWord + word + 1] : 0;
Tim Shen89337752018-02-16 01:44:36 +0000435 DestPtr[word] = (w0 >> loBit) | (w1 << (APINT_BITS_PER_WORD - loBit));
Simon Pilgrim0f5fb5f2017-02-25 20:01:58 +0000436 }
437
438 return Result.clearUnusedBits();
439}
440
Benjamin Kramer92d89982010-07-14 22:38:02 +0000441unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
Daniel Dunbar3a1efd112009-08-13 02:33:34 +0000442 assert(!str.empty() && "Invalid string length");
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +0000443 assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
Douglas Gregor663c0682011-09-14 15:54:46 +0000444 radix == 36) &&
445 "Radix should be 2, 8, 10, 16, or 36!");
Daniel Dunbar3a1efd112009-08-13 02:33:34 +0000446
447 size_t slen = str.size();
Reid Spencer9329e7b2007-04-13 19:19:07 +0000448
Eric Christopher43a1dec2009-08-21 04:10:31 +0000449 // Each computation below needs to know if it's negative.
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +0000450 StringRef::iterator p = str.begin();
Eric Christopher43a1dec2009-08-21 04:10:31 +0000451 unsigned isNegative = *p == '-';
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +0000452 if (*p == '-' || *p == '+') {
453 p++;
Reid Spencer9329e7b2007-04-13 19:19:07 +0000454 slen--;
Eric Christopher43a1dec2009-08-21 04:10:31 +0000455 assert(slen && "String is only a sign, needs a value.");
Reid Spencer9329e7b2007-04-13 19:19:07 +0000456 }
Eric Christopher43a1dec2009-08-21 04:10:31 +0000457
Reid Spencer9329e7b2007-04-13 19:19:07 +0000458 // For radixes of power-of-two values, the bits required is accurately and
459 // easily computed
460 if (radix == 2)
461 return slen + isNegative;
462 if (radix == 8)
463 return slen * 3 + isNegative;
464 if (radix == 16)
465 return slen * 4 + isNegative;
466
Douglas Gregor663c0682011-09-14 15:54:46 +0000467 // FIXME: base 36
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +0000468
Reid Spencer9329e7b2007-04-13 19:19:07 +0000469 // This is grossly inefficient but accurate. We could probably do something
470 // with a computation of roughly slen*64/20 and then adjust by the value of
471 // the first few digits. But, I'm not sure how accurate that could be.
472
473 // Compute a sufficient number of bits that is always large enough but might
Erick Tryzelaardadb15712009-08-21 03:15:28 +0000474 // be too large. This avoids the assertion in the constructor. This
475 // calculation doesn't work appropriately for the numbers 0-9, so just use 4
476 // bits in that case.
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +0000477 unsigned sufficient
Douglas Gregor663c0682011-09-14 15:54:46 +0000478 = radix == 10? (slen == 1 ? 4 : slen * 64/18)
479 : (slen == 1 ? 7 : slen * 16/3);
Reid Spencer9329e7b2007-04-13 19:19:07 +0000480
481 // Convert to the actual binary value.
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +0000482 APInt tmp(sufficient, StringRef(p, slen), radix);
Reid Spencer9329e7b2007-04-13 19:19:07 +0000483
Erick Tryzelaardadb15712009-08-21 03:15:28 +0000484 // Compute how many bits are required. If the log is infinite, assume we need
Dmitry Venikov9e9eb622019-06-29 11:38:12 +0000485 // just bit. If the log is exact and value is negative, then the value is
486 // MinSignedValue with (log + 1) bits.
Erick Tryzelaardadb15712009-08-21 03:15:28 +0000487 unsigned log = tmp.logBase2();
488 if (log == (unsigned)-1) {
489 return isNegative + 1;
Dmitry Venikov9e9eb622019-06-29 11:38:12 +0000490 } else if (isNegative && tmp.isPowerOf2()) {
491 return isNegative + log;
Erick Tryzelaardadb15712009-08-21 03:15:28 +0000492 } else {
493 return isNegative + log + 1;
494 }
Reid Spencer9329e7b2007-04-13 19:19:07 +0000495}
496
Chandler Carruth71bd7d12012-03-04 12:02:57 +0000497hash_code llvm::hash_value(const APInt &Arg) {
498 if (Arg.isSingleWord())
Craig Topperb339c6d2017-05-03 15:46:24 +0000499 return hash_combine(Arg.U.VAL);
Reid Spencerb2bc9852007-02-26 21:02:27 +0000500
Craig Topperb339c6d2017-05-03 15:46:24 +0000501 return hash_combine_range(Arg.U.pVal, Arg.U.pVal + Arg.getNumWords());
Reid Spencerb2bc9852007-02-26 21:02:27 +0000502}
503
Benjamin Kramerb4b51502015-03-25 16:49:59 +0000504bool APInt::isSplat(unsigned SplatSizeInBits) const {
505 assert(getBitWidth() % SplatSizeInBits == 0 &&
506 "SplatSizeInBits must divide width!");
507 // We can check that all parts of an integer are equal by making use of a
508 // little trick: rotate and check if it's still the same value.
509 return *this == rotl(SplatSizeInBits);
510}
511
Pawel Bylica6eeeac72015-04-06 13:31:39 +0000512/// This function returns the high "numBits" bits of this APInt.
Chris Lattner77527f52009-01-21 18:09:24 +0000513APInt APInt::getHiBits(unsigned numBits) const {
Craig Toppere7e35602017-03-31 18:48:14 +0000514 return this->lshr(BitWidth - numBits);
Zhou Shengdac63782007-02-06 03:00:16 +0000515}
516
Pawel Bylica6eeeac72015-04-06 13:31:39 +0000517/// This function returns the low "numBits" bits of this APInt.
Chris Lattner77527f52009-01-21 18:09:24 +0000518APInt APInt::getLoBits(unsigned numBits) const {
Craig Toppere7e35602017-03-31 18:48:14 +0000519 APInt Result(getLowBitsSet(BitWidth, numBits));
520 Result &= *this;
521 return Result;
Zhou Shengdac63782007-02-06 03:00:16 +0000522}
523
Craig Topper9881bd92017-05-02 06:32:27 +0000524/// Return a value containing V broadcasted over NewLen bits.
525APInt APInt::getSplat(unsigned NewLen, const APInt &V) {
526 assert(NewLen >= V.getBitWidth() && "Can't splat to smaller bit width!");
527
528 APInt Val = V.zextOrSelf(NewLen);
529 for (unsigned I = V.getBitWidth(); I < NewLen; I <<= 1)
530 Val |= Val << I;
531
532 return Val;
533}
534
Chris Lattner77527f52009-01-21 18:09:24 +0000535unsigned APInt::countLeadingZerosSlowCase() const {
Matthias Brauna6be4e82016-02-15 20:06:22 +0000536 unsigned Count = 0;
537 for (int i = getNumWords()-1; i >= 0; --i) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000538 uint64_t V = U.pVal[i];
Matthias Brauna6be4e82016-02-15 20:06:22 +0000539 if (V == 0)
Chris Lattner1ac3e252008-08-20 17:02:31 +0000540 Count += APINT_BITS_PER_WORD;
541 else {
Matthias Brauna6be4e82016-02-15 20:06:22 +0000542 Count += llvm::countLeadingZeros(V);
Chris Lattner1ac3e252008-08-20 17:02:31 +0000543 break;
Reid Spencer74cf82e2007-02-21 00:29:48 +0000544 }
Zhou Shengdac63782007-02-06 03:00:16 +0000545 }
Matthias Brauna6be4e82016-02-15 20:06:22 +0000546 // Adjust for unused bits in the most significant word (they are zero).
547 unsigned Mod = BitWidth % APINT_BITS_PER_WORD;
548 Count -= Mod > 0 ? APINT_BITS_PER_WORD - Mod : 0;
John McCalldf951bd2010-02-03 03:42:44 +0000549 return Count;
Zhou Shengdac63782007-02-06 03:00:16 +0000550}
551
Craig Topper40516522017-06-23 20:28:45 +0000552unsigned APInt::countLeadingOnesSlowCase() const {
Chris Lattner77527f52009-01-21 18:09:24 +0000553 unsigned highWordBits = BitWidth % APINT_BITS_PER_WORD;
Torok Edwinec39eb82009-01-27 18:06:03 +0000554 unsigned shift;
555 if (!highWordBits) {
556 highWordBits = APINT_BITS_PER_WORD;
557 shift = 0;
558 } else {
559 shift = APINT_BITS_PER_WORD - highWordBits;
560 }
Reid Spencer31acef52007-02-27 21:59:26 +0000561 int i = getNumWords() - 1;
Craig Topperb339c6d2017-05-03 15:46:24 +0000562 unsigned Count = llvm::countLeadingOnes(U.pVal[i] << shift);
Reid Spencer31acef52007-02-27 21:59:26 +0000563 if (Count == highWordBits) {
564 for (i--; i >= 0; --i) {
Simon Pilgrim8f465052018-08-16 11:08:23 +0000565 if (U.pVal[i] == WORDTYPE_MAX)
Reid Spencer31acef52007-02-27 21:59:26 +0000566 Count += APINT_BITS_PER_WORD;
567 else {
Craig Topperb339c6d2017-05-03 15:46:24 +0000568 Count += llvm::countLeadingOnes(U.pVal[i]);
Reid Spencer31acef52007-02-27 21:59:26 +0000569 break;
570 }
571 }
572 }
573 return Count;
574}
575
Craig Topper40516522017-06-23 20:28:45 +0000576unsigned APInt::countTrailingZerosSlowCase() const {
Chris Lattner77527f52009-01-21 18:09:24 +0000577 unsigned Count = 0;
578 unsigned i = 0;
Craig Topperb339c6d2017-05-03 15:46:24 +0000579 for (; i < getNumWords() && U.pVal[i] == 0; ++i)
Reid Spenceraa8dcfe2007-02-26 07:44:38 +0000580 Count += APINT_BITS_PER_WORD;
581 if (i < getNumWords())
Craig Topperb339c6d2017-05-03 15:46:24 +0000582 Count += llvm::countTrailingZeros(U.pVal[i]);
Chris Lattnerc2c4c742007-11-23 22:36:25 +0000583 return std::min(Count, BitWidth);
Zhou Shengdac63782007-02-06 03:00:16 +0000584}
585
Chris Lattner77527f52009-01-21 18:09:24 +0000586unsigned APInt::countTrailingOnesSlowCase() const {
587 unsigned Count = 0;
588 unsigned i = 0;
Simon Pilgrim8f465052018-08-16 11:08:23 +0000589 for (; i < getNumWords() && U.pVal[i] == WORDTYPE_MAX; ++i)
Dan Gohman8b4fa9d2008-02-13 21:11:05 +0000590 Count += APINT_BITS_PER_WORD;
591 if (i < getNumWords())
Craig Topperb339c6d2017-05-03 15:46:24 +0000592 Count += llvm::countTrailingOnes(U.pVal[i]);
Craig Topper3a29e3b82017-04-22 19:59:11 +0000593 assert(Count <= BitWidth);
594 return Count;
Dan Gohman8b4fa9d2008-02-13 21:11:05 +0000595}
596
Chris Lattner77527f52009-01-21 18:09:24 +0000597unsigned APInt::countPopulationSlowCase() const {
598 unsigned Count = 0;
599 for (unsigned i = 0; i < getNumWords(); ++i)
Craig Topperb339c6d2017-05-03 15:46:24 +0000600 Count += llvm::countPopulation(U.pVal[i]);
Zhou Shengdac63782007-02-06 03:00:16 +0000601 return Count;
602}
603
Craig Topperbaa392e2017-04-20 02:11:27 +0000604bool APInt::intersectsSlowCase(const APInt &RHS) const {
605 for (unsigned i = 0, e = getNumWords(); i != e; ++i)
Craig Topperb339c6d2017-05-03 15:46:24 +0000606 if ((U.pVal[i] & RHS.U.pVal[i]) != 0)
Craig Topperbaa392e2017-04-20 02:11:27 +0000607 return true;
608
609 return false;
610}
611
Craig Toppera8129a12017-04-20 16:17:13 +0000612bool APInt::isSubsetOfSlowCase(const APInt &RHS) const {
613 for (unsigned i = 0, e = getNumWords(); i != e; ++i)
Craig Topperb339c6d2017-05-03 15:46:24 +0000614 if ((U.pVal[i] & ~RHS.U.pVal[i]) != 0)
Craig Toppera8129a12017-04-20 16:17:13 +0000615 return false;
616
617 return true;
618}
619
Reid Spencer1d072122007-02-16 22:36:51 +0000620APInt APInt::byteSwap() const {
621 assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
622 if (BitWidth == 16)
Craig Topperb339c6d2017-05-03 15:46:24 +0000623 return APInt(BitWidth, ByteSwap_16(uint16_t(U.VAL)));
Richard Smith4f9a8082011-11-23 21:33:37 +0000624 if (BitWidth == 32)
Craig Topperb339c6d2017-05-03 15:46:24 +0000625 return APInt(BitWidth, ByteSwap_32(unsigned(U.VAL)));
Richard Smith4f9a8082011-11-23 21:33:37 +0000626 if (BitWidth == 48) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000627 unsigned Tmp1 = unsigned(U.VAL >> 16);
Zhou Shengcfa2ac02007-02-15 06:36:31 +0000628 Tmp1 = ByteSwap_32(Tmp1);
Craig Topperb339c6d2017-05-03 15:46:24 +0000629 uint16_t Tmp2 = uint16_t(U.VAL);
Zhou Shengcfa2ac02007-02-15 06:36:31 +0000630 Tmp2 = ByteSwap_16(Tmp2);
Jeff Cohene06855e2007-03-20 20:42:36 +0000631 return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
Zhou Shengcfa2ac02007-02-15 06:36:31 +0000632 }
Richard Smith4f9a8082011-11-23 21:33:37 +0000633 if (BitWidth == 64)
Craig Topperb339c6d2017-05-03 15:46:24 +0000634 return APInt(BitWidth, ByteSwap_64(U.VAL));
Richard Smith4f9a8082011-11-23 21:33:37 +0000635
636 APInt Result(getNumWords() * APINT_BITS_PER_WORD, 0);
637 for (unsigned I = 0, N = getNumWords(); I != N; ++I)
Craig Topperb339c6d2017-05-03 15:46:24 +0000638 Result.U.pVal[I] = ByteSwap_64(U.pVal[N - I - 1]);
Richard Smith4f9a8082011-11-23 21:33:37 +0000639 if (Result.BitWidth != BitWidth) {
Richard Smith55bd3752017-04-13 20:29:59 +0000640 Result.lshrInPlace(Result.BitWidth - BitWidth);
Richard Smith4f9a8082011-11-23 21:33:37 +0000641 Result.BitWidth = BitWidth;
642 }
643 return Result;
Zhou Shengdac63782007-02-06 03:00:16 +0000644}
645
Matt Arsenault155dda92016-03-21 15:00:35 +0000646APInt APInt::reverseBits() const {
647 switch (BitWidth) {
648 case 64:
Craig Topperb339c6d2017-05-03 15:46:24 +0000649 return APInt(BitWidth, llvm::reverseBits<uint64_t>(U.VAL));
Matt Arsenault155dda92016-03-21 15:00:35 +0000650 case 32:
Craig Topperb339c6d2017-05-03 15:46:24 +0000651 return APInt(BitWidth, llvm::reverseBits<uint32_t>(U.VAL));
Matt Arsenault155dda92016-03-21 15:00:35 +0000652 case 16:
Craig Topperb339c6d2017-05-03 15:46:24 +0000653 return APInt(BitWidth, llvm::reverseBits<uint16_t>(U.VAL));
Matt Arsenault155dda92016-03-21 15:00:35 +0000654 case 8:
Craig Topperb339c6d2017-05-03 15:46:24 +0000655 return APInt(BitWidth, llvm::reverseBits<uint8_t>(U.VAL));
Matt Arsenault155dda92016-03-21 15:00:35 +0000656 default:
657 break;
658 }
659
660 APInt Val(*this);
Craig Topper9eaef072017-04-18 05:02:21 +0000661 APInt Reversed(BitWidth, 0);
662 unsigned S = BitWidth;
Matt Arsenault155dda92016-03-21 15:00:35 +0000663
Craig Topper9eaef072017-04-18 05:02:21 +0000664 for (; Val != 0; Val.lshrInPlace(1)) {
Matt Arsenault155dda92016-03-21 15:00:35 +0000665 Reversed <<= 1;
Craig Topper9eaef072017-04-18 05:02:21 +0000666 Reversed |= Val[0];
Matt Arsenault155dda92016-03-21 15:00:35 +0000667 --S;
668 }
669
670 Reversed <<= S;
671 return Reversed;
672}
673
Craig Topper278ebd22017-04-01 20:30:57 +0000674APInt llvm::APIntOps::GreatestCommonDivisor(APInt A, APInt B) {
Richard Smith55bd3752017-04-13 20:29:59 +0000675 // Fast-path a common case.
676 if (A == B) return A;
677
678 // Corner cases: if either operand is zero, the other is the gcd.
679 if (!A) return B;
680 if (!B) return A;
681
682 // Count common powers of 2 and remove all other powers of 2.
683 unsigned Pow2;
684 {
685 unsigned Pow2_A = A.countTrailingZeros();
686 unsigned Pow2_B = B.countTrailingZeros();
687 if (Pow2_A > Pow2_B) {
688 A.lshrInPlace(Pow2_A - Pow2_B);
689 Pow2 = Pow2_B;
690 } else if (Pow2_B > Pow2_A) {
691 B.lshrInPlace(Pow2_B - Pow2_A);
692 Pow2 = Pow2_A;
693 } else {
694 Pow2 = Pow2_A;
695 }
Zhou Shengdac63782007-02-06 03:00:16 +0000696 }
Richard Smith55bd3752017-04-13 20:29:59 +0000697
698 // Both operands are odd multiples of 2^Pow_2:
699 //
700 // gcd(a, b) = gcd(|a - b| / 2^i, min(a, b))
701 //
702 // This is a modified version of Stein's algorithm, taking advantage of
703 // efficient countTrailingZeros().
704 while (A != B) {
705 if (A.ugt(B)) {
706 A -= B;
707 A.lshrInPlace(A.countTrailingZeros() - Pow2);
708 } else {
709 B -= A;
710 B.lshrInPlace(B.countTrailingZeros() - Pow2);
711 }
712 }
713
Zhou Shengdac63782007-02-06 03:00:16 +0000714 return A;
715}
Chris Lattner28cbd1d2007-02-06 05:38:37 +0000716
Chris Lattner77527f52009-01-21 18:09:24 +0000717APInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
JF Bastienc4986ce2018-09-08 03:55:25 +0000718 uint64_t I = bit_cast<uint64_t>(Double);
Reid Spencer974551a2007-02-27 01:28:10 +0000719
720 // Get the sign bit from the highest order bit
JF Bastienc4986ce2018-09-08 03:55:25 +0000721 bool isNeg = I >> 63;
Reid Spencer974551a2007-02-27 01:28:10 +0000722
723 // Get the 11-bit exponent and adjust for the 1023 bit bias
JF Bastienc4986ce2018-09-08 03:55:25 +0000724 int64_t exp = ((I >> 52) & 0x7ff) - 1023;
Reid Spencer974551a2007-02-27 01:28:10 +0000725
726 // If the exponent is negative, the value is < 0 so just return 0.
Zhou Shengd707d632007-02-12 20:02:55 +0000727 if (exp < 0)
Reid Spencer66d0d572007-02-28 01:30:08 +0000728 return APInt(width, 0u);
Reid Spencer974551a2007-02-27 01:28:10 +0000729
730 // Extract the mantissa by clearing the top 12 bits (sign + exponent).
JF Bastienc4986ce2018-09-08 03:55:25 +0000731 uint64_t mantissa = (I & (~0ULL >> 12)) | 1ULL << 52;
Reid Spencer974551a2007-02-27 01:28:10 +0000732
733 // If the exponent doesn't shift all bits out of the mantissa
Zhou Shengd707d632007-02-12 20:02:55 +0000734 if (exp < 52)
Eric Christopher820256b2009-08-21 04:06:45 +0000735 return isNeg ? -APInt(width, mantissa >> (52 - exp)) :
Reid Spencer54abdcf2007-02-27 18:23:40 +0000736 APInt(width, mantissa >> (52 - exp));
737
738 // If the client didn't provide enough bits for us to shift the mantissa into
739 // then the result is undefined, just return 0
740 if (width <= exp - 52)
741 return APInt(width, 0);
Reid Spencer974551a2007-02-27 01:28:10 +0000742
743 // Otherwise, we have to shift the mantissa bits up to the right location
Reid Spencer54abdcf2007-02-27 18:23:40 +0000744 APInt Tmp(width, mantissa);
Craig Topper24e71012017-04-28 03:36:24 +0000745 Tmp <<= (unsigned)exp - 52;
Zhou Shengd707d632007-02-12 20:02:55 +0000746 return isNeg ? -Tmp : Tmp;
747}
748
Pawel Bylica6eeeac72015-04-06 13:31:39 +0000749/// This function converts this APInt to a double.
Zhou Shengd707d632007-02-12 20:02:55 +0000750/// The layout for double is as following (IEEE Standard 754):
751/// --------------------------------------
752/// | Sign Exponent Fraction Bias |
753/// |-------------------------------------- |
754/// | 1[63] 11[62-52] 52[51-00] 1023 |
Eric Christopher820256b2009-08-21 04:06:45 +0000755/// --------------------------------------
Reid Spencer1d072122007-02-16 22:36:51 +0000756double APInt::roundToDouble(bool isSigned) const {
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000757
758 // Handle the simple case where the value is contained in one uint64_t.
Dale Johannesen54be7852009-08-12 18:04:11 +0000759 // It is wrong to optimize getWord(0) to VAL; there might be more than one word.
Reid Spencerbe4ddf62007-02-18 20:09:41 +0000760 if (isSingleWord() || getActiveBits() <= APINT_BITS_PER_WORD) {
761 if (isSigned) {
David Majnemer03992262016-06-24 21:15:36 +0000762 int64_t sext = SignExtend64(getWord(0), BitWidth);
Reid Spencerbe4ddf62007-02-18 20:09:41 +0000763 return double(sext);
764 } else
Dale Johannesen34c08bb2009-08-12 17:42:34 +0000765 return double(getWord(0));
Reid Spencerbe4ddf62007-02-18 20:09:41 +0000766 }
767
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000768 // Determine if the value is negative.
Reid Spencer1d072122007-02-16 22:36:51 +0000769 bool isNeg = isSigned ? (*this)[BitWidth-1] : false;
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000770
771 // Construct the absolute value if we're negative.
Zhou Shengd707d632007-02-12 20:02:55 +0000772 APInt Tmp(isNeg ? -(*this) : (*this));
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000773
774 // Figure out how many bits we're using.
Chris Lattner77527f52009-01-21 18:09:24 +0000775 unsigned n = Tmp.getActiveBits();
Zhou Shengd707d632007-02-12 20:02:55 +0000776
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000777 // The exponent (without bias normalization) is just the number of bits
778 // we are using. Note that the sign bit is gone since we constructed the
779 // absolute value.
780 uint64_t exp = n;
Zhou Shengd707d632007-02-12 20:02:55 +0000781
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000782 // Return infinity for exponent overflow
783 if (exp > 1023) {
784 if (!isSigned || !isNeg)
Jeff Cohene06855e2007-03-20 20:42:36 +0000785 return std::numeric_limits<double>::infinity();
Eric Christopher820256b2009-08-21 04:06:45 +0000786 else
Jeff Cohene06855e2007-03-20 20:42:36 +0000787 return -std::numeric_limits<double>::infinity();
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000788 }
789 exp += 1023; // Increment for 1023 bias
790
791 // Number of bits in mantissa is 52. To obtain the mantissa value, we must
792 // extract the high 52 bits from the correct words in pVal.
Zhou Shengd707d632007-02-12 20:02:55 +0000793 uint64_t mantissa;
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000794 unsigned hiWord = whichWord(n-1);
795 if (hiWord == 0) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000796 mantissa = Tmp.U.pVal[0];
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000797 if (n > 52)
798 mantissa >>= n - 52; // shift down, we want the top 52 bits.
799 } else {
800 assert(hiWord > 0 && "huh?");
Craig Topperb339c6d2017-05-03 15:46:24 +0000801 uint64_t hibits = Tmp.U.pVal[hiWord] << (52 - n % APINT_BITS_PER_WORD);
802 uint64_t lobits = Tmp.U.pVal[hiWord-1] >> (11 + n % APINT_BITS_PER_WORD);
Reid Spencerfb77b2b2007-02-20 08:51:03 +0000803 mantissa = hibits | lobits;
804 }
805
Zhou Shengd707d632007-02-12 20:02:55 +0000806 // The leading bit of mantissa is implicit, so get rid of it.
Reid Spencerfbd48a52007-02-18 00:44:22 +0000807 uint64_t sign = isNeg ? (1ULL << (APINT_BITS_PER_WORD - 1)) : 0;
JF Bastienc4986ce2018-09-08 03:55:25 +0000808 uint64_t I = sign | (exp << 52) | mantissa;
809 return bit_cast<double>(I);
Zhou Shengd707d632007-02-12 20:02:55 +0000810}
811
Reid Spencer1d072122007-02-16 22:36:51 +0000812// Truncate to new width.
Jay Foad583abbc2010-12-07 08:25:19 +0000813APInt APInt::trunc(unsigned width) const {
Reid Spencer1d072122007-02-16 22:36:51 +0000814 assert(width < BitWidth && "Invalid APInt Truncate request");
Chris Lattner1ac3e252008-08-20 17:02:31 +0000815 assert(width && "Can't truncate to 0 bits");
Jay Foad583abbc2010-12-07 08:25:19 +0000816
817 if (width <= APINT_BITS_PER_WORD)
818 return APInt(width, getRawData()[0]);
819
820 APInt Result(getMemory(getNumWords(width)), width);
821
822 // Copy full words.
823 unsigned i;
824 for (i = 0; i != width / APINT_BITS_PER_WORD; i++)
Craig Topperb339c6d2017-05-03 15:46:24 +0000825 Result.U.pVal[i] = U.pVal[i];
Jay Foad583abbc2010-12-07 08:25:19 +0000826
827 // Truncate and copy any partial word.
828 unsigned bits = (0 - width) % APINT_BITS_PER_WORD;
829 if (bits != 0)
Craig Topperb339c6d2017-05-03 15:46:24 +0000830 Result.U.pVal[i] = U.pVal[i] << bits >> bits;
Jay Foad583abbc2010-12-07 08:25:19 +0000831
832 return Result;
Reid Spencer1d072122007-02-16 22:36:51 +0000833}
834
835// Sign extend to a new width.
Craig Topper1dec2812017-04-24 17:37:10 +0000836APInt APInt::sext(unsigned Width) const {
837 assert(Width > BitWidth && "Invalid APInt SignExtend request");
Jay Foad583abbc2010-12-07 08:25:19 +0000838
Craig Topper1dec2812017-04-24 17:37:10 +0000839 if (Width <= APINT_BITS_PER_WORD)
Craig Topperb339c6d2017-05-03 15:46:24 +0000840 return APInt(Width, SignExtend64(U.VAL, BitWidth));
Reid Spencerb6b5cc32007-02-25 23:44:53 +0000841
Craig Topper1dec2812017-04-24 17:37:10 +0000842 APInt Result(getMemory(getNumWords(Width)), Width);
Reid Spencerb6b5cc32007-02-25 23:44:53 +0000843
Craig Topper1dec2812017-04-24 17:37:10 +0000844 // Copy words.
Craig Topperb339c6d2017-05-03 15:46:24 +0000845 std::memcpy(Result.U.pVal, getRawData(), getNumWords() * APINT_WORD_SIZE);
Reid Spencerb6b5cc32007-02-25 23:44:53 +0000846
Craig Topper1dec2812017-04-24 17:37:10 +0000847 // Sign extend the last word since there may be unused bits in the input.
Craig Topperb339c6d2017-05-03 15:46:24 +0000848 Result.U.pVal[getNumWords() - 1] =
849 SignExtend64(Result.U.pVal[getNumWords() - 1],
Craig Topper1dec2812017-04-24 17:37:10 +0000850 ((BitWidth - 1) % APINT_BITS_PER_WORD) + 1);
Jay Foad583abbc2010-12-07 08:25:19 +0000851
Craig Topper1dec2812017-04-24 17:37:10 +0000852 // Fill with sign bits.
Craig Topperb339c6d2017-05-03 15:46:24 +0000853 std::memset(Result.U.pVal + getNumWords(), isNegative() ? -1 : 0,
Craig Topper1dec2812017-04-24 17:37:10 +0000854 (Result.getNumWords() - getNumWords()) * APINT_WORD_SIZE);
855 Result.clearUnusedBits();
Jay Foad583abbc2010-12-07 08:25:19 +0000856 return Result;
Reid Spencer1d072122007-02-16 22:36:51 +0000857}
858
859// Zero extend to a new width.
Jay Foad583abbc2010-12-07 08:25:19 +0000860APInt APInt::zext(unsigned width) const {
Reid Spencer1d072122007-02-16 22:36:51 +0000861 assert(width > BitWidth && "Invalid APInt ZeroExtend request");
Jay Foad583abbc2010-12-07 08:25:19 +0000862
863 if (width <= APINT_BITS_PER_WORD)
Craig Topperb339c6d2017-05-03 15:46:24 +0000864 return APInt(width, U.VAL);
Jay Foad583abbc2010-12-07 08:25:19 +0000865
866 APInt Result(getMemory(getNumWords(width)), width);
867
868 // Copy words.
Craig Topperb339c6d2017-05-03 15:46:24 +0000869 std::memcpy(Result.U.pVal, getRawData(), getNumWords() * APINT_WORD_SIZE);
Jay Foad583abbc2010-12-07 08:25:19 +0000870
871 // Zero remaining words.
Craig Topperb339c6d2017-05-03 15:46:24 +0000872 std::memset(Result.U.pVal + getNumWords(), 0,
Craig Topper1dec2812017-04-24 17:37:10 +0000873 (Result.getNumWords() - getNumWords()) * APINT_WORD_SIZE);
Jay Foad583abbc2010-12-07 08:25:19 +0000874
875 return Result;
Reid Spencer1d072122007-02-16 22:36:51 +0000876}
877
Jay Foad583abbc2010-12-07 08:25:19 +0000878APInt APInt::zextOrTrunc(unsigned width) const {
Reid Spencer742d1702007-03-01 17:15:32 +0000879 if (BitWidth < width)
880 return zext(width);
881 if (BitWidth > width)
882 return trunc(width);
883 return *this;
884}
885
Jay Foad583abbc2010-12-07 08:25:19 +0000886APInt APInt::sextOrTrunc(unsigned width) const {
Reid Spencer742d1702007-03-01 17:15:32 +0000887 if (BitWidth < width)
888 return sext(width);
889 if (BitWidth > width)
890 return trunc(width);
891 return *this;
892}
893
Rafael Espindolabb893fe2012-01-27 23:33:07 +0000894APInt APInt::zextOrSelf(unsigned width) const {
895 if (BitWidth < width)
896 return zext(width);
897 return *this;
898}
899
900APInt APInt::sextOrSelf(unsigned width) const {
901 if (BitWidth < width)
902 return sext(width);
903 return *this;
904}
905
Zhou Shenge93db8f2007-02-09 07:48:24 +0000906/// Arithmetic right-shift this APInt by shiftAmt.
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000907/// Arithmetic right-shift function.
Craig Topper8b373262017-04-24 17:18:47 +0000908void APInt::ashrInPlace(const APInt &shiftAmt) {
909 ashrInPlace((unsigned)shiftAmt.getLimitedValue(BitWidth));
Dan Gohman105c1d42008-02-29 01:40:47 +0000910}
911
912/// Arithmetic right-shift this APInt by shiftAmt.
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000913/// Arithmetic right-shift function.
Craig Topper8b373262017-04-24 17:18:47 +0000914void APInt::ashrSlowCase(unsigned ShiftAmt) {
915 // Don't bother performing a no-op shift.
916 if (!ShiftAmt)
917 return;
Reid Spencer1825dd02007-03-02 22:39:11 +0000918
Craig Topper8b373262017-04-24 17:18:47 +0000919 // Save the original sign bit for later.
920 bool Negative = isNegative();
Reid Spencer522ca7c2007-02-25 01:56:07 +0000921
Hiroshi Inoue9ff23802018-04-09 04:37:53 +0000922 // WordShift is the inter-part shift; BitShift is intra-part shift.
Craig Topper8b373262017-04-24 17:18:47 +0000923 unsigned WordShift = ShiftAmt / APINT_BITS_PER_WORD;
924 unsigned BitShift = ShiftAmt % APINT_BITS_PER_WORD;
Reid Spenceraa8dcfe2007-02-26 07:44:38 +0000925
Craig Topper8b373262017-04-24 17:18:47 +0000926 unsigned WordsToMove = getNumWords() - WordShift;
927 if (WordsToMove != 0) {
928 // Sign extend the last word to fill in the unused bits.
Craig Topperb339c6d2017-05-03 15:46:24 +0000929 U.pVal[getNumWords() - 1] = SignExtend64(
930 U.pVal[getNumWords() - 1], ((BitWidth - 1) % APINT_BITS_PER_WORD) + 1);
Renato Golincc4a9122017-04-23 12:02:07 +0000931
Craig Topper8b373262017-04-24 17:18:47 +0000932 // Fastpath for moving by whole words.
933 if (BitShift == 0) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000934 std::memmove(U.pVal, U.pVal + WordShift, WordsToMove * APINT_WORD_SIZE);
Craig Topper8b373262017-04-24 17:18:47 +0000935 } else {
936 // Move the words containing significant bits.
937 for (unsigned i = 0; i != WordsToMove - 1; ++i)
Craig Topperb339c6d2017-05-03 15:46:24 +0000938 U.pVal[i] = (U.pVal[i + WordShift] >> BitShift) |
939 (U.pVal[i + WordShift + 1] << (APINT_BITS_PER_WORD - BitShift));
Renato Golincc4a9122017-04-23 12:02:07 +0000940
Craig Topper8b373262017-04-24 17:18:47 +0000941 // Handle the last word which has no high bits to copy.
Craig Topperb339c6d2017-05-03 15:46:24 +0000942 U.pVal[WordsToMove - 1] = U.pVal[WordShift + WordsToMove - 1] >> BitShift;
Craig Topper8b373262017-04-24 17:18:47 +0000943 // Sign extend one more time.
Craig Topperb339c6d2017-05-03 15:46:24 +0000944 U.pVal[WordsToMove - 1] =
945 SignExtend64(U.pVal[WordsToMove - 1], APINT_BITS_PER_WORD - BitShift);
Chris Lattnerdad2d092007-05-03 18:15:36 +0000946 }
Reid Spenceraa8dcfe2007-02-26 07:44:38 +0000947 }
948
Craig Topper8b373262017-04-24 17:18:47 +0000949 // Fill in the remainder based on the original sign.
Craig Topperb339c6d2017-05-03 15:46:24 +0000950 std::memset(U.pVal + WordsToMove, Negative ? -1 : 0,
Craig Topper8b373262017-04-24 17:18:47 +0000951 WordShift * APINT_WORD_SIZE);
952 clearUnusedBits();
Zhou Shengfbf61ea2007-02-08 14:35:19 +0000953}
954
Zhou Shenge93db8f2007-02-09 07:48:24 +0000955/// Logical right-shift this APInt by shiftAmt.
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000956/// Logical right-shift function.
Craig Topperfc947bc2017-04-18 17:14:21 +0000957void APInt::lshrInPlace(const APInt &shiftAmt) {
958 lshrInPlace((unsigned)shiftAmt.getLimitedValue(BitWidth));
Dan Gohman105c1d42008-02-29 01:40:47 +0000959}
960
961/// Logical right-shift this APInt by shiftAmt.
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000962/// Logical right-shift function.
Craig Topperae8bd672017-04-18 19:13:27 +0000963void APInt::lshrSlowCase(unsigned ShiftAmt) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000964 tcShiftRight(U.pVal, getNumWords(), ShiftAmt);
Zhou Shengfbf61ea2007-02-08 14:35:19 +0000965}
966
Zhou Shenge93db8f2007-02-09 07:48:24 +0000967/// Left-shift this APInt by shiftAmt.
Adrian Prantl4dfcc4a2018-05-01 16:10:38 +0000968/// Left-shift function.
Craig Topper24e71012017-04-28 03:36:24 +0000969APInt &APInt::operator<<=(const APInt &shiftAmt) {
Nick Lewycky030c4502009-01-19 17:42:33 +0000970 // It's undefined behavior in C to shift by BitWidth or greater.
Craig Topper24e71012017-04-28 03:36:24 +0000971 *this <<= (unsigned)shiftAmt.getLimitedValue(BitWidth);
972 return *this;
Dan Gohman105c1d42008-02-29 01:40:47 +0000973}
974
Craig Toppera8a4f0d2017-04-18 04:39:48 +0000975void APInt::shlSlowCase(unsigned ShiftAmt) {
Craig Topperb339c6d2017-05-03 15:46:24 +0000976 tcShiftLeft(U.pVal, getNumWords(), ShiftAmt);
Craig Toppera8a4f0d2017-04-18 04:39:48 +0000977 clearUnusedBits();
Zhou Shengfbf61ea2007-02-08 14:35:19 +0000978}
979
Joey Gouly51c0ae52017-02-07 11:58:22 +0000980// Calculate the rotate amount modulo the bit width.
981static unsigned rotateModulo(unsigned BitWidth, const APInt &rotateAmt) {
982 unsigned rotBitWidth = rotateAmt.getBitWidth();
983 APInt rot = rotateAmt;
984 if (rotBitWidth < BitWidth) {
985 // Extend the rotate APInt, so that the urem doesn't divide by 0.
986 // e.g. APInt(1, 32) would give APInt(1, 0).
987 rot = rotateAmt.zext(BitWidth);
988 }
989 rot = rot.urem(APInt(rot.getBitWidth(), BitWidth));
990 return rot.getLimitedValue(BitWidth);
991}
992
Dan Gohman105c1d42008-02-29 01:40:47 +0000993APInt APInt::rotl(const APInt &rotateAmt) const {
Joey Gouly51c0ae52017-02-07 11:58:22 +0000994 return rotl(rotateModulo(BitWidth, rotateAmt));
Dan Gohman105c1d42008-02-29 01:40:47 +0000995}
996
Chris Lattner77527f52009-01-21 18:09:24 +0000997APInt APInt::rotl(unsigned rotateAmt) const {
Eli Friedman2aae94f2011-12-22 03:15:35 +0000998 rotateAmt %= BitWidth;
Reid Spencer98ed7db2007-05-14 00:15:28 +0000999 if (rotateAmt == 0)
1000 return *this;
Eli Friedman2aae94f2011-12-22 03:15:35 +00001001 return shl(rotateAmt) | lshr(BitWidth - rotateAmt);
Reid Spencer4c50b522007-05-13 23:44:59 +00001002}
1003
Dan Gohman105c1d42008-02-29 01:40:47 +00001004APInt APInt::rotr(const APInt &rotateAmt) const {
Joey Gouly51c0ae52017-02-07 11:58:22 +00001005 return rotr(rotateModulo(BitWidth, rotateAmt));
Dan Gohman105c1d42008-02-29 01:40:47 +00001006}
1007
Chris Lattner77527f52009-01-21 18:09:24 +00001008APInt APInt::rotr(unsigned rotateAmt) const {
Eli Friedman2aae94f2011-12-22 03:15:35 +00001009 rotateAmt %= BitWidth;
Reid Spencer98ed7db2007-05-14 00:15:28 +00001010 if (rotateAmt == 0)
1011 return *this;
Eli Friedman2aae94f2011-12-22 03:15:35 +00001012 return lshr(rotateAmt) | shl(BitWidth - rotateAmt);
Reid Spencer4c50b522007-05-13 23:44:59 +00001013}
Reid Spencerd99feaf2007-03-01 05:39:56 +00001014
1015// Square Root - this method computes and returns the square root of "this".
1016// Three mechanisms are used for computation. For small values (<= 5 bits),
1017// a table lookup is done. This gets some performance for common cases. For
1018// values using less than 52 bits, the value is converted to double and then
1019// the libc sqrt function is called. The result is rounded and then converted
1020// back to a uint64_t which is then used to construct the result. Finally,
Eric Christopher820256b2009-08-21 04:06:45 +00001021// the Babylonian method for computing square roots is used.
Reid Spencerd99feaf2007-03-01 05:39:56 +00001022APInt APInt::sqrt() const {
1023
1024 // Determine the magnitude of the value.
Chris Lattner77527f52009-01-21 18:09:24 +00001025 unsigned magnitude = getActiveBits();
Reid Spencerd99feaf2007-03-01 05:39:56 +00001026
1027 // Use a fast table for some small values. This also gets rid of some
1028 // rounding errors in libc sqrt for small values.
1029 if (magnitude <= 5) {
Reid Spencer2f6ad4d2007-03-01 17:47:31 +00001030 static const uint8_t results[32] = {
Reid Spencerc8841d22007-03-01 06:23:32 +00001031 /* 0 */ 0,
1032 /* 1- 2 */ 1, 1,
Eric Christopher820256b2009-08-21 04:06:45 +00001033 /* 3- 6 */ 2, 2, 2, 2,
Reid Spencerc8841d22007-03-01 06:23:32 +00001034 /* 7-12 */ 3, 3, 3, 3, 3, 3,
1035 /* 13-20 */ 4, 4, 4, 4, 4, 4, 4, 4,
1036 /* 21-30 */ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
1037 /* 31 */ 6
1038 };
Craig Topperb339c6d2017-05-03 15:46:24 +00001039 return APInt(BitWidth, results[ (isSingleWord() ? U.VAL : U.pVal[0]) ]);
Reid Spencerd99feaf2007-03-01 05:39:56 +00001040 }
1041
1042 // If the magnitude of the value fits in less than 52 bits (the precision of
1043 // an IEEE double precision floating point value), then we can use the
1044 // libc sqrt function which will probably use a hardware sqrt computation.
1045 // This should be faster than the algorithm below.
Jeff Cohenb622c112007-03-05 00:00:42 +00001046 if (magnitude < 52) {
Eric Christopher820256b2009-08-21 04:06:45 +00001047 return APInt(BitWidth,
Craig Topperb339c6d2017-05-03 15:46:24 +00001048 uint64_t(::round(::sqrt(double(isSingleWord() ? U.VAL
1049 : U.pVal[0])))));
Jeff Cohenb622c112007-03-05 00:00:42 +00001050 }
Reid Spencerd99feaf2007-03-01 05:39:56 +00001051
1052 // Okay, all the short cuts are exhausted. We must compute it. The following
1053 // is a classical Babylonian method for computing the square root. This code
Sanjay Patel4cb54e02014-09-11 15:41:01 +00001054 // was adapted to APInt from a wikipedia article on such computations.
Reid Spencerd99feaf2007-03-01 05:39:56 +00001055 // See http://www.wikipedia.org/ and go to the page named
Eric Christopher820256b2009-08-21 04:06:45 +00001056 // Calculate_an_integer_square_root.
Chris Lattner77527f52009-01-21 18:09:24 +00001057 unsigned nbits = BitWidth, i = 4;
Reid Spencerd99feaf2007-03-01 05:39:56 +00001058 APInt testy(BitWidth, 16);
1059 APInt x_old(BitWidth, 1);
1060 APInt x_new(BitWidth, 0);
1061 APInt two(BitWidth, 2);
1062
1063 // Select a good starting value using binary logarithms.
Eric Christopher820256b2009-08-21 04:06:45 +00001064 for (;; i += 2, testy = testy.shl(2))
Reid Spencerd99feaf2007-03-01 05:39:56 +00001065 if (i >= nbits || this->ule(testy)) {
1066 x_old = x_old.shl(i / 2);
1067 break;
1068 }
1069
Eric Christopher820256b2009-08-21 04:06:45 +00001070 // Use the Babylonian method to arrive at the integer square root:
Reid Spencerd99feaf2007-03-01 05:39:56 +00001071 for (;;) {
1072 x_new = (this->udiv(x_old) + x_old).udiv(two);
1073 if (x_old.ule(x_new))
1074 break;
1075 x_old = x_new;
1076 }
1077
1078 // Make sure we return the closest approximation
Eric Christopher820256b2009-08-21 04:06:45 +00001079 // NOTE: The rounding calculation below is correct. It will produce an
Reid Spencercf817562007-03-02 04:21:55 +00001080 // off-by-one discrepancy with results from pari/gp. That discrepancy has been
Eric Christopher820256b2009-08-21 04:06:45 +00001081 // determined to be a rounding issue with pari/gp as it begins to use a
Reid Spencercf817562007-03-02 04:21:55 +00001082 // floating point representation after 192 bits. There are no discrepancies
1083 // between this algorithm and pari/gp for bit widths < 192 bits.
Reid Spencerd99feaf2007-03-01 05:39:56 +00001084 APInt square(x_old * x_old);
1085 APInt nextSquare((x_old + 1) * (x_old +1));
1086 if (this->ult(square))
1087 return x_old;
David Blaikie54c94622011-12-01 20:58:30 +00001088 assert(this->ule(nextSquare) && "Error in APInt::sqrt computation");
1089 APInt midpoint((nextSquare - square).udiv(two));
1090 APInt offset(*this - square);
1091 if (offset.ult(midpoint))
1092 return x_old;
Reid Spencerd99feaf2007-03-01 05:39:56 +00001093 return x_old + 1;
1094}
1095
Wojciech Matyjewicz41b744d2008-06-23 19:39:50 +00001096/// Computes the multiplicative inverse of this APInt for a given modulo. The
1097/// iterative extended Euclidean algorithm is used to solve for this value,
1098/// however we simplify it to speed up calculating only the inverse, and take
1099/// advantage of div+rem calculations. We also use some tricks to avoid copying
1100/// (potentially large) APInts around.
Roman Lebedev29d05c02019-06-27 21:52:10 +00001101/// WARNING: a value of '0' may be returned,
1102/// signifying that no multiplicative inverse exists!
Wojciech Matyjewicz41b744d2008-06-23 19:39:50 +00001103APInt APInt::multiplicativeInverse(const APInt& modulo) const {
1104 assert(ult(modulo) && "This APInt must be smaller than the modulo");
1105
1106 // Using the properties listed at the following web page (accessed 06/21/08):
1107 // http://www.numbertheory.org/php/euclid.html
1108 // (especially the properties numbered 3, 4 and 9) it can be proved that
1109 // BitWidth bits suffice for all the computations in the algorithm implemented
1110 // below. More precisely, this number of bits suffice if the multiplicative
1111 // inverse exists, but may not suffice for the general extended Euclidean
1112 // algorithm.
1113
1114 APInt r[2] = { modulo, *this };
1115 APInt t[2] = { APInt(BitWidth, 0), APInt(BitWidth, 1) };
1116 APInt q(BitWidth, 0);
Eric Christopher820256b2009-08-21 04:06:45 +00001117
Wojciech Matyjewicz41b744d2008-06-23 19:39:50 +00001118 unsigned i;
1119 for (i = 0; r[i^1] != 0; i ^= 1) {
1120 // An overview of the math without the confusing bit-flipping:
1121 // q = r[i-2] / r[i-1]
1122 // r[i] = r[i-2] % r[i-1]
1123 // t[i] = t[i-2] - t[i-1] * q
1124 udivrem(r[i], r[i^1], q, r[i]);
1125 t[i] -= t[i^1] * q;
1126 }
1127
1128 // If this APInt and the modulo are not coprime, there is no multiplicative
1129 // inverse, so return 0. We check this by looking at the next-to-last
1130 // remainder, which is the gcd(*this,modulo) as calculated by the Euclidean
1131 // algorithm.
1132 if (r[i] != 1)
1133 return APInt(BitWidth, 0);
1134
1135 // The next-to-last t is the multiplicative inverse. However, we are
Craig Topper3fbecad2017-05-11 17:57:43 +00001136 // interested in a positive inverse. Calculate a positive one from a negative
Wojciech Matyjewicz41b744d2008-06-23 19:39:50 +00001137 // one if necessary. A simple addition of the modulo suffices because
Wojciech Matyjewiczf0d21cd2008-07-20 15:55:14 +00001138 // abs(t[i]) is known to be less than *this/2 (see the link above).
Craig Topperdbd62192017-05-11 18:40:53 +00001139 if (t[i].isNegative())
1140 t[i] += modulo;
1141
1142 return std::move(t[i]);
Wojciech Matyjewicz41b744d2008-06-23 19:39:50 +00001143}
1144
Jay Foadfe0c6482009-04-30 10:15:35 +00001145/// Calculate the magic numbers required to implement a signed integer division
1146/// by a constant as a sequence of multiplies, adds and shifts. Requires that
1147/// the divisor not be 0, 1, or -1. Taken from "Hacker's Delight", Henry S.
1148/// Warren, Jr., chapter 10.
1149APInt::ms APInt::magic() const {
1150 const APInt& d = *this;
1151 unsigned p;
1152 APInt ad, anc, delta, q1, r1, q2, r2, t;
Jay Foadfe0c6482009-04-30 10:15:35 +00001153 APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
Jay Foadfe0c6482009-04-30 10:15:35 +00001154 struct ms mag;
Eric Christopher820256b2009-08-21 04:06:45 +00001155
Jay Foadfe0c6482009-04-30 10:15:35 +00001156 ad = d.abs();
1157 t = signedMin + (d.lshr(d.getBitWidth() - 1));
1158 anc = t - 1 - t.urem(ad); // absolute value of nc
1159 p = d.getBitWidth() - 1; // initialize p
1160 q1 = signedMin.udiv(anc); // initialize q1 = 2p/abs(nc)
1161 r1 = signedMin - q1*anc; // initialize r1 = rem(2p,abs(nc))
1162 q2 = signedMin.udiv(ad); // initialize q2 = 2p/abs(d)
1163 r2 = signedMin - q2*ad; // initialize r2 = rem(2p,abs(d))
1164 do {
1165 p = p + 1;
1166 q1 = q1<<1; // update q1 = 2p/abs(nc)
1167 r1 = r1<<1; // update r1 = rem(2p/abs(nc))
1168 if (r1.uge(anc)) { // must be unsigned comparison
1169 q1 = q1 + 1;
1170 r1 = r1 - anc;
1171 }
1172 q2 = q2<<1; // update q2 = 2p/abs(d)
1173 r2 = r2<<1; // update r2 = rem(2p/abs(d))
1174 if (r2.uge(ad)) { // must be unsigned comparison
1175 q2 = q2 + 1;
1176 r2 = r2 - ad;
1177 }
1178 delta = ad - r2;
Cameron Zwarich8731d0c2011-02-21 00:22:02 +00001179 } while (q1.ult(delta) || (q1 == delta && r1 == 0));
Eric Christopher820256b2009-08-21 04:06:45 +00001180
Jay Foadfe0c6482009-04-30 10:15:35 +00001181 mag.m = q2 + 1;
1182 if (d.isNegative()) mag.m = -mag.m; // resulting magic number
1183 mag.s = p - d.getBitWidth(); // resulting shift
1184 return mag;
1185}
1186
1187/// Calculate the magic numbers required to implement an unsigned integer
1188/// division by a constant as a sequence of multiplies, adds and shifts.
1189/// Requires that the divisor not be 0. Taken from "Hacker's Delight", Henry
1190/// S. Warren, Jr., chapter 10.
Benjamin Kramer09a51ba2011-03-17 20:39:06 +00001191/// LeadingZeros can be used to simplify the calculation if the upper bits
Chris Lattner0ab5e2c2011-04-15 05:18:47 +00001192/// of the divided value are known zero.
Benjamin Kramer09a51ba2011-03-17 20:39:06 +00001193APInt::mu APInt::magicu(unsigned LeadingZeros) const {
Jay Foadfe0c6482009-04-30 10:15:35 +00001194 const APInt& d = *this;
1195 unsigned p;
1196 APInt nc, delta, q1, r1, q2, r2;
1197 struct mu magu;
1198 magu.a = 0; // initialize "add" indicator
Benjamin Kramer09a51ba2011-03-17 20:39:06 +00001199 APInt allOnes = APInt::getAllOnesValue(d.getBitWidth()).lshr(LeadingZeros);
Jay Foadfe0c6482009-04-30 10:15:35 +00001200 APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
1201 APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
1202
Benjamin Kramer3aab6a82012-07-11 18:31:59 +00001203 nc = allOnes - (allOnes - d).urem(d);
Jay Foadfe0c6482009-04-30 10:15:35 +00001204 p = d.getBitWidth() - 1; // initialize p
1205 q1 = signedMin.udiv(nc); // initialize q1 = 2p/nc
1206 r1 = signedMin - q1*nc; // initialize r1 = rem(2p,nc)
1207 q2 = signedMax.udiv(d); // initialize q2 = (2p-1)/d
1208 r2 = signedMax - q2*d; // initialize r2 = rem((2p-1),d)
1209 do {
1210 p = p + 1;
1211 if (r1.uge(nc - r1)) {
1212 q1 = q1 + q1 + 1; // update q1
1213 r1 = r1 + r1 - nc; // update r1
1214 }
1215 else {
1216 q1 = q1+q1; // update q1
1217 r1 = r1+r1; // update r1
1218 }
1219 if ((r2 + 1).uge(d - r2)) {
1220 if (q2.uge(signedMax)) magu.a = 1;
1221 q2 = q2+q2 + 1; // update q2
1222 r2 = r2+r2 + 1 - d; // update r2
1223 }
1224 else {
1225 if (q2.uge(signedMin)) magu.a = 1;
1226 q2 = q2+q2; // update q2
1227 r2 = r2+r2 + 1; // update r2
1228 }
1229 delta = d - 1 - r2;
1230 } while (p < d.getBitWidth()*2 &&
1231 (q1.ult(delta) || (q1 == delta && r1 == 0)));
1232 magu.m = q2 + 1; // resulting magic number
1233 magu.s = p - d.getBitWidth(); // resulting shift
1234 return magu;
1235}
1236
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001237/// Implementation of Knuth's Algorithm D (Division of nonnegative integers)
1238/// from "Art of Computer Programming, Volume 2", section 4.3.1, p. 272. The
1239/// variables here have the same names as in the algorithm. Comments explain
1240/// the algorithm and any deviation from it.
Craig Topper6271bc72017-05-10 18:15:20 +00001241static void KnuthDiv(uint32_t *u, uint32_t *v, uint32_t *q, uint32_t* r,
Chris Lattner77527f52009-01-21 18:09:24 +00001242 unsigned m, unsigned n) {
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001243 assert(u && "Must provide dividend");
1244 assert(v && "Must provide divisor");
1245 assert(q && "Must provide quotient");
Yaron Keren39fc5a62015-03-26 19:45:19 +00001246 assert(u != v && u != q && v != q && "Must use different memory");
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001247 assert(n>1 && "n must be > 1");
1248
Yaron Keren39fc5a62015-03-26 19:45:19 +00001249 // b denotes the base of the number system. In our case b is 2^32.
George Burgess IV381fc0e2016-08-25 01:05:08 +00001250 const uint64_t b = uint64_t(1) << 32;
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001251
Craig Topper03106bb2017-11-24 20:29:04 +00001252// The DEBUG macros here tend to be spam in the debug output if you're not
1253// debugging this code. Disable them unless KNUTH_DEBUG is defined.
Tim Northoverb3766452018-08-06 11:43:11 +00001254#ifdef KNUTH_DEBUG
1255#define DEBUG_KNUTH(X) LLVM_DEBUG(X)
1256#else
1257#define DEBUG_KNUTH(X) do {} while(false)
Craig Topper03106bb2017-11-24 20:29:04 +00001258#endif
1259
Tim Northoverb3766452018-08-06 11:43:11 +00001260 DEBUG_KNUTH(dbgs() << "KnuthDiv: m=" << m << " n=" << n << '\n');
1261 DEBUG_KNUTH(dbgs() << "KnuthDiv: original:");
1262 DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
1263 DEBUG_KNUTH(dbgs() << " by");
1264 DEBUG_KNUTH(for (int i = n; i > 0; i--) dbgs() << " " << v[i - 1]);
1265 DEBUG_KNUTH(dbgs() << '\n');
Eric Christopher820256b2009-08-21 04:06:45 +00001266 // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
1267 // u and v by d. Note that we have taken Knuth's advice here to use a power
1268 // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
1269 // 2 allows us to shift instead of multiply and it is easy to determine the
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001270 // shift amount from the leading zeros. We are basically normalizing the u
1271 // and v so that its high bits are shifted to the top of v's range without
1272 // overflow. Note that this can require an extra word in u so that u must
1273 // be of length m+n+1.
Michael J. Spencerdf1ecbd72013-05-24 22:23:49 +00001274 unsigned shift = countLeadingZeros(v[n-1]);
Craig Topper6271bc72017-05-10 18:15:20 +00001275 uint32_t v_carry = 0;
1276 uint32_t u_carry = 0;
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001277 if (shift) {
Chris Lattner77527f52009-01-21 18:09:24 +00001278 for (unsigned i = 0; i < m+n; ++i) {
Craig Topper6271bc72017-05-10 18:15:20 +00001279 uint32_t u_tmp = u[i] >> (32 - shift);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001280 u[i] = (u[i] << shift) | u_carry;
1281 u_carry = u_tmp;
Reid Spencer100502d2007-02-17 03:16:00 +00001282 }
Chris Lattner77527f52009-01-21 18:09:24 +00001283 for (unsigned i = 0; i < n; ++i) {
Craig Topper6271bc72017-05-10 18:15:20 +00001284 uint32_t v_tmp = v[i] >> (32 - shift);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001285 v[i] = (v[i] << shift) | v_carry;
1286 v_carry = v_tmp;
1287 }
1288 }
1289 u[m+n] = u_carry;
Yaron Keren39fc5a62015-03-26 19:45:19 +00001290
Tim Northoverb3766452018-08-06 11:43:11 +00001291 DEBUG_KNUTH(dbgs() << "KnuthDiv: normal:");
1292 DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
1293 DEBUG_KNUTH(dbgs() << " by");
1294 DEBUG_KNUTH(for (int i = n; i > 0; i--) dbgs() << " " << v[i - 1]);
1295 DEBUG_KNUTH(dbgs() << '\n');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001296
1297 // D2. [Initialize j.] Set j to m. This is the loop counter over the places.
1298 int j = m;
1299 do {
Tim Northoverb3766452018-08-06 11:43:11 +00001300 DEBUG_KNUTH(dbgs() << "KnuthDiv: quotient digit #" << j << '\n');
Eric Christopher820256b2009-08-21 04:06:45 +00001301 // D3. [Calculate q'.].
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001302 // Set qp = (u[j+n]*b + u[j+n-1]) / v[n-1]. (qp=qprime=q')
1303 // Set rp = (u[j+n]*b + u[j+n-1]) % v[n-1]. (rp=rprime=r')
1304 // Now test if qp == b or qp*v[n-2] > b*rp + u[j+n-2]; if so, decrease
Craig Topper4b83b4d2017-05-13 00:35:30 +00001305 // qp by 1, increase rp by v[n-1], and repeat this test if rp < b. The test
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001306 // on v[n-2] determines at high speed most of the cases in which the trial
Eric Christopher820256b2009-08-21 04:06:45 +00001307 // value qp is one too large, and it eliminates all cases where qp is two
1308 // too large.
Craig Topper2c9a7062017-05-13 07:14:17 +00001309 uint64_t dividend = Make_64(u[j+n], u[j+n-1]);
Tim Northoverb3766452018-08-06 11:43:11 +00001310 DEBUG_KNUTH(dbgs() << "KnuthDiv: dividend == " << dividend << '\n');
Reid Spencercb292e42007-02-23 01:57:13 +00001311 uint64_t qp = dividend / v[n-1];
1312 uint64_t rp = dividend % v[n-1];
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001313 if (qp == b || qp*v[n-2] > b*rp + u[j+n-2]) {
1314 qp--;
1315 rp += v[n-1];
Reid Spencerdf6cf5a2007-02-24 10:01:42 +00001316 if (rp < b && (qp == b || qp*v[n-2] > b*rp + u[j+n-2]))
Reid Spencera5e0d202007-02-24 03:58:46 +00001317 qp--;
Reid Spencercb292e42007-02-23 01:57:13 +00001318 }
Tim Northoverb3766452018-08-06 11:43:11 +00001319 DEBUG_KNUTH(dbgs() << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001320
Reid Spencercb292e42007-02-23 01:57:13 +00001321 // D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
1322 // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
1323 // consists of a simple multiplication by a one-place number, combined with
Eric Christopher820256b2009-08-21 04:06:45 +00001324 // a subtraction.
Yaron Keren39fc5a62015-03-26 19:45:19 +00001325 // The digits (u[j+n]...u[j]) should be kept positive; if the result of
1326 // this step is actually negative, (u[j+n]...u[j]) should be left as the
1327 // true value plus b**(n+1), namely as the b's complement of
1328 // the true value, and a "borrow" to the left should be remembered.
Pawel Bylica86ac4472015-04-24 07:38:39 +00001329 int64_t borrow = 0;
Chris Lattner77527f52009-01-21 18:09:24 +00001330 for (unsigned i = 0; i < n; ++i) {
Pawel Bylica86ac4472015-04-24 07:38:39 +00001331 uint64_t p = uint64_t(qp) * uint64_t(v[i]);
Craig Topper2c9a7062017-05-13 07:14:17 +00001332 int64_t subres = int64_t(u[j+i]) - borrow - Lo_32(p);
1333 u[j+i] = Lo_32(subres);
1334 borrow = Hi_32(p) - Hi_32(subres);
Tim Northoverb3766452018-08-06 11:43:11 +00001335 DEBUG_KNUTH(dbgs() << "KnuthDiv: u[j+i] = " << u[j + i]
Nicola Zaghend34e60c2018-05-14 12:53:11 +00001336 << ", borrow = " << borrow << '\n');
Reid Spencera5e0d202007-02-24 03:58:46 +00001337 }
Pawel Bylica86ac4472015-04-24 07:38:39 +00001338 bool isNeg = u[j+n] < borrow;
Craig Topper2c9a7062017-05-13 07:14:17 +00001339 u[j+n] -= Lo_32(borrow);
Pawel Bylica86ac4472015-04-24 07:38:39 +00001340
Tim Northoverb3766452018-08-06 11:43:11 +00001341 DEBUG_KNUTH(dbgs() << "KnuthDiv: after subtraction:");
1342 DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
1343 DEBUG_KNUTH(dbgs() << '\n');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001344
Eric Christopher820256b2009-08-21 04:06:45 +00001345 // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001346 // negative, go to step D6; otherwise go on to step D7.
Craig Topper2c9a7062017-05-13 07:14:17 +00001347 q[j] = Lo_32(qp);
Reid Spenceraa8dcfe2007-02-26 07:44:38 +00001348 if (isNeg) {
Eric Christopher820256b2009-08-21 04:06:45 +00001349 // D6. [Add back]. The probability that this step is necessary is very
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001350 // small, on the order of only 2/b. Make sure that test data accounts for
Eric Christopher820256b2009-08-21 04:06:45 +00001351 // this possibility. Decrease q[j] by 1
Reid Spencercb292e42007-02-23 01:57:13 +00001352 q[j]--;
Eric Christopher820256b2009-08-21 04:06:45 +00001353 // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
1354 // A carry will occur to the left of u[j+n], and it should be ignored
Reid Spencercb292e42007-02-23 01:57:13 +00001355 // since it cancels with the borrow that occurred in D4.
1356 bool carry = false;
Chris Lattner77527f52009-01-21 18:09:24 +00001357 for (unsigned i = 0; i < n; i++) {
Craig Topper6271bc72017-05-10 18:15:20 +00001358 uint32_t limit = std::min(u[j+i],v[i]);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001359 u[j+i] += v[i] + carry;
Reid Spencera5e0d202007-02-24 03:58:46 +00001360 carry = u[j+i] < limit || (carry && u[j+i] == limit);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001361 }
Reid Spencera5e0d202007-02-24 03:58:46 +00001362 u[j+n] += carry;
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001363 }
Tim Northoverb3766452018-08-06 11:43:11 +00001364 DEBUG_KNUTH(dbgs() << "KnuthDiv: after correction:");
1365 DEBUG_KNUTH(for (int i = m + n; i >= 0; i--) dbgs() << " " << u[i]);
1366 DEBUG_KNUTH(dbgs() << "\nKnuthDiv: digit result = " << q[j] << '\n');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001367
Nicola Zaghend34e60c2018-05-14 12:53:11 +00001368 // D7. [Loop on j.] Decrease j by one. Now if j >= 0, go back to D3.
Reid Spencercb292e42007-02-23 01:57:13 +00001369 } while (--j >= 0);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001370
Tim Northoverb3766452018-08-06 11:43:11 +00001371 DEBUG_KNUTH(dbgs() << "KnuthDiv: quotient:");
1372 DEBUG_KNUTH(for (int i = m; i >= 0; i--) dbgs() << " " << q[i]);
1373 DEBUG_KNUTH(dbgs() << '\n');
Reid Spencera5e0d202007-02-24 03:58:46 +00001374
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001375 // D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
1376 // remainder may be obtained by dividing u[...] by d. If r is non-null we
1377 // compute the remainder (urem uses this).
1378 if (r) {
1379 // The value d is expressed by the "shift" value above since we avoided
1380 // multiplication by d by using a shift left. So, all we have to do is
Simon Pilgrim0099beb2017-03-09 13:57:04 +00001381 // shift right here.
Reid Spencer468ad9112007-02-24 20:38:01 +00001382 if (shift) {
Craig Topper6271bc72017-05-10 18:15:20 +00001383 uint32_t carry = 0;
Tim Northoverb3766452018-08-06 11:43:11 +00001384 DEBUG_KNUTH(dbgs() << "KnuthDiv: remainder:");
Reid Spencer468ad9112007-02-24 20:38:01 +00001385 for (int i = n-1; i >= 0; i--) {
1386 r[i] = (u[i] >> shift) | carry;
1387 carry = u[i] << (32 - shift);
Tim Northoverb3766452018-08-06 11:43:11 +00001388 DEBUG_KNUTH(dbgs() << " " << r[i]);
Reid Spencer468ad9112007-02-24 20:38:01 +00001389 }
1390 } else {
1391 for (int i = n-1; i >= 0; i--) {
1392 r[i] = u[i];
Tim Northoverb3766452018-08-06 11:43:11 +00001393 DEBUG_KNUTH(dbgs() << " " << r[i]);
Reid Spencer468ad9112007-02-24 20:38:01 +00001394 }
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001395 }
Tim Northoverb3766452018-08-06 11:43:11 +00001396 DEBUG_KNUTH(dbgs() << '\n');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001397 }
Tim Northoverb3766452018-08-06 11:43:11 +00001398 DEBUG_KNUTH(dbgs() << '\n');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001399}
1400
Craig Topper8885f932017-05-19 16:43:54 +00001401void APInt::divide(const WordType *LHS, unsigned lhsWords, const WordType *RHS,
1402 unsigned rhsWords, WordType *Quotient, WordType *Remainder) {
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001403 assert(lhsWords >= rhsWords && "Fractional result");
1404
Eric Christopher820256b2009-08-21 04:06:45 +00001405 // First, compose the values into an array of 32-bit words instead of
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001406 // 64-bit words. This is a necessity of both the "short division" algorithm
Dan Gohman4a618822010-02-10 16:03:48 +00001407 // and the Knuth "classical algorithm" which requires there to be native
Eric Christopher820256b2009-08-21 04:06:45 +00001408 // operations for +, -, and * on an m bit value with an m*2 bit result. We
1409 // can't use 64-bit operands here because we don't have native results of
1410 // 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001411 // work on large-endian machines.
Chris Lattner77527f52009-01-21 18:09:24 +00001412 unsigned n = rhsWords * 2;
1413 unsigned m = (lhsWords * 2) - n;
Reid Spencer522ca7c2007-02-25 01:56:07 +00001414
1415 // Allocate space for the temporary values we need either on the stack, if
1416 // it will fit, or on the heap if it won't.
Craig Topper6271bc72017-05-10 18:15:20 +00001417 uint32_t SPACE[128];
1418 uint32_t *U = nullptr;
1419 uint32_t *V = nullptr;
1420 uint32_t *Q = nullptr;
1421 uint32_t *R = nullptr;
Reid Spencer522ca7c2007-02-25 01:56:07 +00001422 if ((Remainder?4:3)*n+2*m+1 <= 128) {
1423 U = &SPACE[0];
1424 V = &SPACE[m+n+1];
1425 Q = &SPACE[(m+n+1) + n];
1426 if (Remainder)
1427 R = &SPACE[(m+n+1) + n + (m+n)];
1428 } else {
Craig Topper6271bc72017-05-10 18:15:20 +00001429 U = new uint32_t[m + n + 1];
1430 V = new uint32_t[n];
1431 Q = new uint32_t[m+n];
Reid Spencer522ca7c2007-02-25 01:56:07 +00001432 if (Remainder)
Craig Topper6271bc72017-05-10 18:15:20 +00001433 R = new uint32_t[n];
Reid Spencer522ca7c2007-02-25 01:56:07 +00001434 }
1435
1436 // Initialize the dividend
Craig Topper6271bc72017-05-10 18:15:20 +00001437 memset(U, 0, (m+n+1)*sizeof(uint32_t));
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001438 for (unsigned i = 0; i < lhsWords; ++i) {
Craig Topper8885f932017-05-19 16:43:54 +00001439 uint64_t tmp = LHS[i];
Craig Topper6271bc72017-05-10 18:15:20 +00001440 U[i * 2] = Lo_32(tmp);
1441 U[i * 2 + 1] = Hi_32(tmp);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001442 }
1443 U[m+n] = 0; // this extra word is for "spill" in the Knuth algorithm.
1444
Reid Spencer522ca7c2007-02-25 01:56:07 +00001445 // Initialize the divisor
Craig Topper6271bc72017-05-10 18:15:20 +00001446 memset(V, 0, (n)*sizeof(uint32_t));
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001447 for (unsigned i = 0; i < rhsWords; ++i) {
Craig Topper8885f932017-05-19 16:43:54 +00001448 uint64_t tmp = RHS[i];
Craig Topper6271bc72017-05-10 18:15:20 +00001449 V[i * 2] = Lo_32(tmp);
1450 V[i * 2 + 1] = Hi_32(tmp);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001451 }
1452
Reid Spencer522ca7c2007-02-25 01:56:07 +00001453 // initialize the quotient and remainder
Craig Topper6271bc72017-05-10 18:15:20 +00001454 memset(Q, 0, (m+n) * sizeof(uint32_t));
Reid Spencer522ca7c2007-02-25 01:56:07 +00001455 if (Remainder)
Craig Topper6271bc72017-05-10 18:15:20 +00001456 memset(R, 0, n * sizeof(uint32_t));
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001457
Eric Christopher820256b2009-08-21 04:06:45 +00001458 // Now, adjust m and n for the Knuth division. n is the number of words in
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001459 // the divisor. m is the number of words by which the dividend exceeds the
Eric Christopher820256b2009-08-21 04:06:45 +00001460 // divisor (i.e. m+n is the length of the dividend). These sizes must not
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001461 // contain any zero words or the Knuth algorithm fails.
1462 for (unsigned i = n; i > 0 && V[i-1] == 0; i--) {
1463 n--;
1464 m++;
1465 }
1466 for (unsigned i = m+n; i > 0 && U[i-1] == 0; i--)
1467 m--;
1468
1469 // If we're left with only a single word for the divisor, Knuth doesn't work
1470 // so we implement the short division algorithm here. This is much simpler
1471 // and faster because we are certain that we can divide a 64-bit quantity
1472 // by a 32-bit quantity at hardware speed and short division is simply a
1473 // series of such operations. This is just like doing short division but we
1474 // are using base 2^32 instead of base 10.
1475 assert(n != 0 && "Divide by zero?");
1476 if (n == 1) {
Craig Topper6271bc72017-05-10 18:15:20 +00001477 uint32_t divisor = V[0];
1478 uint32_t remainder = 0;
Craig Topper6a1d0202017-05-15 22:01:03 +00001479 for (int i = m; i >= 0; i--) {
Craig Topper6271bc72017-05-10 18:15:20 +00001480 uint64_t partial_dividend = Make_64(remainder, U[i]);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001481 if (partial_dividend == 0) {
1482 Q[i] = 0;
1483 remainder = 0;
1484 } else if (partial_dividend < divisor) {
1485 Q[i] = 0;
Craig Topper6271bc72017-05-10 18:15:20 +00001486 remainder = Lo_32(partial_dividend);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001487 } else if (partial_dividend == divisor) {
1488 Q[i] = 1;
1489 remainder = 0;
1490 } else {
Craig Topper6271bc72017-05-10 18:15:20 +00001491 Q[i] = Lo_32(partial_dividend / divisor);
1492 remainder = Lo_32(partial_dividend - (Q[i] * divisor));
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001493 }
1494 }
1495 if (R)
1496 R[0] = remainder;
1497 } else {
1498 // Now we're ready to invoke the Knuth classical divide algorithm. In this
1499 // case n > 1.
1500 KnuthDiv(U, V, Q, R, m, n);
1501 }
1502
1503 // If the caller wants the quotient
1504 if (Quotient) {
Craig Topper8885f932017-05-19 16:43:54 +00001505 for (unsigned i = 0; i < lhsWords; ++i)
1506 Quotient[i] = Make_64(Q[i*2+1], Q[i*2]);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001507 }
1508
1509 // If the caller wants the remainder
1510 if (Remainder) {
Craig Topper8885f932017-05-19 16:43:54 +00001511 for (unsigned i = 0; i < rhsWords; ++i)
1512 Remainder[i] = Make_64(R[i*2+1], R[i*2]);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001513 }
1514
1515 // Clean up the memory we allocated.
Reid Spencer522ca7c2007-02-25 01:56:07 +00001516 if (U != &SPACE[0]) {
1517 delete [] U;
1518 delete [] V;
1519 delete [] Q;
1520 delete [] R;
1521 }
Reid Spencer100502d2007-02-17 03:16:00 +00001522}
1523
Craig Topper8885f932017-05-19 16:43:54 +00001524APInt APInt::udiv(const APInt &RHS) const {
Reid Spencera32372d12007-02-17 00:18:01 +00001525 assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
Reid Spencer39867762007-02-17 02:07:07 +00001526
1527 // First, deal with the easy case
1528 if (isSingleWord()) {
Craig Topperb339c6d2017-05-03 15:46:24 +00001529 assert(RHS.U.VAL != 0 && "Divide by zero?");
1530 return APInt(BitWidth, U.VAL / RHS.U.VAL);
Zhou Shengfbf61ea2007-02-08 14:35:19 +00001531 }
Reid Spencer39867762007-02-17 02:07:07 +00001532
Reid Spencer39867762007-02-17 02:07:07 +00001533 // Get some facts about the LHS and RHS number of bits and words
Craig Topper62de0392017-05-10 07:50:15 +00001534 unsigned lhsWords = getNumWords(getActiveBits());
Craig Topperb1a71ca2017-05-12 21:45:50 +00001535 unsigned rhsBits = RHS.getActiveBits();
1536 unsigned rhsWords = getNumWords(rhsBits);
1537 assert(rhsWords && "Divided by zero???");
Reid Spencer39867762007-02-17 02:07:07 +00001538
1539 // Deal with some degenerate cases
Eric Christopher820256b2009-08-21 04:06:45 +00001540 if (!lhsWords)
Reid Spencer58a6a432007-02-21 08:21:52 +00001541 // 0 / X ===> 0
Eric Christopher820256b2009-08-21 04:06:45 +00001542 return APInt(BitWidth, 0);
Craig Topperb1a71ca2017-05-12 21:45:50 +00001543 if (rhsBits == 1)
1544 // X / 1 ===> X
1545 return *this;
Craig Topper24ae6952017-05-08 23:49:49 +00001546 if (lhsWords < rhsWords || this->ult(RHS))
Sylvestre Ledru91ce36c2012-09-27 10:14:43 +00001547 // X / Y ===> 0, iff X < Y
Reid Spencer58a6a432007-02-21 08:21:52 +00001548 return APInt(BitWidth, 0);
Craig Topper24ae6952017-05-08 23:49:49 +00001549 if (*this == RHS)
Reid Spencer58a6a432007-02-21 08:21:52 +00001550 // X / X ===> 1
1551 return APInt(BitWidth, 1);
Craig Topper06da0812017-05-12 18:18:57 +00001552 if (lhsWords == 1) // rhsWords is 1 if lhsWords is 1.
Reid Spencer39867762007-02-17 02:07:07 +00001553 // All high words are zero, just use native divide
Craig Topperb339c6d2017-05-03 15:46:24 +00001554 return APInt(BitWidth, this->U.pVal[0] / RHS.U.pVal[0]);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001555
1556 // We have to compute it the hard way. Invoke the Knuth divide algorithm.
Craig Topper8885f932017-05-19 16:43:54 +00001557 APInt Quotient(BitWidth, 0); // to hold result.
1558 divide(U.pVal, lhsWords, RHS.U.pVal, rhsWords, Quotient.U.pVal, nullptr);
1559 return Quotient;
1560}
1561
1562APInt APInt::udiv(uint64_t RHS) const {
1563 assert(RHS != 0 && "Divide by zero?");
1564
1565 // First, deal with the easy case
1566 if (isSingleWord())
1567 return APInt(BitWidth, U.VAL / RHS);
1568
1569 // Get some facts about the LHS words.
1570 unsigned lhsWords = getNumWords(getActiveBits());
1571
1572 // Deal with some degenerate cases
1573 if (!lhsWords)
1574 // 0 / X ===> 0
1575 return APInt(BitWidth, 0);
1576 if (RHS == 1)
1577 // X / 1 ===> X
1578 return *this;
1579 if (this->ult(RHS))
1580 // X / Y ===> 0, iff X < Y
1581 return APInt(BitWidth, 0);
1582 if (*this == RHS)
1583 // X / X ===> 1
1584 return APInt(BitWidth, 1);
1585 if (lhsWords == 1) // rhsWords is 1 if lhsWords is 1.
1586 // All high words are zero, just use native divide
1587 return APInt(BitWidth, this->U.pVal[0] / RHS);
1588
1589 // We have to compute it the hard way. Invoke the Knuth divide algorithm.
1590 APInt Quotient(BitWidth, 0); // to hold result.
1591 divide(U.pVal, lhsWords, &RHS, 1, Quotient.U.pVal, nullptr);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001592 return Quotient;
Zhou Shengfbf61ea2007-02-08 14:35:19 +00001593}
1594
Jakub Staszak6605c602013-02-20 00:17:42 +00001595APInt APInt::sdiv(const APInt &RHS) const {
1596 if (isNegative()) {
1597 if (RHS.isNegative())
1598 return (-(*this)).udiv(-RHS);
1599 return -((-(*this)).udiv(RHS));
1600 }
1601 if (RHS.isNegative())
1602 return -(this->udiv(-RHS));
1603 return this->udiv(RHS);
1604}
1605
Craig Topper8885f932017-05-19 16:43:54 +00001606APInt APInt::sdiv(int64_t RHS) const {
1607 if (isNegative()) {
1608 if (RHS < 0)
1609 return (-(*this)).udiv(-RHS);
1610 return -((-(*this)).udiv(RHS));
1611 }
1612 if (RHS < 0)
1613 return -(this->udiv(-RHS));
1614 return this->udiv(RHS);
1615}
1616
1617APInt APInt::urem(const APInt &RHS) const {
Reid Spencera32372d12007-02-17 00:18:01 +00001618 assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
Reid Spencer39867762007-02-17 02:07:07 +00001619 if (isSingleWord()) {
Craig Topperb339c6d2017-05-03 15:46:24 +00001620 assert(RHS.U.VAL != 0 && "Remainder by zero?");
1621 return APInt(BitWidth, U.VAL % RHS.U.VAL);
Zhou Shengfbf61ea2007-02-08 14:35:19 +00001622 }
Reid Spencer39867762007-02-17 02:07:07 +00001623
Reid Spencer58a6a432007-02-21 08:21:52 +00001624 // Get some facts about the LHS
Craig Topper62de0392017-05-10 07:50:15 +00001625 unsigned lhsWords = getNumWords(getActiveBits());
Reid Spencer39867762007-02-17 02:07:07 +00001626
1627 // Get some facts about the RHS
Craig Topperb1a71ca2017-05-12 21:45:50 +00001628 unsigned rhsBits = RHS.getActiveBits();
1629 unsigned rhsWords = getNumWords(rhsBits);
Reid Spencer39867762007-02-17 02:07:07 +00001630 assert(rhsWords && "Performing remainder operation by zero ???");
1631
Reid Spencer39867762007-02-17 02:07:07 +00001632 // Check the degenerate cases
Craig Topper24ae6952017-05-08 23:49:49 +00001633 if (lhsWords == 0)
Reid Spencer58a6a432007-02-21 08:21:52 +00001634 // 0 % Y ===> 0
1635 return APInt(BitWidth, 0);
Craig Topperb1a71ca2017-05-12 21:45:50 +00001636 if (rhsBits == 1)
1637 // X % 1 ===> 0
1638 return APInt(BitWidth, 0);
Craig Topper24ae6952017-05-08 23:49:49 +00001639 if (lhsWords < rhsWords || this->ult(RHS))
Sylvestre Ledru91ce36c2012-09-27 10:14:43 +00001640 // X % Y ===> X, iff X < Y
Reid Spencer58a6a432007-02-21 08:21:52 +00001641 return *this;
Craig Topper24ae6952017-05-08 23:49:49 +00001642 if (*this == RHS)
Reid Spencer39867762007-02-17 02:07:07 +00001643 // X % X == 0;
Reid Spencer58a6a432007-02-21 08:21:52 +00001644 return APInt(BitWidth, 0);
Craig Topper24ae6952017-05-08 23:49:49 +00001645 if (lhsWords == 1)
Reid Spencer39867762007-02-17 02:07:07 +00001646 // All high words are zero, just use native remainder
Craig Topperb339c6d2017-05-03 15:46:24 +00001647 return APInt(BitWidth, U.pVal[0] % RHS.U.pVal[0]);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001648
Reid Spencer4c50b522007-05-13 23:44:59 +00001649 // We have to compute it the hard way. Invoke the Knuth divide algorithm.
Craig Topper8885f932017-05-19 16:43:54 +00001650 APInt Remainder(BitWidth, 0);
1651 divide(U.pVal, lhsWords, RHS.U.pVal, rhsWords, nullptr, Remainder.U.pVal);
1652 return Remainder;
1653}
1654
1655uint64_t APInt::urem(uint64_t RHS) const {
1656 assert(RHS != 0 && "Remainder by zero?");
1657
1658 if (isSingleWord())
1659 return U.VAL % RHS;
1660
1661 // Get some facts about the LHS
1662 unsigned lhsWords = getNumWords(getActiveBits());
1663
1664 // Check the degenerate cases
1665 if (lhsWords == 0)
1666 // 0 % Y ===> 0
1667 return 0;
1668 if (RHS == 1)
1669 // X % 1 ===> 0
1670 return 0;
1671 if (this->ult(RHS))
1672 // X % Y ===> X, iff X < Y
1673 return getZExtValue();
1674 if (*this == RHS)
1675 // X % X == 0;
1676 return 0;
1677 if (lhsWords == 1)
1678 // All high words are zero, just use native remainder
1679 return U.pVal[0] % RHS;
1680
1681 // We have to compute it the hard way. Invoke the Knuth divide algorithm.
1682 uint64_t Remainder;
1683 divide(U.pVal, lhsWords, &RHS, 1, nullptr, &Remainder);
Reid Spencerfb77b2b2007-02-20 08:51:03 +00001684 return Remainder;
Zhou Shengfbf61ea2007-02-08 14:35:19 +00001685}
Reid Spencer100502d2007-02-17 03:16:00 +00001686
Jakub Staszak6605c602013-02-20 00:17:42 +00001687APInt APInt::srem(const APInt &RHS) const {
1688 if (isNegative()) {
1689 if (RHS.isNegative())
1690 return -((-(*this)).urem(-RHS));
1691 return -((-(*this)).urem(RHS));
1692 }
1693 if (RHS.isNegative())
1694 return this->urem(-RHS);
1695 return this->urem(RHS);
1696}
1697
Craig Topper8885f932017-05-19 16:43:54 +00001698int64_t APInt::srem(int64_t RHS) const {
1699 if (isNegative()) {
1700 if (RHS < 0)
1701 return -((-(*this)).urem(-RHS));
1702 return -((-(*this)).urem(RHS));
1703 }
1704 if (RHS < 0)
1705 return this->urem(-RHS);
1706 return this->urem(RHS);
1707}
1708
Eric Christopher820256b2009-08-21 04:06:45 +00001709void APInt::udivrem(const APInt &LHS, const APInt &RHS,
Reid Spencer4c50b522007-05-13 23:44:59 +00001710 APInt &Quotient, APInt &Remainder) {
David Majnemer7f039202014-12-14 09:41:56 +00001711 assert(LHS.BitWidth == RHS.BitWidth && "Bit widths must be the same");
Craig Topper2579c7c2017-05-12 21:45:44 +00001712 unsigned BitWidth = LHS.BitWidth;
David Majnemer7f039202014-12-14 09:41:56 +00001713
1714 // First, deal with the easy case
1715 if (LHS.isSingleWord()) {
Craig Topperb339c6d2017-05-03 15:46:24 +00001716 assert(RHS.U.VAL != 0 && "Divide by zero?");
1717 uint64_t QuotVal = LHS.U.VAL / RHS.U.VAL;
1718 uint64_t RemVal = LHS.U.VAL % RHS.U.VAL;
Craig Topper2579c7c2017-05-12 21:45:44 +00001719 Quotient = APInt(BitWidth, QuotVal);
1720 Remainder = APInt(BitWidth, RemVal);
David Majnemer7f039202014-12-14 09:41:56 +00001721 return;
1722 }
1723
Reid Spencer4c50b522007-05-13 23:44:59 +00001724 // Get some size facts about the dividend and divisor
Craig Topper62de0392017-05-10 07:50:15 +00001725 unsigned lhsWords = getNumWords(LHS.getActiveBits());
Craig Topperb1a71ca2017-05-12 21:45:50 +00001726 unsigned rhsBits = RHS.getActiveBits();
1727 unsigned rhsWords = getNumWords(rhsBits);
Craig Topper4bdd6212017-05-12 18:19:01 +00001728 assert(rhsWords && "Performing divrem operation by zero ???");
Reid Spencer4c50b522007-05-13 23:44:59 +00001729
1730 // Check the degenerate cases
Eric Christopher820256b2009-08-21 04:06:45 +00001731 if (lhsWords == 0) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001732 Quotient = APInt(BitWidth, 0); // 0 / Y ===> 0
1733 Remainder = APInt(BitWidth, 0); // 0 % Y ===> 0
Reid Spencer4c50b522007-05-13 23:44:59 +00001734 return;
Eric Christopher820256b2009-08-21 04:06:45 +00001735 }
1736
Craig Topperb1a71ca2017-05-12 21:45:50 +00001737 if (rhsBits == 1) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001738 Quotient = LHS; // X / 1 ===> X
1739 Remainder = APInt(BitWidth, 0); // X % 1 ===> 0
Craig Topperb1a71ca2017-05-12 21:45:50 +00001740 }
1741
Eric Christopher820256b2009-08-21 04:06:45 +00001742 if (lhsWords < rhsWords || LHS.ult(RHS)) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001743 Remainder = LHS; // X % Y ===> X, iff X < Y
1744 Quotient = APInt(BitWidth, 0); // X / Y ===> 0, iff X < Y
Reid Spencer4c50b522007-05-13 23:44:59 +00001745 return;
Eric Christopher820256b2009-08-21 04:06:45 +00001746 }
1747
Reid Spencer4c50b522007-05-13 23:44:59 +00001748 if (LHS == RHS) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001749 Quotient = APInt(BitWidth, 1); // X / X ===> 1
1750 Remainder = APInt(BitWidth, 0); // X % X ===> 0;
Reid Spencer4c50b522007-05-13 23:44:59 +00001751 return;
Eric Christopher820256b2009-08-21 04:06:45 +00001752 }
1753
Craig Topper8885f932017-05-19 16:43:54 +00001754 // Make sure there is enough space to hold the results.
1755 // NOTE: This assumes that reallocate won't affect any bits if it doesn't
1756 // change the size. This is necessary if Quotient or Remainder is aliased
1757 // with LHS or RHS.
1758 Quotient.reallocate(BitWidth);
1759 Remainder.reallocate(BitWidth);
1760
Craig Topper06da0812017-05-12 18:18:57 +00001761 if (lhsWords == 1) { // rhsWords is 1 if lhsWords is 1.
Reid Spencer4c50b522007-05-13 23:44:59 +00001762 // There is only one word to consider so use the native versions.
Craig Topper93eabae2017-05-10 18:15:14 +00001763 uint64_t lhsValue = LHS.U.pVal[0];
1764 uint64_t rhsValue = RHS.U.pVal[0];
Craig Topper87694032017-05-12 07:21:09 +00001765 Quotient = lhsValue / rhsValue;
1766 Remainder = lhsValue % rhsValue;
Reid Spencer4c50b522007-05-13 23:44:59 +00001767 return;
1768 }
1769
1770 // Okay, lets do it the long way
Craig Topper8885f932017-05-19 16:43:54 +00001771 divide(LHS.U.pVal, lhsWords, RHS.U.pVal, rhsWords, Quotient.U.pVal,
1772 Remainder.U.pVal);
1773 // Clear the rest of the Quotient and Remainder.
1774 std::memset(Quotient.U.pVal + lhsWords, 0,
1775 (getNumWords(BitWidth) - lhsWords) * APINT_WORD_SIZE);
1776 std::memset(Remainder.U.pVal + rhsWords, 0,
1777 (getNumWords(BitWidth) - rhsWords) * APINT_WORD_SIZE);
1778}
1779
1780void APInt::udivrem(const APInt &LHS, uint64_t RHS, APInt &Quotient,
1781 uint64_t &Remainder) {
1782 assert(RHS != 0 && "Divide by zero?");
1783 unsigned BitWidth = LHS.BitWidth;
1784
1785 // First, deal with the easy case
1786 if (LHS.isSingleWord()) {
1787 uint64_t QuotVal = LHS.U.VAL / RHS;
1788 Remainder = LHS.U.VAL % RHS;
1789 Quotient = APInt(BitWidth, QuotVal);
1790 return;
1791 }
1792
1793 // Get some size facts about the dividend and divisor
1794 unsigned lhsWords = getNumWords(LHS.getActiveBits());
1795
1796 // Check the degenerate cases
1797 if (lhsWords == 0) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001798 Quotient = APInt(BitWidth, 0); // 0 / Y ===> 0
1799 Remainder = 0; // 0 % Y ===> 0
Craig Topper8885f932017-05-19 16:43:54 +00001800 return;
1801 }
1802
1803 if (RHS == 1) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001804 Quotient = LHS; // X / 1 ===> X
1805 Remainder = 0; // X % 1 ===> 0
1806 return;
Craig Topper8885f932017-05-19 16:43:54 +00001807 }
1808
1809 if (LHS.ult(RHS)) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001810 Remainder = LHS.getZExtValue(); // X % Y ===> X, iff X < Y
1811 Quotient = APInt(BitWidth, 0); // X / Y ===> 0, iff X < Y
Craig Topper8885f932017-05-19 16:43:54 +00001812 return;
1813 }
1814
1815 if (LHS == RHS) {
Krzysztof Parzyszek55a0dce2018-07-19 18:07:56 +00001816 Quotient = APInt(BitWidth, 1); // X / X ===> 1
1817 Remainder = 0; // X % X ===> 0;
Craig Topper8885f932017-05-19 16:43:54 +00001818 return;
1819 }
1820
1821 // Make sure there is enough space to hold the results.
1822 // NOTE: This assumes that reallocate won't affect any bits if it doesn't
1823 // change the size. This is necessary if Quotient is aliased with LHS.
1824 Quotient.reallocate(BitWidth);
1825
1826 if (lhsWords == 1) { // rhsWords is 1 if lhsWords is 1.
1827 // There is only one word to consider so use the native versions.
1828 uint64_t lhsValue = LHS.U.pVal[0];
1829 Quotient = lhsValue / RHS;
1830 Remainder = lhsValue % RHS;
1831 return;
1832 }
1833
1834 // Okay, lets do it the long way
1835 divide(LHS.U.pVal, lhsWords, &RHS, 1, Quotient.U.pVal, &Remainder);
1836 // Clear the rest of the Quotient.
1837 std::memset(Quotient.U.pVal + lhsWords, 0,
1838 (getNumWords(BitWidth) - lhsWords) * APINT_WORD_SIZE);
Reid Spencer4c50b522007-05-13 23:44:59 +00001839}
1840
Jakub Staszak6605c602013-02-20 00:17:42 +00001841void APInt::sdivrem(const APInt &LHS, const APInt &RHS,
1842 APInt &Quotient, APInt &Remainder) {
1843 if (LHS.isNegative()) {
1844 if (RHS.isNegative())
1845 APInt::udivrem(-LHS, -RHS, Quotient, Remainder);
1846 else {
1847 APInt::udivrem(-LHS, RHS, Quotient, Remainder);
Craig Topperb3c1f562017-05-11 07:02:04 +00001848 Quotient.negate();
Jakub Staszak6605c602013-02-20 00:17:42 +00001849 }
Craig Topperb3c1f562017-05-11 07:02:04 +00001850 Remainder.negate();
Jakub Staszak6605c602013-02-20 00:17:42 +00001851 } else if (RHS.isNegative()) {
1852 APInt::udivrem(LHS, -RHS, Quotient, Remainder);
Craig Topperb3c1f562017-05-11 07:02:04 +00001853 Quotient.negate();
Jakub Staszak6605c602013-02-20 00:17:42 +00001854 } else {
1855 APInt::udivrem(LHS, RHS, Quotient, Remainder);
1856 }
1857}
1858
Craig Topper8885f932017-05-19 16:43:54 +00001859void APInt::sdivrem(const APInt &LHS, int64_t RHS,
1860 APInt &Quotient, int64_t &Remainder) {
1861 uint64_t R = Remainder;
1862 if (LHS.isNegative()) {
1863 if (RHS < 0)
1864 APInt::udivrem(-LHS, -RHS, Quotient, R);
1865 else {
1866 APInt::udivrem(-LHS, RHS, Quotient, R);
1867 Quotient.negate();
1868 }
1869 R = -R;
1870 } else if (RHS < 0) {
1871 APInt::udivrem(LHS, -RHS, Quotient, R);
1872 Quotient.negate();
1873 } else {
1874 APInt::udivrem(LHS, RHS, Quotient, R);
1875 }
1876 Remainder = R;
1877}
1878
Chris Lattner2c819b02010-10-13 23:54:10 +00001879APInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
Chris Lattner79bdd882010-10-13 23:46:33 +00001880 APInt Res = *this+RHS;
1881 Overflow = isNonNegative() == RHS.isNonNegative() &&
1882 Res.isNonNegative() != isNonNegative();
1883 return Res;
1884}
1885
Chris Lattner698661c2010-10-14 00:05:07 +00001886APInt APInt::uadd_ov(const APInt &RHS, bool &Overflow) const {
1887 APInt Res = *this+RHS;
1888 Overflow = Res.ult(RHS);
1889 return Res;
1890}
1891
Chris Lattner2c819b02010-10-13 23:54:10 +00001892APInt APInt::ssub_ov(const APInt &RHS, bool &Overflow) const {
Chris Lattner79bdd882010-10-13 23:46:33 +00001893 APInt Res = *this - RHS;
1894 Overflow = isNonNegative() != RHS.isNonNegative() &&
1895 Res.isNonNegative() != isNonNegative();
1896 return Res;
1897}
1898
Chris Lattner698661c2010-10-14 00:05:07 +00001899APInt APInt::usub_ov(const APInt &RHS, bool &Overflow) const {
Chris Lattnerb9681ad2010-10-14 00:30:00 +00001900 APInt Res = *this-RHS;
1901 Overflow = Res.ugt(*this);
Chris Lattner698661c2010-10-14 00:05:07 +00001902 return Res;
1903}
1904
Chris Lattner2c819b02010-10-13 23:54:10 +00001905APInt APInt::sdiv_ov(const APInt &RHS, bool &Overflow) const {
Chris Lattner79bdd882010-10-13 23:46:33 +00001906 // MININT/-1 --> overflow.
1907 Overflow = isMinSignedValue() && RHS.isAllOnesValue();
1908 return sdiv(RHS);
1909}
1910
Chris Lattner2c819b02010-10-13 23:54:10 +00001911APInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
Chris Lattner79bdd882010-10-13 23:46:33 +00001912 APInt Res = *this * RHS;
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +00001913
Chris Lattner79bdd882010-10-13 23:46:33 +00001914 if (*this != 0 && RHS != 0)
1915 Overflow = Res.sdiv(RHS) != *this || Res.sdiv(*this) != RHS;
1916 else
1917 Overflow = false;
1918 return Res;
1919}
1920
Frits van Bommel0bb2ad22011-03-27 14:26:13 +00001921APInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
Fangrui Songacc76412019-04-19 02:06:06 +00001922 if (countLeadingZeros() + RHS.countLeadingZeros() + 2 <= BitWidth) {
1923 Overflow = true;
1924 return *this * RHS;
1925 }
Frits van Bommel0bb2ad22011-03-27 14:26:13 +00001926
Fangrui Songacc76412019-04-19 02:06:06 +00001927 APInt Res = lshr(1) * RHS;
1928 Overflow = Res.isNegative();
1929 Res <<= 1;
1930 if ((*this)[0]) {
1931 Res += RHS;
1932 if (Res.ult(RHS))
1933 Overflow = true;
1934 }
Frits van Bommel0bb2ad22011-03-27 14:26:13 +00001935 return Res;
1936}
1937
David Majnemera2521382014-10-13 21:48:30 +00001938APInt APInt::sshl_ov(const APInt &ShAmt, bool &Overflow) const {
1939 Overflow = ShAmt.uge(getBitWidth());
Chris Lattner79bdd882010-10-13 23:46:33 +00001940 if (Overflow)
David Majnemera2521382014-10-13 21:48:30 +00001941 return APInt(BitWidth, 0);
Chris Lattner79bdd882010-10-13 23:46:33 +00001942
1943 if (isNonNegative()) // Don't allow sign change.
David Majnemera2521382014-10-13 21:48:30 +00001944 Overflow = ShAmt.uge(countLeadingZeros());
Chris Lattner79bdd882010-10-13 23:46:33 +00001945 else
David Majnemera2521382014-10-13 21:48:30 +00001946 Overflow = ShAmt.uge(countLeadingOnes());
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +00001947
Chris Lattner79bdd882010-10-13 23:46:33 +00001948 return *this << ShAmt;
1949}
1950
David Majnemera2521382014-10-13 21:48:30 +00001951APInt APInt::ushl_ov(const APInt &ShAmt, bool &Overflow) const {
1952 Overflow = ShAmt.uge(getBitWidth());
1953 if (Overflow)
1954 return APInt(BitWidth, 0);
1955
1956 Overflow = ShAmt.ugt(countLeadingZeros());
1957
1958 return *this << ShAmt;
1959}
1960
Sanjay Patel7ef0b312018-11-20 16:47:59 +00001961APInt APInt::sadd_sat(const APInt &RHS) const {
1962 bool Overflow;
1963 APInt Res = sadd_ov(RHS, Overflow);
1964 if (!Overflow)
1965 return Res;
Chris Lattner79bdd882010-10-13 23:46:33 +00001966
Sanjay Patel7ef0b312018-11-20 16:47:59 +00001967 return isNegative() ? APInt::getSignedMinValue(BitWidth)
1968 : APInt::getSignedMaxValue(BitWidth);
1969}
1970
1971APInt APInt::uadd_sat(const APInt &RHS) const {
1972 bool Overflow;
1973 APInt Res = uadd_ov(RHS, Overflow);
1974 if (!Overflow)
1975 return Res;
1976
1977 return APInt::getMaxValue(BitWidth);
1978}
1979
1980APInt APInt::ssub_sat(const APInt &RHS) const {
1981 bool Overflow;
1982 APInt Res = ssub_ov(RHS, Overflow);
1983 if (!Overflow)
1984 return Res;
1985
1986 return isNegative() ? APInt::getSignedMinValue(BitWidth)
1987 : APInt::getSignedMaxValue(BitWidth);
1988}
1989
1990APInt APInt::usub_sat(const APInt &RHS) const {
1991 bool Overflow;
1992 APInt Res = usub_ov(RHS, Overflow);
1993 if (!Overflow)
1994 return Res;
1995
1996 return APInt(BitWidth, 0);
1997}
Chris Lattner79bdd882010-10-13 23:46:33 +00001998
1999
Benjamin Kramer92d89982010-07-14 22:38:02 +00002000void APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
Reid Spencer1ba83352007-02-21 03:55:44 +00002001 // Check our assumptions here
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +00002002 assert(!str.empty() && "Invalid string length");
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +00002003 assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 ||
Douglas Gregor663c0682011-09-14 15:54:46 +00002004 radix == 36) &&
2005 "Radix should be 2, 8, 10, 16, or 36!");
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +00002006
Daniel Dunbar3a1efd112009-08-13 02:33:34 +00002007 StringRef::iterator p = str.begin();
2008 size_t slen = str.size();
2009 bool isNeg = *p == '-';
Erick Tryzelaar1264bcb2009-08-21 03:15:14 +00002010 if (*p == '-' || *p == '+') {
Daniel Dunbar3a1efd112009-08-13 02:33:34 +00002011 p++;
2012 slen--;
Eric Christopher43a1dec2009-08-21 04:10:31 +00002013 assert(slen && "String is only a sign, needs a value.");
Daniel Dunbar3a1efd112009-08-13 02:33:34 +00002014 }
Chris Lattnerdad2d092007-05-03 18:15:36 +00002015 assert((slen <= numbits || radix != 2) && "Insufficient bit width");
Chris Lattnerb869a0a2009-04-25 18:34:04 +00002016 assert(((slen-1)*3 <= numbits || radix != 8) && "Insufficient bit width");
2017 assert(((slen-1)*4 <= numbits || radix != 16) && "Insufficient bit width");
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002018 assert((((slen-1)*64)/22 <= numbits || radix != 10) &&
2019 "Insufficient bit width");
Reid Spencer1ba83352007-02-21 03:55:44 +00002020
Craig Topperb339c6d2017-05-03 15:46:24 +00002021 // Allocate memory if needed
2022 if (isSingleWord())
2023 U.VAL = 0;
2024 else
2025 U.pVal = getClearedMemory(getNumWords());
Reid Spencer1ba83352007-02-21 03:55:44 +00002026
2027 // Figure out if we can shift instead of multiply
Chris Lattner77527f52009-01-21 18:09:24 +00002028 unsigned shift = (radix == 16 ? 4 : radix == 8 ? 3 : radix == 2 ? 1 : 0);
Reid Spencer1ba83352007-02-21 03:55:44 +00002029
Reid Spencer1ba83352007-02-21 03:55:44 +00002030 // Enter digit traversal loop
Daniel Dunbar3a1efd112009-08-13 02:33:34 +00002031 for (StringRef::iterator e = str.end(); p != e; ++p) {
Erick Tryzelaardadb15712009-08-21 03:15:28 +00002032 unsigned digit = getDigit(*p, radix);
Erick Tryzelaar60964092009-08-21 06:48:37 +00002033 assert(digit < radix && "Invalid character in digit string");
Reid Spencer1ba83352007-02-21 03:55:44 +00002034
Reid Spencera93c9812007-05-16 19:18:22 +00002035 // Shift or multiply the value by the radix
Chris Lattnerb869a0a2009-04-25 18:34:04 +00002036 if (slen > 1) {
2037 if (shift)
2038 *this <<= shift;
2039 else
Craig Topperf15bec52017-05-08 04:55:12 +00002040 *this *= radix;
Chris Lattnerb869a0a2009-04-25 18:34:04 +00002041 }
Reid Spencer1ba83352007-02-21 03:55:44 +00002042
2043 // Add in the digit we just interpreted
Craig Topperb7d8faa2017-04-02 06:59:38 +00002044 *this += digit;
Reid Spencer100502d2007-02-17 03:16:00 +00002045 }
Reid Spencerb6b5cc32007-02-25 23:44:53 +00002046 // If its negative, put it in two's complement form
Craig Topperef0114c2017-05-10 20:01:38 +00002047 if (isNeg)
2048 this->negate();
Reid Spencer100502d2007-02-17 03:16:00 +00002049}
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002050
Chris Lattner17f71652008-08-17 07:19:36 +00002051void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002052 bool Signed, bool formatAsCLiteral) const {
Simon Pilgrim4c0ea9d2017-02-23 16:07:04 +00002053 assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2 ||
Douglas Gregor663c0682011-09-14 15:54:46 +00002054 Radix == 36) &&
Dylan Noblesmith1c419ff2011-12-16 20:36:31 +00002055 "Radix should be 2, 8, 10, 16, or 36!");
Eric Christopher820256b2009-08-21 04:06:45 +00002056
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002057 const char *Prefix = "";
2058 if (formatAsCLiteral) {
2059 switch (Radix) {
2060 case 2:
2061 // Binary literals are a non-standard extension added in gcc 4.3:
2062 // http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
2063 Prefix = "0b";
2064 break;
2065 case 8:
2066 Prefix = "0";
2067 break;
Dylan Noblesmith1c419ff2011-12-16 20:36:31 +00002068 case 10:
2069 break; // No prefix
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002070 case 16:
2071 Prefix = "0x";
2072 break;
Dylan Noblesmith1c419ff2011-12-16 20:36:31 +00002073 default:
2074 llvm_unreachable("Invalid radix!");
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002075 }
2076 }
2077
Chris Lattner17f71652008-08-17 07:19:36 +00002078 // First, check for a zero value and just short circuit the logic below.
2079 if (*this == 0) {
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002080 while (*Prefix) {
2081 Str.push_back(*Prefix);
2082 ++Prefix;
2083 };
Chris Lattner17f71652008-08-17 07:19:36 +00002084 Str.push_back('0');
2085 return;
2086 }
Eric Christopher820256b2009-08-21 04:06:45 +00002087
Douglas Gregor663c0682011-09-14 15:54:46 +00002088 static const char Digits[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
Eric Christopher820256b2009-08-21 04:06:45 +00002089
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002090 if (isSingleWord()) {
Chris Lattner17f71652008-08-17 07:19:36 +00002091 char Buffer[65];
Craig Toppere6a23182017-05-24 07:00:55 +00002092 char *BufPtr = std::end(Buffer);
Eric Christopher820256b2009-08-21 04:06:45 +00002093
Chris Lattner17f71652008-08-17 07:19:36 +00002094 uint64_t N;
Chris Lattnerb91c9032010-08-18 00:33:47 +00002095 if (!Signed) {
Chris Lattner17f71652008-08-17 07:19:36 +00002096 N = getZExtValue();
Chris Lattnerb91c9032010-08-18 00:33:47 +00002097 } else {
2098 int64_t I = getSExtValue();
2099 if (I >= 0) {
2100 N = I;
2101 } else {
2102 Str.push_back('-');
2103 N = -(uint64_t)I;
2104 }
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002105 }
Eric Christopher820256b2009-08-21 04:06:45 +00002106
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002107 while (*Prefix) {
2108 Str.push_back(*Prefix);
2109 ++Prefix;
2110 };
2111
Chris Lattner17f71652008-08-17 07:19:36 +00002112 while (N) {
2113 *--BufPtr = Digits[N % Radix];
2114 N /= Radix;
2115 }
Craig Toppere6a23182017-05-24 07:00:55 +00002116 Str.append(BufPtr, std::end(Buffer));
Chris Lattner17f71652008-08-17 07:19:36 +00002117 return;
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002118 }
2119
Chris Lattner17f71652008-08-17 07:19:36 +00002120 APInt Tmp(*this);
Eric Christopher820256b2009-08-21 04:06:45 +00002121
Chris Lattner17f71652008-08-17 07:19:36 +00002122 if (Signed && isNegative()) {
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002123 // They want to print the signed version and it is a negative value
2124 // Flip the bits and add one to turn it into the equivalent positive
2125 // value and put a '-' in the result.
Craig Topperef0114c2017-05-10 20:01:38 +00002126 Tmp.negate();
Chris Lattner17f71652008-08-17 07:19:36 +00002127 Str.push_back('-');
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002128 }
Eric Christopher820256b2009-08-21 04:06:45 +00002129
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002130 while (*Prefix) {
2131 Str.push_back(*Prefix);
2132 ++Prefix;
2133 };
2134
Chris Lattner17f71652008-08-17 07:19:36 +00002135 // We insert the digits backward, then reverse them to get the right order.
2136 unsigned StartDig = Str.size();
Eric Christopher820256b2009-08-21 04:06:45 +00002137
2138 // For the 2, 8 and 16 bit cases, we can just shift instead of divide
2139 // because the number of bits per digit (1, 3 and 4 respectively) divides
Craig Topperd7ed50d2017-04-02 06:59:36 +00002140 // equally. We just shift until the value is zero.
Douglas Gregor663c0682011-09-14 15:54:46 +00002141 if (Radix == 2 || Radix == 8 || Radix == 16) {
Chris Lattner17f71652008-08-17 07:19:36 +00002142 // Just shift tmp right for each digit width until it becomes zero
2143 unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
2144 unsigned MaskAmt = Radix - 1;
Eric Christopher820256b2009-08-21 04:06:45 +00002145
Craig Topperecb97da2017-05-10 18:15:24 +00002146 while (Tmp.getBoolValue()) {
Chris Lattner17f71652008-08-17 07:19:36 +00002147 unsigned Digit = unsigned(Tmp.getRawData()[0]) & MaskAmt;
2148 Str.push_back(Digits[Digit]);
Craig Topperfc947bc2017-04-18 17:14:21 +00002149 Tmp.lshrInPlace(ShiftAmt);
Chris Lattner17f71652008-08-17 07:19:36 +00002150 }
2151 } else {
Craig Topperecb97da2017-05-10 18:15:24 +00002152 while (Tmp.getBoolValue()) {
Craig Topper8885f932017-05-19 16:43:54 +00002153 uint64_t Digit;
2154 udivrem(Tmp, Radix, Tmp, Digit);
Chris Lattner17f71652008-08-17 07:19:36 +00002155 assert(Digit < Radix && "divide failed");
2156 Str.push_back(Digits[Digit]);
Chris Lattner17f71652008-08-17 07:19:36 +00002157 }
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002158 }
Eric Christopher820256b2009-08-21 04:06:45 +00002159
Chris Lattner17f71652008-08-17 07:19:36 +00002160 // Reverse the digits before returning.
2161 std::reverse(Str.begin()+StartDig, Str.end());
Reid Spencerfb77b2b2007-02-20 08:51:03 +00002162}
2163
Pawel Bylica6eeeac72015-04-06 13:31:39 +00002164/// Returns the APInt as a std::string. Note that this is an inefficient method.
2165/// It is better to pass in a SmallVector/SmallString to the methods above.
Chris Lattner17f71652008-08-17 07:19:36 +00002166std::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
2167 SmallString<40> S;
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002168 toString(S, Radix, Signed, /* formatAsCLiteral = */false);
Daniel Dunbar8b0b1152009-08-19 20:07:03 +00002169 return S.str();
Reid Spencer1ba83352007-02-21 03:55:44 +00002170}
Chris Lattner6b695682007-08-16 15:56:55 +00002171
Aaron Ballman615eb472017-10-15 14:32:27 +00002172#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
Yaron Kereneb2a2542016-01-29 20:50:44 +00002173LLVM_DUMP_METHOD void APInt::dump() const {
Chris Lattner17f71652008-08-17 07:19:36 +00002174 SmallString<40> S, U;
2175 this->toStringUnsigned(U);
2176 this->toStringSigned(S);
David Greenef32fcb42010-01-05 01:28:52 +00002177 dbgs() << "APInt(" << BitWidth << "b, "
Davide Italiano5a473d22017-01-31 21:26:18 +00002178 << U << "u " << S << "s)\n";
Chris Lattner17f71652008-08-17 07:19:36 +00002179}
Matthias Braun8c209aa2017-01-28 02:02:38 +00002180#endif
Chris Lattner17f71652008-08-17 07:19:36 +00002181
Chris Lattner0c19df42008-08-23 22:23:09 +00002182void APInt::print(raw_ostream &OS, bool isSigned) const {
Chris Lattner17f71652008-08-17 07:19:36 +00002183 SmallString<40> S;
Ted Kremenekb05f02e2011-06-15 00:51:55 +00002184 this->toString(S, 10, isSigned, /* formatAsCLiteral = */false);
Yaron Keren92e1b622015-03-18 10:17:07 +00002185 OS << S;
Chris Lattner17f71652008-08-17 07:19:36 +00002186}
2187
Chris Lattner6b695682007-08-16 15:56:55 +00002188// This implements a variety of operations on a representation of
2189// arbitrary precision, two's-complement, bignum integer values.
2190
Chris Lattner96cffa62009-08-23 23:11:28 +00002191// Assumed by lowHalf, highHalf, partMSB and partLSB. A fairly safe
2192// and unrestricting assumption.
Craig Topper55229b72017-04-02 19:17:22 +00002193static_assert(APInt::APINT_BITS_PER_WORD % 2 == 0,
2194 "Part width must be divisible by 2!");
Chris Lattner6b695682007-08-16 15:56:55 +00002195
2196/* Some handy functions local to this file. */
Chris Lattner6b695682007-08-16 15:56:55 +00002197
Craig Topper76f42462017-03-28 05:32:53 +00002198/* Returns the integer part with the least significant BITS set.
2199 BITS cannot be zero. */
Craig Topper55229b72017-04-02 19:17:22 +00002200static inline APInt::WordType lowBitMask(unsigned bits) {
2201 assert(bits != 0 && bits <= APInt::APINT_BITS_PER_WORD);
Chris Lattnerfe02c1f2007-08-20 22:49:32 +00002202
Craig Topper55229b72017-04-02 19:17:22 +00002203 return ~(APInt::WordType) 0 >> (APInt::APINT_BITS_PER_WORD - bits);
Craig Topper76f42462017-03-28 05:32:53 +00002204}
Chris Lattnerfe02c1f2007-08-20 22:49:32 +00002205
Craig Topper76f42462017-03-28 05:32:53 +00002206/* Returns the value of the lower half of PART. */
Craig Topper55229b72017-04-02 19:17:22 +00002207static inline APInt::WordType lowHalf(APInt::WordType part) {
2208 return part & lowBitMask(APInt::APINT_BITS_PER_WORD / 2);
Craig Topper76f42462017-03-28 05:32:53 +00002209}
Chris Lattnerfe02c1f2007-08-20 22:49:32 +00002210
Craig Topper76f42462017-03-28 05:32:53 +00002211/* Returns the value of the upper half of PART. */
Craig Topper55229b72017-04-02 19:17:22 +00002212static inline APInt::WordType highHalf(APInt::WordType part) {
2213 return part >> (APInt::APINT_BITS_PER_WORD / 2);
Craig Topper76f42462017-03-28 05:32:53 +00002214}
Chris Lattnerfe02c1f2007-08-20 22:49:32 +00002215
Craig Topper76f42462017-03-28 05:32:53 +00002216/* Returns the bit number of the most significant set bit of a part.
2217 If the input number has no bits set -1U is returned. */
Craig Topper55229b72017-04-02 19:17:22 +00002218static unsigned partMSB(APInt::WordType value) {
Craig Topper76f42462017-03-28 05:32:53 +00002219 return findLastSet(value, ZB_Max);
2220}
Chris Lattner6b695682007-08-16 15:56:55 +00002221
Craig Topper76f42462017-03-28 05:32:53 +00002222/* Returns the bit number of the least significant set bit of a
2223 part. If the input number has no bits set -1U is returned. */
Craig Topper55229b72017-04-02 19:17:22 +00002224static unsigned partLSB(APInt::WordType value) {
Craig Topper76f42462017-03-28 05:32:53 +00002225 return findFirstSet(value, ZB_Max);
Alexander Kornienkof00654e2015-06-23 09:49:53 +00002226}
Chris Lattner6b695682007-08-16 15:56:55 +00002227
2228/* Sets the least significant part of a bignum to the input value, and
2229 zeroes out higher parts. */
Craig Topper55229b72017-04-02 19:17:22 +00002230void APInt::tcSet(WordType *dst, WordType part, unsigned parts) {
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002231 assert(parts > 0);
Neil Boothb6182162007-10-08 13:47:12 +00002232
Chris Lattner6b695682007-08-16 15:56:55 +00002233 dst[0] = part;
Craig Topperb0038162017-03-28 05:32:52 +00002234 for (unsigned i = 1; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002235 dst[i] = 0;
2236}
2237
2238/* Assign one bignum to another. */
Craig Topper55229b72017-04-02 19:17:22 +00002239void APInt::tcAssign(WordType *dst, const WordType *src, unsigned parts) {
Craig Topperb0038162017-03-28 05:32:52 +00002240 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002241 dst[i] = src[i];
2242}
2243
2244/* Returns true if a bignum is zero, false otherwise. */
Craig Topper55229b72017-04-02 19:17:22 +00002245bool APInt::tcIsZero(const WordType *src, unsigned parts) {
Craig Topperb0038162017-03-28 05:32:52 +00002246 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002247 if (src[i])
2248 return false;
2249
2250 return true;
2251}
2252
2253/* Extract the given bit of a bignum; returns 0 or 1. */
Craig Topper55229b72017-04-02 19:17:22 +00002254int APInt::tcExtractBit(const WordType *parts, unsigned bit) {
Craig Topper00b47ee2017-04-02 19:35:18 +00002255 return (parts[whichWord(bit)] & maskBit(bit)) != 0;
Chris Lattner6b695682007-08-16 15:56:55 +00002256}
2257
John McCalldcb9a7a2010-02-28 02:51:25 +00002258/* Set the given bit of a bignum. */
Craig Topper55229b72017-04-02 19:17:22 +00002259void APInt::tcSetBit(WordType *parts, unsigned bit) {
Craig Topper00b47ee2017-04-02 19:35:18 +00002260 parts[whichWord(bit)] |= maskBit(bit);
Chris Lattner6b695682007-08-16 15:56:55 +00002261}
2262
John McCalldcb9a7a2010-02-28 02:51:25 +00002263/* Clears the given bit of a bignum. */
Craig Topper55229b72017-04-02 19:17:22 +00002264void APInt::tcClearBit(WordType *parts, unsigned bit) {
Craig Topper00b47ee2017-04-02 19:35:18 +00002265 parts[whichWord(bit)] &= ~maskBit(bit);
John McCalldcb9a7a2010-02-28 02:51:25 +00002266}
2267
Neil Boothc8b650a2007-10-06 00:43:45 +00002268/* Returns the bit number of the least significant set bit of a
2269 number. If the input number has no bits set -1U is returned. */
Craig Topper55229b72017-04-02 19:17:22 +00002270unsigned APInt::tcLSB(const WordType *parts, unsigned n) {
Craig Topperb0038162017-03-28 05:32:52 +00002271 for (unsigned i = 0; i < n; i++) {
2272 if (parts[i] != 0) {
2273 unsigned lsb = partLSB(parts[i]);
Chris Lattner6b695682007-08-16 15:56:55 +00002274
Craig Topper55229b72017-04-02 19:17:22 +00002275 return lsb + i * APINT_BITS_PER_WORD;
Craig Topperb0038162017-03-28 05:32:52 +00002276 }
Chris Lattner6b695682007-08-16 15:56:55 +00002277 }
2278
2279 return -1U;
2280}
2281
Neil Boothc8b650a2007-10-06 00:43:45 +00002282/* Returns the bit number of the most significant set bit of a number.
2283 If the input number has no bits set -1U is returned. */
Craig Topper55229b72017-04-02 19:17:22 +00002284unsigned APInt::tcMSB(const WordType *parts, unsigned n) {
Chris Lattner6b695682007-08-16 15:56:55 +00002285 do {
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002286 --n;
Chris Lattner6b695682007-08-16 15:56:55 +00002287
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002288 if (parts[n] != 0) {
Craig Topperb0038162017-03-28 05:32:52 +00002289 unsigned msb = partMSB(parts[n]);
Chris Lattner6b695682007-08-16 15:56:55 +00002290
Craig Topper55229b72017-04-02 19:17:22 +00002291 return msb + n * APINT_BITS_PER_WORD;
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002292 }
Chris Lattner6b695682007-08-16 15:56:55 +00002293 } while (n);
2294
2295 return -1U;
2296}
2297
Neil Boothb6182162007-10-08 13:47:12 +00002298/* Copy the bit vector of width srcBITS from SRC, starting at bit
2299 srcLSB, to DST, of dstCOUNT parts, such that the bit srcLSB becomes
2300 the least significant bit of DST. All high bits above srcBITS in
2301 DST are zero-filled. */
2302void
Craig Topper55229b72017-04-02 19:17:22 +00002303APInt::tcExtract(WordType *dst, unsigned dstCount, const WordType *src,
Craig Topper6a8518082017-03-28 05:32:55 +00002304 unsigned srcBits, unsigned srcLSB) {
Craig Topper55229b72017-04-02 19:17:22 +00002305 unsigned dstParts = (srcBits + APINT_BITS_PER_WORD - 1) / APINT_BITS_PER_WORD;
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002306 assert(dstParts <= dstCount);
Neil Boothb6182162007-10-08 13:47:12 +00002307
Craig Topper55229b72017-04-02 19:17:22 +00002308 unsigned firstSrcPart = srcLSB / APINT_BITS_PER_WORD;
Neil Boothb6182162007-10-08 13:47:12 +00002309 tcAssign (dst, src + firstSrcPart, dstParts);
2310
Craig Topper55229b72017-04-02 19:17:22 +00002311 unsigned shift = srcLSB % APINT_BITS_PER_WORD;
Neil Boothb6182162007-10-08 13:47:12 +00002312 tcShiftRight (dst, dstParts, shift);
2313
Craig Topper55229b72017-04-02 19:17:22 +00002314 /* We now have (dstParts * APINT_BITS_PER_WORD - shift) bits from SRC
Neil Boothb6182162007-10-08 13:47:12 +00002315 in DST. If this is less that srcBits, append the rest, else
2316 clear the high bits. */
Craig Topper55229b72017-04-02 19:17:22 +00002317 unsigned n = dstParts * APINT_BITS_PER_WORD - shift;
Neil Boothb6182162007-10-08 13:47:12 +00002318 if (n < srcBits) {
Craig Topper55229b72017-04-02 19:17:22 +00002319 WordType mask = lowBitMask (srcBits - n);
Neil Boothb6182162007-10-08 13:47:12 +00002320 dst[dstParts - 1] |= ((src[firstSrcPart + dstParts] & mask)
Craig Topper55229b72017-04-02 19:17:22 +00002321 << n % APINT_BITS_PER_WORD);
Neil Boothb6182162007-10-08 13:47:12 +00002322 } else if (n > srcBits) {
Craig Topper55229b72017-04-02 19:17:22 +00002323 if (srcBits % APINT_BITS_PER_WORD)
2324 dst[dstParts - 1] &= lowBitMask (srcBits % APINT_BITS_PER_WORD);
Neil Boothb6182162007-10-08 13:47:12 +00002325 }
2326
2327 /* Clear high parts. */
2328 while (dstParts < dstCount)
2329 dst[dstParts++] = 0;
2330}
2331
Chris Lattner6b695682007-08-16 15:56:55 +00002332/* DST += RHS + C where C is zero or one. Returns the carry flag. */
Craig Topper55229b72017-04-02 19:17:22 +00002333APInt::WordType APInt::tcAdd(WordType *dst, const WordType *rhs,
2334 WordType c, unsigned parts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002335 assert(c <= 1);
2336
Craig Topperb0038162017-03-28 05:32:52 +00002337 for (unsigned i = 0; i < parts; i++) {
Craig Topper55229b72017-04-02 19:17:22 +00002338 WordType l = dst[i];
Chris Lattner6b695682007-08-16 15:56:55 +00002339 if (c) {
2340 dst[i] += rhs[i] + 1;
2341 c = (dst[i] <= l);
2342 } else {
2343 dst[i] += rhs[i];
2344 c = (dst[i] < l);
2345 }
2346 }
2347
2348 return c;
2349}
2350
Craig Topper92fc4772017-04-13 04:36:06 +00002351/// This function adds a single "word" integer, src, to the multiple
2352/// "word" integer array, dst[]. dst[] is modified to reflect the addition and
2353/// 1 is returned if there is a carry out, otherwise 0 is returned.
2354/// @returns the carry of the addition.
2355APInt::WordType APInt::tcAddPart(WordType *dst, WordType src,
2356 unsigned parts) {
2357 for (unsigned i = 0; i < parts; ++i) {
2358 dst[i] += src;
2359 if (dst[i] >= src)
2360 return 0; // No need to carry so exit early.
2361 src = 1; // Carry one to next digit.
2362 }
2363
2364 return 1;
2365}
2366
Chris Lattner6b695682007-08-16 15:56:55 +00002367/* DST -= RHS + C where C is zero or one. Returns the carry flag. */
Craig Topper55229b72017-04-02 19:17:22 +00002368APInt::WordType APInt::tcSubtract(WordType *dst, const WordType *rhs,
2369 WordType c, unsigned parts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002370 assert(c <= 1);
2371
Craig Topperb0038162017-03-28 05:32:52 +00002372 for (unsigned i = 0; i < parts; i++) {
Craig Topper55229b72017-04-02 19:17:22 +00002373 WordType l = dst[i];
Chris Lattner6b695682007-08-16 15:56:55 +00002374 if (c) {
2375 dst[i] -= rhs[i] + 1;
2376 c = (dst[i] >= l);
2377 } else {
2378 dst[i] -= rhs[i];
2379 c = (dst[i] > l);
2380 }
2381 }
2382
2383 return c;
2384}
2385
Craig Topper92fc4772017-04-13 04:36:06 +00002386/// This function subtracts a single "word" (64-bit word), src, from
2387/// the multi-word integer array, dst[], propagating the borrowed 1 value until
2388/// no further borrowing is needed or it runs out of "words" in dst. The result
2389/// is 1 if "borrowing" exhausted the digits in dst, or 0 if dst was not
2390/// exhausted. In other words, if src > dst then this function returns 1,
2391/// otherwise 0.
2392/// @returns the borrow out of the subtraction
2393APInt::WordType APInt::tcSubtractPart(WordType *dst, WordType src,
2394 unsigned parts) {
2395 for (unsigned i = 0; i < parts; ++i) {
2396 WordType Dst = dst[i];
2397 dst[i] -= src;
2398 if (src <= Dst)
2399 return 0; // No need to borrow so exit early.
2400 src = 1; // We have to "borrow 1" from next "word"
2401 }
2402
2403 return 1;
2404}
2405
Chris Lattner6b695682007-08-16 15:56:55 +00002406/* Negate a bignum in-place. */
Craig Topper55229b72017-04-02 19:17:22 +00002407void APInt::tcNegate(WordType *dst, unsigned parts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002408 tcComplement(dst, parts);
2409 tcIncrement(dst, parts);
2410}
2411
Neil Boothc8b650a2007-10-06 00:43:45 +00002412/* DST += SRC * MULTIPLIER + CARRY if add is true
2413 DST = SRC * MULTIPLIER + CARRY if add is false
Chris Lattner6b695682007-08-16 15:56:55 +00002414
2415 Requires 0 <= DSTPARTS <= SRCPARTS + 1. If DST overlaps SRC
2416 they must start at the same point, i.e. DST == SRC.
2417
2418 If DSTPARTS == SRCPARTS + 1 no overflow occurs and zero is
2419 returned. Otherwise DST is filled with the least significant
2420 DSTPARTS parts of the result, and if all of the omitted higher
2421 parts were zero return zero, otherwise overflow occurred and
2422 return one. */
Craig Topper55229b72017-04-02 19:17:22 +00002423int APInt::tcMultiplyPart(WordType *dst, const WordType *src,
2424 WordType multiplier, WordType carry,
Craig Topper6a8518082017-03-28 05:32:55 +00002425 unsigned srcParts, unsigned dstParts,
2426 bool add) {
Chris Lattner6b695682007-08-16 15:56:55 +00002427 /* Otherwise our writes of DST kill our later reads of SRC. */
2428 assert(dst <= src || dst >= src + srcParts);
2429 assert(dstParts <= srcParts + 1);
2430
2431 /* N loops; minimum of dstParts and srcParts. */
Craig Topper0cbab7c2017-05-08 06:34:39 +00002432 unsigned n = std::min(dstParts, srcParts);
Chris Lattner6b695682007-08-16 15:56:55 +00002433
Craig Topperc96a84d2017-05-08 06:34:41 +00002434 for (unsigned i = 0; i < n; i++) {
Craig Topper55229b72017-04-02 19:17:22 +00002435 WordType low, mid, high, srcPart;
Chris Lattner6b695682007-08-16 15:56:55 +00002436
2437 /* [ LOW, HIGH ] = MULTIPLIER * SRC[i] + DST[i] + CARRY.
2438
2439 This cannot overflow, because
2440
2441 (n - 1) * (n - 1) + 2 (n - 1) = (n - 1) * (n + 1)
2442
2443 which is less than n^2. */
2444
2445 srcPart = src[i];
2446
Craig Topper6a8518082017-03-28 05:32:55 +00002447 if (multiplier == 0 || srcPart == 0) {
Chris Lattner6b695682007-08-16 15:56:55 +00002448 low = carry;
2449 high = 0;
2450 } else {
2451 low = lowHalf(srcPart) * lowHalf(multiplier);
2452 high = highHalf(srcPart) * highHalf(multiplier);
2453
2454 mid = lowHalf(srcPart) * highHalf(multiplier);
2455 high += highHalf(mid);
Craig Topper55229b72017-04-02 19:17:22 +00002456 mid <<= APINT_BITS_PER_WORD / 2;
Chris Lattner6b695682007-08-16 15:56:55 +00002457 if (low + mid < low)
2458 high++;
2459 low += mid;
2460
2461 mid = highHalf(srcPart) * lowHalf(multiplier);
2462 high += highHalf(mid);
Craig Topper55229b72017-04-02 19:17:22 +00002463 mid <<= APINT_BITS_PER_WORD / 2;
Chris Lattner6b695682007-08-16 15:56:55 +00002464 if (low + mid < low)
2465 high++;
2466 low += mid;
2467
2468 /* Now add carry. */
2469 if (low + carry < low)
2470 high++;
2471 low += carry;
2472 }
2473
2474 if (add) {
2475 /* And now DST[i], and store the new low part there. */
2476 if (low + dst[i] < low)
2477 high++;
2478 dst[i] += low;
2479 } else
2480 dst[i] = low;
2481
2482 carry = high;
2483 }
2484
Craig Topperc96a84d2017-05-08 06:34:41 +00002485 if (srcParts < dstParts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002486 /* Full multiplication, there is no overflow. */
Craig Topperc96a84d2017-05-08 06:34:41 +00002487 assert(srcParts + 1 == dstParts);
2488 dst[srcParts] = carry;
Chris Lattner6b695682007-08-16 15:56:55 +00002489 return 0;
Chris Lattner6b695682007-08-16 15:56:55 +00002490 }
Craig Toppera6c142a2017-05-08 06:34:36 +00002491
2492 /* We overflowed if there is carry. */
2493 if (carry)
2494 return 1;
2495
2496 /* We would overflow if any significant unwritten parts would be
2497 non-zero. This is true if any remaining src parts are non-zero
2498 and the multiplier is non-zero. */
2499 if (multiplier)
Craig Topperc96a84d2017-05-08 06:34:41 +00002500 for (unsigned i = dstParts; i < srcParts; i++)
Craig Toppera6c142a2017-05-08 06:34:36 +00002501 if (src[i])
2502 return 1;
2503
2504 /* We fitted in the narrow destination. */
2505 return 0;
Chris Lattner6b695682007-08-16 15:56:55 +00002506}
2507
2508/* DST = LHS * RHS, where DST has the same width as the operands and
2509 is filled with the least significant parts of the result. Returns
2510 one if overflow occurred, otherwise zero. DST must be disjoint
2511 from both operands. */
Craig Topper55229b72017-04-02 19:17:22 +00002512int APInt::tcMultiply(WordType *dst, const WordType *lhs,
2513 const WordType *rhs, unsigned parts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002514 assert(dst != lhs && dst != rhs);
2515
Craig Topperb0038162017-03-28 05:32:52 +00002516 int overflow = 0;
Chris Lattner6b695682007-08-16 15:56:55 +00002517 tcSet(dst, 0, parts);
2518
Craig Topperb0038162017-03-28 05:32:52 +00002519 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002520 overflow |= tcMultiplyPart(&dst[i], lhs, rhs[i], 0, parts,
2521 parts - i, true);
2522
2523 return overflow;
2524}
2525
Craig Topper0acb6652017-05-09 16:47:33 +00002526/// DST = LHS * RHS, where DST has width the sum of the widths of the
2527/// operands. No overflow occurs. DST must be disjoint from both operands.
2528void APInt::tcFullMultiply(WordType *dst, const WordType *lhs,
2529 const WordType *rhs, unsigned lhsParts,
2530 unsigned rhsParts) {
Neil Booth0ea72a92007-10-06 00:24:48 +00002531 /* Put the narrower number on the LHS for less loops below. */
Craig Toppera6c142a2017-05-08 06:34:36 +00002532 if (lhsParts > rhsParts)
Neil Booth0ea72a92007-10-06 00:24:48 +00002533 return tcFullMultiply (dst, rhs, lhs, rhsParts, lhsParts);
Chris Lattner6b695682007-08-16 15:56:55 +00002534
Craig Toppera6c142a2017-05-08 06:34:36 +00002535 assert(dst != lhs && dst != rhs);
Chris Lattner6b695682007-08-16 15:56:55 +00002536
Craig Toppera6c142a2017-05-08 06:34:36 +00002537 tcSet(dst, 0, rhsParts);
Chris Lattner6b695682007-08-16 15:56:55 +00002538
Craig Toppera6c142a2017-05-08 06:34:36 +00002539 for (unsigned i = 0; i < lhsParts; i++)
2540 tcMultiplyPart(&dst[i], rhs, lhs[i], 0, rhsParts, rhsParts + 1, true);
Chris Lattner6b695682007-08-16 15:56:55 +00002541}
2542
2543/* If RHS is zero LHS and REMAINDER are left unchanged, return one.
2544 Otherwise set LHS to LHS / RHS with the fractional part discarded,
2545 set REMAINDER to the remainder, return zero. i.e.
2546
2547 OLD_LHS = RHS * LHS + REMAINDER
2548
2549 SCRATCH is a bignum of the same size as the operands and result for
2550 use by the routine; its contents need not be initialized and are
2551 destroyed. LHS, REMAINDER and SCRATCH must be distinct.
2552*/
Craig Topper55229b72017-04-02 19:17:22 +00002553int APInt::tcDivide(WordType *lhs, const WordType *rhs,
2554 WordType *remainder, WordType *srhs,
Craig Topper6a8518082017-03-28 05:32:55 +00002555 unsigned parts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002556 assert(lhs != remainder && lhs != srhs && remainder != srhs);
2557
Craig Topperb0038162017-03-28 05:32:52 +00002558 unsigned shiftCount = tcMSB(rhs, parts) + 1;
Chris Lattnerfe02c1f2007-08-20 22:49:32 +00002559 if (shiftCount == 0)
Chris Lattner6b695682007-08-16 15:56:55 +00002560 return true;
2561
Craig Topper55229b72017-04-02 19:17:22 +00002562 shiftCount = parts * APINT_BITS_PER_WORD - shiftCount;
2563 unsigned n = shiftCount / APINT_BITS_PER_WORD;
2564 WordType mask = (WordType) 1 << (shiftCount % APINT_BITS_PER_WORD);
Chris Lattner6b695682007-08-16 15:56:55 +00002565
2566 tcAssign(srhs, rhs, parts);
2567 tcShiftLeft(srhs, parts, shiftCount);
2568 tcAssign(remainder, lhs, parts);
2569 tcSet(lhs, 0, parts);
2570
2571 /* Loop, subtracting SRHS if REMAINDER is greater and adding that to
2572 the total. */
Dan Gohmanb452d4e2010-03-24 19:38:02 +00002573 for (;;) {
Craig Toppera584af52017-05-10 07:50:17 +00002574 int compare = tcCompare(remainder, srhs, parts);
2575 if (compare >= 0) {
2576 tcSubtract(remainder, srhs, 0, parts);
2577 lhs[n] |= mask;
2578 }
Chris Lattner6b695682007-08-16 15:56:55 +00002579
Craig Toppera584af52017-05-10 07:50:17 +00002580 if (shiftCount == 0)
2581 break;
2582 shiftCount--;
2583 tcShiftRight(srhs, parts, 1);
2584 if ((mask >>= 1) == 0) {
2585 mask = (WordType) 1 << (APINT_BITS_PER_WORD - 1);
2586 n--;
2587 }
Chris Lattner6b695682007-08-16 15:56:55 +00002588 }
2589
2590 return false;
2591}
2592
Craig Toppera8a4f0d2017-04-18 04:39:48 +00002593/// Shift a bignum left Cound bits in-place. Shifted in bits are zero. There are
2594/// no restrictions on Count.
2595void APInt::tcShiftLeft(WordType *Dst, unsigned Words, unsigned Count) {
2596 // Don't bother performing a no-op shift.
2597 if (!Count)
2598 return;
Chris Lattner6b695682007-08-16 15:56:55 +00002599
Craig Topperc6b05682017-04-24 17:00:22 +00002600 // WordShift is the inter-part shift; BitShift is the intra-part shift.
Craig Toppera8a4f0d2017-04-18 04:39:48 +00002601 unsigned WordShift = std::min(Count / APINT_BITS_PER_WORD, Words);
2602 unsigned BitShift = Count % APINT_BITS_PER_WORD;
Chris Lattner6b695682007-08-16 15:56:55 +00002603
Craig Toppera8a4f0d2017-04-18 04:39:48 +00002604 // Fastpath for moving by whole words.
2605 if (BitShift == 0) {
2606 std::memmove(Dst + WordShift, Dst, (Words - WordShift) * APINT_WORD_SIZE);
2607 } else {
2608 while (Words-- > WordShift) {
2609 Dst[Words] = Dst[Words - WordShift] << BitShift;
2610 if (Words > WordShift)
2611 Dst[Words] |=
2612 Dst[Words - WordShift - 1] >> (APINT_BITS_PER_WORD - BitShift);
Neil Boothb6182162007-10-08 13:47:12 +00002613 }
Neil Boothb6182162007-10-08 13:47:12 +00002614 }
Craig Toppera8a4f0d2017-04-18 04:39:48 +00002615
2616 // Fill in the remainder with 0s.
2617 std::memset(Dst, 0, WordShift * APINT_WORD_SIZE);
Chris Lattner6b695682007-08-16 15:56:55 +00002618}
2619
Craig Topper9575d8f2017-04-17 21:43:43 +00002620/// Shift a bignum right Count bits in-place. Shifted in bits are zero. There
2621/// are no restrictions on Count.
2622void APInt::tcShiftRight(WordType *Dst, unsigned Words, unsigned Count) {
2623 // Don't bother performing a no-op shift.
2624 if (!Count)
2625 return;
Chris Lattner6b695682007-08-16 15:56:55 +00002626
Craig Topperc6b05682017-04-24 17:00:22 +00002627 // WordShift is the inter-part shift; BitShift is the intra-part shift.
Craig Topper9575d8f2017-04-17 21:43:43 +00002628 unsigned WordShift = std::min(Count / APINT_BITS_PER_WORD, Words);
2629 unsigned BitShift = Count % APINT_BITS_PER_WORD;
Chris Lattner6b695682007-08-16 15:56:55 +00002630
Craig Topper9575d8f2017-04-17 21:43:43 +00002631 unsigned WordsToMove = Words - WordShift;
2632 // Fastpath for moving by whole words.
2633 if (BitShift == 0) {
2634 std::memmove(Dst, Dst + WordShift, WordsToMove * APINT_WORD_SIZE);
2635 } else {
2636 for (unsigned i = 0; i != WordsToMove; ++i) {
2637 Dst[i] = Dst[i + WordShift] >> BitShift;
2638 if (i + 1 != WordsToMove)
2639 Dst[i] |= Dst[i + WordShift + 1] << (APINT_BITS_PER_WORD - BitShift);
Neil Boothb6182162007-10-08 13:47:12 +00002640 }
Chris Lattner6b695682007-08-16 15:56:55 +00002641 }
Craig Topper9575d8f2017-04-17 21:43:43 +00002642
2643 // Fill in the remainder with 0s.
2644 std::memset(Dst + WordsToMove, 0, WordShift * APINT_WORD_SIZE);
Chris Lattner6b695682007-08-16 15:56:55 +00002645}
2646
2647/* Bitwise and of two bignums. */
Craig Topper55229b72017-04-02 19:17:22 +00002648void APInt::tcAnd(WordType *dst, const WordType *rhs, unsigned parts) {
Craig Topperb0038162017-03-28 05:32:52 +00002649 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002650 dst[i] &= rhs[i];
2651}
2652
2653/* Bitwise inclusive or of two bignums. */
Craig Topper55229b72017-04-02 19:17:22 +00002654void APInt::tcOr(WordType *dst, const WordType *rhs, unsigned parts) {
Craig Topperb0038162017-03-28 05:32:52 +00002655 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002656 dst[i] |= rhs[i];
2657}
2658
2659/* Bitwise exclusive or of two bignums. */
Craig Topper55229b72017-04-02 19:17:22 +00002660void APInt::tcXor(WordType *dst, const WordType *rhs, unsigned parts) {
Craig Topperb0038162017-03-28 05:32:52 +00002661 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002662 dst[i] ^= rhs[i];
2663}
2664
2665/* Complement a bignum in-place. */
Craig Topper55229b72017-04-02 19:17:22 +00002666void APInt::tcComplement(WordType *dst, unsigned parts) {
Craig Topperb0038162017-03-28 05:32:52 +00002667 for (unsigned i = 0; i < parts; i++)
Chris Lattner6b695682007-08-16 15:56:55 +00002668 dst[i] = ~dst[i];
2669}
2670
2671/* Comparison (unsigned) of two bignums. */
Craig Topper55229b72017-04-02 19:17:22 +00002672int APInt::tcCompare(const WordType *lhs, const WordType *rhs,
Craig Topper6a8518082017-03-28 05:32:55 +00002673 unsigned parts) {
Chris Lattner6b695682007-08-16 15:56:55 +00002674 while (parts) {
Craig Topper99cfe4f2017-04-01 21:50:06 +00002675 parts--;
Craig Topper1dc8fc82017-04-21 16:13:15 +00002676 if (lhs[parts] != rhs[parts])
2677 return (lhs[parts] > rhs[parts]) ? 1 : -1;
Craig Topper99cfe4f2017-04-01 21:50:06 +00002678 }
Chris Lattner6b695682007-08-16 15:56:55 +00002679
2680 return 0;
2681}
2682
Chris Lattner6b695682007-08-16 15:56:55 +00002683/* Set the least significant BITS bits of a bignum, clear the
2684 rest. */
Craig Topper55229b72017-04-02 19:17:22 +00002685void APInt::tcSetLeastSignificantBits(WordType *dst, unsigned parts,
Craig Topper6a8518082017-03-28 05:32:55 +00002686 unsigned bits) {
Craig Topperb0038162017-03-28 05:32:52 +00002687 unsigned i = 0;
Craig Topper55229b72017-04-02 19:17:22 +00002688 while (bits > APINT_BITS_PER_WORD) {
2689 dst[i++] = ~(WordType) 0;
2690 bits -= APINT_BITS_PER_WORD;
Chris Lattner6b695682007-08-16 15:56:55 +00002691 }
2692
2693 if (bits)
Craig Topper55229b72017-04-02 19:17:22 +00002694 dst[i++] = ~(WordType) 0 >> (APINT_BITS_PER_WORD - bits);
Chris Lattner6b695682007-08-16 15:56:55 +00002695
2696 while (i < parts)
2697 dst[i++] = 0;
2698}
Tim Shen802c31c2018-06-25 23:49:20 +00002699
2700APInt llvm::APIntOps::RoundingUDiv(const APInt &A, const APInt &B,
2701 APInt::Rounding RM) {
2702 // Currently udivrem always rounds down.
2703 switch (RM) {
2704 case APInt::Rounding::DOWN:
2705 case APInt::Rounding::TOWARD_ZERO:
2706 return A.udiv(B);
2707 case APInt::Rounding::UP: {
2708 APInt Quo, Rem;
2709 APInt::udivrem(A, B, Quo, Rem);
2710 if (Rem == 0)
2711 return Quo;
2712 return Quo + 1;
2713 }
2714 }
Simon Pilgrim9b3b0fe2018-06-26 09:31:18 +00002715 llvm_unreachable("Unknown APInt::Rounding enum");
Tim Shen802c31c2018-06-25 23:49:20 +00002716}
2717
2718APInt llvm::APIntOps::RoundingSDiv(const APInt &A, const APInt &B,
2719 APInt::Rounding RM) {
2720 switch (RM) {
2721 case APInt::Rounding::DOWN:
2722 case APInt::Rounding::UP: {
2723 APInt Quo, Rem;
2724 APInt::sdivrem(A, B, Quo, Rem);
2725 if (Rem == 0)
2726 return Quo;
2727 // This algorithm deals with arbitrary rounding mode used by sdivrem.
2728 // We want to check whether the non-integer part of the mathematical value
2729 // is negative or not. If the non-integer part is negative, we need to round
2730 // down from Quo; otherwise, if it's positive or 0, we return Quo, as it's
2731 // already rounded down.
2732 if (RM == APInt::Rounding::DOWN) {
2733 if (Rem.isNegative() != B.isNegative())
2734 return Quo - 1;
2735 return Quo;
2736 }
2737 if (Rem.isNegative() != B.isNegative())
2738 return Quo;
2739 return Quo + 1;
2740 }
2741 // Currently sdiv rounds twards zero.
2742 case APInt::Rounding::TOWARD_ZERO:
2743 return A.sdiv(B);
2744 }
Simon Pilgrim9b3b0fe2018-06-26 09:31:18 +00002745 llvm_unreachable("Unknown APInt::Rounding enum");
Tim Shen802c31c2018-06-25 23:49:20 +00002746}
Krzysztof Parzyszek90f32492018-08-02 19:13:35 +00002747
2748Optional<APInt>
2749llvm::APIntOps::SolveQuadraticEquationWrap(APInt A, APInt B, APInt C,
2750 unsigned RangeWidth) {
2751 unsigned CoeffWidth = A.getBitWidth();
2752 assert(CoeffWidth == B.getBitWidth() && CoeffWidth == C.getBitWidth());
2753 assert(RangeWidth <= CoeffWidth &&
2754 "Value range width should be less than coefficient width");
2755 assert(RangeWidth > 1 && "Value range bit width should be > 1");
2756
2757 LLVM_DEBUG(dbgs() << __func__ << ": solving " << A << "x^2 + " << B
2758 << "x + " << C << ", rw:" << RangeWidth << '\n');
2759
2760 // Identify 0 as a (non)solution immediately.
2761 if (C.sextOrTrunc(RangeWidth).isNullValue() ) {
2762 LLVM_DEBUG(dbgs() << __func__ << ": zero solution\n");
2763 return APInt(CoeffWidth, 0);
2764 }
2765
2766 // The result of APInt arithmetic has the same bit width as the operands,
2767 // so it can actually lose high bits. A product of two n-bit integers needs
2768 // 2n-1 bits to represent the full value.
2769 // The operation done below (on quadratic coefficients) that can produce
2770 // the largest value is the evaluation of the equation during bisection,
2771 // which needs 3 times the bitwidth of the coefficient, so the total number
2772 // of required bits is 3n.
2773 //
2774 // The purpose of this extension is to simulate the set Z of all integers,
2775 // where n+1 > n for all n in Z. In Z it makes sense to talk about positive
2776 // and negative numbers (not so much in a modulo arithmetic). The method
2777 // used to solve the equation is based on the standard formula for real
2778 // numbers, and uses the concepts of "positive" and "negative" with their
2779 // usual meanings.
2780 CoeffWidth *= 3;
2781 A = A.sext(CoeffWidth);
2782 B = B.sext(CoeffWidth);
2783 C = C.sext(CoeffWidth);
2784
2785 // Make A > 0 for simplicity. Negate cannot overflow at this point because
2786 // the bit width has increased.
2787 if (A.isNegative()) {
2788 A.negate();
2789 B.negate();
2790 C.negate();
2791 }
2792
2793 // Solving an equation q(x) = 0 with coefficients in modular arithmetic
2794 // is really solving a set of equations q(x) = kR for k = 0, 1, 2, ...,
2795 // and R = 2^BitWidth.
2796 // Since we're trying not only to find exact solutions, but also values
2797 // that "wrap around", such a set will always have a solution, i.e. an x
2798 // that satisfies at least one of the equations, or such that |q(x)|
2799 // exceeds kR, while |q(x-1)| for the same k does not.
2800 //
2801 // We need to find a value k, such that Ax^2 + Bx + C = kR will have a
2802 // positive solution n (in the above sense), and also such that the n
2803 // will be the least among all solutions corresponding to k = 0, 1, ...
2804 // (more precisely, the least element in the set
2805 // { n(k) | k is such that a solution n(k) exists }).
2806 //
2807 // Consider the parabola (over real numbers) that corresponds to the
2808 // quadratic equation. Since A > 0, the arms of the parabola will point
2809 // up. Picking different values of k will shift it up and down by R.
2810 //
2811 // We want to shift the parabola in such a way as to reduce the problem
2812 // of solving q(x) = kR to solving shifted_q(x) = 0.
2813 // (The interesting solutions are the ceilings of the real number
2814 // solutions.)
2815 APInt R = APInt::getOneBitSet(CoeffWidth, RangeWidth);
2816 APInt TwoA = 2 * A;
2817 APInt SqrB = B * B;
2818 bool PickLow;
2819
Krzysztof Parzyszekdfd5fad2018-08-02 19:38:18 +00002820 auto RoundUp = [] (const APInt &V, const APInt &A) -> APInt {
Krzysztof Parzyszek90f32492018-08-02 19:13:35 +00002821 assert(A.isStrictlyPositive());
2822 APInt T = V.abs().urem(A);
2823 if (T.isNullValue())
2824 return V;
2825 return V.isNegative() ? V+T : V+(A-T);
2826 };
2827
2828 // The vertex of the parabola is at -B/2A, but since A > 0, it's negative
2829 // iff B is positive.
2830 if (B.isNonNegative()) {
2831 // If B >= 0, the vertex it at a negative location (or at 0), so in
2832 // order to have a non-negative solution we need to pick k that makes
2833 // C-kR negative. To satisfy all the requirements for the solution
2834 // that we are looking for, it needs to be closest to 0 of all k.
2835 C = C.srem(R);
2836 if (C.isStrictlyPositive())
2837 C -= R;
2838 // Pick the greater solution.
2839 PickLow = false;
2840 } else {
2841 // If B < 0, the vertex is at a positive location. For any solution
2842 // to exist, the discriminant must be non-negative. This means that
2843 // C-kR <= B^2/4A is a necessary condition for k, i.e. there is a
2844 // lower bound on values of k: kR >= C - B^2/4A.
2845 APInt LowkR = C - SqrB.udiv(2*TwoA); // udiv because all values > 0.
2846 // Round LowkR up (towards +inf) to the nearest kR.
2847 LowkR = RoundUp(LowkR, R);
2848
2849 // If there exists k meeting the condition above, and such that
2850 // C-kR > 0, there will be two positive real number solutions of
2851 // q(x) = kR. Out of all such values of k, pick the one that makes
2852 // C-kR closest to 0, (i.e. pick maximum k such that C-kR > 0).
2853 // In other words, find maximum k such that LowkR <= kR < C.
2854 if (C.sgt(LowkR)) {
2855 // If LowkR < C, then such a k is guaranteed to exist because
2856 // LowkR itself is a multiple of R.
2857 C -= -RoundUp(-C, R); // C = C - RoundDown(C, R)
2858 // Pick the smaller solution.
2859 PickLow = true;
2860 } else {
2861 // If C-kR < 0 for all potential k's, it means that one solution
2862 // will be negative, while the other will be positive. The positive
2863 // solution will shift towards 0 if the parabola is moved up.
2864 // Pick the kR closest to the lower bound (i.e. make C-kR closest
2865 // to 0, or in other words, out of all parabolas that have solutions,
2866 // pick the one that is the farthest "up").
2867 // Since LowkR is itself a multiple of R, simply take C-LowkR.
2868 C -= LowkR;
2869 // Pick the greater solution.
2870 PickLow = false;
2871 }
2872 }
2873
2874 LLVM_DEBUG(dbgs() << __func__ << ": updated coefficients " << A << "x^2 + "
2875 << B << "x + " << C << ", rw:" << RangeWidth << '\n');
2876
2877 APInt D = SqrB - 4*A*C;
2878 assert(D.isNonNegative() && "Negative discriminant");
2879 APInt SQ = D.sqrt();
2880
2881 APInt Q = SQ * SQ;
2882 bool InexactSQ = Q != D;
2883 // The calculated SQ may actually be greater than the exact (non-integer)
2884 // value. If that's the case, decremement SQ to get a value that is lower.
2885 if (Q.sgt(D))
2886 SQ -= 1;
2887
2888 APInt X;
2889 APInt Rem;
2890
2891 // SQ is rounded down (i.e SQ * SQ <= D), so the roots may be inexact.
2892 // When using the quadratic formula directly, the calculated low root
2893 // may be greater than the exact one, since we would be subtracting SQ.
2894 // To make sure that the calculated root is not greater than the exact
2895 // one, subtract SQ+1 when calculating the low root (for inexact value
2896 // of SQ).
2897 if (PickLow)
2898 APInt::sdivrem(-B - (SQ+InexactSQ), TwoA, X, Rem);
2899 else
2900 APInt::sdivrem(-B + SQ, TwoA, X, Rem);
2901
2902 // The updated coefficients should be such that the (exact) solution is
2903 // positive. Since APInt division rounds towards 0, the calculated one
2904 // can be 0, but cannot be negative.
2905 assert(X.isNonNegative() && "Solution should be non-negative");
2906
2907 if (!InexactSQ && Rem.isNullValue()) {
2908 LLVM_DEBUG(dbgs() << __func__ << ": solution (root): " << X << '\n');
2909 return X;
2910 }
2911
2912 assert((SQ*SQ).sle(D) && "SQ = |_sqrt(D)_|, so SQ*SQ <= D");
2913 // The exact value of the square root of D should be between SQ and SQ+1.
2914 // This implies that the solution should be between that corresponding to
2915 // SQ (i.e. X) and that corresponding to SQ+1.
2916 //
2917 // The calculated X cannot be greater than the exact (real) solution.
2918 // Actually it must be strictly less than the exact solution, while
2919 // X+1 will be greater than or equal to it.
2920
2921 APInt VX = (A*X + B)*X + C;
2922 APInt VY = VX + TwoA*X + A + B;
2923 bool SignChange = VX.isNegative() != VY.isNegative() ||
2924 VX.isNullValue() != VY.isNullValue();
2925 // If the sign did not change between X and X+1, X is not a valid solution.
2926 // This could happen when the actual (exact) roots don't have an integer
2927 // between them, so they would both be contained between X and X+1.
2928 if (!SignChange) {
2929 LLVM_DEBUG(dbgs() << __func__ << ": no valid solution\n");
2930 return None;
2931 }
2932
2933 X += 1;
2934 LLVM_DEBUG(dbgs() << __func__ << ": solution (wrap): " << X << '\n');
2935 return X;
2936}
Erik Pilkingtoneee944e2019-07-02 18:28:13 +00002937
2938/// StoreIntToMemory - Fills the StoreBytes bytes of memory starting from Dst
2939/// with the integer held in IntVal.
2940void llvm::StoreIntToMemory(const APInt &IntVal, uint8_t *Dst,
2941 unsigned StoreBytes) {
2942 assert((IntVal.getBitWidth()+7)/8 >= StoreBytes && "Integer too small!");
2943 const uint8_t *Src = (const uint8_t *)IntVal.getRawData();
2944
2945 if (sys::IsLittleEndianHost) {
2946 // Little-endian host - the source is ordered from LSB to MSB. Order the
2947 // destination from LSB to MSB: Do a straight copy.
2948 memcpy(Dst, Src, StoreBytes);
2949 } else {
2950 // Big-endian host - the source is an array of 64 bit words ordered from
2951 // LSW to MSW. Each word is ordered from MSB to LSB. Order the destination
2952 // from MSB to LSB: Reverse the word order, but not the bytes in a word.
2953 while (StoreBytes > sizeof(uint64_t)) {
2954 StoreBytes -= sizeof(uint64_t);
2955 // May not be aligned so use memcpy.
2956 memcpy(Dst + StoreBytes, Src, sizeof(uint64_t));
2957 Src += sizeof(uint64_t);
2958 }
2959
2960 memcpy(Dst, Src + sizeof(uint64_t) - StoreBytes, StoreBytes);
2961 }
2962}
2963
2964/// LoadIntFromMemory - Loads the integer stored in the LoadBytes bytes starting
2965/// from Src into IntVal, which is assumed to be wide enough and to hold zero.
2966void llvm::LoadIntFromMemory(APInt &IntVal, uint8_t *Src, unsigned LoadBytes) {
2967 assert((IntVal.getBitWidth()+7)/8 >= LoadBytes && "Integer too small!");
2968 uint8_t *Dst = reinterpret_cast<uint8_t *>(
2969 const_cast<uint64_t *>(IntVal.getRawData()));
2970
2971 if (sys::IsLittleEndianHost)
2972 // Little-endian host - the destination must be ordered from LSB to MSB.
2973 // The source is ordered from LSB to MSB: Do a straight copy.
2974 memcpy(Dst, Src, LoadBytes);
2975 else {
2976 // Big-endian - the destination is an array of 64 bit words ordered from
2977 // LSW to MSW. Each word must be ordered from MSB to LSB. The source is
2978 // ordered from MSB to LSB: Reverse the word order, but not the bytes in
2979 // a word.
2980 while (LoadBytes > sizeof(uint64_t)) {
2981 LoadBytes -= sizeof(uint64_t);
2982 // May not be aligned so use memcpy.
2983 memcpy(Dst, Src + LoadBytes, sizeof(uint64_t));
2984 Dst += sizeof(uint64_t);
2985 }
2986
2987 memcpy(Dst + sizeof(uint64_t) - LoadBytes, Src, LoadBytes);
2988 }
2989}