APInt.cpp source code [llvm_projects/llvm/lib/Support/APInt.cpp]

1	//===-- APInt.cpp - Implement APInt class ---------------------------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// This file implements a class to represent arbitrary precision integer
10	// constant values and provide a variety of arithmetic operations on them.
11	//
12	//===----------------------------------------------------------------------===//
13
14	#include "llvm/ADT/APInt.h"
15	#include "llvm/ADT/ArrayRef.h"
16	#include "llvm/ADT/FoldingSet.h"
17	#include "llvm/ADT/Hashing.h"
18	#include "llvm/ADT/Sequence.h"
19	#include "llvm/ADT/SmallString.h"
20	#include "llvm/ADT/StringRef.h"
21	#include "llvm/ADT/bit.h"
22	#include "llvm/Support/Alignment.h"
23	#include "llvm/Support/Debug.h"
24	#include "llvm/Support/ErrorHandling.h"
25	#include "llvm/Support/MathExtras.h"
26	#include "llvm/Support/SwapByteOrder.h"
27	#include "llvm/Support/raw_ostream.h"
28	#include <cmath>
29	#include <optional>
30
31	using namespace llvm;
32
33	#define DEBUG_TYPE "apint"
34
35	/// A utility function for allocating memory, checking for allocation failures,
36	/// and ensuring the contents are zeroed.
37	inline static uint64_t* getClearedMemory(unsigned numWords) {
38	return new uint64_t[numWords]();
39	}
40
41	/// A utility function for allocating memory and checking for allocation
42	/// failure. The content is not zeroed.
43	inline static uint64_t* getMemory(unsigned numWords) {
44	return new uint64_t[numWords];
45	}
46
47	/// A utility function that converts a character to a digit.
48	inline static unsigned getDigit(char cdigit, uint8_t radix) {
49	unsigned r;
50
51	if (radix == `16` \|\| radix == `36`) {
52	r = cdigit - `'0'`;
53	if (r <= `9`)
54	return r;
55
56	r = cdigit - `'A'`;
57	if (r <= radix - `11U`)
58	return r + `10`;
59
60	r = cdigit - `'a'`;
61	if (r <= radix - `11U`)
62	return r + `10`;
63
64	radix = `10`;
65	}
66
67	r = cdigit - `'0'`;
68	if (r < radix)
69	return r;
70
71	return UINT_MAX;
72	}
73
74
75	void APInt::initSlowCase(uint64_t val, bool isSigned) {
76	if (isSigned && int64_t(val) < `0`) {
77	U.pVal = getMemory(numWords: getNumWords());
78	U.pVal[`0`] = val;
79	memset(s: &U.pVal[`1`], c: `0xFF`, n: APINT_WORD_SIZE * (getNumWords() - `1`));
80	clearUnusedBits();
81	} else {
82	U.pVal = getClearedMemory(numWords: getNumWords());
83	U.pVal[`0`] = val;
84	}
85	}
86
87	void APInt::initSlowCase(const APInt& that) {
88	U.pVal = getMemory(numWords: getNumWords());
89	memcpy(dest: U.pVal, src: that.U.pVal, n: getNumWords() * APINT_WORD_SIZE);
90	}
91
92	void APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
93	assert(bigVal.data() && "Null pointer detected!");
94	if (isSingleWord())
95	U.VAL = bigVal [`0`];
96	else {
97	// Get memory, cleared to 0
98	U.pVal = getClearedMemory(numWords: getNumWords());
99	// Calculate the number of words to copy
100	unsigned words = std::min<unsigned>(a: bigVal.size(), b: getNumWords());
101	// Copy the words from bigVal to pVal
102	memcpy(dest: U.pVal, src: bigVal.data(), n: words * APINT_WORD_SIZE);
103	}
104	// Make sure unused high bits are cleared
105	clearUnusedBits();
106	}
107
108	APInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal) : BitWidth(numBits) {
109	initFromArray(bigVal);
110	}
111
112	APInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
113	: BitWidth(numBits) {
114	initFromArray(bigVal: ArrayRef(bigVal, numWords));
115	}
116
117	APInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
118	: BitWidth(numbits) {
119	fromString(numBits: numbits, str: Str, radix);
120	}
121
122	void APInt::reallocate(unsigned NewBitWidth) {
123	// If the number of words is the same we can just change the width and stop.
124	if (getNumWords() == getNumWords(BitWidth: NewBitWidth)) {
125	BitWidth = NewBitWidth;
126	return;
127	}
128
129	// If we have an allocation, delete it.
130	if (!isSingleWord())
131	delete [] U.pVal;
132
133	// Update BitWidth.
134	BitWidth = NewBitWidth;
135
136	// If we are supposed to have an allocation, create it.
137	if (!isSingleWord())
138	U.pVal = getMemory(numWords: getNumWords());
139	}
140
141	void APInt::assignSlowCase(const APInt &RHS) {
142	// Don't do anything for X = X
143	if (this == &RHS)
144	return;
145
146	// Adjust the bit width and handle allocations as necessary.
147	reallocate(NewBitWidth: RHS.getBitWidth());
148
149	// Copy the data.
150	if (isSingleWord())
151	U.VAL = RHS.U.VAL;
152	else
153	memcpy(dest: U.pVal, src: RHS.U.pVal, n: getNumWords() * APINT_WORD_SIZE);
154	}
155
156	/// This method 'profiles' an APInt for use with FoldingSet.
157	void APInt::Profile(FoldingSetNodeID& ID) const {
158	ID.AddInteger(I: BitWidth);
159
160	if (isSingleWord()) {
161	ID.AddInteger(I: U.VAL);
162	return;
163	}
164
165	unsigned NumWords = getNumWords();
166	for (unsigned i = `0`; i < NumWords; ++i)
167	ID.AddInteger(I: U.pVal[i]);
168	}
169
170	bool APInt::isAligned(Align A) const {
171	if (isZero())
172	return true;
173	const unsigned TrailingZeroes = countr_zero();
174	const unsigned MinimumTrailingZeroes = Log2(A);
175	return TrailingZeroes >= MinimumTrailingZeroes;
176	}
177
178	/// Prefix increment operator. Increments the APInt by one.
179	APInt& APInt::operator++() {
180	if (isSingleWord())
181	++U.VAL;
182	else
183	tcIncrement(dst: U.pVal, parts: getNumWords());
184	return clearUnusedBits();
185	}
186
187	/// Prefix decrement operator. Decrements the APInt by one.
188	APInt& APInt::operator--() {
189	if (isSingleWord())
190	--U.VAL;
191	else
192	tcDecrement(dst: U.pVal, parts: getNumWords());
193	return clearUnusedBits();
194	}
195
196	/// Adds the RHS APInt to this APInt.
197	/// @returns this, after addition of RHS.
198	/// Addition assignment operator.
199	APInt& APInt::operator+=(const APInt& RHS) {
200	assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
201	if (isSingleWord())
202	U.VAL += RHS.U.VAL;
203	else
204	tcAdd(U.pVal, RHS.U.pVal, carry: `0`, getNumWords());
205	return clearUnusedBits();
206	}
207
208	APInt& APInt::operator+=(uint64_t RHS) {
209	if (isSingleWord())
210	U.VAL += RHS;
211	else
212	tcAddPart(U.pVal, RHS, getNumWords());
213	return clearUnusedBits();
214	}
215
216	/// Subtracts the RHS APInt from this APInt
217	/// @returns this, after subtraction
218	/// Subtraction assignment operator.
219	APInt& APInt::operator-=(const APInt& RHS) {
220	assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
221	if (isSingleWord())
222	U.VAL -= RHS.U.VAL;
223	else
224	tcSubtract(U.pVal, RHS.U.pVal, carry: `0`, getNumWords());
225	return clearUnusedBits();
226	}
227
228	APInt& APInt::operator-=(uint64_t RHS) {
229	if (isSingleWord())
230	U.VAL -= RHS;
231	else
232	tcSubtractPart(U.pVal, RHS, getNumWords());
233	return clearUnusedBits();
234	}
235
236	APInt APInt::operator(const* APInt& RHS) const {
237	assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
238	if (isSingleWord())
239	return APInt (BitWidth, U.VAL * RHS.U.VAL, /isSigned=/false,
240	/implicitTrunc=/true);
241
242	APInt Result(getMemory(numWords: getNumWords()), getBitWidth());
243	tcMultiply(Result.U.pVal, U.pVal, RHS.U.pVal, getNumWords());
244	Result.clearUnusedBits();
245	return Result;
246	}
247
248	void APInt::andAssignSlowCase(const APInt &RHS) {
249	WordType dst = U.pVal, rhs = RHS.U.pVal;
250	for (size_t i = `0`, e = getNumWords(); i != e; ++i)
251	dst[i] &= rhs[i];
252	}
253
254	void APInt::orAssignSlowCase(const APInt &RHS) {
255	WordType dst = U.pVal, rhs = RHS.U.pVal;
256	for (size_t i = `0`, e = getNumWords(); i != e; ++i)
257	dst[i] \|= rhs[i];
258	}
259
260	void APInt::xorAssignSlowCase(const APInt &RHS) {
261	WordType dst = U.pVal, rhs = RHS.U.pVal;
262	for (size_t i = `0`, e = getNumWords(); i != e; ++i)
263	dst[i] ^= rhs[i];
264	}
265
266	APInt &APInt::operator=(const* APInt &RHS) {
267	*this = *this * RHS;
268	return *this;
269	}
270
271	APInt& APInt::operator*=(uint64_t RHS) {
272	if (isSingleWord()) {
273	U.VAL *= RHS;
274	} else {
275	unsigned NumWords = getNumWords();
276	tcMultiplyPart(dst: U.pVal, src: U.pVal, multiplier: RHS, carry: `0`, srcParts: NumWords, dstParts: NumWords, add: false);
277	}
278	return clearUnusedBits();
279	}
280
281	bool APInt::equalSlowCase(const APInt &RHS) const {
282	return std::equal(first1: U.pVal, last1: U.pVal + getNumWords(), first2: RHS.U.pVal);
283	}
284
285	int APInt::compare(const APInt& RHS) const {
286	assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
287	if (isSingleWord())
288	return U.VAL < RHS.U.VAL ? -`1` : U.VAL > RHS.U.VAL;
289
290	return tcCompare(U.pVal, RHS.U.pVal, getNumWords());
291	}
292
293	int APInt::compareSigned(const APInt& RHS) const {
294	assert(BitWidth == RHS.BitWidth && "Bit widths must be same for comparison");
295	if (isSingleWord()) {
296	int64_t lhsSext = SignExtend64(X: U.VAL, B: BitWidth);
297	int64_t rhsSext = SignExtend64(X: RHS.U.VAL, B: BitWidth);
298	return lhsSext < rhsSext ? -`1` : lhsSext > rhsSext;
299	}
300
301	bool lhsNeg = isNegative();
302	bool rhsNeg = RHS.isNegative();
303
304	// If the sign bits don't match, then (LHS < RHS) if LHS is negative
305	if (lhsNeg != rhsNeg)
306	return lhsNeg ? -`1` : `1`;
307
308	// Otherwise we can just use an unsigned comparison, because even negative
309	// numbers compare correctly this way if both have the same signed-ness.
310	return tcCompare(U.pVal, RHS.U.pVal, getNumWords());
311	}
312
313	void APInt::setBitsSlowCase(unsigned loBit, unsigned hiBit) {
314	unsigned loWord = whichWord(bitPosition: loBit);
315	unsigned hiWord = whichWord(bitPosition: hiBit);
316
317	// Create an initial mask for the low word with zeros below loBit.
318	uint64_t loMask = WORDTYPE_MAX << whichBit(bitPosition: loBit);
319
320	// If hiBit is not aligned, we need a high mask.
321	unsigned hiShiftAmt = whichBit(bitPosition: hiBit);
322	if (hiShiftAmt != `0`) {
323	// Create a high mask with zeros above hiBit.
324	uint64_t hiMask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - hiShiftAmt);
325	// If loWord and hiWord are equal, then we combine the masks. Otherwise,
326	// set the bits in hiWord.
327	if (hiWord == loWord)
328	loMask &= hiMask;
329	else
330	U.pVal[hiWord] \|= hiMask;
331	}
332	// Apply the mask to the low word.
333	U.pVal[loWord] \|= loMask;
334
335	// Fill any words between loWord and hiWord with all ones.
336	for (unsigned word = loWord + `1`; word < hiWord; ++word)
337	U.pVal[word] = WORDTYPE_MAX;
338	}
339
340	void APInt::clearBitsSlowCase(unsigned LoBit, unsigned HiBit) {
341	unsigned LoWord = whichWord(bitPosition: LoBit);
342	unsigned HiWord = whichWord(bitPosition: HiBit);
343
344	// Create an initial mask for the low word with ones below loBit.
345	uint64_t LoMask = ~(WORDTYPE_MAX << whichBit(bitPosition: LoBit));
346
347	// If HiBit is not aligned, we need a high mask.
348	unsigned HiShiftAmt = whichBit(bitPosition: HiBit);
349	if (HiShiftAmt != `0`) {
350	// Create a high mask with ones above HiBit.
351	uint64_t HiMask = ~(WORDTYPE_MAX >> (APINT_BITS_PER_WORD - HiShiftAmt));
352	// If LoWord and HiWord are equal, then we combine the masks. Otherwise,
353	// clear the bits in HiWord.
354	if (HiWord == LoWord)
355	LoMask \|= HiMask;
356	else
357	U.pVal[HiWord] &= HiMask;
358	}
359	// Apply the mask to the low word.
360	U.pVal[LoWord] &= LoMask;
361
362	// Fill any words between LoWord and HiWord with all zeros.
363	for (unsigned Word = LoWord + `1`; Word < HiWord; ++Word)
364	U.pVal[Word] = `0`;
365	}
366
367	// Complement a bignum in-place.
368	static void tcComplement(APInt::WordType dst, unsigned* parts) {
369	for (unsigned i = `0`; i < parts; i++)
370	dst[i] = ~dst[i];
371	}
372
373	/// Toggle every bit to its opposite value.
374	void APInt::flipAllBitsSlowCase() {
375	tcComplement(dst: U.pVal, parts: getNumWords());
376	clearUnusedBits();
377	}
378
379	/// Concatenate the bits from "NewLSB" onto the bottom of this. This is*
380	/// equivalent to:
381	/// (this->zext(NewWidth) << NewLSB.getBitWidth()) \| NewLSB.zext(NewWidth)
382	/// In the slow case, we know the result is large.
383	APInt APInt::concatSlowCase(const APInt &NewLSB) const {
384	unsigned NewWidth = getBitWidth() + NewLSB.getBitWidth();
385	APInt Result = NewLSB.zext(width: NewWidth);
386	Result.insertBits(SubBits: *this, bitPosition: NewLSB.getBitWidth());
387	return Result;
388	}
389
390	/// Toggle a given bit to its opposite value whose position is given
391	/// as "bitPosition".
392	/// Toggles a given bit to its opposite value.
393	void APInt::flipBit(unsigned bitPosition) {
394	assert(bitPosition < BitWidth && "Out of the bit-width range!");
395	setBitVal(BitPosition: bitPosition, BitValue: !(*this)[bitPosition]);
396	}
397
398	void APInt::insertBits(const APInt &subBits, unsigned bitPosition) {
399	unsigned subBitWidth = subBits.getBitWidth();
400	assert((subBitWidth + bitPosition) <= BitWidth && "Illegal bit insertion");
401
402	// inserting no bits is a noop.
403	if (subBitWidth == `0`)
404	return;
405
406	// Insertion is a direct copy.
407	if (subBitWidth == BitWidth) {
408	*this = subBits;
409	return;
410	}
411
412	// Single word result can be done as a direct bitmask.
413	if (isSingleWord()) {
414	uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - subBitWidth);
415	U.VAL &= ~(mask << bitPosition);
416	U.VAL \|= (subBits.U.VAL << bitPosition);
417	return;
418	}
419
420	unsigned loBit = whichBit(bitPosition);
421	unsigned loWord = whichWord(bitPosition);
422	unsigned hi1Word = whichWord(bitPosition: bitPosition + subBitWidth - `1`);
423
424	// Insertion within a single word can be done as a direct bitmask.
425	if (loWord == hi1Word) {
426	uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - subBitWidth);
427	U.pVal[loWord] &= ~(mask << loBit);
428	U.pVal[loWord] \|= (subBits.U.VAL << loBit);
429	return;
430	}
431
432	// Insert on word boundaries.
433	if (loBit == `0`) {
434	// Direct copy whole words.
435	unsigned numWholeSubWords = subBitWidth / APINT_BITS_PER_WORD;
436	memcpy(dest: U.pVal + loWord, src: subBits.getRawData(),
437	n: numWholeSubWords * APINT_WORD_SIZE);
438
439	// Mask+insert remaining bits.
440	unsigned remainingBits = subBitWidth % APINT_BITS_PER_WORD;
441	if (remainingBits != `0`) {
442	uint64_t mask = WORDTYPE_MAX >> (APINT_BITS_PER_WORD - remainingBits);
443	U.pVal[hi1Word] &= ~mask;
444	U.pVal[hi1Word] \|= subBits.getWord(bitPosition: subBitWidth - `1`);
445	}
446	return;
447	}
448
449	// General case - set/clear individual bits in dst based on src.
450	// TODO - there is scope for optimization here, but at the moment this code
451	// path is barely used so prefer readability over performance.
452	for (unsigned i = `0`; i != subBitWidth; ++i)
453	setBitVal(BitPosition: bitPosition + i, BitValue: subBits [i]);
454	}
455
456	void APInt::insertBits(uint64_t subBits, unsigned bitPosition, unsigned numBits) {
457	uint64_t maskBits = maskTrailingOnes<uint64_t>(N: numBits);
458	subBits &= maskBits;
459	if (isSingleWord()) {
460	U.VAL &= ~(maskBits << bitPosition);
461	U.VAL \|= subBits << bitPosition;
462	return;
463	}
464
465	unsigned loBit = whichBit(bitPosition);
466	unsigned loWord = whichWord(bitPosition);
467	unsigned hiWord = whichWord(bitPosition: bitPosition + numBits - `1`);
468	if (loWord == hiWord) {
469	U.pVal[loWord] &= ~(maskBits << loBit);
470	U.pVal[loWord] \|= subBits << loBit;
471	return;
472	}
473
474	static_assert(`8` * sizeof(WordType) <= `64`, "This code assumes only two words affected");
475	unsigned wordBits = `8` * sizeof(WordType);
476	U.pVal[loWord] &= ~(maskBits << loBit);
477	U.pVal[loWord] \|= subBits << loBit;
478
479	U.pVal[hiWord] &= ~(maskBits >> (wordBits - loBit));
480	U.pVal[hiWord] \|= subBits >> (wordBits - loBit);
481	}
482
483	APInt APInt::extractBits(unsigned numBits, unsigned bitPosition) const {
484	assert(bitPosition < BitWidth && (numBits + bitPosition) <= BitWidth &&
485	"Illegal bit extraction");
486
487	if (isSingleWord())
488	return APInt (numBits, U.VAL >> bitPosition, /isSigned=/false,
489	/implicitTrunc=/true);
490
491	unsigned loBit = whichBit(bitPosition);
492	unsigned loWord = whichWord(bitPosition);
493	unsigned hiWord = whichWord(bitPosition: bitPosition + numBits - `1`);
494
495	// Single word result extracting bits from a single word source.
496	if (loWord == hiWord)
497	return APInt (numBits, U.pVal[loWord] >> loBit, /isSigned=/false,
498	/implicitTrunc=/true);
499
500	// Extracting bits that start on a source word boundary can be done
501	// as a fast memory copy.
502	if (loBit == `0`)
503	return APInt (numBits, ArrayRef(U.pVal + loWord, `1` + hiWord - loWord));
504
505	// General case - shift + copy source words directly into place.
506	APInt Result(numBits, `0`);
507	unsigned NumSrcWords = getNumWords();
508	unsigned NumDstWords = Result.getNumWords();
509
510	uint64_t *DestPtr = Result.isSingleWord() ? &Result.U.VAL : Result.U.pVal;
511	for (unsigned word = `0`; word < NumDstWords; ++word) {
512	uint64_t w0 = U.pVal[loWord + word];
513	uint64_t w1 =
514	(loWord + word + `1`) < NumSrcWords ? U.pVal[loWord + word + `1`] : `0`;
515	DestPtr[word] = (w0 >> loBit) \| (w1 << (APINT_BITS_PER_WORD - loBit));
516	}
517
518	return Result.clearUnusedBits();
519	}
520
521	uint64_t APInt::extractBitsAsZExtValue(unsigned numBits,
522	unsigned bitPosition) const {
523	assert(bitPosition < BitWidth && (numBits + bitPosition) <= BitWidth &&
524	"Illegal bit extraction");
525	assert(numBits <= `64` && "Illegal bit extraction");
526
527	uint64_t maskBits = maskTrailingOnes<uint64_t>(N: numBits);
528	if (isSingleWord())
529	return (U.VAL >> bitPosition) & maskBits;
530
531	static_assert(APINT_BITS_PER_WORD >= `64`,
532	"This code assumes only two words affected");
533	unsigned loBit = whichBit(bitPosition);
534	unsigned loWord = whichWord(bitPosition);
535	unsigned hiWord = whichWord(bitPosition: bitPosition + numBits - `1`);
536	if (loWord == hiWord)
537	return (U.pVal[loWord] >> loBit) & maskBits;
538
539	uint64_t retBits = U.pVal[loWord] >> loBit;
540	retBits \|= U.pVal[hiWord] << (APINT_BITS_PER_WORD - loBit);
541	retBits &= maskBits;
542	return retBits;
543	}
544
545	unsigned APInt::getSufficientBitsNeeded(StringRef Str, uint8_t Radix) {
546	assert(!Str.empty() && "Invalid string length");
547	size_t StrLen = Str.size();
548
549	// Each computation below needs to know if it's negative.
550	unsigned IsNegative = false;
551	if (Str [`0`] == `'-'` \|\| Str [`0`] == `'+'`) {
552	IsNegative = Str [`0`] == `'-'`;
553	StrLen--;
554	assert(StrLen && "String is only a sign, needs a value.");
555	}
556
557	// For radixes of power-of-two values, the bits required is accurately and
558	// easily computed.
559	if (Radix == `2`)
560	return StrLen + IsNegative;
561	if (Radix == `8`)
562	return StrLen * `3` + IsNegative;
563	if (Radix == `16`)
564	return StrLen * `4` + IsNegative;
565
566	// Compute a sufficient number of bits that is always large enough but might
567	// be too large. This avoids the assertion in the constructor. This
568	// calculation doesn't work appropriately for the numbers 0-9, so just use 4
569	// bits in that case.
570	if (Radix == `10`)
571	return (StrLen == `1` ? `4` : StrLen * `64` / `18`) + IsNegative;
572
573	assert(Radix == `36`);
574	return (StrLen == `1` ? `7` : StrLen * `16` / `3`) + IsNegative;
575	}
576
577	unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
578	// Compute a sufficient number of bits that is always large enough but might
579	// be too large.
580	unsigned sufficient = getSufficientBitsNeeded(Str: str, Radix: radix);
581
582	// For bases 2, 8, and 16, the sufficient number of bits is exact and we can
583	// return the value directly. For bases 10 and 36, we need to do extra work.
584	if (radix == `2` \|\| radix == `8` \|\| radix == `16`)
585	return sufficient;
586
587	// This is grossly inefficient but accurate. We could probably do something
588	// with a computation of roughly slen64/20 and then adjust by the value of*
589	// the first few digits. But, I'm not sure how accurate that could be.
590	size_t slen = str.size();
591
592	// Each computation below needs to know if it's negative.
593	StringRef::iterator p = str.begin();
594	unsigned isNegative = *p == `'-'`;
595	if (p == `'-'` \|\| p == `'+'`) {
596	p++;
597	slen--;
598	assert(slen && "String is only a sign, needs a value.");
599	}
600
601
602	// Convert to the actual binary value.
603	APInt tmp(sufficient, StringRef (p, slen), radix);
604
605	// Compute how many bits are required. If the log is infinite, assume we need
606	// just bit. If the log is exact and value is negative, then the value is
607	// MinSignedValue with (log + 1) bits.
608	unsigned log = tmp.logBase2();
609	if (log == (unsigned)-`1`) {
610	return isNegative + `1`;
611	} else if (isNegative && tmp.isPowerOf2()) {
612	return isNegative + log;
613	} else {
614	return isNegative + log + `1`;
615	}
616	}
617
618	hash_code llvm::hash_value(const APInt &Arg) {
619	if (Arg.isSingleWord())
620	return hash_combine(args: Arg.BitWidth, args: Arg.U.VAL);
621
622	return hash_combine(
623	args: Arg.BitWidth,
624	args: hash_combine_range(first: Arg.U.pVal, last: Arg.U.pVal + Arg.getNumWords()));
625	}
626
627	unsigned DenseMapInfo<APInt, void>::getHashValue(const APInt &Key) {
628	return static_cast<unsigned>(hash_value(Arg: Key));
629	}
630
631	bool APInt::isSplat(unsigned SplatSizeInBits) const {
632	assert(getBitWidth() % SplatSizeInBits == `0` &&
633	"SplatSizeInBits must divide width!");
634	// We can check that all parts of an integer are equal by making use of a
635	// little trick: rotate and check if it's still the same value.
636	return *this == rotl(rotateAmt: SplatSizeInBits);
637	}
638
639	/// This function returns the high "numBits" bits of this APInt.
640	APInt APInt::getHiBits(unsigned numBits) const {
641	return this->lshr(shiftAmt: BitWidth - numBits);
642	}
643
644	/// This function returns the low "numBits" bits of this APInt.
645	APInt APInt::getLoBits(unsigned numBits) const {
646	APInt Result(getLowBitsSet(numBits: BitWidth, loBitsSet: numBits));
647	Result &= *this;
648	return Result;
649	}
650
651	/// Return a value containing V broadcasted over NewLen bits.
652	APInt APInt::getSplat(unsigned NewLen, const APInt &V) {
653	assert(NewLen >= V.getBitWidth() && "Can't splat to smaller bit width!");
654
655	APInt Val = V.zext(width: NewLen);
656	for (unsigned I = V.getBitWidth(); I < NewLen; I <<= `1`)
657	Val \|= Val << I;
658
659	return Val;
660	}
661
662	unsigned APInt::countLeadingZerosSlowCase() const {
663	unsigned Count = `0`;
664	for (int i = getNumWords() - `1`; i >= `0`; --i) {
665	uint64_t V = U.pVal[i];
666	if (V == `0`)
667	Count += APINT_BITS_PER_WORD;
668	else {
669	Count += llvm::countl_zero(Val: V);
670	break;
671	}
672	}
673	// Adjust for unused bits in the most significant word (they are zero).
674	unsigned Mod = BitWidth % APINT_BITS_PER_WORD;
675	Count -= Mod > `0` ? APINT_BITS_PER_WORD - Mod : `0`;
676	return Count;
677	}
678
679	unsigned APInt::countLeadingOnesSlowCase() const {
680	unsigned highWordBits = BitWidth % APINT_BITS_PER_WORD;
681	unsigned shift;
682	if (!highWordBits) {
683	highWordBits = APINT_BITS_PER_WORD;
684	shift = `0`;
685	} else {
686	shift = APINT_BITS_PER_WORD - highWordBits;
687	}
688	int i = getNumWords() - `1`;
689	unsigned Count = llvm::countl_one(Value: U.pVal[i] << shift);
690	if (Count == highWordBits) {
691	for (i--; i >= `0`; --i) {
692	if (U.pVal[i] == WORDTYPE_MAX)
693	Count += APINT_BITS_PER_WORD;
694	else {
695	Count += llvm::countl_one(Value: U.pVal[i]);
696	break;
697	}
698	}
699	}
700	return Count;
701	}
702
703	unsigned APInt::countTrailingZerosSlowCase() const {
704	unsigned Count = `0`;
705	unsigned i = `0`;
706	for (; i < getNumWords() && U.pVal[i] == `0`; ++i)
707	Count += APINT_BITS_PER_WORD;
708	if (i < getNumWords())
709	Count += llvm::countr_zero(Val: U.pVal[i]);
710	return std::min(a: Count, b: BitWidth);
711	}
712
713	unsigned APInt::countTrailingOnesSlowCase() const {
714	unsigned Count = `0`;
715	unsigned i = `0`;
716	for (; i < getNumWords() && U.pVal[i] == WORDTYPE_MAX; ++i)
717	Count += APINT_BITS_PER_WORD;
718	if (i < getNumWords())
719	Count += llvm::countr_one(Value: U.pVal[i]);
720	assert(Count <= BitWidth);
721	return Count;
722	}
723
724	unsigned APInt::countPopulationSlowCase() const {
725	unsigned Count = `0`;
726	for (unsigned i = `0`; i < getNumWords(); ++i)
727	Count += llvm::popcount(Value: U.pVal[i]);
728	return Count;
729	}
730
731	bool APInt::isPowerOf2SlowCase() const {
732	unsigned Count = `0`;
733	for (unsigned i = `0`; i < getNumWords(); ++i) {
734	Count += llvm::popcount(Value: U.pVal[i]);
735	if (Count > `1`)
736	return false;
737	}
738	return Count == `1`;
739	}
740
741	bool APInt::intersectsSlowCase(const APInt &RHS) const {
742	for (unsigned i = `0`, e = getNumWords(); i != e; ++i)
743	if ((U.pVal[i] & RHS.U.pVal[i]) != `0`)
744	return true;
745
746	return false;
747	}
748
749	bool APInt::isSubsetOfSlowCase(const APInt &RHS) const {
750	for (unsigned i = `0`, e = getNumWords(); i != e; ++i)
751	if ((U.pVal[i] & ~RHS.U.pVal[i]) != `0`)
752	return false;
753
754	return true;
755	}
756
757	bool APInt::isInverseOfSlowCase(const APInt &RHS) const {
758	const unsigned Last = getNumWords() - `1`;
759	for (unsigned I = `0`; I != Last; ++I)
760	if ((U.pVal[I] ^ RHS.U.pVal[I]) != WORDTYPE_MAX)
761	return false;
762
763	unsigned TailBits = BitWidth - Last * APINT_BITS_PER_WORD;
764	WordType TailMask = llvm::maskTrailingOnes<WordType>(N: TailBits);
765	return (U.pVal[Last] ^ RHS.U.pVal[Last]) == TailMask;
766	}
767
768	APInt APInt::byteSwap() const {
769	assert(BitWidth >= `16` && BitWidth % `8` == `0` && "Cannot byteswap!");
770	if (BitWidth == `16`)
771	return APInt (BitWidth, llvm::byteswap<uint16_t>(V: U.VAL));
772	if (BitWidth == `32`)
773	return APInt (BitWidth, llvm::byteswap<uint32_t>(V: U.VAL));
774	if (BitWidth <= `64`) {
775	uint64_t Tmp1 = llvm::byteswap<uint64_t>(V: U.VAL);
776	Tmp1 >>= (`64` - BitWidth);
777	return APInt (BitWidth, Tmp1);
778	}
779
780	APInt Result(getNumWords() * APINT_BITS_PER_WORD, `0`);
781	for (unsigned I = `0`, N = getNumWords(); I != N; ++I)
782	Result.U.pVal[I] = llvm::byteswap<uint64_t>(V: U.pVal[N - I - `1`]);
783	if (Result.BitWidth != BitWidth) {
784	Result.lshrInPlace(ShiftAmt: Result.BitWidth - BitWidth);
785	Result.BitWidth = BitWidth;
786	}
787	return Result;
788	}
789
790	APInt APInt::reverseBits() const {
791	if (isSingleWord()) {
792	switch (BitWidth) {
793	case `64`:
794	return APInt (BitWidth, llvm::reverseBits<uint64_t>(Val: U.VAL));
795	case `32`:
796	return APInt (BitWidth, llvm::reverseBits<uint32_t>(Val: U.VAL));
797	case `16`:
798	return APInt (BitWidth, llvm::reverseBits<uint16_t>(Val: U.VAL));
799	case `8`:
800	return APInt (BitWidth, llvm::reverseBits<uint8_t>(Val: U.VAL));
801	case `1`: // fallthrough
802	case `0`:
803	return *this;
804	default:
805	return APInt (BitWidth,
806	llvm::reverseBits<uint64_t>(Val: U.VAL) >> (`64` - BitWidth));
807	}
808	}
809
810	APInt Result(BitWidth, `0`);
811	unsigned NumWords = getNumWords();
812	unsigned ExcessBits = NumWords * APINT_BITS_PER_WORD - BitWidth;
813	if (ExcessBits == `0`) {
814	// Fast path. No cross-word shift needed.
815	for (unsigned I = `0`; I < NumWords; ++I)
816	Result.U.pVal[I] = llvm::reverseBits<uint64_t>(Val: U.pVal[NumWords - `1` - I]);
817	return Result;
818	}
819	// Holds reversed bits of the previous (more significant) word.
820	uint64_t PrevRev = llvm::reverseBits<uint64_t>(Val: U.pVal[NumWords - `1`]);
821	for (unsigned I = `0`; I < NumWords - `1`; ++I) {
822	uint64_t CurrRev = llvm::reverseBits<uint64_t>(Val: U.pVal[NumWords - `2` - I]);
823	Result.U.pVal[I] = (PrevRev >> ExcessBits) \| (CurrRev << (`64` - ExcessBits));
824	PrevRev = CurrRev;
825	}
826	Result.U.pVal[NumWords - `1`] = PrevRev >> ExcessBits;
827	return Result;
828	}
829
830	APInt llvm::APIntOps::GreatestCommonDivisor(APInt A, APInt B) {
831	// Fast-path a common case.
832	if (A == B) return A;
833
834	// Corner cases: if either operand is zero, the other is the gcd.
835	if (!A) return B;
836	if (!B) return A;
837
838	// Count common powers of 2 and remove all other powers of 2.
839	unsigned Pow2;
840	{
841	unsigned Pow2_A = A.countr_zero();
842	unsigned Pow2_B = B.countr_zero();
843	if (Pow2_A > Pow2_B) {
844	A.lshrInPlace(ShiftAmt: Pow2_A - Pow2_B);
845	Pow2 = Pow2_B;
846	} else if (Pow2_B > Pow2_A) {
847	B.lshrInPlace(ShiftAmt: Pow2_B - Pow2_A);
848	Pow2 = Pow2_A;
849	} else {
850	Pow2 = Pow2_A;
851	}
852	}
853
854	// Both operands are odd multiples of 2^Pow_2:
855	//
856	// gcd(a, b) = gcd(\|a - b\| / 2^i, min(a, b))
857	//
858	// This is a modified version of Stein's algorithm, taking advantage of
859	// efficient countTrailingZeros().
860	while (A != B) {
861	if (A.ugt(RHS: B)) {
862	A -= B;
863	A.lshrInPlace(ShiftAmt: A.countr_zero() - Pow2);
864	} else {
865	B -= A;
866	B.lshrInPlace(ShiftAmt: B.countr_zero() - Pow2);
867	}
868	}
869
870	return A;
871	}
872
873	APInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
874	uint64_t I = bit_cast<uint64_t>(from: Double);
875
876	// Get the sign bit from the highest order bit
877	bool isNeg = I >> `63`;
878
879	// Get the 11-bit exponent and adjust for the 1023 bit bias
880	int64_t exp = ((I >> `52`) & `0x7ff`) - `1023`;
881
882	// If the exponent is negative, the value is < 0 so just return 0.
883	if (exp < `0`)
884	return APInt (width, `0u`);
885
886	// Extract the mantissa by clearing the top 12 bits (sign + exponent).
887	uint64_t mantissa = (I & (~`0ULL` >> `12`)) \| `1ULL` << `52`;
888
889	// If the exponent doesn't shift all bits out of the mantissa
890	if (exp < `52`)
891	return isNeg ? -APInt (width, mantissa >> (`52` - exp)) :
892	APInt (width, mantissa >> (`52` - exp));
893
894	// If the client didn't provide enough bits for us to shift the mantissa into
895	// then the result is undefined, just return 0
896	if (width <= exp - `52`)
897	return APInt (width, `0`);
898
899	// Otherwise, we have to shift the mantissa bits up to the right location
900	APInt Tmp(width, mantissa);
901	Tmp <<= (unsigned)exp - `52`;
902	return isNeg ? -Tmp : Tmp;
903	}
904
905	/// This function converts this APInt to a double.
906	/// The layout for double is as following (IEEE Standard 754):
907	/// --------------------------------------
908	/// \| Sign Exponent Fraction Bias \|
909	/// \|-------------------------------------- \|
910	/// \| 1[63] 11[62-52] 52[51-00] 1023 \|
911	/// --------------------------------------
912	double APInt::roundToDouble(bool isSigned) const {
913	// Handle the simple case where the value is contained in one uint64_t.
914	// It is wrong to optimize getWord(0) to VAL; there might be more than one word.
915	if (isSingleWord() \|\| getActiveBits() <= APINT_BITS_PER_WORD) {
916	if (isSigned) {
917	int64_t sext = SignExtend64(X: getWord(bitPosition: `0`), B: BitWidth);
918	return double(sext);
919	}
920	return double(getWord(bitPosition: `0`));
921	}
922
923	// Determine if the value is negative.
924	bool isNeg = isSigned ? (*this)[BitWidth-`1`] : false;
925
926	// Construct the absolute value if we're negative.
927	APInt Tmp(isNeg ? -(*this) : (*this));
928
929	// Figure out how many bits we're using.
930	unsigned n = Tmp.getActiveBits();
931
932	// The exponent (without bias normalization) is just the number of bits
933	// we are using. Note that the sign bit is gone since we constructed the
934	// absolute value.
935	uint64_t exp = n;
936
937	// Return infinity for exponent overflow
938	if (exp > `1023`) {
939	if (!isSigned \|\| !isNeg)
940	return std::numeric_limits<double>::infinity();
941	else
942	return -std::numeric_limits<double>::infinity();
943	}
944	exp += `1023`; // Increment for 1023 bias
945
946	// Number of bits in mantissa is 52. To obtain the mantissa value, we must
947	// extract the high 52 bits from the correct words in pVal.
948	uint64_t mantissa;
949	unsigned hiWord = whichWord(bitPosition: n-`1`);
950	if (hiWord == `0`) {
951	mantissa = Tmp.U.pVal[`0`];
952	if (n > `52`)
953	mantissa >>= n - `52`; // shift down, we want the top 52 bits.
954	} else {
955	assert(hiWord > `0` && "huh?");
956	uint64_t hibits = Tmp.U.pVal[hiWord] << (`52` - n % APINT_BITS_PER_WORD);
957	uint64_t lobits = Tmp.U.pVal[hiWord-`1`] >> (`11` + n % APINT_BITS_PER_WORD);
958	mantissa = hibits \| lobits;
959	}
960
961	// The leading bit of mantissa is implicit, so get rid of it.
962	uint64_t sign = isNeg ? (`1ULL` << (APINT_BITS_PER_WORD - `1`)) : `0`;
963	uint64_t I = sign \| (exp << `52`) \| mantissa;
964	return bit_cast<double>(from: I);
965	}
966
967	// Truncate to new width.
968	APInt APInt::trunc(unsigned width) const {
969	assert(width <= BitWidth && "Invalid APInt Truncate request");
970
971	if (width <= APINT_BITS_PER_WORD)
972	return APInt (width, getRawData()[`0`], /isSigned=/false,
973	/implicitTrunc=/true);
974
975	if (width == BitWidth)
976	return *this;
977
978	APInt Result(getMemory(numWords: getNumWords(BitWidth: width)), width);
979
980	// Copy full words.
981	unsigned i;
982	for (i = `0`; i != width / APINT_BITS_PER_WORD; i++)
983	Result.U.pVal[i] = U.pVal[i];
984
985	// Truncate and copy any partial word.
986	unsigned bits = (`0` - width) % APINT_BITS_PER_WORD;
987	if (bits != `0`)
988	Result.U.pVal[i] = U.pVal[i] << bits >> bits;
989
990	return Result;
991	}
992
993	// Truncate to new width with unsigned saturation.
994	APInt APInt::truncUSat(unsigned width) const {
995	assert(width <= BitWidth && "Invalid APInt Truncate request");
996
997	// Can we just losslessly truncate it?
998	if (isIntN(N: width))
999	return trunc(width);
1000	// If not, then just return the new limit.
1001	return APInt::getMaxValue(numBits: width);
1002	}
1003
1004	// Truncate to new width with signed saturation to signed result.
1005	APInt APInt::truncSSat(unsigned width) const {
1006	assert(width <= BitWidth && "Invalid APInt Truncate request");
1007
1008	// Can we just losslessly truncate it?
1009	if (isSignedIntN(N: width))
1010	return trunc(width);
1011	// If not, then just return the new limits.
1012	return isNegative() ? APInt::getSignedMinValue(numBits: width)
1013	: APInt::getSignedMaxValue(numBits: width);
1014	}
1015
1016	// Truncate to new width with signed saturation to unsigned result.
1017	APInt APInt::truncSSatU(unsigned width) const {
1018	assert(width <= BitWidth && "Invalid APInt Truncate request");
1019
1020	// Can we just losslessly truncate it?
1021	if (isIntN(N: width))
1022	return trunc(width);
1023	// If not, then just return the new limits.
1024	return isNegative() ? APInt::getZero(numBits: width) : APInt::getMaxValue(numBits: width);
1025	}
1026
1027	// Sign extend to a new width.
1028	APInt APInt::sext(unsigned Width) const {
1029	assert(Width >= BitWidth && "Invalid APInt SignExtend request");
1030
1031	if (Width <= APINT_BITS_PER_WORD)
1032	return APInt (Width, SignExtend64(X: U.VAL, B: BitWidth), /isSigned=/true);
1033
1034	if (Width == BitWidth)
1035	return *this;
1036
1037	APInt Result(getMemory(numWords: getNumWords(BitWidth: Width)), Width);
1038
1039	// Copy words.
1040	std::memcpy(dest: Result.U.pVal, src: getRawData(), n: getNumWords() * APINT_WORD_SIZE);
1041
1042	// Sign extend the last word since there may be unused bits in the input.
1043	Result.U.pVal[getNumWords() - `1`] =
1044	SignExtend64(X: Result.U.pVal[getNumWords() - `1`],
1045	B: ((BitWidth - `1`) % APINT_BITS_PER_WORD) + `1`);
1046
1047	// Fill with sign bits.
1048	std::memset(s: Result.U.pVal + getNumWords(), c: isNegative() ? -`1` : `0`,
1049	n: (Result.getNumWords() - getNumWords()) * APINT_WORD_SIZE);
1050	Result.clearUnusedBits();
1051	return Result;
1052	}
1053
1054	// Zero extend to a new width.
1055	APInt APInt::zext(unsigned width) const {
1056	assert(width >= BitWidth && "Invalid APInt ZeroExtend request");
1057
1058	if (width <= APINT_BITS_PER_WORD)
1059	return APInt (width, U.VAL);
1060
1061	if (width == BitWidth)
1062	return *this;
1063
1064	APInt Result(getMemory(numWords: getNumWords(BitWidth: width)), width);
1065
1066	// Copy words.
1067	std::memcpy(dest: Result.U.pVal, src: getRawData(), n: getNumWords() * APINT_WORD_SIZE);
1068
1069	// Zero remaining words.
1070	std::memset(s: Result.U.pVal + getNumWords(), c: `0`,
1071	n: (Result.getNumWords() - getNumWords()) * APINT_WORD_SIZE);
1072
1073	return Result;
1074	}
1075
1076	APInt APInt::zextOrTrunc(unsigned width) const {
1077	if (BitWidth < width)
1078	return zext(width);
1079	if (BitWidth > width)
1080	return trunc(width);
1081	return *this;
1082	}
1083
1084	APInt APInt::sextOrTrunc(unsigned width) const {
1085	if (BitWidth < width)
1086	return sext(Width: width);
1087	if (BitWidth > width)
1088	return trunc(width);
1089	return *this;
1090	}
1091
1092	/// Arithmetic right-shift this APInt by shiftAmt.
1093	/// Arithmetic right-shift function.
1094	void APInt::ashrInPlace(const APInt &shiftAmt) {
1095	ashrInPlace(ShiftAmt: (unsigned)shiftAmt.getLimitedValue(Limit: BitWidth));
1096	}
1097
1098	/// Arithmetic right-shift this APInt by shiftAmt.
1099	/// Arithmetic right-shift function.
1100	void APInt::ashrSlowCase(unsigned ShiftAmt) {
1101	// Don't bother performing a no-op shift.
1102	if (!ShiftAmt)
1103	return;
1104
1105	// Save the original sign bit for later.
1106	bool Negative = isNegative();
1107
1108	// WordShift is the inter-part shift; BitShift is intra-part shift.
1109	unsigned WordShift = ShiftAmt / APINT_BITS_PER_WORD;
1110	unsigned BitShift = ShiftAmt % APINT_BITS_PER_WORD;
1111
1112	unsigned WordsToMove = getNumWords() - WordShift;
1113	if (WordsToMove != `0`) {
1114	// Sign extend the last word to fill in the unused bits.
1115	U.pVal[getNumWords() - `1`] = SignExtend64(
1116	X: U.pVal[getNumWords() - `1`], B: ((BitWidth - `1`) % APINT_BITS_PER_WORD) + `1`);
1117
1118	// Fastpath for moving by whole words.
1119	if (BitShift == `0`) {
1120	std::memmove(dest: U.pVal, src: U.pVal + WordShift, n: WordsToMove * APINT_WORD_SIZE);
1121	} else {
1122	// Move the words containing significant bits.
1123	for (unsigned i = `0`; i != WordsToMove - `1`; ++i)
1124	U.pVal[i] = (U.pVal[i + WordShift] >> BitShift) \|
1125	(U.pVal[i + WordShift + `1`] << (APINT_BITS_PER_WORD - BitShift));
1126
1127	// Handle the last word which has no high bits to copy. Use an arithmetic
1128	// shift to preserve the sign bit.
1129	U.pVal[WordsToMove - `1`] =
1130	(int64_t)U.pVal[WordShift + WordsToMove - `1`] >> BitShift;
1131	}
1132	}
1133
1134	// Fill in the remainder based on the original sign.
1135	std::memset(s: U.pVal + WordsToMove, c: Negative ? -`1` : `0`,
1136	n: WordShift * APINT_WORD_SIZE);
1137	clearUnusedBits();
1138	}
1139
1140	/// Logical right-shift this APInt by shiftAmt.
1141	/// Logical right-shift function.
1142	void APInt::lshrInPlace(const APInt &shiftAmt) {
1143	lshrInPlace(ShiftAmt: (unsigned)shiftAmt.getLimitedValue(Limit: BitWidth));
1144	}
1145
1146	/// Logical right-shift this APInt by shiftAmt.
1147	/// Logical right-shift function.
1148	void APInt::lshrSlowCase(unsigned ShiftAmt) {
1149	tcShiftRight(U.pVal, Words: getNumWords(), Count: ShiftAmt);
1150	}
1151
1152	/// Left-shift this APInt by shiftAmt.
1153	/// Left-shift function.
1154	APInt &APInt::operator<<=(const APInt &shiftAmt) {
1155	// It's undefined behavior in C to shift by BitWidth or greater.
1156	*this <<= (unsigned)shiftAmt.getLimitedValue(Limit: BitWidth);
1157	return *this;
1158	}
1159
1160	void APInt::shlSlowCase(unsigned ShiftAmt) {
1161	tcShiftLeft(U.pVal, Words: getNumWords(), Count: ShiftAmt);
1162	clearUnusedBits();
1163	}
1164
1165	// Calculate the rotate amount modulo the bit width.
1166	static unsigned rotateModulo(unsigned BitWidth, const APInt &rotateAmt) {
1167	if (LLVM_UNLIKELY(BitWidth == `0`))
1168	return `0`;
1169	unsigned rotBitWidth = rotateAmt.getBitWidth();
1170	APInt rot = rotateAmt;
1171	if (rotBitWidth < BitWidth) {
1172	// Extend the rotate APInt, so that the urem doesn't divide by 0.
1173	// e.g. APInt(1, 32) would give APInt(1, 0).
1174	rot = rotateAmt.zext(width: BitWidth);
1175	}
1176	rot = rot.urem(RHS: APInt (rot.getBitWidth(), BitWidth));
1177	return rot.getLimitedValue(Limit: BitWidth);
1178	}
1179
1180	APInt APInt::rotl(const APInt &rotateAmt) const {
1181	return rotl(rotateAmt: rotateModulo(BitWidth, rotateAmt));
1182	}
1183
1184	APInt APInt::rotl(unsigned rotateAmt) const {
1185	if (LLVM_UNLIKELY(BitWidth == `0`))
1186	return *this;
1187	rotateAmt %= BitWidth;
1188	if (rotateAmt == `0`)
1189	return *this;
1190	return shl(shiftAmt: rotateAmt) \| lshr(shiftAmt: BitWidth - rotateAmt);
1191	}
1192
1193	APInt APInt::rotr(const APInt &rotateAmt) const {
1194	return rotr(rotateAmt: rotateModulo(BitWidth, rotateAmt));
1195	}
1196
1197	APInt APInt::rotr(unsigned rotateAmt) const {
1198	if (BitWidth == `0`)
1199	return *this;
1200	rotateAmt %= BitWidth;
1201	if (rotateAmt == `0`)
1202	return *this;
1203	return lshr(shiftAmt: rotateAmt) \| shl(shiftAmt: BitWidth - rotateAmt);
1204	}
1205
1206	/// \returns the nearest log base 2 of this APInt. Ties round up.
1207	///
1208	/// NOTE: When we have a BitWidth of 1, we define:
1209	///
1210	/// log2(0) = UINT32_MAX
1211	/// log2(1) = 0
1212	///
1213	/// to get around any mathematical concerns resulting from
1214	/// referencing 2 in a space where 2 does no exist.
1215	unsigned APInt::nearestLogBase2() const {
1216	// Special case when we have a bitwidth of 1. If VAL is 1, then we
1217	// get 0. If VAL is 0, we get WORDTYPE_MAX which gets truncated to
1218	// UINT32_MAX.
1219	if (BitWidth == `1`)
1220	return U.VAL - `1`;
1221
1222	// Handle the zero case.
1223	if (isZero())
1224	return UINT32_MAX;
1225
1226	// The non-zero case is handled by computing:
1227	//
1228	// nearestLogBase2(x) = logBase2(x) + x[logBase2(x)-1].
1229	//
1230	// where x[i] is referring to the value of the ith bit of x.
1231	unsigned lg = logBase2();
1232	return lg + unsigned((*this)[lg - `1`]);
1233	}
1234
1235	// Square Root - this method computes and returns the square root of "this".
1236	// Three mechanisms are used for computation. For small values (<= 5 bits),
1237	// a table lookup is done. This gets some performance for common cases. For
1238	// values using less than 52 bits, the value is converted to double and then
1239	// the libc sqrt function is called. The result is rounded and then converted
1240	// back to a uint64_t which is then used to construct the result. Finally,
1241	// the Babylonian method for computing square roots is used.
1242	APInt APInt::sqrtFloor() const {
1243
1244	// Determine the magnitude of the value.
1245	unsigned magnitude = getActiveBits();
1246
1247	// Use a fast table for some small values. This also gets rid of some
1248	// rounding errors in libc sqrt for small values.
1249	if (magnitude <= `5`) {
1250	static const uint8_t results[`32`] = {
1251	/ 0 / `0`,
1252	/ 1- 3 / `1`, `1`, `1`,
1253	/ 4- 8 / `2`, `2`, `2`, `2`, `2`,
1254	/ 9-15 / `3`, `3`, `3`, `3`, `3`, `3`, `3`,
1255	/ 16-24 / `4`, `4`, `4`, `4`, `4`, `4`, `4`, `4`, `4`,
1256	/ 25-31 / `5`, `5`, `5`, `5`, `5`, `5`, `5`,
1257	};
1258	return APInt (BitWidth, results[ (isSingleWord() ? U.VAL : U.pVal[`0`]) ]);
1259	}
1260
1261	// If the magnitude of the value fits in less than 52 bits (the precision of
1262	// an IEEE double precision floating point value), then we can use the
1263	// libc sqrt function which will probably use a hardware sqrt computation.
1264	// This should be faster than the algorithm below.
1265	if (magnitude < `52`) {
1266	return APInt (
1267	BitWidth,
1268	uint64_t(::floor(x: ::sqrt(x: double(isSingleWord() ? U.VAL : U.pVal[`0`])))));
1269	}
1270
1271	// Okay, all the short cuts are exhausted. We must compute it. The following
1272	// is a classical Babylonian method for computing the square root. This code
1273	// was adapted to APInt from a wikipedia article on such computations.
1274	// See http://www.wikipedia.org/ and go to the page named
1275	// Calculate_an_integer_square_root.
1276	unsigned nbits = BitWidth, i = `4`;
1277	APInt testy(BitWidth, `16`);
1278	APInt x_old(BitWidth, `1`);
1279	APInt x_new(BitWidth, `0`);
1280	APInt two(BitWidth, `2`);
1281
1282	// Select a good starting value using binary logarithms.
1283	for (;; i += `2`, testy = testy.shl(shiftAmt: `2`))
1284	if (i >= nbits \|\| this->ule(RHS: testy)) {
1285	x_old = x_old.shl(shiftAmt: i / `2`);
1286	break;
1287	}
1288
1289	// Use the Babylonian method to arrive at the integer square root:
1290	for (;;) {
1291	x_new = (this->udiv(RHS: x_old) + x_old).udiv(RHS: two);
1292	if (x_old.ule(RHS: x_new))
1293	break;
1294	x_old = x_new;
1295	}
1296	return x_old;
1297	}
1298
1299	/// \returns the multiplicative inverse of an odd APInt modulo 2^BitWidth.
1300	APInt APInt::multiplicativeInverse() const {
1301	assert((*this)[`0`] &&
1302	"multiplicative inverse is only defined for odd numbers!");
1303
1304	// Use Newton's method.
1305	APInt Factor = *this;
1306	APInt T;
1307	while (!(T = *this * Factor).isOne())
1308	Factor *= `2` - std::move(T);
1309	return Factor;
1310	}
1311
1312	/// Implementation of Knuth's Algorithm D (Division of nonnegative integers)
1313	/// from "Art of Computer Programming, Volume 2", section 4.3.1, p. 272. The
1314	/// variables here have the same names as in the algorithm. Comments explain
1315	/// the algorithm and any deviation from it.
1316	static void KnuthDiv(uint32_t u, uint32_t v, uint32_t q, uint32_t r,
1317	unsigned m, unsigned n) {
1318	assert(u && "Must provide dividend");
1319	assert(v && "Must provide divisor");
1320	assert(q && "Must provide quotient");
1321	assert(u != v && u != q && v != q && "Must use different memory");
1322	assert(n>`1` && "n must be > 1");
1323
1324	// b denotes the base of the number system. In our case b is 2^32.
1325	const uint64_t b = uint64_t(`1`) << `32`;
1326
1327	// The DEBUG macros here tend to be spam in the debug output if you're not
1328	// debugging this code. Disable them unless KNUTH_DEBUG is defined.
1329	#ifdef KNUTH_DEBUG
1330	#define DEBUG_KNUTH(X) LLVM_DEBUG(X)
1331	#else
1332	#define DEBUG_KNUTH(X) do {} while(false)
1333	#endif
1334
1335	DEBUG_KNUTH(dbgs() << "KnuthDiv: m=" << m << " n=" << n << `'\n'`);
1336	DEBUG_KNUTH(dbgs() << "KnuthDiv: original:");
1337	DEBUG_KNUTH(for (int i = m + n; i >= `0`; i--) dbgs() << " " << u[i]);
1338	DEBUG_KNUTH(dbgs() << " by");
1339	DEBUG_KNUTH(for (int i = n; i > `0`; i--) dbgs() << " " << v[i - `1`]);
1340	DEBUG_KNUTH(dbgs() << `'\n'`);
1341	// D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
1342	// u and v by d. Note that we have taken Knuth's advice here to use a power
1343	// of 2 value for d such that d v[n-1] >= b/2 (b is the base). A power of*
1344	// 2 allows us to shift instead of multiply and it is easy to determine the
1345	// shift amount from the leading zeros. We are basically normalizing the u
1346	// and v so that its high bits are shifted to the top of v's range without
1347	// overflow. Note that this can require an extra word in u so that u must
1348	// be of length m+n+1.
1349	unsigned shift = llvm::countl_zero(Val: v[n - `1`]);
1350	uint32_t v_carry = `0`;
1351	uint32_t u_carry = `0`;
1352	if (shift) {
1353	for (unsigned i = `0`; i < m+n; ++i) {
1354	uint32_t u_tmp = u[i] >> (`32` - shift);
1355	u[i] = (u[i] << shift) \| u_carry;
1356	u_carry = u_tmp;
1357	}
1358	for (unsigned i = `0`; i < n; ++i) {
1359	uint32_t v_tmp = v[i] >> (`32` - shift);
1360	v[i] = (v[i] << shift) \| v_carry;
1361	v_carry = v_tmp;
1362	}
1363	}
1364	u[m+n] = u_carry;
1365
1366	DEBUG_KNUTH(dbgs() << "KnuthDiv: normal:");
1367	DEBUG_KNUTH(for (int i = m + n; i >= `0`; i--) dbgs() << " " << u[i]);
1368	DEBUG_KNUTH(dbgs() << " by");
1369	DEBUG_KNUTH(for (int i = n; i > `0`; i--) dbgs() << " " << v[i - `1`]);
1370	DEBUG_KNUTH(dbgs() << `'\n'`);
1371
1372	// D2. [Initialize j.] Set j to m. This is the loop counter over the places.
1373	int j = m;
1374	do {
1375	DEBUG_KNUTH(dbgs() << "KnuthDiv: quotient digit #" << j << `'\n'`);
1376	// D3. [Calculate q'.].
1377	// Set qp = (u[j+n]b + u[j+n-1]) / v[n-1]. (qp=qprime=q')*
1378	// Set rp = (u[j+n]b + u[j+n-1]) % v[n-1]. (rp=rprime=r')*
1379	// Now test if qp == b or qpv[n-2] > brp + u[j+n-2]; if so, decrease
1380	// qp by 1, increase rp by v[n-1], and repeat this test if rp < b. The test
1381	// on v[n-2] determines at high speed most of the cases in which the trial
1382	// value qp is one too large, and it eliminates all cases where qp is two
1383	// too large.
1384	uint64_t dividend = Make_64(High: u[j+n], Low: u[j+n-`1`]);
1385	DEBUG_KNUTH(dbgs() << "KnuthDiv: dividend == " << dividend << `'\n'`);
1386	uint64_t qp = dividend / v[n-`1`];
1387	uint64_t rp = dividend % v[n-`1`];
1388	if (qp == b \|\| qpv[n-`2`] > brp + u[j+n-`2`]) {
1389	qp--;
1390	rp += v[n-`1`];
1391	if (rp < b && (qp == b \|\| qpv[n-`2`] > brp + u[j+n-`2`]))
1392	qp--;
1393	}
1394	DEBUG_KNUTH(dbgs() << "KnuthDiv: qp == " << qp << ", rp == " << rp << `'\n'`);
1395
1396	// D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
1397	// (u[j+n]u[j+n-1]..u[j]) - qp (v[n-1]...v[1]v[0]). This computation*
1398	// consists of a simple multiplication by a one-place number, combined with
1399	// a subtraction.
1400	// The digits (u[j+n]...u[j]) should be kept positive; if the result of
1401	// this step is actually negative, (u[j+n]...u[j]) should be left as the
1402	// true value plus b(n+1), namely as the b's complement of
1403	// the true value, and a "borrow" to the left should be remembered.
1404	int64_t borrow = `0`;
1405	for (unsigned i = `0`; i < n; ++i) {
1406	uint64_t p = qp * uint64_t(v[i]);
1407	int64_t subres = int64_t(u[j+i]) - borrow - Lo_32(Value: p);
1408	u[j+i] = Lo_32(Value: subres);
1409	borrow = Hi_32(Value: p) - Hi_32(Value: subres);
1410	DEBUG_KNUTH(dbgs() << "KnuthDiv: u[j+i] = " << u[j + i]
1411	<< ", borrow = " << borrow << `'\n'`);
1412	}
1413	bool isNeg = u[j+n] < borrow;
1414	u[j+n] -= Lo_32(Value: borrow);
1415
1416	DEBUG_KNUTH(dbgs() << "KnuthDiv: after subtraction:");
1417	DEBUG_KNUTH(for (int i = m + n; i >= `0`; i--) dbgs() << " " << u[i]);
1418	DEBUG_KNUTH(dbgs() << `'\n'`);
1419
1420	// D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
1421	// negative, go to step D6; otherwise go on to step D7.
1422	q[j] = Lo_32(Value: qp);
1423	if (isNeg) {
1424	// D6. [Add back]. The probability that this step is necessary is very
1425	// small, on the order of only 2/b. Make sure that test data accounts for
1426	// this possibility. Decrease q[j] by 1
1427	q[j]--;
1428	// and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
1429	// A carry will occur to the left of u[j+n], and it should be ignored
1430	// since it cancels with the borrow that occurred in D4.
1431	bool carry = false;
1432	for (unsigned i = `0`; i < n; i++) {
1433	uint32_t limit = std::min(a: u[j+i],b: v[i]);
1434	u[j+i] += v[i] + carry;
1435	carry = u[j+i] < limit \|\| (carry && u[j+i] == limit);
1436	}
1437	u[j+n] += carry;
1438	}
1439	DEBUG_KNUTH(dbgs() << "KnuthDiv: after correction:");
1440	DEBUG_KNUTH(for (int i = m + n; i >= `0`; i--) dbgs() << " " << u[i]);
1441	DEBUG_KNUTH(dbgs() << "\nKnuthDiv: digit result = " << q[j] << `'\n'`);
1442
1443	// D7. [Loop on j.] Decrease j by one. Now if j >= 0, go back to D3.
1444	} while (--j >= `0`);
1445
1446	DEBUG_KNUTH(dbgs() << "KnuthDiv: quotient:");
1447	DEBUG_KNUTH(for (int i = m; i >= `0`; i--) dbgs() << " " << q[i]);
1448	DEBUG_KNUTH(dbgs() << `'\n'`);
1449
1450	// D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
1451	// remainder may be obtained by dividing u[...] by d. If r is non-null we
1452	// compute the remainder (urem uses this).
1453	if (r) {
1454	// The value d is expressed by the "shift" value above since we avoided
1455	// multiplication by d by using a shift left. So, all we have to do is
1456	// shift right here.
1457	if (shift) {
1458	uint32_t carry = `0`;
1459	DEBUG_KNUTH(dbgs() << "KnuthDiv: remainder:");
1460	for (int i = n-`1`; i >= `0`; i--) {
1461	r[i] = (u[i] >> shift) \| carry;
1462	carry = u[i] << (`32` - shift);
1463	DEBUG_KNUTH(dbgs() << " " << r[i]);
1464	}
1465	} else {
1466	for (int i = n-`1`; i >= `0`; i--) {
1467	r[i] = u[i];
1468	DEBUG_KNUTH(dbgs() << " " << r[i]);
1469	}
1470	}
1471	DEBUG_KNUTH(dbgs() << `'\n'`);
1472	}
1473	DEBUG_KNUTH(dbgs() << `'\n'`);
1474	}
1475
1476	void APInt::divide(const WordType LHS, unsigned* lhsWords, const WordType *RHS,
1477	unsigned rhsWords, WordType Quotient, WordType Remainder) {
1478	assert(lhsWords >= rhsWords && "Fractional result");
1479
1480	// First, compose the values into an array of 32-bit words instead of
1481	// 64-bit words. This is a necessity of both the "short division" algorithm
1482	// and the Knuth "classical algorithm" which requires there to be native
1483	// operations for +, -, and on an m bit value with an m2 bit result. We
1484	// can't use 64-bit operands here because we don't have native results of
1485	// 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't
1486	// work on large-endian machines.
1487	unsigned n = rhsWords * `2`;
1488	unsigned m = (lhsWords * `2`) - n;
1489
1490	// Allocate space for the temporary values we need either on the stack, if
1491	// it will fit, or on the heap if it won't.
1492	uint32_t SPACE[`128`];
1493	uint32_t U = nullptr*;
1494	uint32_t V = nullptr*;
1495	uint32_t Q = nullptr*;
1496	uint32_t R = nullptr*;
1497	if ((Remainder?`4`:`3`)n+`2`m+`1` <= `128`) {
1498	U = &SPACE[`0`];
1499	V = &SPACE[m+n+`1`];
1500	Q = &SPACE[(m+n+`1`) + n];
1501	if (Remainder)
1502	R = &SPACE[(m+n+`1`) + n + (m+n)];
1503	} else {
1504	U = new uint32_t[m + n + `1`];
1505	V = new uint32_t[n];
1506	Q = new uint32_t[m+n];
1507	if (Remainder)
1508	R = new uint32_t[n];
1509	}
1510
1511	// Initialize the dividend
1512	memset(s: U, c: `0`, n: (m+n+`1`)*sizeof(uint32_t));
1513	for (unsigned i = `0`; i < lhsWords; ++i) {
1514	uint64_t tmp = LHS[i];
1515	U[i * `2`] = Lo_32(Value: tmp);
1516	U[i * `2` + `1`] = Hi_32(Value: tmp);
1517	}
1518	U[m+n] = `0`; // this extra word is for "spill" in the Knuth algorithm.
1519
1520	// Initialize the divisor
1521	memset(s: V, c: `0`, n: (n)*sizeof(uint32_t));
1522	for (unsigned i = `0`; i < rhsWords; ++i) {
1523	uint64_t tmp = RHS[i];
1524	V[i * `2`] = Lo_32(Value: tmp);
1525	V[i * `2` + `1`] = Hi_32(Value: tmp);
1526	}
1527
1528	// initialize the quotient and remainder
1529	memset(s: Q, c: `0`, n: (m+n) * sizeof(uint32_t));
1530	if (Remainder)
1531	memset(s: R, c: `0`, n: n * sizeof(uint32_t));
1532
1533	// Now, adjust m and n for the Knuth division. n is the number of words in
1534	// the divisor. m is the number of words by which the dividend exceeds the
1535	// divisor (i.e. m+n is the length of the dividend). These sizes must not
1536	// contain any zero words or the Knuth algorithm fails.
1537	for (unsigned i = n; i > `0` && V[i-`1`] == `0`; i--) {
1538	n--;
1539	m++;
1540	}
1541	for (unsigned i = m+n; i > `0` && U[i-`1`] == `0`; i--)
1542	m--;
1543
1544	// If we're left with only a single word for the divisor, Knuth doesn't work
1545	// so we implement the short division algorithm here. This is much simpler
1546	// and faster because we are certain that we can divide a 64-bit quantity
1547	// by a 32-bit quantity at hardware speed and short division is simply a
1548	// series of such operations. This is just like doing short division but we
1549	// are using base 2^32 instead of base 10.
1550	assert(n != `0` && "Divide by zero?");
1551	if (n == `1`) {
1552	uint32_t divisor = V[`0`];
1553	uint32_t remainder = `0`;
1554	for (int i = m; i >= `0`; i--) {
1555	uint64_t partial_dividend = Make_64(High: remainder, Low: U[i]);
1556	if (partial_dividend == `0`) {
1557	Q[i] = `0`;
1558	remainder = `0`;
1559	} else if (partial_dividend < divisor) {
1560	Q[i] = `0`;
1561	remainder = Lo_32(Value: partial_dividend);
1562	} else if (partial_dividend == divisor) {
1563	Q[i] = `1`;
1564	remainder = `0`;
1565	} else {
1566	Q[i] = Lo_32(Value: partial_dividend / divisor);
1567	remainder = Lo_32(Value: partial_dividend - (Q[i] * divisor));
1568	}
1569	}
1570	if (R)
1571	R[`0`] = remainder;
1572	} else {
1573	// Now we're ready to invoke the Knuth classical divide algorithm. In this
1574	// case n > 1.
1575	KnuthDiv(u: U, v: V, q: Q, r: R, m, n);
1576	}
1577
1578	// If the caller wants the quotient
1579	if (Quotient) {
1580	for (unsigned i = `0`; i < lhsWords; ++i)
1581	Quotient[i] = Make_64(High: Q[i`2`+`1`], Low: Q[i`2`]);
1582	}
1583
1584	// If the caller wants the remainder
1585	if (Remainder) {
1586	for (unsigned i = `0`; i < rhsWords; ++i)
1587	Remainder[i] = Make_64(High: R[i`2`+`1`], Low: R[i`2`]);
1588	}
1589
1590	// Clean up the memory we allocated.
1591	if (U != &SPACE[`0`]) {
1592	delete [] U;
1593	delete [] V;
1594	delete [] Q;
1595	delete [] R;
1596	}
1597	}
1598
1599	APInt APInt::udiv(const APInt &RHS) const {
1600	assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
1601
1602	// First, deal with the easy case
1603	if (isSingleWord()) {
1604	assert(RHS.U.VAL != `0` && "Divide by zero?");
1605	return APInt (BitWidth, U.VAL / RHS.U.VAL);
1606	}
1607
1608	// Get some facts about the LHS and RHS number of bits and words
1609	unsigned lhsWords = getNumWords(BitWidth: getActiveBits());
1610	unsigned rhsBits = RHS.getActiveBits();
1611	unsigned rhsWords = getNumWords(BitWidth: rhsBits);
1612	assert(rhsWords && "Divided by zero???");
1613
1614	// Deal with some degenerate cases
1615	if (!lhsWords)
1616	// 0 / X ===> 0
1617	return APInt (BitWidth, `0`);
1618	if (rhsBits == `1`)
1619	// X / 1 ===> X
1620	return *this;
1621	if (lhsWords < rhsWords \|\| this->ult(RHS))
1622	// X / Y ===> 0, iff X < Y
1623	return APInt (BitWidth, `0`);
1624	if (*this == RHS)
1625	// X / X ===> 1
1626	return APInt (BitWidth, `1`);
1627	if (lhsWords == `1`) // rhsWords is 1 if lhsWords is 1.
1628	// All high words are zero, just use native divide
1629	return APInt (BitWidth, this->U.pVal[`0`] / RHS.U.pVal[`0`]);
1630
1631	// We have to compute it the hard way. Invoke the Knuth divide algorithm.
1632	APInt Quotient(BitWidth, `0`); // to hold result.
1633	divide(LHS: U.pVal, lhsWords, RHS: RHS.U.pVal, rhsWords, Quotient: Quotient.U.pVal, Remainder: nullptr);
1634	return Quotient;
1635	}
1636
1637	APInt APInt::udiv(uint64_t RHS) const {
1638	assert(RHS != `0` && "Divide by zero?");
1639
1640	// First, deal with the easy case
1641	if (isSingleWord())
1642	return APInt (BitWidth, U.VAL / RHS);
1643
1644	// Get some facts about the LHS words.
1645	unsigned lhsWords = getNumWords(BitWidth: getActiveBits());
1646
1647	// Deal with some degenerate cases
1648	if (!lhsWords)
1649	// 0 / X ===> 0
1650	return APInt (BitWidth, `0`);
1651	if (RHS == `1`)
1652	// X / 1 ===> X
1653	return *this;
1654	if (this->ult(RHS))
1655	// X / Y ===> 0, iff X < Y
1656	return APInt (BitWidth, `0`);
1657	if (*this == RHS)
1658	// X / X ===> 1
1659	return APInt (BitWidth, `1`);
1660	if (lhsWords == `1`) // rhsWords is 1 if lhsWords is 1.
1661	// All high words are zero, just use native divide
1662	return APInt (BitWidth, this->U.pVal[`0`] / RHS);
1663
1664	// We have to compute it the hard way. Invoke the Knuth divide algorithm.
1665	APInt Quotient(BitWidth, `0`); // to hold result.
1666	divide(LHS: U.pVal, lhsWords, RHS: &RHS, rhsWords: `1`, Quotient: Quotient.U.pVal, Remainder: nullptr);
1667	return Quotient;
1668	}
1669
1670	APInt APInt::sdiv(const APInt &RHS) const {
1671	if (isNegative()) {
1672	if (RHS.isNegative())
1673	return (-(*this)).udiv(RHS: -RHS);
1674	return -((-(*this)).udiv(RHS));
1675	}
1676	if (RHS.isNegative())
1677	return -(this->udiv(RHS: -RHS));
1678	return this->udiv(RHS);
1679	}
1680
1681	APInt APInt::sdiv(int64_t RHS) const {
1682	if (isNegative()) {
1683	if (RHS < `0`)
1684	return (-(*this)).udiv(RHS: -RHS);
1685	return -((-(*this)).udiv(RHS));
1686	}
1687	if (RHS < `0`)
1688	return -(this->udiv(RHS: -RHS));
1689	return this->udiv(RHS);
1690	}
1691
1692	APInt APInt::urem(const APInt &RHS) const {
1693	assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
1694	if (isSingleWord()) {
1695	assert(RHS.U.VAL != `0` && "Remainder by zero?");
1696	return APInt (BitWidth, U.VAL % RHS.U.VAL);
1697	}
1698
1699	// Get some facts about the LHS
1700	unsigned lhsWords = getNumWords(BitWidth: getActiveBits());
1701
1702	// Get some facts about the RHS
1703	unsigned rhsBits = RHS.getActiveBits();
1704	unsigned rhsWords = getNumWords(BitWidth: rhsBits);
1705	assert(rhsWords && "Performing remainder operation by zero ???");
1706
1707	// Check the degenerate cases
1708	if (lhsWords == `0`)
1709	// 0 % Y ===> 0
1710	return APInt (BitWidth, `0`);
1711	if (rhsBits == `1`)
1712	// X % 1 ===> 0
1713	return APInt (BitWidth, `0`);
1714	if (lhsWords < rhsWords \|\| this->ult(RHS))
1715	// X % Y ===> X, iff X < Y
1716	return *this;
1717	if (*this == RHS)
1718	// X % X == 0;
1719	return APInt (BitWidth, `0`);
1720	if (lhsWords == `1`)
1721	// All high words are zero, just use native remainder
1722	return APInt (BitWidth, U.pVal[`0`] % RHS.U.pVal[`0`]);
1723	if (RHS.isPowerOf2()) {
1724	// X % 2^w ===> X & (2^w - 1)
1725	APInt Result(*this);
1726	Result.clearBits(LoBit: RHS.logBase2(), HiBit: BitWidth);
1727	return Result;
1728	}
1729
1730	// We have to compute it the hard way. Invoke the Knuth divide algorithm.
1731	APInt Remainder(BitWidth, `0`);
1732	divide(LHS: U.pVal, lhsWords, RHS: RHS.U.pVal, rhsWords, Quotient: nullptr, Remainder: Remainder.U.pVal);
1733	return Remainder;
1734	}
1735
1736	uint64_t APInt::urem(uint64_t RHS) const {
1737	assert(RHS != `0` && "Remainder by zero?");
1738
1739	if (isSingleWord())
1740	return U.VAL % RHS;
1741
1742	// Get some facts about the LHS
1743	unsigned lhsWords = getNumWords(BitWidth: getActiveBits());
1744
1745	// Check the degenerate cases
1746	if (lhsWords == `0`)
1747	// 0 % Y ===> 0
1748	return `0`;
1749	if (RHS == `1`)
1750	// X % 1 ===> 0
1751	return `0`;
1752	if (this->ult(RHS))
1753	// X % Y ===> X, iff X < Y
1754	return getZExtValue();
1755	if (*this == RHS)
1756	// X % X == 0;
1757	return `0`;
1758	if (lhsWords == `1`)
1759	// All high words are zero, just use native remainder
1760	return U.pVal[`0`] % RHS;
1761	if (llvm::isPowerOf2_64(Value: RHS))
1762	// X % 2^w ===> X & (2^w - 1)
1763	return U.pVal[`0`] & (RHS - `1`);
1764
1765	// We have to compute it the hard way. Invoke the Knuth divide algorithm.
1766	uint64_t Remainder;
1767	divide(LHS: U.pVal, lhsWords, RHS: &RHS, rhsWords: `1`, Quotient: nullptr, Remainder: &Remainder);
1768	return Remainder;
1769	}
1770
1771	APInt APInt::srem(const APInt &RHS) const {
1772	if (isNegative()) {
1773	if (RHS.isNegative())
1774	return -((-(*this)).urem(RHS: -RHS));
1775	return -((-(*this)).urem(RHS));
1776	}
1777	if (RHS.isNegative())
1778	return this->urem(RHS: -RHS);
1779	return this->urem(RHS);
1780	}
1781
1782	int64_t APInt::srem(int64_t RHS) const {
1783	if (isNegative()) {
1784	if (RHS < `0`)
1785	return -((-(*this)).urem(RHS: -RHS));
1786	return -((-(*this)).urem(RHS));
1787	}
1788	if (RHS < `0`)
1789	return this->urem(RHS: -RHS);
1790	return this->urem(RHS);
1791	}
1792
1793	void APInt::udivrem(const APInt &LHS, const APInt &RHS,
1794	APInt &Quotient, APInt &Remainder) {
1795	assert(LHS.BitWidth == RHS.BitWidth && "Bit widths must be the same");
1796	unsigned BitWidth = LHS.BitWidth;
1797
1798	// First, deal with the easy case
1799	if (LHS.isSingleWord()) {
1800	assert(RHS.U.VAL != `0` && "Divide by zero?");
1801	uint64_t QuotVal = LHS.U.VAL / RHS.U.VAL;
1802	uint64_t RemVal = LHS.U.VAL % RHS.U.VAL;
1803	Quotient = APInt (BitWidth, QuotVal);
1804	Remainder = APInt (BitWidth, RemVal);
1805	return;
1806	}
1807
1808	// Get some size facts about the dividend and divisor
1809	unsigned lhsWords = getNumWords(BitWidth: LHS.getActiveBits());
1810	unsigned rhsBits = RHS.getActiveBits();
1811	unsigned rhsWords = getNumWords(BitWidth: rhsBits);
1812	assert(rhsWords && "Performing divrem operation by zero ???");
1813
1814	// Check the degenerate cases
1815	if (lhsWords == `0`) {
1816	Quotient = APInt (BitWidth, `0`); // 0 / Y ===> 0
1817	Remainder = APInt (BitWidth, `0`); // 0 % Y ===> 0
1818	return;
1819	}
1820
1821	if (rhsBits == `1`) {
1822	Quotient = LHS; // X / 1 ===> X
1823	Remainder = APInt (BitWidth, `0`); // X % 1 ===> 0
1824	}
1825
1826	if (lhsWords < rhsWords \|\| LHS.ult(RHS)) {
1827	Remainder = LHS; // X % Y ===> X, iff X < Y
1828	Quotient = APInt (BitWidth, `0`); // X / Y ===> 0, iff X < Y
1829	return;
1830	}
1831
1832	if (LHS == RHS) {
1833	Quotient = APInt (BitWidth, `1`); // X / X ===> 1
1834	Remainder = APInt (BitWidth, `0`); // X % X ===> 0;
1835	return;
1836	}
1837
1838	// Make sure there is enough space to hold the results.
1839	// NOTE: This assumes that reallocate won't affect any bits if it doesn't
1840	// change the size. This is necessary if Quotient or Remainder is aliased
1841	// with LHS or RHS.
1842	Quotient.reallocate(NewBitWidth: BitWidth);
1843	Remainder.reallocate(NewBitWidth: BitWidth);
1844
1845	if (lhsWords == `1`) { // rhsWords is 1 if lhsWords is 1.
1846	// There is only one word to consider so use the native versions.
1847	uint64_t lhsValue = LHS.U.pVal[`0`];
1848	uint64_t rhsValue = RHS.U.pVal[`0`];
1849	Quotient = lhsValue / rhsValue;
1850	Remainder = lhsValue % rhsValue;
1851	return;
1852	}
1853
1854	// Okay, lets do it the long way
1855	divide(LHS: LHS.U.pVal, lhsWords, RHS: RHS.U.pVal, rhsWords, Quotient: Quotient.U.pVal,
1856	Remainder: Remainder.U.pVal);
1857	// Clear the rest of the Quotient and Remainder.
1858	std::memset(s: Quotient.U.pVal + lhsWords, c: `0`,
1859	n: (getNumWords(BitWidth) - lhsWords) * APINT_WORD_SIZE);
1860	std::memset(s: Remainder.U.pVal + rhsWords, c: `0`,
1861	n: (getNumWords(BitWidth) - rhsWords) * APINT_WORD_SIZE);
1862	}
1863
1864	void APInt::udivrem(const APInt &LHS, uint64_t RHS, APInt &Quotient,
1865	uint64_t &Remainder) {
1866	assert(RHS != `0` && "Divide by zero?");
1867	unsigned BitWidth = LHS.BitWidth;
1868
1869	// First, deal with the easy case
1870	if (LHS.isSingleWord()) {
1871	uint64_t QuotVal = LHS.U.VAL / RHS;
1872	Remainder = LHS.U.VAL % RHS;
1873	Quotient = APInt (BitWidth, QuotVal);
1874	return;
1875	}
1876
1877	// Get some size facts about the dividend and divisor
1878	unsigned lhsWords = getNumWords(BitWidth: LHS.getActiveBits());
1879
1880	// Check the degenerate cases
1881	if (lhsWords == `0`) {
1882	Quotient = APInt (BitWidth, `0`); // 0 / Y ===> 0
1883	Remainder = `0`; // 0 % Y ===> 0
1884	return;
1885	}
1886
1887	if (RHS == `1`) {
1888	Quotient = LHS; // X / 1 ===> X
1889	Remainder = `0`; // X % 1 ===> 0
1890	return;
1891	}
1892
1893	if (LHS.ult(RHS)) {
1894	Remainder = LHS.getZExtValue(); // X % Y ===> X, iff X < Y
1895	Quotient = APInt (BitWidth, `0`); // X / Y ===> 0, iff X < Y
1896	return;
1897	}
1898
1899	if (LHS == RHS) {
1900	Quotient = APInt (BitWidth, `1`); // X / X ===> 1
1901	Remainder = `0`; // X % X ===> 0;
1902	return;
1903	}
1904
1905	// Make sure there is enough space to hold the results.
1906	// NOTE: This assumes that reallocate won't affect any bits if it doesn't
1907	// change the size. This is necessary if Quotient is aliased with LHS.
1908	Quotient.reallocate(NewBitWidth: BitWidth);
1909
1910	if (lhsWords == `1`) { // rhsWords is 1 if lhsWords is 1.
1911	// There is only one word to consider so use the native versions.
1912	uint64_t lhsValue = LHS.U.pVal[`0`];
1913	Quotient = lhsValue / RHS;
1914	Remainder = lhsValue % RHS;
1915	return;
1916	}
1917
1918	// Okay, lets do it the long way
1919	divide(LHS: LHS.U.pVal, lhsWords, RHS: &RHS, rhsWords: `1`, Quotient: Quotient.U.pVal, Remainder: &Remainder);
1920	// Clear the rest of the Quotient.
1921	std::memset(s: Quotient.U.pVal + lhsWords, c: `0`,
1922	n: (getNumWords(BitWidth) - lhsWords) * APINT_WORD_SIZE);
1923	}
1924
1925	void APInt::sdivrem(const APInt &LHS, const APInt &RHS,
1926	APInt &Quotient, APInt &Remainder) {
1927	if (LHS.isNegative()) {
1928	if (RHS.isNegative())
1929	APInt::udivrem(LHS: -LHS, RHS: -RHS, Quotient, Remainder);
1930	else {
1931	APInt::udivrem(LHS: -LHS, RHS, Quotient, Remainder);
1932	Quotient.negate();
1933	}
1934	Remainder.negate();
1935	} else if (RHS.isNegative()) {
1936	APInt::udivrem(LHS, RHS: -RHS, Quotient, Remainder);
1937	Quotient.negate();
1938	} else {
1939	APInt::udivrem(LHS, RHS, Quotient, Remainder);
1940	}
1941	}
1942
1943	void APInt::sdivrem(const APInt &LHS, int64_t RHS,
1944	APInt &Quotient, int64_t &Remainder) {
1945	uint64_t R = Remainder;
1946	if (LHS.isNegative()) {
1947	if (RHS < `0`)
1948	APInt::udivrem(LHS: -LHS, RHS: -RHS, Quotient, Remainder&: R);
1949	else {
1950	APInt::udivrem(LHS: -LHS, RHS, Quotient, Remainder&: R);
1951	Quotient.negate();
1952	}
1953	R = -R;
1954	} else if (RHS < `0`) {
1955	APInt::udivrem(LHS, RHS: -RHS, Quotient, Remainder&: R);
1956	Quotient.negate();
1957	} else {
1958	APInt::udivrem(LHS, RHS, Quotient, Remainder&: R);
1959	}
1960	Remainder = R;
1961	}
1962
1963	APInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
1964	APInt Res = *this+RHS;
1965	Overflow = isNonNegative() == RHS.isNonNegative() &&
1966	Res.isNonNegative() != isNonNegative();
1967	return Res;
1968	}
1969
1970	APInt APInt::uadd_ov(const APInt &RHS, bool &Overflow) const {
1971	APInt Res = *this+RHS;
1972	Overflow = Res.ult(RHS);
1973	return Res;
1974	}
1975
1976	APInt APInt::ssub_ov(const APInt &RHS, bool &Overflow) const {
1977	APInt Res = *this - RHS;
1978	Overflow = isNonNegative() != RHS.isNonNegative() &&
1979	Res.isNonNegative() != isNonNegative();
1980	return Res;
1981	}
1982
1983	APInt APInt::usub_ov(const APInt &RHS, bool &Overflow) const {
1984	APInt Res = *this-RHS;
1985	Overflow = Res.ugt(RHS: *this);
1986	return Res;
1987	}
1988
1989	APInt APInt::sdiv_ov(const APInt &RHS, bool &Overflow) const {
1990	// MININT/-1 --> overflow.
1991	Overflow = isMinSignedValue() && RHS.isAllOnes();
1992	return sdiv(RHS);
1993	}
1994
1995	APInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
1996	APInt Res = *this * RHS;
1997
1998	if (RHS != `0`)
1999	Overflow = Res.sdiv(RHS) != *this \|\|
2000	(isMinSignedValue() && RHS.isAllOnes());
2001	else
2002	Overflow = false;
2003	return Res;
2004	}
2005
2006	APInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
2007	if (countl_zero() + RHS.countl_zero() + `2` <= BitWidth) {
2008	Overflow = true;
2009	return *this * RHS;
2010	}
2011
2012	APInt Res = lshr(shiftAmt: `1`) * RHS;
2013	Overflow = Res.isNegative();
2014	Res <<= `1`;
2015	if ((*this)[`0`]) {
2016	Res += RHS;
2017	if (Res.ult(RHS))
2018	Overflow = true;
2019	}
2020	return Res;
2021	}
2022
2023	APInt APInt::sshl_ov(const APInt &ShAmt, bool &Overflow) const {
2024	return sshl_ov(Amt: ShAmt.getLimitedValue(Limit: getBitWidth()), Overflow);
2025	}
2026
2027	APInt APInt::sshl_ov(unsigned ShAmt, bool &Overflow) const {
2028	Overflow = ShAmt >= getBitWidth();
2029	if (Overflow)
2030	return APInt (BitWidth, `0`);
2031
2032	if (isNonNegative()) // Don't allow sign change.
2033	Overflow = ShAmt >= countl_zero();
2034	else
2035	Overflow = ShAmt >= countl_one();
2036
2037	return *this << ShAmt;
2038	}
2039
2040	APInt APInt::ushl_ov(const APInt &ShAmt, bool &Overflow) const {
2041	return ushl_ov(Amt: ShAmt.getLimitedValue(Limit: getBitWidth()), Overflow);
2042	}
2043
2044	APInt APInt::ushl_ov(unsigned ShAmt, bool &Overflow) const {
2045	Overflow = ShAmt >= getBitWidth();
2046	if (Overflow)
2047	return APInt (BitWidth, `0`);
2048
2049	Overflow = ShAmt > countl_zero();
2050
2051	return *this << ShAmt;
2052	}
2053
2054	APInt APInt::sfloordiv_ov(const APInt &RHS, bool &Overflow) const {
2055	APInt quotient = sdiv_ov(RHS, Overflow);
2056	if ((quotient * RHS != *this) && (isNegative() != RHS.isNegative()))
2057	return quotient - `1`;
2058	return quotient;
2059	}
2060
2061	APInt APInt::sadd_sat(const APInt &RHS) const {
2062	bool Overflow;
2063	APInt Res = sadd_ov(RHS, Overflow);
2064	if (!Overflow)
2065	return Res;
2066
2067	return isNegative() ? APInt::getSignedMinValue(numBits: BitWidth)
2068	: APInt::getSignedMaxValue(numBits: BitWidth);
2069	}
2070
2071	APInt APInt::uadd_sat(const APInt &RHS) const {
2072	bool Overflow;
2073	APInt Res = uadd_ov(RHS, Overflow);
2074	if (!Overflow)
2075	return Res;
2076
2077	return APInt::getMaxValue(numBits: BitWidth);
2078	}
2079
2080	APInt APInt::ssub_sat(const APInt &RHS) const {
2081	bool Overflow;
2082	APInt Res = ssub_ov(RHS, Overflow);
2083	if (!Overflow)
2084	return Res;
2085
2086	return isNegative() ? APInt::getSignedMinValue(numBits: BitWidth)
2087	: APInt::getSignedMaxValue(numBits: BitWidth);
2088	}
2089
2090	APInt APInt::usub_sat(const APInt &RHS) const {
2091	bool Overflow;
2092	APInt Res = usub_ov(RHS, Overflow);
2093	if (!Overflow)
2094	return Res;
2095
2096	return APInt (BitWidth, `0`);
2097	}
2098
2099	APInt APInt::smul_sat(const APInt &RHS) const {
2100	bool Overflow;
2101	APInt Res = smul_ov(RHS, Overflow);
2102	if (!Overflow)
2103	return Res;
2104
2105	// The result is negative if one and only one of inputs is negative.
2106	bool ResIsNegative = isNegative() ^ RHS.isNegative();
2107
2108	return ResIsNegative ? APInt::getSignedMinValue(numBits: BitWidth)
2109	: APInt::getSignedMaxValue(numBits: BitWidth);
2110	}
2111
2112	APInt APInt::umul_sat(const APInt &RHS) const {
2113	bool Overflow;
2114	APInt Res = umul_ov(RHS, Overflow);
2115	if (!Overflow)
2116	return Res;
2117
2118	return APInt::getMaxValue(numBits: BitWidth);
2119	}
2120
2121	APInt APInt::sshl_sat(const APInt &RHS) const {
2122	return sshl_sat(RHS: RHS.getLimitedValue(Limit: getBitWidth()));
2123	}
2124
2125	APInt APInt::sshl_sat(unsigned RHS) const {
2126	bool Overflow;
2127	APInt Res = sshl_ov(ShAmt: RHS, Overflow);
2128	if (!Overflow)
2129	return Res;
2130
2131	return isNegative() ? APInt::getSignedMinValue(numBits: BitWidth)
2132	: APInt::getSignedMaxValue(numBits: BitWidth);
2133	}
2134
2135	APInt APInt::ushl_sat(const APInt &RHS) const {
2136	return ushl_sat(RHS: RHS.getLimitedValue(Limit: getBitWidth()));
2137	}
2138
2139	APInt APInt::ushl_sat(unsigned RHS) const {
2140	bool Overflow;
2141	APInt Res = ushl_ov(ShAmt: RHS, Overflow);
2142	if (!Overflow)
2143	return Res;
2144
2145	return APInt::getMaxValue(numBits: BitWidth);
2146	}
2147
2148	void APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
2149	// Check our assumptions here
2150	assert(!str.empty() && "Invalid string length");
2151	assert((radix == `10` \|\| radix == `8` \|\| radix == `16` \|\| radix == `2` \|\|
2152	radix == `36`) &&
2153	"Radix should be 2, 8, 10, 16, or 36!");
2154
2155	StringRef::iterator p = str.begin();
2156	size_t slen = str.size();
2157	bool isNeg = *p == `'-'`;
2158	if (p == `'-'` \|\| p == `'+'`) {
2159	p++;
2160	slen--;
2161	assert(slen && "String is only a sign, needs a value.");
2162	}
2163	assert((slen <= numbits \|\| radix != `2`) && "Insufficient bit width");
2164	assert(((slen-`1`)*`3` <= numbits \|\| radix != `8`) && "Insufficient bit width");
2165	assert(((slen-`1`)*`4` <= numbits \|\| radix != `16`) && "Insufficient bit width");
2166	assert((((slen-`1`)*`64`)/`22` <= numbits \|\| radix != `10`) &&
2167	"Insufficient bit width");
2168
2169	// Allocate memory if needed
2170	if (isSingleWord())
2171	U.VAL = `0`;
2172	else
2173	U.pVal = getClearedMemory(numWords: getNumWords());
2174
2175	// Figure out if we can shift instead of multiply
2176	unsigned shift = (radix == `16` ? `4` : radix == `8` ? `3` : radix == `2` ? `1` : `0`);
2177
2178	// Enter digit traversal loop
2179	for (StringRef::iterator e = str.end(); p != e; ++p) {
2180	unsigned digit = getDigit(cdigit: *p, radix);
2181	assert(digit < radix && "Invalid character in digit string");
2182
2183	// Shift or multiply the value by the radix
2184	if (slen > `1`) {
2185	if (shift)
2186	*this <<= shift;
2187	else
2188	*this *= radix;
2189	}
2190
2191	// Add in the digit we just interpreted
2192	*this += digit;
2193	}
2194	// If its negative, put it in two's complement form
2195	if (isNeg)
2196	this->negate();
2197	}
2198
2199	void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix, bool Signed,
2200	bool formatAsCLiteral, bool UpperCase,
2201	bool InsertSeparators) const {
2202	assert((Radix == `10` \|\| Radix == `8` \|\| Radix == `16` \|\| Radix == `2` \|\|
2203	Radix == `36`) &&
2204	"Radix should be 2, 8, 10, 16, or 36!");
2205
2206	const char *Prefix = "";
2207	if (formatAsCLiteral) {
2208	switch (Radix) {
2209	case `2`:
2210	// Binary literals are a non-standard extension added in gcc 4.3:
2211	// http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
2212	Prefix = "0b";
2213	break;
2214	case `8`:
2215	Prefix = "0";
2216	break;
2217	case `10`:
2218	break; // No prefix
2219	case `16`:
2220	Prefix = "0x";
2221	break;
2222	default:
2223	llvm_unreachable("Invalid radix!");
2224	}
2225	}
2226
2227	// Number of digits in a group between separators.
2228	unsigned Grouping = (Radix == `8` \|\| Radix == `10`) ? `3` : `4`;
2229
2230	// First, check for a zero value and just short circuit the logic below.
2231	if (isZero()) {
2232	while (*Prefix) {
2233	Str.push_back(Elt: *Prefix);
2234	++Prefix;
2235	};
2236	Str.push_back(Elt: `'0'`);
2237	return;
2238	}
2239
2240	static const char BothDigits[] = "0123456789abcdefghijklmnopqrstuvwxyz"
2241	"0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
2242	const char *Digits = BothDigits + (UpperCase ? `36` : `0`);
2243
2244	if (isSingleWord()) {
2245	char Buffer[`65`];
2246	char *BufPtr = std::end(arr&: Buffer);
2247
2248	uint64_t N;
2249	if (!Signed) {
2250	N = getZExtValue();
2251	} else {
2252	int64_t I = getSExtValue();
2253	if (I >= `0`) {
2254	N = I;
2255	} else {
2256	Str.push_back(Elt: `'-'`);
2257	N = -(uint64_t)I;
2258	}
2259	}
2260
2261	while (*Prefix) {
2262	Str.push_back(Elt: *Prefix);
2263	++Prefix;
2264	};
2265
2266	int Pos = `0`;
2267	while (N) {
2268	if (InsertSeparators && Pos % Grouping == `0` && Pos > `0`)
2269	*--BufPtr = `'\''`;
2270	*--BufPtr = Digits[N % Radix];
2271	N /= Radix;
2272	Pos++;
2273	}
2274	Str.append(in_start: BufPtr, in_end: std::end(arr&: Buffer));
2275	return;
2276	}
2277
2278	APInt Tmp(*this);
2279
2280	if (Signed && isNegative()) {
2281	// They want to print the signed version and it is a negative value
2282	// Flip the bits and add one to turn it into the equivalent positive
2283	// value and put a '-' in the result.
2284	Tmp.negate();
2285	Str.push_back(Elt: `'-'`);
2286	}
2287
2288	while (*Prefix) {
2289	Str.push_back(Elt: *Prefix);
2290	++Prefix;
2291	}
2292
2293	// We insert the digits backward, then reverse them to get the right order.
2294	unsigned StartDig = Str.size();
2295
2296	// For the 2, 8 and 16 bit cases, we can just shift instead of divide
2297	// because the number of bits per digit (1, 3 and 4 respectively) divides
2298	// equally. We just shift until the value is zero.
2299	if (Radix == `2` \|\| Radix == `8` \|\| Radix == `16`) {
2300	// Just shift tmp right for each digit width until it becomes zero
2301	unsigned ShiftAmt = (Radix == `16` ? `4` : (Radix == `8` ? `3` : `1`));
2302	unsigned MaskAmt = Radix - `1`;
2303
2304	int Pos = `0`;
2305	while (Tmp.getBoolValue()) {
2306	unsigned Digit = unsigned(Tmp.getRawData()[`0`]) & MaskAmt;
2307	if (InsertSeparators && Pos % Grouping == `0` && Pos > `0`)
2308	Str.push_back(Elt: `'\''`);
2309
2310	Str.push_back(Elt: Digits[Digit]);
2311	Tmp.lshrInPlace(ShiftAmt);
2312	Pos++;
2313	}
2314	} else {
2315	int Pos = `0`;
2316	while (Tmp.getBoolValue()) {
2317	uint64_t Digit;
2318	udivrem(LHS: Tmp, RHS: Radix, Quotient&: Tmp, Remainder&: Digit);
2319	assert(Digit < Radix && "divide failed");
2320	if (InsertSeparators && Pos % Grouping == `0` && Pos > `0`)
2321	Str.push_back(Elt: `'\''`);
2322
2323	Str.push_back(Elt: Digits[Digit]);
2324	Pos++;
2325	}
2326	}
2327
2328	// Reverse the digits before returning.
2329	std::reverse(first: Str.begin()+StartDig, last: Str.end());
2330	}
2331
2332	#if !defined(NDEBUG) \|\| defined(LLVM_ENABLE_DUMP)
2333	LLVM_DUMP_METHOD void APInt::dump() const {
2334	SmallString<`40`> S, U;
2335	this->toStringUnsigned(U);
2336	this->toStringSigned(S);
2337	dbgs() << "APInt(" << BitWidth << "b, "
2338	<< U << "u " << S << "s)\n";
2339	}
2340	#endif
2341
2342	void APInt::print(raw_ostream &OS, bool isSigned) const {
2343	SmallString<`40`> S;
2344	this->toString(Str&: S, Radix: `10`, Signed: isSigned, / formatAsCLiteral = /false);
2345	OS << S;
2346	}
2347
2348	// This implements a variety of operations on a representation of
2349	// arbitrary precision, two's-complement, bignum integer values.
2350
2351	// Assumed by lowHalf, highHalf, partMSB and partLSB. A fairly safe
2352	// and unrestricting assumption.
2353	static_assert(APInt::APINT_BITS_PER_WORD % `2` == `0`,
2354	"Part width must be divisible by 2!");
2355
2356	// Returns the integer part with the least significant BITS set.
2357	// BITS cannot be zero.
2358	static inline APInt::WordType lowBitMask(unsigned bits) {
2359	assert(bits != `0` && bits <= APInt::APINT_BITS_PER_WORD);
2360	return ~(APInt::WordType) `0` >> (APInt::APINT_BITS_PER_WORD - bits);
2361	}
2362
2363	/// Returns the value of the lower half of PART.
2364	static inline APInt::WordType lowHalf(APInt::WordType part) {
2365	return part & lowBitMask(bits: APInt::APINT_BITS_PER_WORD / `2`);
2366	}
2367
2368	/// Returns the value of the upper half of PART.
2369	static inline APInt::WordType highHalf(APInt::WordType part) {
2370	return part >> (APInt::APINT_BITS_PER_WORD / `2`);
2371	}
2372
2373	/// Sets the least significant part of a bignum to the input value, and zeroes
2374	/// out higher parts.
2375	void APInt::tcSet(WordType dst, WordType part, unsigned* parts) {
2376	assert(parts > `0`);
2377	dst[`0`] = part;
2378	for (unsigned i = `1`; i < parts; i++)
2379	dst[i] = `0`;
2380	}
2381
2382	/// Assign one bignum to another.
2383	void APInt::tcAssign(WordType dst, const* WordType src, unsigned* parts) {
2384	for (unsigned i = `0`; i < parts; i++)
2385	dst[i] = src[i];
2386	}
2387
2388	/// Returns true if a bignum is zero, false otherwise.
2389	bool APInt::tcIsZero(const WordType src, unsigned* parts) {
2390	for (unsigned i = `0`; i < parts; i++)
2391	if (src[i])
2392	return false;
2393
2394	return true;
2395	}
2396
2397	/// Extract the given bit of a bignum; returns 0 or 1.
2398	int APInt::tcExtractBit(const WordType parts, unsigned* bit) {
2399	return (parts[whichWord(bitPosition: bit)] & maskBit(bitPosition: bit)) != `0`;
2400	}
2401
2402	/// Set the given bit of a bignum.
2403	void APInt::tcSetBit(WordType parts, unsigned* bit) {
2404	parts[whichWord(bitPosition: bit)] \|= maskBit(bitPosition: bit);
2405	}
2406
2407	/// Clears the given bit of a bignum.
2408	void APInt::tcClearBit(WordType parts, unsigned* bit) {
2409	parts[whichWord(bitPosition: bit)] &= ~maskBit(bitPosition: bit);
2410	}
2411
2412	/// Returns the bit number of the least significant set bit of a number. If the
2413	/// input number has no bits set UINT_MAX is returned.
2414	unsigned APInt::tcLSB(const WordType parts, unsigned* n) {
2415	for (unsigned i = `0`; i < n; i++) {
2416	if (parts[i] != `0`) {
2417	unsigned lsb = llvm::countr_zero(Val: parts[i]);
2418	return lsb + i * APINT_BITS_PER_WORD;
2419	}
2420	}
2421
2422	return UINT_MAX;
2423	}
2424
2425	/// Returns the bit number of the most significant set bit of a number.
2426	/// If the input number has no bits set UINT_MAX is returned.
2427	unsigned APInt::tcMSB(const WordType parts, unsigned* n) {
2428	do {
2429	--n;
2430
2431	if (parts[n] != `0`) {
2432	static_assert(sizeof(parts[n]) <= sizeof(uint64_t));
2433	unsigned msb = llvm::Log2_64(Value: parts[n]);
2434
2435	return msb + n * APINT_BITS_PER_WORD;
2436	}
2437	} while (n);
2438
2439	return UINT_MAX;
2440	}
2441
2442	/// Copy the bit vector of width srcBITS from SRC, starting at bit srcLSB, to
2443	/// DST, of dstCOUNT parts, such that the bit srcLSB becomes the least
2444	/// significant bit of DST. All high bits above srcBITS in DST are zero-filled.
2445	/// /*
2446	void
2447	APInt::tcExtract(WordType dst, unsigned* dstCount, const WordType *src,
2448	unsigned srcBits, unsigned srcLSB) {
2449	unsigned dstParts = (srcBits + APINT_BITS_PER_WORD - `1`) / APINT_BITS_PER_WORD;
2450	assert(dstParts <= dstCount);
2451
2452	unsigned firstSrcPart = srcLSB / APINT_BITS_PER_WORD;
2453	tcAssign(dst, src: src + firstSrcPart, parts: dstParts);
2454
2455	unsigned shift = srcLSB % APINT_BITS_PER_WORD;
2456	tcShiftRight(dst, Words: dstParts, Count: shift);
2457
2458	// We now have (dstParts APINT_BITS_PER_WORD - shift) bits from SRC*
2459	// in DST. If this is less that srcBits, append the rest, else
2460	// clear the high bits.
2461	unsigned n = dstParts * APINT_BITS_PER_WORD - shift;
2462	if (n < srcBits) {
2463	WordType mask = lowBitMask (bits: srcBits - n);
2464	dst[dstParts - `1`] \|= ((src[firstSrcPart + dstParts] & mask)
2465	<< n % APINT_BITS_PER_WORD);
2466	} else if (n > srcBits) {
2467	if (srcBits % APINT_BITS_PER_WORD)
2468	dst[dstParts - `1`] &= lowBitMask (bits: srcBits % APINT_BITS_PER_WORD);
2469	}
2470
2471	// Clear high parts.
2472	while (dstParts < dstCount)
2473	dst[dstParts++] = `0`;
2474	}
2475
2476	//// DST += RHS + C where C is zero or one. Returns the carry flag.
2477	APInt::WordType APInt::tcAdd(WordType dst, const* WordType *rhs,
2478	WordType c, unsigned parts) {
2479	assert(c <= `1`);
2480
2481	for (unsigned i = `0`; i < parts; i++) {
2482	WordType l = dst[i];
2483	if (c) {
2484	dst[i] += rhs[i] + `1`;
2485	c = (dst[i] <= l);
2486	} else {
2487	dst[i] += rhs[i];
2488	c = (dst[i] < l);
2489	}
2490	}
2491
2492	return c;
2493	}
2494
2495	/// This function adds a single "word" integer, src, to the multiple
2496	/// "word" integer array, dst[]. dst[] is modified to reflect the addition and
2497	/// 1 is returned if there is a carry out, otherwise 0 is returned.
2498	/// @returns the carry of the addition.
2499	APInt::WordType APInt::tcAddPart(WordType *dst, WordType src,
2500	unsigned parts) {
2501	for (unsigned i = `0`; i < parts; ++i) {
2502	dst[i] += src;
2503	if (dst[i] >= src)
2504	return `0`; // No need to carry so exit early.
2505	src = `1`; // Carry one to next digit.
2506	}
2507
2508	return `1`;
2509	}
2510
2511	/// DST -= RHS + C where C is zero or one. Returns the carry flag.
2512	APInt::WordType APInt::tcSubtract(WordType dst, const* WordType *rhs,
2513	WordType c, unsigned parts) {
2514	assert(c <= `1`);
2515
2516	for (unsigned i = `0`; i < parts; i++) {
2517	WordType l = dst[i];
2518	if (c) {
2519	dst[i] -= rhs[i] + `1`;
2520	c = (dst[i] >= l);
2521	} else {
2522	dst[i] -= rhs[i];
2523	c = (dst[i] > l);
2524	}
2525	}
2526
2527	return c;
2528	}
2529
2530	/// This function subtracts a single "word" (64-bit word), src, from
2531	/// the multi-word integer array, dst[], propagating the borrowed 1 value until
2532	/// no further borrowing is needed or it runs out of "words" in dst. The result
2533	/// is 1 if "borrowing" exhausted the digits in dst, or 0 if dst was not
2534	/// exhausted. In other words, if src > dst then this function returns 1,
2535	/// otherwise 0.
2536	/// @returns the borrow out of the subtraction
2537	APInt::WordType APInt::tcSubtractPart(WordType *dst, WordType src,
2538	unsigned parts) {
2539	for (unsigned i = `0`; i < parts; ++i) {
2540	WordType Dst = dst[i];
2541	dst[i] -= src;
2542	if (src <= Dst)
2543	return `0`; // No need to borrow so exit early.
2544	src = `1`; // We have to "borrow 1" from next "word"
2545	}
2546
2547	return `1`;
2548	}
2549
2550	/// Negate a bignum in-place.
2551	void APInt::tcNegate(WordType dst, unsigned* parts) {
2552	tcComplement(dst, parts);
2553	tcIncrement(dst, parts);
2554	}
2555
2556	/// DST += SRC MULTIPLIER + CARRY if add is true*
2557	/// DST = SRC MULTIPLIER + CARRY if add is false*
2558	/// Requires 0 <= DSTPARTS <= SRCPARTS + 1. If DST overlaps SRC
2559	/// they must start at the same point, i.e. DST == SRC.
2560	/// If DSTPARTS == SRCPARTS + 1 no overflow occurs and zero is
2561	/// returned. Otherwise DST is filled with the least significant
2562	/// DSTPARTS parts of the result, and if all of the omitted higher
2563	/// parts were zero return zero, otherwise overflow occurred and
2564	/// return one.
2565	int APInt::tcMultiplyPart(WordType dst, const* WordType *src,
2566	WordType multiplier, WordType carry,
2567	unsigned srcParts, unsigned dstParts,
2568	bool add) {
2569	// Otherwise our writes of DST kill our later reads of SRC.
2570	assert(dst <= src \|\| dst >= src + srcParts);
2571	assert(dstParts <= srcParts + `1`);
2572
2573	// N loops; minimum of dstParts and srcParts.
2574	unsigned n = std::min(a: dstParts, b: srcParts);
2575
2576	for (unsigned i = `0`; i < n; i++) {
2577	// [LOW, HIGH] = MULTIPLIER SRC[i] + DST[i] + CARRY.*
2578	// This cannot overflow, because:
2579	// (n - 1) (n - 1) + 2 (n - 1) = (n - 1) * (n + 1)*
2580	// which is less than n^2.
2581	WordType srcPart = src[i];
2582	WordType low, mid, high;
2583	if (multiplier == `0` \|\| srcPart == `0`) {
2584	low = carry;
2585	high = `0`;
2586	} else {
2587	low = lowHalf(part: srcPart) * lowHalf(part: multiplier);
2588	high = highHalf(part: srcPart) * highHalf(part: multiplier);
2589
2590	mid = lowHalf(part: srcPart) * highHalf(part: multiplier);
2591	high += highHalf(part: mid);
2592	mid <<= APINT_BITS_PER_WORD / `2`;
2593	if (low + mid < low)
2594	high++;
2595	low += mid;
2596
2597	mid = highHalf(part: srcPart) * lowHalf(part: multiplier);
2598	high += highHalf(part: mid);
2599	mid <<= APINT_BITS_PER_WORD / `2`;
2600	if (low + mid < low)
2601	high++;
2602	low += mid;
2603
2604	// Now add carry.
2605	if (low + carry < low)
2606	high++;
2607	low += carry;
2608	}
2609
2610	if (add) {
2611	// And now DST[i], and store the new low part there.
2612	if (low + dst[i] < low)
2613	high++;
2614	dst[i] += low;
2615	} else {
2616	dst[i] = low;
2617	}
2618
2619	carry = high;
2620	}
2621
2622	if (srcParts < dstParts) {
2623	// Full multiplication, there is no overflow.
2624	assert(srcParts + `1` == dstParts);
2625	dst[srcParts] = carry;
2626	return `0`;
2627	}
2628
2629	// We overflowed if there is carry.
2630	if (carry)
2631	return `1`;
2632
2633	// We would overflow if any significant unwritten parts would be
2634	// non-zero. This is true if any remaining src parts are non-zero
2635	// and the multiplier is non-zero.
2636	if (multiplier)
2637	for (unsigned i = dstParts; i < srcParts; i++)
2638	if (src[i])
2639	return `1`;
2640
2641	// We fitted in the narrow destination.
2642	return `0`;
2643	}
2644
2645	/// DST = LHS RHS, where DST has the same width as the operands and*
2646	/// is filled with the least significant parts of the result. Returns
2647	/// one if overflow occurred, otherwise zero. DST must be disjoint
2648	/// from both operands.
2649	int APInt::tcMultiply(WordType dst, const* WordType *lhs,
2650	const WordType rhs, unsigned* parts) {
2651	assert(dst != lhs && dst != rhs);
2652
2653	int overflow = `0`;
2654
2655	for (unsigned i = `0`; i < parts; i++) {
2656	// Don't accumulate on the first iteration so we don't need to initalize
2657	// dst to 0.
2658	overflow \|=
2659	tcMultiplyPart(dst: &dst[i], src: lhs, multiplier: rhs[i], carry: `0`, srcParts: parts, dstParts: parts - i, add: i != `0`);
2660	}
2661
2662	return overflow;
2663	}
2664
2665	/// DST = LHS RHS, where DST has width the sum of the widths of the*
2666	/// operands. No overflow occurs. DST must be disjoint from both operands.
2667	void APInt::tcFullMultiply(WordType dst, const* WordType *lhs,
2668	const WordType rhs, unsigned* lhsParts,
2669	unsigned rhsParts) {
2670	// Put the narrower number on the LHS for less loops below.
2671	if (lhsParts > rhsParts)
2672	return tcFullMultiply (dst, lhs: rhs, rhs: lhs, lhsParts: rhsParts, rhsParts: lhsParts);
2673
2674	assert(dst != lhs && dst != rhs);
2675
2676	for (unsigned i = `0`; i < lhsParts; i++) {
2677	// Don't accumulate on the first iteration so we don't need to initalize
2678	// dst to 0.
2679	tcMultiplyPart(dst: &dst[i], src: rhs, multiplier: lhs[i], carry: `0`, srcParts: rhsParts, dstParts: rhsParts + `1`, add: i != `0`);
2680	}
2681	}
2682
2683	// If RHS is zero LHS and REMAINDER are left unchanged, return one.
2684	// Otherwise set LHS to LHS / RHS with the fractional part discarded,
2685	// set REMAINDER to the remainder, return zero. i.e.
2686	//
2687	// OLD_LHS = RHS LHS + REMAINDER*
2688	//
2689	// SCRATCH is a bignum of the same size as the operands and result for
2690	// use by the routine; its contents need not be initialized and are
2691	// destroyed. LHS, REMAINDER and SCRATCH must be distinct.
2692	int APInt::tcDivide(WordType lhs, const* WordType *rhs,
2693	WordType remainder, WordType srhs,
2694	unsigned parts) {
2695	assert(lhs != remainder && lhs != srhs && remainder != srhs);
2696
2697	unsigned shiftCount = tcMSB(parts: rhs, n: parts) + `1`;
2698	if (shiftCount == `0`)
2699	return true;
2700
2701	shiftCount = parts * APINT_BITS_PER_WORD - shiftCount;
2702	unsigned n = shiftCount / APINT_BITS_PER_WORD;
2703	WordType mask = (WordType) `1` << (shiftCount % APINT_BITS_PER_WORD);
2704
2705	tcAssign(dst: srhs, src: rhs, parts);
2706	tcShiftLeft(srhs, Words: parts, Count: shiftCount);
2707	tcAssign(dst: remainder, src: lhs, parts);
2708	tcSet(dst: lhs, part: `0`, parts);
2709
2710	// Loop, subtracting SRHS if REMAINDER is greater and adding that to the
2711	// total.
2712	for (;;) {
2713	int compare = tcCompare(remainder, srhs, parts);
2714	if (compare >= `0`) {
2715	tcSubtract(dst: remainder, rhs: srhs, c: `0`, parts);
2716	lhs[n] \|= mask;
2717	}
2718
2719	if (shiftCount == `0`)
2720	break;
2721	shiftCount--;
2722	tcShiftRight(srhs, Words: parts, Count: `1`);
2723	if ((mask >>= `1`) == `0`) {
2724	mask = (WordType) `1` << (APINT_BITS_PER_WORD - `1`);
2725	n--;
2726	}
2727	}
2728
2729	return false;
2730	}
2731
2732	/// Shift a bignum left Count bits in-place. Shifted in bits are zero. There are
2733	/// no restrictions on Count.
2734	void APInt::tcShiftLeft(WordType Dst, unsigned* Words, unsigned Count) {
2735	// Don't bother performing a no-op shift.
2736	if (!Count)
2737	return;
2738
2739	// WordShift is the inter-part shift; BitShift is the intra-part shift.
2740	unsigned WordShift = std::min(a: Count / APINT_BITS_PER_WORD, b: Words);
2741	unsigned BitShift = Count % APINT_BITS_PER_WORD;
2742
2743	// Fastpath for moving by whole words.
2744	if (BitShift == `0`) {
2745	std::memmove(dest: Dst + WordShift, src: Dst, n: (Words - WordShift) * APINT_WORD_SIZE);
2746	} else {
2747	while (Words-- > WordShift) {
2748	Dst[Words] = Dst[Words - WordShift] << BitShift;
2749	if (Words > WordShift)
2750	Dst[Words] \|=
2751	Dst[Words - WordShift - `1`] >> (APINT_BITS_PER_WORD - BitShift);
2752	}
2753	}
2754
2755	// Fill in the remainder with 0s.
2756	std::memset(s: Dst, c: `0`, n: WordShift * APINT_WORD_SIZE);
2757	}
2758
2759	/// Shift a bignum right Count bits in-place. Shifted in bits are zero. There
2760	/// are no restrictions on Count.
2761	void APInt::tcShiftRight(WordType Dst, unsigned* Words, unsigned Count) {
2762	// Don't bother performing a no-op shift.
2763	if (!Count)
2764	return;
2765
2766	// WordShift is the inter-part shift; BitShift is the intra-part shift.
2767	unsigned WordShift = std::min(a: Count / APINT_BITS_PER_WORD, b: Words);
2768	unsigned BitShift = Count % APINT_BITS_PER_WORD;
2769
2770	unsigned WordsToMove = Words - WordShift;
2771	// Fastpath for moving by whole words.
2772	if (BitShift == `0`) {
2773	std::memmove(dest: Dst, src: Dst + WordShift, n: WordsToMove * APINT_WORD_SIZE);
2774	} else {
2775	for (unsigned i = `0`; i != WordsToMove; ++i) {
2776	Dst[i] = Dst[i + WordShift] >> BitShift;
2777	if (i + `1` != WordsToMove)
2778	Dst[i] \|= Dst[i + WordShift + `1`] << (APINT_BITS_PER_WORD - BitShift);
2779	}
2780	}
2781
2782	// Fill in the remainder with 0s.
2783	std::memset(s: Dst + WordsToMove, c: `0`, n: WordShift * APINT_WORD_SIZE);
2784	}
2785
2786	// Comparison (unsigned) of two bignums.
2787	int APInt::tcCompare(const WordType lhs, const* WordType *rhs,
2788	unsigned parts) {
2789	while (parts) {
2790	parts--;
2791	if (lhs[parts] != rhs[parts])
2792	return (lhs[parts] > rhs[parts]) ? `1` : -`1`;
2793	}
2794
2795	return `0`;
2796	}
2797
2798	APInt llvm::APIntOps::RoundingUDiv(const APInt &A, const APInt &B,
2799	APInt::Rounding RM) {
2800	// Currently udivrem always rounds down.
2801	switch (RM) {
2802	case APInt::Rounding::DOWN:
2803	case APInt::Rounding::TOWARD_ZERO:
2804	return A.udiv(RHS: B);
2805	case APInt::Rounding::UP: {
2806	APInt Quo, Rem;
2807	APInt::udivrem(LHS: A, RHS: B, Quotient&: Quo, Remainder&: Rem);
2808	if (Rem.isZero())
2809	return Quo;
2810	return Quo + `1`;
2811	}
2812	}
2813	llvm_unreachable("Unknown APInt::Rounding enum");
2814	}
2815
2816	APInt llvm::APIntOps::RoundingSDiv(const APInt &A, const APInt &B,
2817	APInt::Rounding RM) {
2818	switch (RM) {
2819	case APInt::Rounding::DOWN:
2820	case APInt::Rounding::UP: {
2821	APInt Quo, Rem;
2822	APInt::sdivrem(LHS: A, RHS: B, Quotient&: Quo, Remainder&: Rem);
2823	if (Rem.isZero())
2824	return Quo;
2825	// This algorithm deals with arbitrary rounding mode used by sdivrem.
2826	// We want to check whether the non-integer part of the mathematical value
2827	// is negative or not. If the non-integer part is negative, we need to round
2828	// down from Quo; otherwise, if it's positive or 0, we return Quo, as it's
2829	// already rounded down.
2830	if (RM == APInt::Rounding::DOWN) {
2831	if (Rem.isNegative() != B.isNegative())
2832	return Quo - `1`;
2833	return Quo;
2834	}
2835	if (Rem.isNegative() != B.isNegative())
2836	return Quo;
2837	return Quo + `1`;
2838	}
2839	// Currently sdiv rounds towards zero.
2840	case APInt::Rounding::TOWARD_ZERO:
2841	return A.sdiv(RHS: B);
2842	}
2843	llvm_unreachable("Unknown APInt::Rounding enum");
2844	}
2845
2846	std::optional<APInt>
2847	llvm::APIntOps::SolveQuadraticEquationWrap(APInt A, APInt B, APInt C,
2848	unsigned RangeWidth) {
2849	unsigned CoeffWidth = A.getBitWidth();
2850	assert(CoeffWidth == B.getBitWidth() && CoeffWidth == C.getBitWidth());
2851	assert(RangeWidth <= CoeffWidth &&
2852	"Value range width should be less than coefficient width");
2853	assert(RangeWidth > `1` && "Value range bit width should be > 1");
2854
2855	LLVM_DEBUG(dbgs() << __func__ << ": solving " << A << "x^2 + " << B
2856	<< "x + " << C << ", rw:" << RangeWidth << `'\n'`);
2857
2858	// Identify 0 as a (non)solution immediately.
2859	if (C.sextOrTrunc(width: RangeWidth).isZero()) {
2860	LLVM_DEBUG(dbgs() << __func__ << ": zero solution\n");
2861	return APInt (CoeffWidth, `0`);
2862	}
2863
2864	// The result of APInt arithmetic has the same bit width as the operands,
2865	// so it can actually lose high bits. A product of two n-bit integers needs
2866	// 2n-1 bits to represent the full value.
2867	// The operation done below (on quadratic coefficients) that can produce
2868	// the largest value is the evaluation of the equation during bisection,
2869	// which needs 3 times the bitwidth of the coefficient, so the total number
2870	// of required bits is 3n.
2871	//
2872	// The purpose of this extension is to simulate the set Z of all integers,
2873	// where n+1 > n for all n in Z. In Z it makes sense to talk about positive
2874	// and negative numbers (not so much in a modulo arithmetic). The method
2875	// used to solve the equation is based on the standard formula for real
2876	// numbers, and uses the concepts of "positive" and "negative" with their
2877	// usual meanings.
2878	CoeffWidth *= `3`;
2879	A = A.sext(Width: CoeffWidth);
2880	B = B.sext(Width: CoeffWidth);
2881	C = C.sext(Width: CoeffWidth);
2882
2883	// Make A > 0 for simplicity. Negate cannot overflow at this point because
2884	// the bit width has increased.
2885	if (A.isNegative()) {
2886	A.negate();
2887	B.negate();
2888	C.negate();
2889	}
2890
2891	// Solving an equation q(x) = 0 with coefficients in modular arithmetic
2892	// is really solving a set of equations q(x) = kR for k = 0, 1, 2, ...,
2893	// and R = 2^BitWidth.
2894	// Since we're trying not only to find exact solutions, but also values
2895	// that "wrap around", such a set will always have a solution, i.e. an x
2896	// that satisfies at least one of the equations, or such that \|q(x)\|
2897	// exceeds kR, while \|q(x-1)\| for the same k does not.
2898	//
2899	// We need to find a value k, such that Ax^2 + Bx + C = kR will have a
2900	// positive solution n (in the above sense), and also such that the n
2901	// will be the least among all solutions corresponding to k = 0, 1, ...
2902	// (more precisely, the least element in the set
2903	// { n(k) \| k is such that a solution n(k) exists }).
2904	//
2905	// Consider the parabola (over real numbers) that corresponds to the
2906	// quadratic equation. Since A > 0, the arms of the parabola will point
2907	// up. Picking different values of k will shift it up and down by R.
2908	//
2909	// We want to shift the parabola in such a way as to reduce the problem
2910	// of solving q(x) = kR to solving shifted_q(x) = 0.
2911	// (The interesting solutions are the ceilings of the real number
2912	// solutions.)
2913	APInt R = APInt::getOneBitSet(numBits: CoeffWidth, BitNo: RangeWidth);
2914	APInt TwoA = `2` * A;
2915	APInt SqrB = B * B;
2916	bool PickLow;
2917
2918	auto RoundUp = [] (const APInt &V, const APInt &A) -> APInt {
2919	assert(A.isStrictlyPositive());
2920	APInt T = V.abs().urem(RHS: A);
2921	if (T.isZero())
2922	return V;
2923	return V.isNegative() ? V +T : V +(A -T);
2924	};
2925
2926	// The vertex of the parabola is at -B/2A, but since A > 0, it's negative
2927	// iff B is positive.
2928	if (B.isNonNegative()) {
2929	// If B >= 0, the vertex it at a negative location (or at 0), so in
2930	// order to have a non-negative solution we need to pick k that makes
2931	// C-kR negative. To satisfy all the requirements for the solution
2932	// that we are looking for, it needs to be closest to 0 of all k.
2933	C = C.srem(RHS: R);
2934	if (C.isStrictlyPositive())
2935	C -= R;
2936	// Pick the greater solution.
2937	PickLow = false;
2938	} else {
2939	// If B < 0, the vertex is at a positive location. For any solution
2940	// to exist, the discriminant must be non-negative. This means that
2941	// C-kR <= B^2/4A is a necessary condition for k, i.e. there is a
2942	// lower bound on values of k: kR >= C - B^2/4A.
2943	APInt LowkR = C - SqrB.udiv(RHS: `2`TwoA); // udiv because all values > 0.*
2944	// Round LowkR up (towards +inf) to the nearest kR.
2945	LowkR = RoundUp (LowkR, R);
2946
2947	// If there exists k meeting the condition above, and such that
2948	// C-kR > 0, there will be two positive real number solutions of
2949	// q(x) = kR. Out of all such values of k, pick the one that makes
2950	// C-kR closest to 0, (i.e. pick maximum k such that C-kR > 0).
2951	// In other words, find maximum k such that LowkR <= kR < C.
2952	if (C.sgt(RHS: LowkR)) {
2953	// If LowkR < C, then such a k is guaranteed to exist because
2954	// LowkR itself is a multiple of R.
2955	C -= -RoundUp (-C, R); // C = C - RoundDown(C, R)
2956	// Pick the smaller solution.
2957	PickLow = true;
2958	} else {
2959	// If C-kR < 0 for all potential k's, it means that one solution
2960	// will be negative, while the other will be positive. The positive
2961	// solution will shift towards 0 if the parabola is moved up.
2962	// Pick the kR closest to the lower bound (i.e. make C-kR closest
2963	// to 0, or in other words, out of all parabolas that have solutions,
2964	// pick the one that is the farthest "up").
2965	// Since LowkR is itself a multiple of R, simply take C-LowkR.
2966	C -= LowkR;
2967	// Pick the greater solution.
2968	PickLow = false;
2969	}
2970	}
2971
2972	LLVM_DEBUG(dbgs() << __func__ << ": updated coefficients " << A << "x^2 + "
2973	<< B << "x + " << C << ", rw:" << RangeWidth << `'\n'`);
2974
2975	APInt D = SqrB - `4`A C;
2976	assert(D.isNonNegative() && "Negative discriminant");
2977	APInt SQ = D.sqrtFloor();
2978
2979	APInt Q = SQ * SQ;
2980	bool InexactSQ = Q != D;
2981
2982	APInt X;
2983	APInt Rem;
2984
2985	// SQ is rounded down (i.e SQ SQ <= D), so the roots may be inexact.*
2986	// When using the quadratic formula directly, the calculated low root
2987	// may be greater than the exact one, since we would be subtracting SQ.
2988	// To make sure that the calculated root is not greater than the exact
2989	// one, subtract SQ+1 when calculating the low root (for inexact value
2990	// of SQ).
2991	if (PickLow)
2992	APInt::sdivrem(LHS: -B - (SQ +InexactSQ), RHS: TwoA, Quotient&: X, Remainder&: Rem);
2993	else
2994	APInt::sdivrem(LHS: -B + SQ, RHS: TwoA, Quotient&: X, Remainder&: Rem);
2995
2996	// The updated coefficients should be such that the (exact) solution is
2997	// positive. Since APInt division rounds towards 0, the calculated one
2998	// can be 0, but cannot be negative.
2999	assert(X.isNonNegative() && "Solution should be non-negative");
3000
3001	if (!InexactSQ && Rem.isZero()) {
3002	LLVM_DEBUG(dbgs() << __func__ << ": solution (root): " << X << `'\n'`);
3003	return X;
3004	}
3005
3006	assert((SQSQ).sle(D) && "SQ = \|_sqrt(D)_\|, so SQSQ <= D");
3007	// The exact value of the square root of D should be between SQ and SQ+1.
3008	// This implies that the solution should be between that corresponding to
3009	// SQ (i.e. X) and that corresponding to SQ+1.
3010	//
3011	// The calculated X cannot be greater than the exact (real) solution.
3012	// Actually it must be strictly less than the exact solution, while
3013	// X+1 will be greater than or equal to it.
3014
3015	APInt VX = (A X + B)X + C;
3016	APInt VY = VX + TwoA *X + A + B;
3017	bool SignChange =
3018	VX.isNegative() != VY.isNegative() \|\| VX.isZero() != VY.isZero();
3019	// If the sign did not change between X and X+1, X is not a valid solution.
3020	// This could happen when the actual (exact) roots don't have an integer
3021	// between them, so they would both be contained between X and X+1.
3022	if (!SignChange) {
3023	LLVM_DEBUG(dbgs() << __func__ << ": no valid solution\n");
3024	return std::nullopt;
3025	}
3026
3027	X += `1`;
3028	LLVM_DEBUG(dbgs() << __func__ << ": solution (wrap): " << X << `'\n'`);
3029	return X;
3030	}
3031
3032	std::optional<unsigned>
3033	llvm::APIntOps::GetMostSignificantDifferentBit(const APInt &A, const APInt &B) {
3034	assert(A.getBitWidth() == B.getBitWidth() && "Must have the same bitwidth");
3035	if (A == B)
3036	return std::nullopt;
3037	return A.getBitWidth() - ((A ^ B).countl_zero() + `1`);
3038	}
3039
3040	APInt llvm::APIntOps::ScaleBitMask(const APInt &A, unsigned NewBitWidth,
3041	bool MatchAllBits) {
3042	unsigned OldBitWidth = A.getBitWidth();
3043	assert((((OldBitWidth % NewBitWidth) == `0`) \|\|
3044	((NewBitWidth % OldBitWidth) == `0`)) &&
3045	"One size should be a multiple of the other one. "
3046	"Can't do fractional scaling.");
3047
3048	// Check for matching bitwidths.
3049	if (OldBitWidth == NewBitWidth)
3050	return A;
3051
3052	APInt NewA = APInt::getZero(numBits: NewBitWidth);
3053
3054	// Check for null input.
3055	if (A.isZero())
3056	return NewA;
3057
3058	if (NewBitWidth > OldBitWidth) {
3059	// Repeat bits.
3060	unsigned Scale = NewBitWidth / OldBitWidth;
3061	for (unsigned i = `0`; i != OldBitWidth; ++i)
3062	if (A [i])
3063	NewA.setBits(loBit: i * Scale, hiBit: (i + `1`) * Scale);
3064	} else {
3065	unsigned Scale = OldBitWidth / NewBitWidth;
3066	for (unsigned i = `0`; i != NewBitWidth; ++i) {
3067	if (MatchAllBits) {
3068	if (A.extractBits(numBits: Scale, bitPosition: i * Scale).isAllOnes())
3069	NewA.setBit(i);
3070	} else {
3071	if (!A.extractBits(numBits: Scale, bitPosition: i * Scale).isZero())
3072	NewA.setBit(i);
3073	}
3074	}
3075	}
3076
3077	return NewA;
3078	}
3079
3080	/// StoreIntToMemory - Fills the StoreBytes bytes of memory starting from Dst
3081	/// with the integer held in IntVal.
3082	void llvm::StoreIntToMemory(const APInt &IntVal, uint8_t *Dst,
3083	unsigned StoreBytes) {
3084	assert((IntVal.getBitWidth()+`7`)/`8` >= StoreBytes && "Integer too small!");
3085	const uint8_t Src = (const* uint8_t *)IntVal.getRawData();
3086
3087	if (sys::IsLittleEndianHost) {
3088	// Little-endian host - the source is ordered from LSB to MSB. Order the
3089	// destination from LSB to MSB: Do a straight copy.
3090	memcpy(dest: Dst, src: Src, n: StoreBytes);
3091	} else {
3092	// Big-endian host - the source is an array of 64 bit words ordered from
3093	// LSW to MSW. Each word is ordered from MSB to LSB. Order the destination
3094	// from MSB to LSB: Reverse the word order, but not the bytes in a word.
3095	while (StoreBytes > sizeof(uint64_t)) {
3096	StoreBytes -= sizeof(uint64_t);
3097	// May not be aligned so use memcpy.
3098	memcpy(dest: Dst + StoreBytes, src: Src, n: sizeof(uint64_t));
3099	Src += sizeof(uint64_t);
3100	}
3101
3102	memcpy(dest: Dst, src: Src + sizeof(uint64_t) - StoreBytes, n: StoreBytes);
3103	}
3104	}
3105
3106	/// LoadIntFromMemory - Loads the integer stored in the LoadBytes bytes starting
3107	/// from Src into IntVal, which is assumed to be wide enough and to hold zero.
3108	void llvm::LoadIntFromMemory(APInt &IntVal, const uint8_t *Src,
3109	unsigned LoadBytes) {
3110	assert((IntVal.getBitWidth()+`7`)/`8` >= LoadBytes && "Integer too small!");
3111	uint8_t Dst = reinterpret_cast<uint8_t >(
3112	const_cast<uint64_t *>(IntVal.getRawData()));
3113
3114	if (sys::IsLittleEndianHost)
3115	// Little-endian host - the destination must be ordered from LSB to MSB.
3116	// The source is ordered from LSB to MSB: Do a straight copy.
3117	memcpy(dest: Dst, src: Src, n: LoadBytes);
3118	else {
3119	// Big-endian - the destination is an array of 64 bit words ordered from
3120	// LSW to MSW. Each word must be ordered from MSB to LSB. The source is
3121	// ordered from MSB to LSB: Reverse the word order, but not the bytes in
3122	// a word.
3123	while (LoadBytes > sizeof(uint64_t)) {
3124	LoadBytes -= sizeof(uint64_t);
3125	// May not be aligned so use memcpy.
3126	memcpy(dest: Dst, src: Src + LoadBytes, n: sizeof(uint64_t));
3127	Dst += sizeof(uint64_t);
3128	}
3129
3130	memcpy(dest: Dst + sizeof(uint64_t) - LoadBytes, src: Src, n: LoadBytes);
3131	}
3132	}
3133
3134	APInt APIntOps::avgFloorS(const APInt &C1, const APInt &C2) {
3135	// Return floor((C1 + C2) / 2)
3136	return (C1 & C2) + (C1 ^ C2).ashr(ShiftAmt: `1`);
3137	}
3138
3139	APInt APIntOps::avgFloorU(const APInt &C1, const APInt &C2) {
3140	// Return floor((C1 + C2) / 2)
3141	return (C1 & C2) + (C1 ^ C2).lshr(shiftAmt: `1`);
3142	}
3143
3144	APInt APIntOps::avgCeilS(const APInt &C1, const APInt &C2) {
3145	// Return ceil((C1 + C2) / 2)
3146	return (C1 \| C2) - (C1 ^ C2).ashr(ShiftAmt: `1`);
3147	}
3148
3149	APInt APIntOps::avgCeilU(const APInt &C1, const APInt &C2) {
3150	// Return ceil((C1 + C2) / 2)
3151	return (C1 \| C2) - (C1 ^ C2).lshr(shiftAmt: `1`);
3152	}
3153
3154	APInt APIntOps::mulhs(const APInt &C1, const APInt &C2) {
3155	assert(C1.getBitWidth() == C2.getBitWidth() && "Unequal bitwidths");
3156	unsigned FullWidth = C1.getBitWidth() * `2`;
3157	APInt C1Ext = C1.sext(Width: FullWidth);
3158	APInt C2Ext = C2.sext(Width: FullWidth);
3159	return (C1Ext * C2Ext).extractBits(numBits: C1.getBitWidth(), bitPosition: C1.getBitWidth());
3160	}
3161
3162	APInt APIntOps::mulhu(const APInt &C1, const APInt &C2) {
3163	assert(C1.getBitWidth() == C2.getBitWidth() && "Unequal bitwidths");
3164	unsigned FullWidth = C1.getBitWidth() * `2`;
3165	APInt C1Ext = C1.zext(width: FullWidth);
3166	APInt C2Ext = C2.zext(width: FullWidth);
3167	return (C1Ext * C2Ext).extractBits(numBits: C1.getBitWidth(), bitPosition: C1.getBitWidth());
3168	}
3169
3170	APInt APIntOps::mulsExtended(const APInt &C1, const APInt &C2) {
3171	assert(C1.getBitWidth() == C2.getBitWidth() && "Unequal bitwidths");
3172	unsigned FullWidth = C1.getBitWidth() * `2`;
3173	APInt C1Ext = C1.sext(Width: FullWidth);
3174	APInt C2Ext = C2.sext(Width: FullWidth);
3175	return C1Ext * C2Ext;
3176	}
3177
3178	APInt APIntOps::muluExtended(const APInt &C1, const APInt &C2) {
3179	assert(C1.getBitWidth() == C2.getBitWidth() && "Unequal bitwidths");
3180	unsigned FullWidth = C1.getBitWidth() * `2`;
3181	APInt C1Ext = C1.zext(width: FullWidth);
3182	APInt C2Ext = C2.zext(width: FullWidth);
3183	return C1Ext * C2Ext;
3184	}
3185
3186	APInt APIntOps::pow(const APInt &X, int64_t N) {
3187	assert(N >= `0` && "negative exponents not supported.");
3188	APInt Acc = APInt (X.getBitWidth(), `1`);
3189	if (N == `0`)
3190	return Acc;
3191	APInt Base = X;
3192	int64_t RemainingExponent = N;
3193	while (RemainingExponent > `0`) {
3194	while (RemainingExponent % `2` == `0`) {
3195	Base *= Base;
3196	RemainingExponent /= `2`;
3197	}
3198	--RemainingExponent;
3199	Acc *= Base;
3200	}
3201	return Acc;
3202	}
3203
3204	APInt llvm::APIntOps::fshl(const APInt &Hi, const APInt &Lo,
3205	const APInt &Shift) {
3206	assert(Hi.getBitWidth() == Lo.getBitWidth());
3207	unsigned ShiftAmt = rotateModulo(BitWidth: Hi.getBitWidth(), rotateAmt: Shift);
3208	if (ShiftAmt == `0`)
3209	return Hi;
3210	return Hi.shl(shiftAmt: ShiftAmt) \| Lo.lshr(shiftAmt: Hi.getBitWidth() - ShiftAmt);
3211	}
3212
3213	APInt llvm::APIntOps::fshr(const APInt &Hi, const APInt &Lo,
3214	const APInt &Shift) {
3215	assert(Hi.getBitWidth() == Lo.getBitWidth());
3216	unsigned ShiftAmt = rotateModulo(BitWidth: Hi.getBitWidth(), rotateAmt: Shift);
3217	if (ShiftAmt == `0`)
3218	return Lo;
3219	return Hi.shl(shiftAmt: Hi.getBitWidth() - ShiftAmt) \| Lo.lshr(shiftAmt: ShiftAmt);
3220	}
3221
3222	APInt llvm::APIntOps::clmul(const APInt &LHS, const APInt &RHS) {
3223	unsigned BW = LHS.getBitWidth();
3224	assert(BW == RHS.getBitWidth() && "Operand mismatch");
3225	APInt Result(BW, `0`);
3226	for (unsigned I : seq(Size: std::min(a: RHS.getActiveBits(), b: BW - LHS.countr_zero())))
3227	if (RHS [I])
3228	Result ^= LHS << I;
3229	return Result;
3230	}
3231
3232	APInt llvm::APIntOps::clmulr(const APInt &LHS, const APInt &RHS) {
3233	assert(LHS.getBitWidth() == RHS.getBitWidth());
3234	return clmul(LHS: LHS.reverseBits(), RHS: RHS.reverseBits()).reverseBits();
3235	}
3236
3237	APInt llvm::APIntOps::clmulh(const APInt &LHS, const APInt &RHS) {
3238	assert(LHS.getBitWidth() == RHS.getBitWidth());
3239	return clmulr(LHS, RHS).lshr(shiftAmt: `1`);
3240	}
3241
3242	APInt llvm::APIntOps::pext(const APInt &Val, const APInt &Mask) {
3243	unsigned BW = Val.getBitWidth();
3244	assert(BW == Mask.getBitWidth() && "Operand mismatch");
3245	APInt Result = APInt::getZero(numBits: BW);
3246	for (unsigned I = `0`, P = `0`; I != BW; ++I)
3247	if (Mask [I])
3248	Result.setBitVal(BitPosition: P++, BitValue: Val [I]);
3249	return Result;
3250	}
3251
3252	APInt llvm::APIntOps::pdep(const APInt &Val, const APInt &Mask) {
3253	unsigned BW = Val.getBitWidth();
3254	assert(BW == Mask.getBitWidth() && "Operand mismatch");
3255	APInt Result = APInt::getZero(numBits: BW);
3256	for (unsigned I = `0`, P = `0`; I != BW; ++I)
3257	if (Mask [I])
3258	Result.setBitVal(BitPosition: I, BitValue: Val [P++]);
3259	return Result;
3260	}
3261

Browse the source code of llvm_projects/llvm/lib/Support/APInt.cpp