AArch64ISelLowering.h source code [llvm_projects/llvm/lib/Target/AArch64/AArch64ISelLowering.h]

1	//==-- AArch64ISelLowering.h - AArch64 DAG Lowering Interface ----- C++ --==//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// This file defines the interfaces that AArch64 uses to lower LLVM code into a
10	// selection DAG.
11	//
12	//===----------------------------------------------------------------------===//
13
14	#ifndef LLVM_LIB_TARGET_AARCH64_AARCH64ISELLOWERING_H
15	#define LLVM_LIB_TARGET_AARCH64_AARCH64ISELLOWERING_H
16
17	#include "llvm/CodeGen/CallingConvLower.h"
18	#include "llvm/CodeGen/MachineFunction.h"
19	#include "llvm/CodeGen/SelectionDAG.h"
20	#include "llvm/CodeGen/TargetLowering.h"
21	#include "llvm/IR/CallingConv.h"
22	#include "llvm/IR/Instruction.h"
23
24	namespace llvm {
25
26	class AArch64TargetMachine;
27
28	namespace AArch64 {
29	/// Possible values of current rounding mode, which is specified in bits
30	/// 23:22 of FPCR.
31	enum Rounding {
32	RN = `0`, // Round to Nearest
33	RP = `1`, // Round towards Plus infinity
34	RM = `2`, // Round towards Minus infinity
35	RZ = `3`, // Round towards Zero
36	rmMask = `3` // Bit mask selecting rounding mode
37	};
38
39	// Bit position of rounding mode bits in FPCR.
40	const unsigned RoundingBitsPos = `22`;
41
42	// Reserved bits should be preserved when modifying FPCR.
43	const uint64_t ReservedFPControlBits = `0xfffffffff80040f8`;
44
45	// Registers used to pass function arguments.
46	ArrayRef<MCPhysReg> getGPRArgRegs();
47	ArrayRef<MCPhysReg> getFPRArgRegs();
48
49	/// Maximum allowed number of unprobed bytes above SP at an ABI
50	/// boundary.
51	const unsigned StackProbeMaxUnprobedStack = `1024`;
52
53	/// Maximum number of iterations to unroll for a constant size probing loop.
54	const unsigned StackProbeMaxLoopUnroll = `4`;
55
56	} // namespace AArch64
57
58	namespace ARM64AS {
59	enum : unsigned { PTR32_SPTR = `270`, PTR32_UPTR = `271`, PTR64 = `272` };
60	}
61
62	class AArch64Subtarget;
63
64	class AArch64TargetLowering : public TargetLowering {
65	public:
66	explicit AArch64TargetLowering(const TargetMachine &TM,
67	const AArch64Subtarget &STI);
68
69	const AArch64TargetMachine &getTM() const;
70
71	/// Control the following reassociation of operands: (op (op x, c1), y) -> (op
72	/// (op x, y), c1) where N0 is (op x, c1) and N1 is y.
73	bool isReassocProfitable(SelectionDAG &DAG, SDValue N0,
74	SDValue N1) const override;
75
76	/// Selects the correct CCAssignFn for a given CallingConvention value.
77	CCAssignFn CCAssignFnForCall(CallingConv::ID CC, bool* IsVarArg) const;
78
79	/// Selects the correct CCAssignFn for a given CallingConvention value.
80	CCAssignFn CCAssignFnForReturn(CallingConv::ID CC) const*;
81
82	/// Determine which of the bits specified in Mask are known to be either zero
83	/// or one and return them in the KnownZero/KnownOne bitsets.
84	void computeKnownBitsForTargetNode(const SDValue Op, KnownBits &Known,
85	const APInt &DemandedElts,
86	const SelectionDAG &DAG,
87	unsigned Depth = `0`) const override;
88
89	unsigned ComputeNumSignBitsForTargetNode(SDValue Op,
90	const APInt &DemandedElts,
91	const SelectionDAG &DAG,
92	unsigned Depth) const override;
93
94	MVT getPointerTy(const DataLayout &DL, uint32_t AS = `0`) const override {
95	if ((AS == ARM64AS::PTR32_SPTR) \|\| (AS == ARM64AS::PTR32_UPTR)) {
96	// These are 32-bit pointers created using the `__ptr32` extension or
97	// similar. They are handled by marking them as being in a different
98	// address space, and will be extended to 64-bits when used as the target
99	// of a load or store operation, or cast to a 64-bit pointer type.
100	return MVT::i32;
101	} else {
102	// Returning i64 unconditionally here (i.e. even for ILP32) means that the
103	// DAG* representation of pointers will always be 64-bits. They will be*
104	// truncated and extended when transferred to memory, but the 64-bit DAG
105	// allows us to use AArch64's addressing modes much more easily.
106	return MVT::i64;
107	}
108	}
109
110	unsigned getVectorIdxWidth(const DataLayout &DL) const override {
111	// The VectorIdx type is i64, with both normal and ilp32.
112	return `64`;
113	}
114
115	bool targetShrinkDemandedConstant(SDValue Op, const APInt &DemandedBits,
116	const APInt &DemandedElts,
117	TargetLoweringOpt &TLO) const override;
118
119	MVT getScalarShiftAmountTy(const DataLayout &DL, EVT) const override;
120
121	/// Returns true if the target allows unaligned memory accesses of the
122	/// specified type.
123	bool allowsMisalignedMemoryAccesses(
124	EVT VT, unsigned AddrSpace = `0`, Align Alignment = Align (`1`),
125	MachineMemOperand::Flags Flags = MachineMemOperand::MONone,
126	unsigned Fast = nullptr) const* override;
127	/// LLT variant.
128	bool allowsMisalignedMemoryAccesses(LLT Ty, unsigned AddrSpace,
129	Align Alignment,
130	MachineMemOperand::Flags Flags,
131	unsigned Fast = nullptr) const* override;
132
133	/// Provide custom lowering hooks for some operations.
134	SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
135
136	SDValue PerformDAGCombine(SDNode N, DAGCombinerInfo &DCI) const* override;
137
138	/// This method returns a target specific FastISel object, or null if the
139	/// target does not support "fast" ISel.
140	FastISel *
141	createFastISel(FunctionLoweringInfo &funcInfo,
142	const TargetLibraryInfo *libInfo,
143	const LibcallLoweringInfo libcallLowering) const* override;
144
145	bool isOffsetFoldingLegal(const GlobalAddressSDNode GA) const* override;
146
147	bool isFPImmLegalAsFMov(const APFloat &Imm, EVT VT) const;
148
149	bool isFPImmLegal(const APFloat &Imm, EVT VT,
150	bool ForCodeSize) const override;
151
152	/// Return true if the given shuffle mask can be codegen'd directly, or if it
153	/// should be stack expanded.
154	bool isShuffleMaskLegal(ArrayRef<int> M, EVT VT) const override;
155
156	/// Similar to isShuffleMaskLegal. Return true is the given 'select with zero'
157	/// shuffle mask can be codegen'd directly.
158	bool isVectorClearMaskLegal(ArrayRef<int> M, EVT VT) const override;
159
160	/// Return the ISD::SETCC ValueType.
161	EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context,
162	EVT VT) const override;
163
164	SDValue ReconstructShuffle(SDValue Op, SelectionDAG &DAG) const;
165
166	MachineBasicBlock *EmitF128CSEL(MachineInstr &MI,
167	MachineBasicBlock BB) const*;
168
169	MachineBasicBlock *EmitLoweredCatchRet(MachineInstr &MI,
170	MachineBasicBlock BB) const*;
171
172	MachineBasicBlock *EmitDynamicProbedAlloc(MachineInstr &MI,
173	MachineBasicBlock MBB) const*;
174
175	MachineBasicBlock *EmitCheckMatchingVL(MachineInstr &MI,
176	MachineBasicBlock MBB) const*;
177
178	MachineBasicBlock EmitTileLoad(unsigned* Opc, unsigned BaseReg,
179	MachineInstr &MI,
180	MachineBasicBlock BB) const*;
181	MachineBasicBlock EmitFill(MachineInstr &MI, MachineBasicBlock BB) const;
182	MachineBasicBlock EmitZAInstr(unsigned* Opc, unsigned BaseReg,
183	MachineInstr &MI, MachineBasicBlock BB) const*;
184	MachineBasicBlock EmitZTInstr(MachineInstr &MI, MachineBasicBlock BB,
185	unsigned Opcode, bool Op0IsDef) const;
186	MachineBasicBlock EmitZero(MachineInstr &MI, MachineBasicBlock BB) const;
187
188	// Note: The following group of functions are only used as part of the old SME
189	// ABI lowering. They will be removed once -aarch64-new-sme-abi=true is the
190	// default.
191	MachineBasicBlock *EmitInitTPIDR2Object(MachineInstr &MI,
192	MachineBasicBlock BB) const*;
193	MachineBasicBlock *EmitAllocateZABuffer(MachineInstr &MI,
194	MachineBasicBlock BB) const*;
195	MachineBasicBlock *EmitAllocateSMESaveBuffer(MachineInstr &MI,
196	MachineBasicBlock BB) const*;
197	MachineBasicBlock *EmitGetSMESaveSize(MachineInstr &MI,
198	MachineBasicBlock BB) const*;
199	MachineBasicBlock *EmitEntryPStateSM(MachineInstr &MI,
200	MachineBasicBlock BB) const*;
201
202	/// Replace (0, vreg) discriminator components with the operands of blend
203	/// or with (immediate, NoRegister) when possible.
204	void fixupPtrauthDiscriminator(MachineInstr &MI, MachineBasicBlock *BB,
205	MachineOperand &IntDiscOp,
206	MachineOperand &AddrDiscOp,
207	const TargetRegisterClass AddrDiscRC) const*;
208
209	MachineBasicBlock *
210	EmitInstrWithCustomInserter(MachineInstr &MI,
211	MachineBasicBlock MBB) const* override;
212
213	void getTgtMemIntrinsic(SmallVectorImpl<IntrinsicInfo> &Infos,
214	const CallBase &I, MachineFunction &MF,
215	unsigned Intrinsic) const override;
216
217	bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtTy, EVT NewVT,
218	std::optional<unsigned> ByteOffset) const override;
219
220	bool shouldRemoveRedundantExtend(SDValue Op) const override;
221
222	bool isTruncateFree(Type Ty1, Type Ty2) const override;
223	bool isTruncateFree(EVT VT1, EVT VT2) const override;
224
225	bool isProfitableToHoist(Instruction I) const* override;
226
227	bool isZExtFree(Type Ty1, Type Ty2) const override;
228	bool isZExtFree(EVT VT1, EVT VT2) const override;
229	bool isZExtFree(SDValue Val, EVT VT2) const override;
230
231	bool optimizeExtendOrTruncateConversion(
232	Instruction I, Loop L, const TargetTransformInfo &TTI) const override;
233
234	bool hasPairedLoad(EVT LoadedType, Align &RequiredAlignment) const override;
235
236	unsigned getMaxSupportedInterleaveFactor() const override { return `4`; }
237
238	bool lowerInterleavedLoad(Instruction Load, Value Mask,
239	ArrayRef<ShuffleVectorInst *> Shuffles,
240	ArrayRef<unsigned> Indices, unsigned Factor,
241	const APInt &GapMask) const override;
242	bool lowerInterleavedStore(Instruction Store, Value Mask,
243	ShuffleVectorInst SVI, unsigned* Factor,
244	const APInt &GapMask) const override;
245
246	bool lowerDeinterleaveIntrinsicToLoad(Instruction Load, Value Mask,
247	IntrinsicInst DI) const* override;
248
249	bool lowerInterleaveIntrinsicToStore(
250	Instruction Store, Value Mask,
251	ArrayRef<Value > InterleaveValues) const* override;
252
253	bool isLegalAddImmediate(int64_t) const override;
254	bool isLegalAddScalableImmediate(int64_t) const override;
255	bool isLegalICmpImmediate(int64_t) const override;
256
257	bool isMulAddWithConstProfitable(SDValue AddNode,
258	SDValue ConstNode) const override;
259
260	bool shouldConsiderGEPOffsetSplit() const override;
261
262	EVT getOptimalMemOpType(LLVMContext &Context, const MemOp &Op,
263	const AttributeList &FuncAttributes) const override;
264
265	LLT getOptimalMemOpLLT(const MemOp &Op,
266	const AttributeList &FuncAttributes) const override;
267
268	bool findOptimalMemOpLowering(LLVMContext &Context, std::vector<EVT> &MemOps,
269	unsigned Limit, const MemOp &Op, unsigned DstAS,
270	unsigned SrcAS,
271	const AttributeList &FuncAttributes,
272	EVT LargestVT = nullptr) const* override;
273
274	/// Return true if the addressing mode represented by AM is legal for this
275	/// target, for a load/store of the specified type.
276	bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty,
277	unsigned AS,
278	Instruction I = nullptr) const* override;
279
280	int64_t getPreferredLargeGEPBaseOffset(int64_t MinOffset,
281	int64_t MaxOffset) const override;
282
283	/// Return true if an FMA operation is faster than a pair of fmul and fadd
284	/// instructions. fmuladd intrinsics will be expanded to FMAs when this method
285	/// returns true, otherwise fmuladd is expanded to fmul + fadd.
286	bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,
287	EVT VT) const override;
288	bool isFMAFasterThanFMulAndFAdd(const Function &F, Type Ty) const* override;
289
290	bool generateFMAsInMachineCombiner(EVT VT,
291	CodeGenOptLevel OptLevel) const override;
292
293	/// Return true if the target has native support for
294	/// the specified value type and it is 'desirable' to use the type for the
295	/// given node type.
296	bool isTypeDesirableForOp(unsigned Opc, EVT VT) const override;
297
298	const MCPhysReg getScratchRegisters(CallingConv::ID CC) const* override;
299	ArrayRef<MCPhysReg> getRoundingControlRegisters() const override;
300
301	/// Returns false if N is a bit extraction pattern of (X >> C) & Mask.
302	bool isDesirableToCommuteWithShift(const SDNode *N,
303	CombineLevel Level) const override;
304
305	bool isDesirableToPullExtFromShl(const MachineInstr &MI) const override {
306	return false;
307	}
308
309	/// Returns false if N is a bit extraction pattern of (X >> C) & Mask.
310	bool isDesirableToCommuteXorWithShift(const SDNode N) const* override;
311
312	/// Return true if it is profitable to fold a pair of shifts into a mask.
313	bool shouldFoldConstantShiftPairToMask(const SDNode N) const* override;
314
315	/// Return true if it is profitable to fold a pair of shifts into a mask.
316	bool shouldFoldMaskToVariableShiftPair(SDValue Y) const override {
317	EVT VT = Y.getValueType();
318
319	if (VT.isVector())
320	return false;
321
322	return VT.getScalarSizeInBits() <= `64`;
323	}
324
325	bool shouldFoldSelectWithIdentityConstant(unsigned BinOpcode, EVT VT,
326	unsigned SelectOpcode, SDValue X,
327	SDValue Y) const override;
328
329	/// Returns true if it is beneficial to convert a load of a constant
330	/// to just the constant itself.
331	bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
332	Type Ty) const* override;
333
334	/// Return true if EXTRACT_SUBVECTOR is cheap for this result type
335	/// with this index.
336	bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
337	unsigned Index) const override;
338
339	bool shouldFormOverflowOp(unsigned Opcode, EVT VT,
340	bool MathUsed) const override {
341	// Using overflow ops for overflow checks only should beneficial on
342	// AArch64.
343	return TargetLowering::shouldFormOverflowOp(Opcode, VT, MathUsed: true);
344	}
345
346	// Return true if the target wants to optimize the mul overflow intrinsic
347	// for the given \p VT.
348	bool shouldOptimizeMulOverflowWithZeroHighBits(LLVMContext &Context,
349	EVT VT) const override;
350
351	Value emitLoadLinked(IRBuilderBase &Builder, Type ValueTy, Value *Addr,
352	AtomicOrdering Ord) const override;
353	Value emitStoreConditional(IRBuilderBase &Builder, Value Val, Value *Addr,
354	AtomicOrdering Ord) const override;
355
356	void emitAtomicCmpXchgNoStoreLLBalance(IRBuilderBase &Builder) const override;
357
358	bool isOpSuitableForLDPSTP(const Instruction I) const*;
359	bool isOpSuitableForLSE128(const Instruction I) const*;
360	bool isOpSuitableForRCPC3(const Instruction I) const*;
361	bool shouldInsertFencesForAtomic(const Instruction I) const* override;
362	bool shouldInsertTrailingSeqCstFenceForAtomicStore(
363	const Instruction I) const* override;
364
365	TargetLoweringBase::AtomicExpansionKind
366	shouldExpandAtomicLoadInIR(LoadInst LI) const* override;
367	TargetLoweringBase::AtomicExpansionKind
368	shouldExpandAtomicStoreInIR(StoreInst SI) const* override;
369	TargetLoweringBase::AtomicExpansionKind
370	shouldExpandAtomicRMWInIR(const AtomicRMWInst AI) const* override;
371
372	TargetLoweringBase::AtomicExpansionKind
373	shouldExpandAtomicCmpXchgInIR(const AtomicCmpXchgInst AI) const* override;
374
375	bool useLoadStackGuardNode(const Module &M) const override;
376	TargetLoweringBase::LegalizeTypeAction
377	getPreferredVectorAction(MVT VT) const override;
378
379	/// If the target has a standard location for the stack protector cookie,
380	/// returns the address of that location. Otherwise, returns nullptr.
381	Value *getIRStackGuard(IRBuilderBase &IRB,
382	const LibcallLoweringInfo &Libcalls) const override;
383
384	void
385	insertSSPDeclarations(Module &M,
386	const LibcallLoweringInfo &Libcalls) const override;
387
388	/// If the target has a standard location for the unsafe stack pointer,
389	/// returns the address of that location. Otherwise, returns nullptr.
390	Value *getSafeStackPointerLocation(
391	IRBuilderBase &IRB, const LibcallLoweringInfo &Libcalls) const override;
392
393	/// If a physical register, this returns the register that receives the
394	/// exception address on entry to an EH pad.
395	Register
396	getExceptionPointerRegister(const Constant PersonalityFn) const* override;
397
398	/// If a physical register, this returns the register that receives the
399	/// exception typeid on entry to a landing pad.
400	Register
401	getExceptionSelectorRegister(const Constant PersonalityFn) const* override;
402
403	bool isIntDivCheap(EVT VT, AttributeList Attr) const override;
404
405	bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,
406	const MachineFunction &MF) const override;
407
408	bool isCheapToSpeculateCttz(Type ) const* override {
409	return true;
410	}
411
412	bool isCheapToSpeculateCtlz(Type ) const* override {
413	return true;
414	}
415
416	bool isMaskAndCmp0FoldingBeneficial(const Instruction &AndI) const override;
417
418	bool hasAndNotCompare(SDValue V) const override {
419	// We can use bics for any scalar.
420	return V.getValueType().isScalarInteger();
421	}
422
423	bool hasAndNot(SDValue Y) const override {
424	EVT VT = Y.getValueType();
425
426	if (!VT.isVector())
427	return hasAndNotCompare(V: Y);
428
429	if (VT.isScalableVector())
430	return true;
431
432	return VT.getFixedSizeInBits() >= `64`; // vector 'bic'
433	}
434
435	bool shouldProduceAndByConstByHoistingConstFromShiftsLHSOfAnd(
436	SDValue X, ConstantSDNode XC, ConstantSDNode CC, SDValue Y,
437	unsigned OldShiftOpcode, unsigned NewShiftOpcode,
438	SelectionDAG &DAG) const override;
439
440	ShiftLegalizationStrategy
441	preferredShiftLegalizationStrategy(SelectionDAG &DAG, SDNode *N,
442	unsigned ExpansionFactor) const override;
443
444	bool shouldTransformSignedTruncationCheck(EVT XVT,
445	unsigned KeptBits) const override {
446	// For vectors, we don't have a preference..
447	if (XVT.isVector())
448	return false;
449
450	auto VTIsOk = [](EVT VT) -> bool {
451	return VT == MVT::i8 \|\| VT == MVT::i16 \|\| VT == MVT::i32 \|\|
452	VT == MVT::i64;
453	};
454
455	// We are ok with KeptBitsVT being byte/word/dword, what SXT supports.
456	// XVT will be larger than KeptBitsVT.
457	MVT KeptBitsVT = MVT::getIntegerVT(BitWidth: KeptBits);
458	return VTIsOk(XVT) && VTIsOk(KeptBitsVT);
459	}
460
461	bool preferIncOfAddToSubOfNot(EVT VT) const override;
462
463	bool shouldConvertFpToSat(unsigned Op, EVT FPVT, EVT VT) const override;
464
465	bool preferSelectsOverBooleanArithmetic(EVT VT) const override;
466
467	bool isComplexDeinterleavingSupported() const override;
468	bool isComplexDeinterleavingOperationSupported(
469	ComplexDeinterleavingOperation Operation, Type Ty) const* override;
470
471	Value *createComplexDeinterleavingIR(
472	IRBuilderBase &B, ComplexDeinterleavingOperation OperationType,
473	ComplexDeinterleavingRotation Rotation, Value InputA, Value InputB,
474	Value Accumulator = nullptr) const* override;
475
476	bool supportSplitCSR(MachineFunction MF) const* override {
477	return MF->getFunction().getCallingConv() == CallingConv::CXX_FAST_TLS &&
478	MF->getFunction().hasFnAttribute(Kind: Attribute::NoUnwind);
479	}
480	void initializeSplitCSR(MachineBasicBlock Entry) const* override;
481	void insertCopiesSplitCSR(
482	MachineBasicBlock *Entry,
483	const SmallVectorImpl<MachineBasicBlock > &Exits) const* override;
484
485	bool supportSwiftError() const override {
486	return true;
487	}
488
489	bool supportPtrAuthBundles() const override { return true; }
490
491	bool supportKCFIBundles() const override { return true; }
492
493	MachineInstr *EmitKCFICheck(MachineBasicBlock &MBB,
494	MachineBasicBlock::instr_iterator &MBBI,
495	const TargetInstrInfo TII) const* override;
496
497	bool shallExtractConstSplatVectorElementToStore(
498	Type VectorTy, unsigned* ElemSizeInBits, unsigned &Index) const override;
499
500	/// Enable aggressive FMA fusion on targets that want it.
501	bool enableAggressiveFMAFusion(EVT VT) const override;
502
503	bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override {
504	return true;
505	}
506
507	/// Returns the size of the platform's va_list object.
508	unsigned getVaListSizeInBits(const DataLayout &DL) const override;
509
510	/// Returns true if \p VecTy is a legal interleaved access type. This
511	/// function checks the vector element type and the overall width of the
512	/// vector.
513	bool isLegalInterleavedAccessType(VectorType VecTy, const* DataLayout &DL,
514	bool &UseScalable) const;
515
516	/// Returns the number of interleaved accesses that will be generated when
517	/// lowering accesses of the given type.
518	unsigned getNumInterleavedAccesses(VectorType VecTy, const* DataLayout &DL,
519	bool UseScalable) const;
520
521	MachineMemOperand::Flags getTargetMMOFlags(
522	const Instruction &I) const override;
523
524	bool functionArgumentNeedsConsecutiveRegisters(
525	Type Ty, CallingConv::ID CallConv, bool* isVarArg,
526	const DataLayout &DL) const override;
527
528	/// Used for exception handling on Win64.
529	bool needsFixedCatchObjects() const override;
530
531	bool fallBackToDAGISel(const Instruction &Inst) const override;
532
533	/// SVE code generation for fixed length vectors does not custom lower
534	/// BUILD_VECTOR. This makes BUILD_VECTOR legalisation a source of stores to
535	/// merge. However, merging them creates a BUILD_VECTOR that is just as
536	/// illegal as the original, thus leading to an infinite legalisation loop.
537	/// NOTE: Once BUILD_VECTOR is legal or can be custom lowered for all legal
538	/// vector types this override can be removed.
539	bool mergeStoresAfterLegalization(EVT VT) const override;
540
541	// If the platform/function should have a redzone, return the size in bytes.
542	unsigned getRedZoneSize(const Function &F) const {
543	if (F.hasFnAttribute(Kind: Attribute::NoRedZone))
544	return `0`;
545	return `128`;
546	}
547
548	bool isAllActivePredicate(SelectionDAG &DAG, SDValue N) const;
549	EVT getPromotedVTForPredicate(EVT VT) const;
550
551	EVT getAsmOperandValueType(const DataLayout &DL, Type *Ty,
552	bool AllowUnknown = false) const override;
553
554	bool shouldExpandGetActiveLaneMask(EVT VT, EVT OpVT) const override;
555
556	bool shouldExpandCttzElements(EVT VT) const override;
557
558	bool shouldExpandVectorMatch(EVT VT, unsigned SearchSize) const override;
559
560	/// If a change in streaming mode is required on entry to/return from a
561	/// function call it emits and returns the corresponding SMSTART or SMSTOP
562	/// node. \p Condition should be one of the enum values from
563	/// AArch64SME::ToggleCondition.
564	SDValue changeStreamingMode(SelectionDAG &DAG, SDLoc DL, bool Enable,
565	SDValue Chain, SDValue InGlue, unsigned Condition,
566	bool InsertVectorLengthCheck = false) const;
567
568	/// Returns true if \p RdxOp should be lowered to a SVE reduction. If a SVE2
569	/// pairwise operation can be used for the reduction \p PairwiseOpIID is set
570	/// to its intrinsic ID.
571	bool
572	shouldLowerReductionToSVE(SDValue RdxOp,
573	std::optional<Intrinsic::ID> &PairwiseOpIID) const;
574
575	// Normally SVE is only used for byte size vectors that do not fit within a
576	// NEON vector. This changes when OverrideNEON is true, allowing SVE to be
577	// used for 64bit and 128bit vectors as well.
578	bool useSVEForFixedLengthVectorVT(EVT VT, bool OverrideNEON = false) const;
579
580	// Follow NEON ABI rules even when using SVE for fixed length vectors.
581	MVT getRegisterTypeForCallingConv(LLVMContext &Context, CallingConv::ID CC,
582	EVT VT) const override;
583	unsigned getNumRegistersForCallingConv(LLVMContext &Context,
584	CallingConv::ID CC,
585	EVT VT) const override;
586	unsigned getVectorTypeBreakdownForCallingConv(LLVMContext &Context,
587	CallingConv::ID CC, EVT VT,
588	EVT &IntermediateVT,
589	unsigned &NumIntermediates,
590	MVT &RegisterVT) const override;
591
592	/// True if stack clash protection is enabled for this functions.
593	bool hasInlineStackProbe(const MachineFunction &MF) const override;
594
595	/// In AArch64, true if FEAT_CPA is present. Allows pointer arithmetic
596	/// semantics to be preserved for instruction selection.
597	bool shouldPreservePtrArith(const Function &F, EVT PtrVT) const override;
598
599	private:
600	/// Keep a pointer to the AArch64Subtarget around so that we can
601	/// make the right decision when generating code for different targets.
602	const AArch64Subtarget *Subtarget;
603
604	bool isExtFreeImpl(const Instruction Ext) const* override;
605
606	void addTypeForNEON(MVT VT);
607	void addTypeForFixedLengthSVE(MVT VT);
608	void addDRType(MVT VT);
609	void addQRType(MVT VT);
610
611	bool shouldExpandBuildVectorWithShuffles(EVT, unsigned) const override;
612
613	SDValue lowerEHPadEntry(SDValue Chain, SDLoc const &DL,
614	SelectionDAG &DAG) const override;
615
616	SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv,
617	bool isVarArg,
618	const SmallVectorImpl<ISD::InputArg> &Ins,
619	const SDLoc &DL, SelectionDAG &DAG,
620	SmallVectorImpl<SDValue> &InVals) const override;
621
622	void AdjustInstrPostInstrSelection(MachineInstr &MI,
623	SDNode Node) const* override;
624
625	SDValue LowerCall(CallLoweringInfo & /CLI/,
626	SmallVectorImpl<SDValue> &InVals) const override;
627
628	SDValue LowerCallResult(SDValue Chain, SDValue InGlue,
629	CallingConv::ID CallConv, bool isVarArg,
630	const SmallVectorImpl<CCValAssign> &RVLocs,
631	const SDLoc &DL, SelectionDAG &DAG,
632	SmallVectorImpl<SDValue> &InVals, bool isThisReturn,
633	SDValue ThisVal, bool RequiresSMChange) const;
634
635	SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;
636	SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
637	SDValue LowerStore128(SDValue Op, SelectionDAG &DAG) const;
638	SDValue LowerABS(SDValue Op, SelectionDAG &DAG) const;
639	SDValue LowerFMUL(SDValue Op, SelectionDAG &DAG) const;
640	SDValue LowerFMA(SDValue Op, SelectionDAG &DAG) const;
641
642	SDValue LowerMGATHER(SDValue Op, SelectionDAG &DAG) const;
643	SDValue LowerMSCATTER(SDValue Op, SelectionDAG &DAG) const;
644
645	SDValue LowerMLOAD(SDValue Op, SelectionDAG &DAG) const;
646
647	SDValue LowerVECTOR_COMPRESS(SDValue Op, SelectionDAG &DAG) const;
648
649	SDValue LowerINTRINSIC_W_CHAIN(SDValue Op, SelectionDAG &DAG) const;
650	SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
651	SDValue LowerINTRINSIC_VOID(SDValue Op, SelectionDAG &DAG) const;
652
653	bool
654	isEligibleForTailCallOptimization(const CallLoweringInfo &CLI) const;
655
656	/// Finds the incoming stack arguments which overlap the given fixed stack
657	/// object and incorporates their load into the current chain. This prevents
658	/// an upcoming store from clobbering the stack argument before it's used.
659	SDValue addTokenForArgument(SDValue Chain, SelectionDAG &DAG,
660	MachineFrameInfo &MFI, int ClobberedFI) const;
661
662	bool DoesCalleeRestoreStack(CallingConv::ID CallCC, bool TailCallOpt) const;
663
664	void saveVarArgRegisters(CCState &CCInfo, SelectionDAG &DAG, const SDLoc &DL,
665	SDValue &Chain) const;
666
667	bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF,
668	bool isVarArg,
669	const SmallVectorImpl<ISD::OutputArg> &Outs,
670	LLVMContext &Context, const Type RetTy) const* override;
671
672	SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
673	const SmallVectorImpl<ISD::OutputArg> &Outs,
674	const SmallVectorImpl<SDValue> &OutVals, const SDLoc &DL,
675	SelectionDAG &DAG) const override;
676
677	SDValue getTargetNode(GlobalAddressSDNode *N, EVT Ty, SelectionDAG &DAG,
678	unsigned Flag) const;
679	SDValue getTargetNode(JumpTableSDNode *N, EVT Ty, SelectionDAG &DAG,
680	unsigned Flag) const;
681	SDValue getTargetNode(ConstantPoolSDNode *N, EVT Ty, SelectionDAG &DAG,
682	unsigned Flag) const;
683	SDValue getTargetNode(BlockAddressSDNode *N, EVT Ty, SelectionDAG &DAG,
684	unsigned Flag) const;
685	SDValue getTargetNode(ExternalSymbolSDNode *N, EVT Ty, SelectionDAG &DAG,
686	unsigned Flag) const;
687	template <class NodeTy>
688	SDValue getGOT(NodeTy N, SelectionDAG &DAG, unsigned* Flags = `0`) const;
689	template <class NodeTy>
690	SDValue getAddrLarge(NodeTy N, SelectionDAG &DAG, unsigned* Flags = `0`) const;
691	template <class NodeTy>
692	SDValue getAddr(NodeTy N, SelectionDAG &DAG, unsigned* Flags = `0`) const;
693	template <class NodeTy>
694	SDValue getAddrTiny(NodeTy N, SelectionDAG &DAG, unsigned* Flags = `0`) const;
695	SDValue LowerADDROFRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
696	SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
697	SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
698	SDValue LowerDarwinGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
699	SDValue LowerELFGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
700	SDValue LowerELFTLSLocalExec(const GlobalValue *GV, SDValue ThreadBase,
701	const SDLoc &DL, SelectionDAG &DAG) const;
702	SDValue LowerELFTLSDescCallSeq(SDValue SymAddr, const SDLoc &DL,
703	SelectionDAG &DAG) const;
704	SDValue LowerWindowsGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
705	SDValue LowerPtrAuthGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
706	SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
707	SDValue LowerSETCCCARRY(SDValue Op, SelectionDAG &DAG) const;
708	SDValue LowerBR_CC(SDValue Op, SelectionDAG &DAG) const;
709	SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
710	SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const;
711	SDValue LowerSELECT_CC(ISD::CondCode CC, SDValue LHS, SDValue RHS,
712	SDValue TVal, SDValue FVal,
713	iterator_range<SDNode::user_iterator> Users,
714	SDNodeFlags Flags, const SDLoc &dl,
715	SelectionDAG &DAG) const;
716	SDValue LowerINIT_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
717	SDValue LowerADJUST_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
718	SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
719	SDValue LowerBR_JT(SDValue Op, SelectionDAG &DAG) const;
720	SDValue LowerBRIND(SDValue Op, SelectionDAG &DAG) const;
721	SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
722	SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
723	SDValue LowerAAPCS_VASTART(SDValue Op, SelectionDAG &DAG) const;
724	SDValue LowerDarwin_VASTART(SDValue Op, SelectionDAG &DAG) const;
725	SDValue LowerWin64_VASTART(SDValue Op, SelectionDAG &DAG) const;
726	SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
727	SDValue LowerVACOPY(SDValue Op, SelectionDAG &DAG) const;
728	SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
729	SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
730	SDValue LowerSPONENTRY(SDValue Op, SelectionDAG &DAG) const;
731	SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
732	SDValue LowerGET_ROUNDING(SDValue Op, SelectionDAG &DAG) const;
733	SDValue LowerSET_ROUNDING(SDValue Op, SelectionDAG &DAG) const;
734	SDValue LowerGET_FPMODE(SDValue Op, SelectionDAG &DAG) const;
735	SDValue LowerSET_FPMODE(SDValue Op, SelectionDAG &DAG) const;
736	SDValue LowerRESET_FPMODE(SDValue Op, SelectionDAG &DAG) const;
737	SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
738	SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
739	SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
740	SDValue LowerEXTEND_VECTOR_INREG(SDValue Op, SelectionDAG &DAG) const;
741	SDValue LowerZERO_EXTEND_VECTOR_INREG(SDValue Op, SelectionDAG &DAG) const;
742	SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) const;
743	SDValue LowerSPLAT_VECTOR(SDValue Op, SelectionDAG &DAG) const;
744	SDValue LowerDUPQLane(SDValue Op, SelectionDAG &DAG) const;
745	SDValue LowerToPredicatedOp(SDValue Op, SelectionDAG &DAG,
746	unsigned NewOp) const;
747	SDValue LowerToScalableOp(SDValue Op, SelectionDAG &DAG) const;
748	SDValue LowerVECTOR_SPLICE(SDValue Op, SelectionDAG &DAG) const;
749	SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const;
750	SDValue LowerINSERT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const;
751	SDValue LowerVECTOR_DEINTERLEAVE(SDValue Op, SelectionDAG &DAG) const;
752	SDValue LowerVECTOR_INTERLEAVE(SDValue Op, SelectionDAG &DAG) const;
753	SDValue LowerVECTOR_HISTOGRAM(SDValue Op, SelectionDAG &DAG) const;
754	SDValue LowerPARTIAL_REDUCE_MLA(SDValue Op, SelectionDAG &DAG) const;
755	SDValue LowerGET_ACTIVE_LANE_MASK(SDValue Op, SelectionDAG &DAG) const;
756	SDValue LowerDIV(SDValue Op, SelectionDAG &DAG) const;
757	SDValue LowerMUL(SDValue Op, SelectionDAG &DAG) const;
758	SDValue LowerVectorSRA_SRL_SHL(SDValue Op, SelectionDAG &DAG) const;
759	SDValue LowerShiftParts(SDValue Op, SelectionDAG &DAG) const;
760	SDValue LowerVSETCC(SDValue Op, SelectionDAG &DAG) const;
761	SDValue LowerCTPOP_PARITY(SDValue Op, SelectionDAG &DAG) const;
762	SDValue LowerCTTZ(SDValue Op, SelectionDAG &DAG) const;
763	SDValue LowerBitreverse(SDValue Op, SelectionDAG &DAG) const;
764	SDValue LowerMinMax(SDValue Op, SelectionDAG &DAG) const;
765	SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) const;
766	SDValue LowerFP_EXTEND(SDValue Op, SelectionDAG &DAG) const;
767	SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;
768	SDValue LowerVectorFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;
769	SDValue LowerVectorFP_TO_INT_SAT(SDValue Op, SelectionDAG &DAG) const;
770	SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;
771	SDValue LowerFP_TO_INT_SAT(SDValue Op, SelectionDAG &DAG) const;
772	SDValue LowerVectorXRINT(SDValue Op, SelectionDAG &DAG) const;
773	SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
774	SDValue LowerVectorINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
775	SDValue LowerVectorOR(SDValue Op, SelectionDAG &DAG) const;
776	SDValue LowerXOR(SDValue Op, SelectionDAG &DAG) const;
777	SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;
778	SDValue LowerLOOP_DEPENDENCE_MASK(SDValue Op, SelectionDAG &DAG) const;
779	SDValue LowerBITCAST(SDValue Op, SelectionDAG &DAG) const;
780	SDValue LowerVSCALE(SDValue Op, SelectionDAG &DAG) const;
781	SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) const;
782	SDValue LowerVECREDUCE(SDValue Op, SelectionDAG &DAG) const;
783	SDValue LowerVECREDUCE_MUL(SDValue Op, SelectionDAG &DAG) const;
784	SDValue LowerATOMIC_LOAD_AND(SDValue Op, SelectionDAG &DAG) const;
785	SDValue LowerWindowsDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
786	SDValue LowerInlineDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
787	SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
788	SDValue LowerMSTORE(SDValue Op, SelectionDAG &DAG) const;
789	SDValue LowerFCANONICALIZE(SDValue Op, SelectionDAG &DAG) const;
790	SDValue LowerAVG(SDValue Op, SelectionDAG &DAG, unsigned NewOp) const;
791
792	SDValue LowerFixedLengthVectorIntDivideToSVE(SDValue Op,
793	SelectionDAG &DAG) const;
794	SDValue LowerFixedLengthVectorIntExtendToSVE(SDValue Op,
795	SelectionDAG &DAG) const;
796	SDValue LowerFixedLengthVectorLoadToSVE(SDValue Op, SelectionDAG &DAG) const;
797	SDValue LowerFixedLengthVectorMLoadToSVE(SDValue Op, SelectionDAG &DAG) const;
798	SDValue LowerVECREDUCE_SEQ_FADD(SDValue ScalarOp, SelectionDAG &DAG) const;
799	SDValue LowerPredReductionToSVE(SDValue ScalarOp, SelectionDAG &DAG) const;
800	SDValue LowerReductionToSVE(SDValue Op, SelectionDAG &DAG) const;
801	SDValue LowerFixedLengthVectorSelectToSVE(SDValue Op, SelectionDAG &DAG) const;
802	SDValue LowerFixedLengthVectorSetccToSVE(SDValue Op, SelectionDAG &DAG) const;
803	SDValue LowerFixedLengthVectorStoreToSVE(SDValue Op, SelectionDAG &DAG) const;
804	SDValue LowerFixedLengthVectorMStoreToSVE(SDValue Op,
805	SelectionDAG &DAG) const;
806	SDValue LowerFixedLengthVectorTruncateToSVE(SDValue Op,
807	SelectionDAG &DAG) const;
808	SDValue LowerFixedLengthExtractVectorElt(SDValue Op, SelectionDAG &DAG) const;
809	SDValue LowerFixedLengthInsertVectorElt(SDValue Op, SelectionDAG &DAG) const;
810	SDValue LowerFixedLengthBitcastToSVE(SDValue Op, SelectionDAG &DAG) const;
811	SDValue LowerFixedLengthConcatVectorsToSVE(SDValue Op,
812	SelectionDAG &DAG) const;
813	SDValue LowerFixedLengthFPExtendToSVE(SDValue Op, SelectionDAG &DAG) const;
814	SDValue LowerFixedLengthFPRoundToSVE(SDValue Op, SelectionDAG &DAG) const;
815	SDValue LowerFixedLengthIntToFPToSVE(SDValue Op, SelectionDAG &DAG) const;
816	SDValue LowerFixedLengthFPToIntToSVE(SDValue Op, SelectionDAG &DAG) const;
817	SDValue LowerFixedLengthVECTOR_SHUFFLEToSVE(SDValue Op,
818	SelectionDAG &DAG) const;
819	SDValue LowerFixedLengthBuildVectorToSVE(SDValue Op, SelectionDAG &DAG) const;
820	SDValue LowerFixedLengthVectorCompressToSVE(SDValue Op,
821	SelectionDAG &DAG) const;
822
823	SDValue BuildSDIVPow2(SDNode N, const* APInt &Divisor, SelectionDAG &DAG,
824	SmallVectorImpl<SDNode > &Created) const* override;
825	SDValue BuildSREMPow2(SDNode N, const* APInt &Divisor, SelectionDAG &DAG,
826	SmallVectorImpl<SDNode > &Created) const* override;
827	SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,
828	int &ExtraSteps, bool &UseOneConst,
829	bool Reciprocal) const override;
830	SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,
831	int &ExtraSteps) const override;
832	SDValue getSqrtInputTest(SDValue Operand, SelectionDAG &DAG,
833	const DenormalMode &Mode,
834	SDNodeFlags Flags = {}) const override;
835	SDValue getSqrtResultForDenormInput(SDValue Operand,
836	SelectionDAG &DAG) const override;
837	unsigned combineRepeatedFPDivisors() const override;
838
839	ConstraintType getConstraintType(StringRef Constraint) const override;
840	Register getRegisterByName(const char* RegName, LLT VT,
841	const MachineFunction &MF) const override;
842
843	/// Examine constraint string and operand type and determine a weight value.
844	/// The operand object must already have been set up with the operand type.
845	ConstraintWeight
846	getSingleConstraintMatchWeight(AsmOperandInfo &info,
847	const char constraint) const* override;
848
849	std::pair<unsigned, const TargetRegisterClass *>
850	getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
851	StringRef Constraint, MVT VT) const override;
852
853	const char LowerXConstraint(EVT ConstraintVT) const* override;
854
855	void LowerAsmOperandForConstraint(SDValue Op, StringRef Constraint,
856	std::vector<SDValue> &Ops,
857	SelectionDAG &DAG) const override;
858
859	InlineAsm::ConstraintCode
860	getInlineAsmMemConstraint(StringRef ConstraintCode) const override {
861	if (ConstraintCode == "Q")
862	return InlineAsm::ConstraintCode::Q;
863	// FIXME: clang has code for 'Ump', 'Utf', 'Usa', and 'Ush' but these are
864	// followed by llvm_unreachable so we'll leave them unimplemented in
865	// the backend for now.
866	return TargetLowering::getInlineAsmMemConstraint(ConstraintCode);
867	}
868
869	/// Handle Lowering flag assembly outputs.
870	SDValue LowerAsmOutputForConstraint(SDValue &Chain, SDValue &Flag,
871	const SDLoc &DL,
872	const AsmOperandInfo &Constraint,
873	SelectionDAG &DAG) const override;
874
875	bool shouldExtendGSIndex(EVT VT, EVT &EltTy) const override;
876	bool shouldRemoveExtendFromGSIndex(SDValue Extend, EVT DataVT) const override;
877	bool isVectorLoadExtDesirable(SDValue ExtVal) const override;
878	bool isUsedByReturnOnly(SDNode N, SDValue &Chain) const* override;
879	bool mayBeEmittedAsTailCall(const CallInst CI) const* override;
880	bool getIndexedAddressParts(SDNode N, SDNode Op, SDValue &Base,
881	SDValue &Offset, SelectionDAG &DAG) const;
882	bool getPreIndexedAddressParts(SDNode *N, SDValue &Base, SDValue &Offset,
883	ISD::MemIndexedMode &AM,
884	SelectionDAG &DAG) const override;
885	bool getPostIndexedAddressParts(SDNode N, SDNode Op, SDValue &Base,
886	SDValue &Offset, ISD::MemIndexedMode &AM,
887	SelectionDAG &DAG) const override;
888	bool isIndexingLegal(MachineInstr &MI, Register Base, Register Offset,
889	bool IsPre, MachineRegisterInfo &MRI) const override;
890
891	void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results,
892	SelectionDAG &DAG) const override;
893	void ReplaceBITCASTResults(SDNode *N, SmallVectorImpl<SDValue> &Results,
894	SelectionDAG &DAG) const;
895	void ReplaceExtractSubVectorResults(SDNode *N,
896	SmallVectorImpl<SDValue> &Results,
897	SelectionDAG &DAG) const;
898	void ReplaceGetActiveLaneMaskResults(SDNode *N,
899	SmallVectorImpl<SDValue> &Results,
900	SelectionDAG &DAG) const;
901
902	bool shouldNormalizeToSelectSequence(LLVMContext &, EVT) const override;
903
904	void finalizeLowering(MachineFunction &MF) const override;
905
906	bool shouldLocalize(const MachineInstr &MI,
907	const TargetTransformInfo TTI) const* override;
908
909	bool SimplifyDemandedBitsForTargetNode(SDValue Op,
910	const APInt &OriginalDemandedBits,
911	const APInt &OriginalDemandedElts,
912	KnownBits &Known,
913	TargetLoweringOpt &TLO,
914	unsigned Depth) const override;
915
916	bool canCreateUndefOrPoisonForTargetNode(SDValue Op,
917	const APInt &DemandedElts,
918	const SelectionDAG &DAG,
919	bool PoisonOnly, bool ConsiderFlags,
920	unsigned Depth) const override;
921
922	bool isTargetCanonicalConstantNode(SDValue Op) const override;
923
924	// With the exception of data-predicate transitions, no instructions are
925	// required to cast between legal scalable vector types. However:
926	// 1. Packed and unpacked types have different bit lengths, meaning BITCAST
927	// is not universally useable.
928	// 2. Most unpacked integer types are not legal and thus integer extends
929	// cannot be used to convert between unpacked and packed types.
930	// These can make "bitcasting" a multiphase process. REINTERPRET_CAST is used
931	// to transition between unpacked and packed types of the same element type,
932	// with BITCAST used otherwise.
933	// This function does not handle predicate bitcasts.
934	SDValue getSVESafeBitCast(EVT VT, SDValue Op, SelectionDAG &DAG) const;
935
936	// Returns the runtime value for PSTATE.SM by generating a call to
937	// __arm_sme_state.
938	SDValue getRuntimePStateSM(SelectionDAG &DAG, SDValue Chain, SDLoc DL,
939	EVT VT) const;
940
941	bool preferScalarizeSplat(SDNode N) const* override;
942
943	unsigned getMinimumJumpTableEntries() const override;
944
945	bool shouldScalarizeBinop(SDValue VecOp) const override {
946	return VecOp.getOpcode() == ISD::SETCC;
947	}
948
949	bool hasMultipleConditionRegisters(EVT VT) const override {
950	return VT.isScalableVector();
951	}
952	};
953
954	namespace AArch64 {
955	FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
956	const TargetLibraryInfo *libInfo,
957	const LibcallLoweringInfo *libcallLowering);
958	} // end namespace AArch64
959
960	} // end namespace llvm
961
962	#endif
963

Browse the source code of llvm_projects/llvm/lib/Target/AArch64/AArch64ISelLowering.h