CGCall.cpp source code [llvm_projects/clang/lib/CodeGen/CGCall.cpp]

1	//===--- CGCall.cpp - Encapsulate calling convention details --------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// These classes wrap the information about a call or function
10	// definition used to handle ABI compliancy.
11	//
12	//===----------------------------------------------------------------------===//
13
14	#include "CGCall.h"
15	#include "ABIInfo.h"
16	#include "ABIInfoImpl.h"
17	#include "CGBlocks.h"
18	#include "CGCXXABI.h"
19	#include "CGCleanup.h"
20	#include "CGDebugInfo.h"
21	#include "CGRecordLayout.h"
22	#include "CodeGenFunction.h"
23	#include "CodeGenModule.h"
24	#include "CodeGenPGO.h"
25	#include "TargetInfo.h"
26	#include "clang/AST/Attr.h"
27	#include "clang/AST/Decl.h"
28	#include "clang/AST/DeclCXX.h"
29	#include "clang/AST/DeclObjC.h"
30	#include "clang/AST/RecordLayout.h"
31	#include "clang/Basic/CodeGenOptions.h"
32	#include "clang/Basic/TargetInfo.h"
33	#include "clang/CodeGen/CGFunctionInfo.h"
34	#include "clang/CodeGen/SwiftCallingConv.h"
35	#include "llvm/ADT/STLExtras.h"
36	#include "llvm/ADT/StringExtras.h"
37	#include "llvm/Analysis/ValueTracking.h"
38	#include "llvm/IR/Assumptions.h"
39	#include "llvm/IR/AttributeMask.h"
40	#include "llvm/IR/Attributes.h"
41	#include "llvm/IR/CallingConv.h"
42	#include "llvm/IR/DataLayout.h"
43	#include "llvm/IR/DebugInfoMetadata.h"
44	#include "llvm/IR/InlineAsm.h"
45	#include "llvm/IR/IntrinsicInst.h"
46	#include "llvm/IR/Intrinsics.h"
47	#include "llvm/IR/Type.h"
48	#include "llvm/Transforms/Utils/Local.h"
49	#include <optional>
50	using namespace clang;
51	using namespace CodeGen;
52
53	/*/
54
55	unsigned CodeGenTypes::ClangCallConvToLLVMCallConv(CallingConv CC) {
56	switch (CC) {
57	default:
58	return llvm::CallingConv::C;
59	case CC_X86StdCall:
60	return llvm::CallingConv::X86_StdCall;
61	case CC_X86FastCall:
62	return llvm::CallingConv::X86_FastCall;
63	case CC_X86RegCall:
64	return llvm::CallingConv::X86_RegCall;
65	case CC_X86ThisCall:
66	return llvm::CallingConv::X86_ThisCall;
67	case CC_Win64:
68	return llvm::CallingConv::Win64;
69	case CC_X86_64SysV:
70	return llvm::CallingConv::X86_64_SysV;
71	case CC_AAPCS:
72	return llvm::CallingConv::ARM_AAPCS;
73	case CC_AAPCS_VFP:
74	return llvm::CallingConv::ARM_AAPCS_VFP;
75	case CC_IntelOclBicc:
76	return llvm::CallingConv::Intel_OCL_BI;
77	// TODO: Add support for __pascal to LLVM.
78	case CC_X86Pascal:
79	return llvm::CallingConv::C;
80	// TODO: Add support for __vectorcall to LLVM.
81	case CC_X86VectorCall:
82	return llvm::CallingConv::X86_VectorCall;
83	case CC_AArch64VectorCall:
84	return llvm::CallingConv::AArch64_VectorCall;
85	case CC_AArch64SVEPCS:
86	return llvm::CallingConv::AArch64_SVE_VectorCall;
87	case CC_SpirFunction:
88	return llvm::CallingConv::SPIR_FUNC;
89	case CC_DeviceKernel:
90	return CGM.getTargetCodeGenInfo().getDeviceKernelCallingConv();
91	case CC_PreserveMost:
92	return llvm::CallingConv::PreserveMost;
93	case CC_PreserveAll:
94	return llvm::CallingConv::PreserveAll;
95	case CC_Swift:
96	return llvm::CallingConv::Swift;
97	case CC_SwiftAsync:
98	return llvm::CallingConv::SwiftTail;
99	case CC_M68kRTD:
100	return llvm::CallingConv::M68k_RTD;
101	case CC_PreserveNone:
102	return llvm::CallingConv::PreserveNone;
103	// clang-format off
104	case CC_RISCVVectorCall: return llvm::CallingConv::RISCV_VectorCall;
105	// clang-format on
106	#define CC_VLS_CASE(ABI_VLEN) \
107	case CC_RISCVVLSCall_##ABI_VLEN: \
108	return llvm::CallingConv::RISCV_VLSCall_##ABI_VLEN;
109	CC_VLS_CASE(`32`)
110	CC_VLS_CASE(`64`)
111	CC_VLS_CASE(`128`)
112	CC_VLS_CASE(`256`)
113	CC_VLS_CASE(`512`)
114	CC_VLS_CASE(`1024`)
115	CC_VLS_CASE(`2048`)
116	CC_VLS_CASE(`4096`)
117	CC_VLS_CASE(`8192`)
118	CC_VLS_CASE(`16384`)
119	CC_VLS_CASE(`32768`)
120	CC_VLS_CASE(`65536`)
121	#undef CC_VLS_CASE
122	}
123	}
124
125	/// Derives the 'this' type for codegen purposes, i.e. ignoring method CVR
126	/// qualification. Either or both of RD and MD may be null. A null RD indicates
127	/// that there is no meaningful 'this' type, and a null MD can occur when
128	/// calling a method pointer.
129	CanQualType CodeGenTypes::DeriveThisType(const CXXRecordDecl *RD,
130	const CXXMethodDecl *MD) {
131	CanQualType RecTy;
132	if (RD)
133	RecTy = Context.getCanonicalTagType(TD: RD);
134	else
135	RecTy = Context.VoidTy;
136
137	if (MD)
138	RecTy = CanQualType::CreateUnsafe(Other: Context.getAddrSpaceQualType(
139	T: RecTy, AddressSpace: MD->getMethodQualifiers().getAddressSpace()));
140	return Context.getPointerType(T: RecTy);
141	}
142
143	/// Returns the canonical formal type of the given C++ method.
144	static CanQual<FunctionProtoType> GetFormalType(const CXXMethodDecl *MD) {
145	return MD->getType()
146	->getCanonicalTypeUnqualified()
147	.getAs<FunctionProtoType>();
148	}
149
150	/// Returns the "extra-canonicalized" return type, which discards
151	/// qualifiers on the return type. Codegen doesn't care about them,
152	/// and it makes ABI code a little easier to be able to assume that
153	/// all parameter and return types are top-level unqualified.
154	static CanQualType GetReturnType(QualType RetTy) {
155	return RetTy ->getCanonicalTypeUnqualified();
156	}
157
158	/// Arrange the argument and result information for a value of the given
159	/// unprototyped freestanding function type.
160	const CGFunctionInfo &
161	CodeGenTypes::arrangeFreeFunctionType(CanQual<FunctionNoProtoType> FTNP) {
162	// When translating an unprototyped function type, always use a
163	// variadic type.
164	return arrangeLLVMFunctionInfo(returnType: FTNP ->getReturnType().getUnqualifiedType(),
165	opts: FnInfoOpts::None, argTypes: {}, info: FTNP ->getExtInfo(), paramInfos: {},
166	args: RequiredArgs (`0`));
167	}
168
169	static void addExtParameterInfosForCall(
170	llvm::SmallVectorImpl<FunctionProtoType::ExtParameterInfo> &paramInfos,
171	const FunctionProtoType proto, unsigned* prefixArgs, unsigned totalArgs) {
172	assert(proto->hasExtParameterInfos());
173	assert(paramInfos.size() <= prefixArgs);
174	assert(proto->getNumParams() + prefixArgs <= totalArgs);
175
176	paramInfos.reserve(N: totalArgs);
177
178	// Add default infos for any prefix args that don't already have infos.
179	paramInfos.resize(N: prefixArgs);
180
181	// Add infos for the prototype.
182	for (const auto &ParamInfo : proto->getExtParameterInfos()) {
183	paramInfos.push_back(Elt: ParamInfo);
184	// pass_object_size params have no parameter info.
185	if (ParamInfo.hasPassObjectSize())
186	paramInfos.emplace_back();
187	}
188
189	assert(paramInfos.size() <= totalArgs &&
190	"Did we forget to insert pass_object_size args?");
191	// Add default infos for the variadic and/or suffix arguments.
192	paramInfos.resize(N: totalArgs);
193	}
194
195	/// Adds the formal parameters in FPT to the given prefix. If any parameter in
196	/// FPT has pass_object_size attrs, then we'll add parameters for those, too.
197	static void appendParameterTypes(
198	const CodeGenTypes &CGT, SmallVectorImpl<CanQualType> &prefix,
199	SmallVectorImpl<FunctionProtoType::ExtParameterInfo> &paramInfos,
200	CanQual<FunctionProtoType> FPT) {
201	// Fast path: don't touch param info if we don't need to.
202	if (!FPT ->hasExtParameterInfos()) {
203	assert(paramInfos.empty() &&
204	"We have paramInfos, but the prototype doesn't?");
205	prefix.append(in_start: FPT ->param_type_begin(), in_end: FPT ->param_type_end());
206	return;
207	}
208
209	unsigned PrefixSize = prefix.size();
210	// In the vast majority of cases, we'll have precisely FPT->getNumParams()
211	// parameters; the only thing that can change this is the presence of
212	// pass_object_size. So, we preallocate for the common case.
213	prefix.reserve(N: prefix.size() + FPT ->getNumParams());
214
215	auto ExtInfos = FPT ->getExtParameterInfos();
216	assert(ExtInfos.size() == FPT->getNumParams());
217	for (unsigned I = `0`, E = FPT ->getNumParams(); I != E; ++I) {
218	prefix.push_back(Elt: FPT ->getParamType(i: I));
219	if (ExtInfos [I].hasPassObjectSize())
220	prefix.push_back(Elt: CGT.getContext().getCanonicalSizeType());
221	}
222
223	addExtParameterInfosForCall(paramInfos, proto: FPT.getTypePtr(), prefixArgs: PrefixSize,
224	totalArgs: prefix.size());
225	}
226
227	using ExtParameterInfoList =
228	SmallVector<FunctionProtoType::ExtParameterInfo, `16`>;
229
230	/// Arrange the LLVM function layout for a value of the given function
231	/// type, on top of any implicit parameters already stored.
232	static const CGFunctionInfo &
233	arrangeLLVMFunctionInfo(CodeGenTypes &CGT, bool instanceMethod,
234	SmallVectorImpl<CanQualType> &prefix,
235	CanQual<FunctionProtoType> FTP) {
236	ExtParameterInfoList paramInfos;
237	RequiredArgs Required = RequiredArgs::forPrototypePlus(prototype: FTP, additional: prefix.size());
238	appendParameterTypes(CGT, prefix, paramInfos, FPT: FTP);
239	CanQualType resultType = FTP ->getReturnType().getUnqualifiedType();
240
241	FnInfoOpts opts =
242	instanceMethod ? FnInfoOpts::IsInstanceMethod : FnInfoOpts::None;
243	return CGT.arrangeLLVMFunctionInfo(returnType: resultType, opts, argTypes: prefix,
244	info: FTP ->getExtInfo(), paramInfos, args: Required);
245	}
246
247	using CanQualTypeList = SmallVector<CanQualType, `16`>;
248
249	/// Arrange the argument and result information for a value of the
250	/// given freestanding function type.
251	const CGFunctionInfo &
252	CodeGenTypes::arrangeFreeFunctionType(CanQual<FunctionProtoType> FTP) {
253	CanQualTypeList argTypes;
254	return ::arrangeLLVMFunctionInfo(CGT&: *this, /instanceMethod=/false, prefix&: argTypes,
255	FTP);
256	}
257
258	static CallingConv getCallingConventionForDecl(const ObjCMethodDecl *D,
259	bool IsTargetDefaultMSABI) {
260	// Set the appropriate calling convention for the Function.
261	if (D->hasAttr<StdCallAttr>())
262	return CC_X86StdCall;
263
264	if (D->hasAttr<FastCallAttr>())
265	return CC_X86FastCall;
266
267	if (D->hasAttr<RegCallAttr>())
268	return CC_X86RegCall;
269
270	if (D->hasAttr<ThisCallAttr>())
271	return CC_X86ThisCall;
272
273	if (D->hasAttr<VectorCallAttr>())
274	return CC_X86VectorCall;
275
276	if (D->hasAttr<PascalAttr>())
277	return CC_X86Pascal;
278
279	if (PcsAttr *PCS = D->getAttr<PcsAttr>())
280	return (PCS->getPCS() == PcsAttr::AAPCS ? CC_AAPCS : CC_AAPCS_VFP);
281
282	if (D->hasAttr<AArch64VectorPcsAttr>())
283	return CC_AArch64VectorCall;
284
285	if (D->hasAttr<AArch64SVEPcsAttr>())
286	return CC_AArch64SVEPCS;
287
288	if (D->hasAttr<DeviceKernelAttr>())
289	return CC_DeviceKernel;
290
291	if (D->hasAttr<IntelOclBiccAttr>())
292	return CC_IntelOclBicc;
293
294	if (D->hasAttr<MSABIAttr>())
295	return IsTargetDefaultMSABI ? CC_C : CC_Win64;
296
297	if (D->hasAttr<SysVABIAttr>())
298	return IsTargetDefaultMSABI ? CC_X86_64SysV : CC_C;
299
300	if (D->hasAttr<PreserveMostAttr>())
301	return CC_PreserveMost;
302
303	if (D->hasAttr<PreserveAllAttr>())
304	return CC_PreserveAll;
305
306	if (D->hasAttr<M68kRTDAttr>())
307	return CC_M68kRTD;
308
309	if (D->hasAttr<PreserveNoneAttr>())
310	return CC_PreserveNone;
311
312	if (D->hasAttr<RISCVVectorCCAttr>())
313	return CC_RISCVVectorCall;
314
315	if (RISCVVLSCCAttr *PCS = D->getAttr<RISCVVLSCCAttr>()) {
316	switch (PCS->getVectorWidth()) {
317	default:
318	llvm_unreachable("Invalid RISC-V VLS ABI VLEN");
319	#define CC_VLS_CASE(ABI_VLEN) \
320	case ABI_VLEN: \
321	return CC_RISCVVLSCall_##ABI_VLEN;
322	CC_VLS_CASE(`32`)
323	CC_VLS_CASE(`64`)
324	CC_VLS_CASE(`128`)
325	CC_VLS_CASE(`256`)
326	CC_VLS_CASE(`512`)
327	CC_VLS_CASE(`1024`)
328	CC_VLS_CASE(`2048`)
329	CC_VLS_CASE(`4096`)
330	CC_VLS_CASE(`8192`)
331	CC_VLS_CASE(`16384`)
332	CC_VLS_CASE(`32768`)
333	CC_VLS_CASE(`65536`)
334	#undef CC_VLS_CASE
335	}
336	}
337
338	return CC_C;
339	}
340
341	/// Arrange the argument and result information for a call to an
342	/// unknown C++ non-static member function of the given abstract type.
343	/// (A null RD means we don't have any meaningful "this" argument type,
344	/// so fall back to a generic pointer type).
345	/// The member function must be an ordinary function, i.e. not a
346	/// constructor or destructor.
347	const CGFunctionInfo &
348	CodeGenTypes::arrangeCXXMethodType(const CXXRecordDecl *RD,
349	const FunctionProtoType *FTP,
350	const CXXMethodDecl *MD) {
351	CanQualTypeList argTypes;
352
353	// Add the 'this' pointer.
354	argTypes.push_back(Elt: DeriveThisType(RD, MD));
355
356	return ::arrangeLLVMFunctionInfo(
357	CGT&: *this, /instanceMethod=/true, prefix&: argTypes,
358	FTP: FTP->getCanonicalTypeUnqualified().getAs<FunctionProtoType>());
359	}
360
361	/// Set calling convention for CUDA/HIP kernel.
362	static void setCUDAKernelCallingConvention(CanQualType &FTy, CodeGenModule &CGM,
363	const FunctionDecl *FD) {
364	if (FD->hasAttr<CUDAGlobalAttr>()) {
365	const FunctionType *FT = FTy ->getAs<FunctionType>();
366	CGM.getTargetCodeGenInfo().setCUDAKernelCallingConvention(FT);
367	FTy = FT->getCanonicalTypeUnqualified();
368	}
369	}
370
371	/// Arrange the argument and result information for a declaration or
372	/// definition of the given C++ non-static member function. The
373	/// member function must be an ordinary function, i.e. not a
374	/// constructor or destructor.
375	const CGFunctionInfo &
376	CodeGenTypes::arrangeCXXMethodDeclaration(const CXXMethodDecl *MD) {
377	assert(!isa<CXXConstructorDecl>(MD) && "wrong method for constructors!");
378	assert(!isa<CXXDestructorDecl>(MD) && "wrong method for destructors!");
379
380	CanQualType FT = GetFormalType(MD).getAs<Type>();
381	setCUDAKernelCallingConvention(FTy&: FT, CGM, FD: MD);
382	auto prototype = FT.getAs<FunctionProtoType>();
383
384	if (MD->isImplicitObjectMemberFunction()) {
385	// The abstract case is perfectly fine.
386	const CXXRecordDecl *ThisType =
387	getCXXABI().getThisArgumentTypeForMethod(GD: MD);
388	return arrangeCXXMethodType(RD: ThisType, FTP: prototype.getTypePtr(), MD);
389	}
390
391	return arrangeFreeFunctionType(FTP: prototype);
392	}
393
394	bool CodeGenTypes::inheritingCtorHasParams(
395	const InheritedConstructor &Inherited, CXXCtorType Type) {
396	// Parameters are unnecessary if we're constructing a base class subobject
397	// and the inherited constructor lives in a virtual base.
398	return Type == Ctor_Complete \|\|
399	!Inherited.getShadowDecl()->constructsVirtualBase() \|\|
400	!Target.getCXXABI().hasConstructorVariants();
401	}
402
403	const CGFunctionInfo &
404	CodeGenTypes::arrangeCXXStructorDeclaration(GlobalDecl GD) {
405	auto *MD = cast<CXXMethodDecl>(Val: GD.getDecl());
406
407	CanQualTypeList argTypes;
408	ExtParameterInfoList paramInfos;
409
410	const CXXRecordDecl *ThisType = getCXXABI().getThisArgumentTypeForMethod(GD);
411	argTypes.push_back(Elt: DeriveThisType(RD: ThisType, MD));
412
413	bool PassParams = true;
414
415	if (auto *CD = dyn_cast<CXXConstructorDecl>(Val: MD)) {
416	// A base class inheriting constructor doesn't get forwarded arguments
417	// needed to construct a virtual base (or base class thereof).
418	if (auto Inherited = CD->getInheritedConstructor())
419	PassParams = inheritingCtorHasParams(Inherited, Type: GD.getCtorType());
420	}
421
422	CanQual<FunctionProtoType> FTP = GetFormalType(MD);
423
424	// Add the formal parameters.
425	if (PassParams)
426	appendParameterTypes(CGT: *this, prefix&: argTypes, paramInfos, FPT: FTP);
427
428	CGCXXABI::AddedStructorArgCounts AddedArgs =
429	getCXXABI().buildStructorSignature(GD, ArgTys&: argTypes);
430	if (!paramInfos.empty()) {
431	// Note: prefix implies after the first param.
432	if (AddedArgs.Prefix)
433	paramInfos.insert(I: paramInfos.begin() + `1`, NumToInsert: AddedArgs.Prefix,
434	Elt: FunctionProtoType::ExtParameterInfo {});
435	if (AddedArgs.Suffix)
436	paramInfos.append(NumInputs: AddedArgs.Suffix,
437	Elt: FunctionProtoType::ExtParameterInfo {});
438	}
439
440	RequiredArgs required =
441	(PassParams && MD->isVariadic() ? RequiredArgs (argTypes.size())
442	: RequiredArgs::All);
443
444	FunctionType::ExtInfo extInfo = FTP ->getExtInfo();
445	CanQualType resultType = getCXXABI().HasThisReturn(GD) ? argTypes.front()
446	: getCXXABI().hasMostDerivedReturn(GD)
447	? CGM.getContext().VoidPtrTy
448	: Context.VoidTy;
449	return arrangeLLVMFunctionInfo(returnType: resultType, opts: FnInfoOpts::IsInstanceMethod,
450	argTypes, info: extInfo, paramInfos, args: required);
451	}
452
453	static CanQualTypeList getArgTypesForCall(ASTContext &ctx,
454	const CallArgList &args) {
455	CanQualTypeList argTypes;
456	for (auto &arg : args)
457	argTypes.push_back(Elt: ctx.getCanonicalParamType(T: arg.Ty));
458	return argTypes;
459	}
460
461	static CanQualTypeList getArgTypesForDeclaration(ASTContext &ctx,
462	const FunctionArgList &args) {
463	CanQualTypeList argTypes;
464	for (auto &arg : args)
465	argTypes.push_back(Elt: ctx.getCanonicalParamType(T: arg->getType()));
466	return argTypes;
467	}
468
469	static ExtParameterInfoList
470	getExtParameterInfosForCall(const FunctionProtoType proto, unsigned* prefixArgs,
471	unsigned totalArgs) {
472	ExtParameterInfoList result;
473	if (proto->hasExtParameterInfos()) {
474	addExtParameterInfosForCall(paramInfos&: result, proto, prefixArgs, totalArgs);
475	}
476	return result;
477	}
478
479	/// Arrange a call to a C++ method, passing the given arguments.
480	///
481	/// ExtraPrefixArgs is the number of ABI-specific args passed after the `this`
482	/// parameter.
483	/// ExtraSuffixArgs is the number of ABI-specific args passed at the end of
484	/// args.
485	/// PassProtoArgs indicates whether `args` has args for the parameters in the
486	/// given CXXConstructorDecl.
487	const CGFunctionInfo &CodeGenTypes::arrangeCXXConstructorCall(
488	const CallArgList &args, const CXXConstructorDecl *D, CXXCtorType CtorKind,
489	unsigned ExtraPrefixArgs, unsigned ExtraSuffixArgs, bool PassProtoArgs) {
490	CanQualTypeList ArgTypes;
491	for (const auto &Arg : args)
492	ArgTypes.push_back(Elt: Context.getCanonicalParamType(T: Arg.Ty));
493
494	// +1 for implicit this, which should always be args[0].
495	unsigned TotalPrefixArgs = `1` + ExtraPrefixArgs;
496
497	CanQual<FunctionProtoType> FPT = GetFormalType(MD: D);
498	RequiredArgs Required = PassProtoArgs
499	? RequiredArgs::forPrototypePlus(
500	prototype: FPT, additional: TotalPrefixArgs + ExtraSuffixArgs)
501	: RequiredArgs::All;
502
503	GlobalDecl GD(D, CtorKind);
504	CanQualType ResultType = getCXXABI().HasThisReturn(GD) ? ArgTypes.front()
505	: getCXXABI().hasMostDerivedReturn(GD)
506	? CGM.getContext().VoidPtrTy
507	: Context.VoidTy;
508
509	FunctionType::ExtInfo Info = FPT ->getExtInfo();
510	ExtParameterInfoList ParamInfos;
511	// If the prototype args are elided, we should only have ABI-specific args,
512	// which never have param info.
513	if (PassProtoArgs && FPT ->hasExtParameterInfos()) {
514	// ABI-specific suffix arguments are treated the same as variadic arguments.
515	addExtParameterInfosForCall(paramInfos&: ParamInfos, proto: FPT.getTypePtr(), prefixArgs: TotalPrefixArgs,
516	totalArgs: ArgTypes.size());
517	}
518
519	return arrangeLLVMFunctionInfo(returnType: ResultType, opts: FnInfoOpts::IsInstanceMethod,
520	argTypes: ArgTypes, info: Info, paramInfos: ParamInfos, args: Required);
521	}
522
523	/// Arrange the argument and result information for the declaration or
524	/// definition of the given function.
525	const CGFunctionInfo &
526	CodeGenTypes::arrangeFunctionDeclaration(const GlobalDecl GD) {
527	const FunctionDecl *FD = cast<FunctionDecl>(Val: GD.getDecl());
528	if (const CXXMethodDecl *MD = dyn_cast<CXXMethodDecl>(Val: FD))
529	if (MD->isImplicitObjectMemberFunction())
530	return arrangeCXXMethodDeclaration(MD);
531
532	CanQualType FTy = FD->getType()->getCanonicalTypeUnqualified();
533
534	assert(isa<FunctionType>(FTy));
535	setCUDAKernelCallingConvention(FTy, CGM, FD);
536
537	if (DeviceKernelAttr::isOpenCLSpelling(A: FD->getAttr<DeviceKernelAttr>()) &&
538	GD.getKernelReferenceKind() == KernelReferenceKind::Stub) {
539	const FunctionType *FT = FTy ->getAs<FunctionType>();
540	CGM.getTargetCodeGenInfo().setOCLKernelStubCallingConvention(FT);
541	FTy = FT->getCanonicalTypeUnqualified();
542	}
543
544	// When declaring a function without a prototype, always use a
545	// non-variadic type.
546	if (CanQual<FunctionNoProtoType> noProto = FTy.getAs<FunctionNoProtoType>()) {
547	return arrangeLLVMFunctionInfo(returnType: noProto ->getReturnType(), opts: FnInfoOpts::None,
548	argTypes: {}, info: noProto ->getExtInfo(), paramInfos: {},
549	args: RequiredArgs::All);
550	}
551
552	return arrangeFreeFunctionType(FTP: FTy.castAs<FunctionProtoType>());
553	}
554
555	/// Arrange the argument and result information for the declaration or
556	/// definition of an Objective-C method.
557	const CGFunctionInfo &
558	CodeGenTypes::arrangeObjCMethodDeclaration(const ObjCMethodDecl *MD) {
559	// It happens that this is the same as a call with no optional
560	// arguments, except also using the formal 'self' type.
561	return arrangeObjCMessageSendSignature(MD, receiverType: MD->getSelfDecl()->getType());
562	}
563
564	/// Arrange the argument and result information for the function type
565	/// through which to perform a send to the given Objective-C method,
566	/// using the given receiver type. The receiver type is not always
567	/// the 'self' type of the method or even an Objective-C pointer type.
568	/// This is not* the right method for actually performing such a*
569	/// message send, due to the possibility of optional arguments.
570	const CGFunctionInfo &
571	CodeGenTypes::arrangeObjCMessageSendSignature(const ObjCMethodDecl *MD,
572	QualType receiverType) {
573	CanQualTypeList argTys;
574	ExtParameterInfoList extParamInfos(MD->isDirectMethod() ? `1` : `2`);
575	argTys.push_back(Elt: Context.getCanonicalParamType(T: receiverType));
576	if (!MD->isDirectMethod())
577	argTys.push_back(Elt: Context.getCanonicalParamType(T: Context.getObjCSelType()));
578	for (const auto *I : MD->parameters()) {
579	argTys.push_back(Elt: Context.getCanonicalParamType(T: I->getType()));
580	auto extParamInfo = FunctionProtoType::ExtParameterInfo ().withIsNoEscape(
581	NoEscape: I->hasAttr<NoEscapeAttr>());
582	extParamInfos.push_back(Elt: extParamInfo);
583	}
584
585	FunctionType::ExtInfo einfo;
586	bool IsTargetDefaultMSABI =
587	getContext().getTargetInfo().getTriple().isOSWindows() \|\|
588	getContext().getTargetInfo().getTriple().isUEFI();
589	einfo = einfo.withCallingConv(
590	cc: getCallingConventionForDecl(D: MD, IsTargetDefaultMSABI));
591
592	if (getContext().getLangOpts().ObjCAutoRefCount &&
593	MD->hasAttr<NSReturnsRetainedAttr>())
594	einfo = einfo.withProducesResult(producesResult: true);
595
596	RequiredArgs required =
597	(MD->isVariadic() ? RequiredArgs (argTys.size()) : RequiredArgs::All);
598
599	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: MD->getReturnType()),
600	opts: FnInfoOpts::None, argTypes: argTys, info: einfo, paramInfos: extParamInfos,
601	args: required);
602	}
603
604	const CGFunctionInfo &
605	CodeGenTypes::arrangeUnprototypedObjCMessageSend(QualType returnType,
606	const CallArgList &args) {
607	CanQualTypeList argTypes = getArgTypesForCall(ctx&: Context, args);
608	FunctionType::ExtInfo einfo;
609
610	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: returnType), opts: FnInfoOpts::None,
611	argTypes, info: einfo, paramInfos: {}, args: RequiredArgs::All);
612	}
613
614	const CGFunctionInfo &CodeGenTypes::arrangeGlobalDeclaration(GlobalDecl GD) {
615	// FIXME: Do we need to handle ObjCMethodDecl?
616	if (isa<CXXConstructorDecl>(Val: GD.getDecl()) \|\|
617	isa<CXXDestructorDecl>(Val: GD.getDecl()))
618	return arrangeCXXStructorDeclaration(GD);
619
620	return arrangeFunctionDeclaration(GD);
621	}
622
623	/// Arrange a thunk that takes 'this' as the first parameter followed by
624	/// varargs. Return a void pointer, regardless of the actual return type.
625	/// The body of the thunk will end in a musttail call to a function of the
626	/// correct type, and the caller will bitcast the function to the correct
627	/// prototype.
628	const CGFunctionInfo &
629	CodeGenTypes::arrangeUnprototypedMustTailThunk(const CXXMethodDecl *MD) {
630	assert(MD->isVirtual() && "only methods have thunks");
631	CanQual<FunctionProtoType> FTP = GetFormalType(MD);
632	CanQualType ArgTys[] = {DeriveThisType(RD: MD->getParent(), MD)};
633	return arrangeLLVMFunctionInfo(returnType: Context.VoidTy, opts: FnInfoOpts::None, argTypes: ArgTys,
634	info: FTP ->getExtInfo(), paramInfos: {}, args: RequiredArgs (`1`));
635	}
636
637	const CGFunctionInfo &
638	CodeGenTypes::arrangeMSCtorClosure(const CXXConstructorDecl *CD,
639	CXXCtorType CT) {
640	assert(CT == Ctor_CopyingClosure \|\| CT == Ctor_DefaultClosure);
641
642	CanQual<FunctionProtoType> FTP = GetFormalType(MD: CD);
643	SmallVector<CanQualType, `2`> ArgTys;
644	const CXXRecordDecl *RD = CD->getParent();
645	ArgTys.push_back(Elt: DeriveThisType(RD, MD: CD));
646	if (CT == Ctor_CopyingClosure)
647	ArgTys.push_back(Elt: *FTP ->param_type_begin());
648	if (RD->getNumVBases() > `0`)
649	ArgTys.push_back(Elt: Context.IntTy);
650	CallingConv CC = Context.getDefaultCallingConvention(
651	/IsVariadic=/false, /IsCXXMethod=/true);
652	return arrangeLLVMFunctionInfo(returnType: Context.VoidTy, opts: FnInfoOpts::IsInstanceMethod,
653	argTypes: ArgTys, info: FunctionType::ExtInfo (CC), paramInfos: {},
654	args: RequiredArgs::All);
655	}
656
657	/// Arrange a call as unto a free function, except possibly with an
658	/// additional number of formal parameters considered required.
659	static const CGFunctionInfo &
660	arrangeFreeFunctionLikeCall(CodeGenTypes &CGT, CodeGenModule &CGM,
661	const CallArgList &args, const FunctionType *fnType,
662	unsigned numExtraRequiredArgs, bool chainCall) {
663	assert(args.size() >= numExtraRequiredArgs);
664
665	ExtParameterInfoList paramInfos;
666
667	// In most cases, there are no optional arguments.
668	RequiredArgs required = RequiredArgs::All;
669
670	// If we have a variadic prototype, the required arguments are the
671	// extra prefix plus the arguments in the prototype.
672	if (const FunctionProtoType *proto = dyn_cast<FunctionProtoType>(Val: fnType)) {
673	if (proto->isVariadic())
674	required = RequiredArgs::forPrototypePlus(prototype: proto, additional: numExtraRequiredArgs);
675
676	if (proto->hasExtParameterInfos())
677	addExtParameterInfosForCall(paramInfos, proto, prefixArgs: numExtraRequiredArgs,
678	totalArgs: args.size());
679
680	// If we don't have a prototype at all, but we're supposed to
681	// explicitly use the variadic convention for unprototyped calls,
682	// treat all of the arguments as required but preserve the nominal
683	// possibility of variadics.
684	} else if (CGM.getTargetCodeGenInfo().isNoProtoCallVariadic(
685	args, fnType: cast<FunctionNoProtoType>(Val: fnType))) {
686	required = RequiredArgs (args.size());
687	}
688
689	CanQualTypeList argTypes;
690	for (const auto &arg : args)
691	argTypes.push_back(Elt: CGT.getContext().getCanonicalParamType(T: arg.Ty));
692	FnInfoOpts opts = chainCall ? FnInfoOpts::IsChainCall : FnInfoOpts::None;
693	return CGT.arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: fnType->getReturnType()),
694	opts, argTypes, info: fnType->getExtInfo(),
695	paramInfos, args: required);
696	}
697
698	/// Figure out the rules for calling a function with the given formal
699	/// type using the given arguments. The arguments are necessary
700	/// because the function might be unprototyped, in which case it's
701	/// target-dependent in crazy ways.
702	const CGFunctionInfo &CodeGenTypes::arrangeFreeFunctionCall(
703	const CallArgList &args, const FunctionType fnType, bool* chainCall) {
704	return arrangeFreeFunctionLikeCall(CGT&: *this, CGM, args, fnType,
705	numExtraRequiredArgs: chainCall ? `1` : `0`, chainCall);
706	}
707
708	/// A block function is essentially a free function with an
709	/// extra implicit argument.
710	const CGFunctionInfo &
711	CodeGenTypes::arrangeBlockFunctionCall(const CallArgList &args,
712	const FunctionType *fnType) {
713	return arrangeFreeFunctionLikeCall(CGT&: *this, CGM, args, fnType, numExtraRequiredArgs: `1`,
714	/chainCall=/false);
715	}
716
717	const CGFunctionInfo &
718	CodeGenTypes::arrangeBlockFunctionDeclaration(const FunctionProtoType *proto,
719	const FunctionArgList &params) {
720	ExtParameterInfoList paramInfos =
721	getExtParameterInfosForCall(proto, prefixArgs: `1`, totalArgs: params.size());
722	CanQualTypeList argTypes = getArgTypesForDeclaration(ctx&: Context, args: params);
723
724	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: proto->getReturnType()),
725	opts: FnInfoOpts::None, argTypes,
726	info: proto->getExtInfo(), paramInfos,
727	args: RequiredArgs::forPrototypePlus(prototype: proto, additional: `1`));
728	}
729
730	const CGFunctionInfo &
731	CodeGenTypes::arrangeBuiltinFunctionCall(QualType resultType,
732	const CallArgList &args) {
733	CanQualTypeList argTypes;
734	for (const auto &Arg : args)
735	argTypes.push_back(Elt: Context.getCanonicalParamType(T: Arg.Ty));
736	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: resultType), opts: FnInfoOpts::None,
737	argTypes, info: FunctionType::ExtInfo (),
738	/paramInfos=/{}, args: RequiredArgs::All);
739	}
740
741	const CGFunctionInfo &
742	CodeGenTypes::arrangeBuiltinFunctionDeclaration(QualType resultType,
743	const FunctionArgList &args) {
744	CanQualTypeList argTypes = getArgTypesForDeclaration(ctx&: Context, args);
745
746	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: resultType), opts: FnInfoOpts::None,
747	argTypes, info: FunctionType::ExtInfo (), paramInfos: {},
748	args: RequiredArgs::All);
749	}
750
751	const CGFunctionInfo &CodeGenTypes::arrangeBuiltinFunctionDeclaration(
752	CanQualType resultType, ArrayRef<CanQualType> argTypes) {
753	return arrangeLLVMFunctionInfo(returnType: resultType, opts: FnInfoOpts::None, argTypes,
754	info: FunctionType::ExtInfo (), paramInfos: {},
755	args: RequiredArgs::All);
756	}
757
758	const CGFunctionInfo &CodeGenTypes::arrangeDeviceKernelCallerDeclaration(
759	QualType resultType, const FunctionArgList &args) {
760	CanQualTypeList argTypes = getArgTypesForDeclaration(ctx&: Context, args);
761
762	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: resultType), opts: FnInfoOpts::None,
763	argTypes,
764	info: FunctionType::ExtInfo (CC_DeviceKernel),
765	/paramInfos=/{}, args: RequiredArgs::All);
766	}
767
768	/// Arrange a call to a C++ method, passing the given arguments.
769	///
770	/// numPrefixArgs is the number of ABI-specific prefix arguments we have. It
771	/// does not count `this`.
772	const CGFunctionInfo &CodeGenTypes::arrangeCXXMethodCall(
773	const CallArgList &args, const FunctionProtoType *proto,
774	RequiredArgs required, unsigned numPrefixArgs) {
775	assert(numPrefixArgs + `1` <= args.size() &&
776	"Emitting a call with less args than the required prefix?");
777	// Add one to account for `this`. It's a bit awkward here, but we don't count
778	// `this` in similar places elsewhere.
779	ExtParameterInfoList paramInfos =
780	getExtParameterInfosForCall(proto, prefixArgs: numPrefixArgs + `1`, totalArgs: args.size());
781
782	CanQualTypeList argTypes = getArgTypesForCall(ctx&: Context, args);
783
784	FunctionType::ExtInfo info = proto->getExtInfo();
785	return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: proto->getReturnType()),
786	opts: FnInfoOpts::IsInstanceMethod, argTypes, info,
787	paramInfos, args: required);
788	}
789
790	const CGFunctionInfo &CodeGenTypes::arrangeNullaryFunction() {
791	return arrangeLLVMFunctionInfo(returnType: getContext().VoidTy, opts: FnInfoOpts::None, argTypes: {},
792	info: FunctionType::ExtInfo (), paramInfos: {},
793	args: RequiredArgs::All);
794	}
795
796	const CGFunctionInfo &CodeGenTypes::arrangeCall(const CGFunctionInfo &signature,
797	const CallArgList &args) {
798	assert(signature.arg_size() <= args.size());
799	if (signature.arg_size() == args.size())
800	return signature;
801
802	ExtParameterInfoList paramInfos;
803	auto sigParamInfos = signature.getExtParameterInfos();
804	if (!sigParamInfos.empty()) {
805	paramInfos.append(in_start: sigParamInfos.begin(), in_end: sigParamInfos.end());
806	paramInfos.resize(N: args.size());
807	}
808
809	CanQualTypeList argTypes = getArgTypesForCall(ctx&: Context, args);
810
811	assert(signature.getRequiredArgs().allowsOptionalArgs());
812	FnInfoOpts opts = FnInfoOpts::None;
813	if (signature.isInstanceMethod())
814	opts \|= FnInfoOpts::IsInstanceMethod;
815	if (signature.isChainCall())
816	opts \|= FnInfoOpts::IsChainCall;
817	if (signature.isDelegateCall())
818	opts \|= FnInfoOpts::IsDelegateCall;
819	return arrangeLLVMFunctionInfo(returnType: signature.getReturnType(), opts, argTypes,
820	info: signature.getExtInfo(), paramInfos,
821	args: signature.getRequiredArgs());
822	}
823
824	namespace clang {
825	namespace CodeGen {
826	void computeSPIRKernelABIInfo(CodeGenModule &CGM, CGFunctionInfo &FI);
827	}
828	} // namespace clang
829
830	/// Arrange the argument and result information for an abstract value
831	/// of a given function type. This is the method which all of the
832	/// above functions ultimately defer to.
833	const CGFunctionInfo &CodeGenTypes::arrangeLLVMFunctionInfo(
834	CanQualType resultType, FnInfoOpts opts, ArrayRef<CanQualType> argTypes,
835	FunctionType::ExtInfo info,
836	ArrayRef<FunctionProtoType::ExtParameterInfo> paramInfos,
837	RequiredArgs required) {
838	assert(llvm::all_of(argTypes,
839	[](CanQualType T) { return T.isCanonicalAsParam(); }));
840
841	// Lookup or create unique function info.
842	llvm::FoldingSetNodeID ID;
843	bool isInstanceMethod =
844	(opts & FnInfoOpts::IsInstanceMethod) == FnInfoOpts::IsInstanceMethod;
845	bool isChainCall =
846	(opts & FnInfoOpts::IsChainCall) == FnInfoOpts::IsChainCall;
847	bool isDelegateCall =
848	(opts & FnInfoOpts::IsDelegateCall) == FnInfoOpts::IsDelegateCall;
849	CGFunctionInfo::Profile(ID, InstanceMethod: isInstanceMethod, ChainCall: isChainCall, IsDelegateCall: isDelegateCall,
850	info, paramInfos, required, resultType, argTypes);
851
852	void insertPos = nullptr*;
853	CGFunctionInfo *FI = FunctionInfos.FindNodeOrInsertPos(ID, InsertPos&: insertPos);
854	if (FI)
855	return *FI;
856
857	unsigned CC = ClangCallConvToLLVMCallConv(CC: info.getCC());
858
859	// Construct the function info. We co-allocate the ArgInfos.
860	FI = CGFunctionInfo::create(llvmCC: CC, instanceMethod: isInstanceMethod, chainCall: isChainCall, delegateCall: isDelegateCall,
861	extInfo: info, paramInfos, resultType, argTypes, required);
862	FunctionInfos.InsertNode(N: FI, InsertPos: insertPos);
863
864	bool inserted = FunctionsBeingProcessed.insert(Ptr: FI).second;
865	(void)inserted;
866	assert(inserted && "Recursively being processed?");
867
868	// Compute ABI information.
869	if (CC == llvm::CallingConv::SPIR_KERNEL) {
870	// Force target independent argument handling for the host visible
871	// kernel functions.
872	computeSPIRKernelABIInfo(CGM, FI&: *FI);
873	} else if (info.getCC() == CC_Swift \|\| info.getCC() == CC_SwiftAsync) {
874	swiftcall::computeABIInfo(CGM, FI&: *FI);
875	} else {
876	CGM.getABIInfo().computeInfo(FI&: *FI);
877	}
878
879	// Loop over all of the computed argument and return value info. If any of
880	// them are direct or extend without a specified coerce type, specify the
881	// default now.
882	ABIArgInfo &retInfo = FI->getReturnInfo();
883	if (retInfo.canHaveCoerceToType() && retInfo.getCoerceToType() == nullptr)
884	retInfo.setCoerceToType(ConvertType(T: FI->getReturnType()));
885
886	for (auto &I : FI->arguments())
887	if (I.info.canHaveCoerceToType() && I.info.getCoerceToType() == nullptr)
888	I.info.setCoerceToType(ConvertType(T: I.type));
889
890	bool erased = FunctionsBeingProcessed.erase(Ptr: FI);
891	(void)erased;
892	assert(erased && "Not in set?");
893
894	return *FI;
895	}
896
897	CGFunctionInfo CGFunctionInfo::create(unsigned* llvmCC, bool instanceMethod,
898	bool chainCall, bool delegateCall,
899	const FunctionType::ExtInfo &info,
900	ArrayRef<ExtParameterInfo> paramInfos,
901	CanQualType resultType,
902	ArrayRef<CanQualType> argTypes,
903	RequiredArgs required) {
904	assert(paramInfos.empty() \|\| paramInfos.size() == argTypes.size());
905	assert(!required.allowsOptionalArgs() \|\|
906	required.getNumRequiredArgs() <= argTypes.size());
907
908	void buffer = operator* new(totalSizeToAlloc<ArgInfo, ExtParameterInfo>(
909	Counts: argTypes.size() + `1`, Counts: paramInfos.size()));
910
911	CGFunctionInfo FI = new* (buffer) CGFunctionInfo ();
912	FI->CallingConvention = llvmCC;
913	FI->EffectiveCallingConvention = llvmCC;
914	FI->ASTCallingConvention = info.getCC();
915	FI->InstanceMethod = instanceMethod;
916	FI->ChainCall = chainCall;
917	FI->DelegateCall = delegateCall;
918	FI->CmseNSCall = info.getCmseNSCall();
919	FI->NoReturn = info.getNoReturn();
920	FI->ReturnsRetained = info.getProducesResult();
921	FI->NoCallerSavedRegs = info.getNoCallerSavedRegs();
922	FI->NoCfCheck = info.getNoCfCheck();
923	FI->Required = required;
924	FI->HasRegParm = info.getHasRegParm();
925	FI->RegParm = info.getRegParm();
926	FI->ArgStruct = nullptr;
927	FI->ArgStructAlign = `0`;
928	FI->NumArgs = argTypes.size();
929	FI->HasExtParameterInfos = !paramInfos.empty();
930	FI->getArgsBuffer()[`0`].type = resultType;
931	FI->MaxVectorWidth = `0`;
932	for (unsigned i = `0`, e = argTypes.size(); i != e; ++i)
933	FI->getArgsBuffer()[i + `1`].type = argTypes [i];
934	for (unsigned i = `0`, e = paramInfos.size(); i != e; ++i)
935	FI->getExtParameterInfosBuffer()[i] = paramInfos [i];
936	return FI;
937	}
938
939	/*/
940
941	namespace {
942	// ABIArgInfo::Expand implementation.
943
944	// Specifies the way QualType passed as ABIArgInfo::Expand is expanded.
945	struct TypeExpansion {
946	enum TypeExpansionKind {
947	// Elements of constant arrays are expanded recursively.
948	TEK_ConstantArray,
949	// Record fields are expanded recursively (but if record is a union, only
950	// the field with the largest size is expanded).
951	TEK_Record,
952	// For complex types, real and imaginary parts are expanded recursively.
953	TEK_Complex,
954	// All other types are not expandable.
955	TEK_None
956	};
957
958	const TypeExpansionKind Kind;
959
960	TypeExpansion(TypeExpansionKind K) : Kind(K) {}
961	virtual ~TypeExpansion() {}
962	};
963
964	struct ConstantArrayExpansion : TypeExpansion {
965	QualType EltTy;
966	uint64_t NumElts;
967
968	ConstantArrayExpansion(QualType EltTy, uint64_t NumElts)
969	: TypeExpansion (TEK_ConstantArray), EltTy (EltTy), NumElts(NumElts) {}
970	static bool classof(const TypeExpansion *TE) {
971	return TE->Kind == TEK_ConstantArray;
972	}
973	};
974
975	struct RecordExpansion : TypeExpansion {
976	SmallVector<const CXXBaseSpecifier *, `1`> Bases;
977
978	SmallVector<const FieldDecl *, `1`> Fields;
979
980	RecordExpansion(SmallVector<const CXXBaseSpecifier *, `1`> &&Bases,
981	SmallVector<const FieldDecl *, `1`> &&Fields)
982	: TypeExpansion (TEK_Record), Bases (std::move(Bases)),
983	Fields (std::move(Fields)) {}
984	static bool classof(const TypeExpansion *TE) {
985	return TE->Kind == TEK_Record;
986	}
987	};
988
989	struct ComplexExpansion : TypeExpansion {
990	QualType EltTy;
991
992	ComplexExpansion(QualType EltTy) : TypeExpansion (TEK_Complex), EltTy (EltTy) {}
993	static bool classof(const TypeExpansion *TE) {
994	return TE->Kind == TEK_Complex;
995	}
996	};
997
998	struct NoExpansion : TypeExpansion {
999	NoExpansion() : TypeExpansion (TEK_None) {}
1000	static bool classof(const TypeExpansion TE) { return* TE->Kind == TEK_None; }
1001	};
1002	} // namespace
1003
1004	static std::unique_ptr<TypeExpansion>
1005	getTypeExpansion(QualType Ty, const ASTContext &Context) {
1006	if (const ConstantArrayType *AT = Context.getAsConstantArrayType(T: Ty)) {
1007	return std::make_unique<ConstantArrayExpansion>(args: AT->getElementType(),
1008	args: AT->getZExtSize());
1009	}
1010	if (const auto *RD = Ty ->getAsRecordDecl()) {
1011	SmallVector<const CXXBaseSpecifier *, `1`> Bases;
1012	SmallVector<const FieldDecl *, `1`> Fields;
1013	assert(!RD->hasFlexibleArrayMember() &&
1014	"Cannot expand structure with flexible array.");
1015	if (RD->isUnion()) {
1016	// Unions can be here only in degenerative cases - all the fields are same
1017	// after flattening. Thus we have to use the "largest" field.
1018	const FieldDecl LargestFD = nullptr*;
1019	CharUnits UnionSize = CharUnits::Zero();
1020
1021	for (const auto *FD : RD->fields()) {
1022	if (FD->isZeroLengthBitField())
1023	continue;
1024	assert(!FD->isBitField() &&
1025	"Cannot expand structure with bit-field members.");
1026	CharUnits FieldSize = Context.getTypeSizeInChars(T: FD->getType());
1027	if (UnionSize < FieldSize) {
1028	UnionSize = FieldSize;
1029	LargestFD = FD;
1030	}
1031	}
1032	if (LargestFD)
1033	Fields.push_back(Elt: LargestFD);
1034	} else {
1035	if (const auto *CXXRD = dyn_cast<CXXRecordDecl>(Val: RD)) {
1036	assert(!CXXRD->isDynamicClass() &&
1037	"cannot expand vtable pointers in dynamic classes");
1038	llvm::append_range(C&: Bases, R: llvm::make_pointer_range(Range: CXXRD->bases()));
1039	}
1040
1041	for (const auto *FD : RD->fields()) {
1042	if (FD->isZeroLengthBitField())
1043	continue;
1044	assert(!FD->isBitField() &&
1045	"Cannot expand structure with bit-field members.");
1046	Fields.push_back(Elt: FD);
1047	}
1048	}
1049	return std::make_unique<RecordExpansion>(args: std::move(Bases),
1050	args: std::move(Fields));
1051	}
1052	if (const ComplexType *CT = Ty ->getAs<ComplexType>()) {
1053	return std::make_unique<ComplexExpansion>(args: CT->getElementType());
1054	}
1055	return std::make_unique<NoExpansion>();
1056	}
1057
1058	static int getExpansionSize(QualType Ty, const ASTContext &Context) {
1059	auto Exp = getTypeExpansion(Ty, Context);
1060	if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) {
1061	return CAExp->NumElts * getExpansionSize(Ty: CAExp->EltTy, Context);
1062	}
1063	if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) {
1064	int Res = `0`;
1065	for (auto BS : RExp->Bases)
1066	Res += getExpansionSize(Ty: BS->getType(), Context);
1067	for (auto FD : RExp->Fields)
1068	Res += getExpansionSize(Ty: FD->getType(), Context);
1069	return Res;
1070	}
1071	if (isa<ComplexExpansion>(Val: Exp.get()))
1072	return `2`;
1073	assert(isa<NoExpansion>(Exp.get()));
1074	return `1`;
1075	}
1076
1077	void CodeGenTypes::getExpandedTypes(
1078	QualType Ty, SmallVectorImpl<llvm::Type *>::iterator &TI) {
1079	auto Exp = getTypeExpansion(Ty, Context);
1080	if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) {
1081	for (int i = `0`, n = CAExp->NumElts; i < n; i++) {
1082	getExpandedTypes(Ty: CAExp->EltTy, TI);
1083	}
1084	} else if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) {
1085	for (auto BS : RExp->Bases)
1086	getExpandedTypes(Ty: BS->getType(), TI);
1087	for (auto FD : RExp->Fields)
1088	getExpandedTypes(Ty: FD->getType(), TI);
1089	} else if (auto CExp = dyn_cast<ComplexExpansion>(Val: Exp.get())) {
1090	llvm::Type *EltTy = ConvertType(T: CExp->EltTy);
1091	*TI++ = EltTy;
1092	*TI++ = EltTy;
1093	} else {
1094	assert(isa<NoExpansion>(Exp.get()));
1095	*TI++ = ConvertType(T: Ty);
1096	}
1097	}
1098
1099	static void forConstantArrayExpansion(CodeGenFunction &CGF,
1100	ConstantArrayExpansion *CAE,
1101	Address BaseAddr,
1102	llvm::function_ref<void(Address)> Fn) {
1103	for (int i = `0`, n = CAE->NumElts; i < n; i++) {
1104	Address EltAddr = CGF.Builder.CreateConstGEP2_32(Addr: BaseAddr, Idx0: `0`, Idx1: i);
1105	Fn (EltAddr);
1106	}
1107	}
1108
1109	void CodeGenFunction::ExpandTypeFromArgs(QualType Ty, LValue LV,
1110	llvm::Function::arg_iterator &AI) {
1111	assert(LV.isSimple() &&
1112	"Unexpected non-simple lvalue during struct expansion.");
1113
1114	auto Exp = getTypeExpansion(Ty, Context: getContext());
1115	if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) {
1116	forConstantArrayExpansion(
1117	CGF&: *this, CAE: CAExp, BaseAddr: LV.getAddress(), Fn: [&](Address EltAddr) {
1118	LValue LV = MakeAddrLValue(Addr: EltAddr, T: CAExp->EltTy);
1119	ExpandTypeFromArgs(Ty: CAExp->EltTy, LV, AI);
1120	});
1121	} else if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) {
1122	Address This = LV.getAddress();
1123	for (const CXXBaseSpecifier *BS : RExp->Bases) {
1124	// Perform a single step derived-to-base conversion.
1125	Address Base =
1126	GetAddressOfBaseClass(Value: This, Derived: Ty ->getAsCXXRecordDecl(), PathBegin: &BS, PathEnd: &BS + `1`,
1127	/NullCheckValue=/false, Loc: SourceLocation ());
1128	LValue SubLV = MakeAddrLValue(Addr: Base, T: BS->getType());
1129
1130	// Recurse onto bases.
1131	ExpandTypeFromArgs(Ty: BS->getType(), LV: SubLV, AI);
1132	}
1133	for (auto FD : RExp->Fields) {
1134	// FIXME: What are the right qualifiers here?
1135	LValue SubLV = EmitLValueForFieldInitialization(Base: LV, Field: FD);
1136	ExpandTypeFromArgs(Ty: FD->getType(), LV: SubLV, AI);
1137	}
1138	} else if (isa<ComplexExpansion>(Val: Exp.get())) {
1139	auto realValue = &*AI++;
1140	auto imagValue = &*AI++;
1141	EmitStoreOfComplex(V: ComplexPairTy (realValue, imagValue), dest: LV, /init/ isInit: true);
1142	} else {
1143	// Call EmitStoreOfScalar except when the lvalue is a bitfield to emit a
1144	// primitive store.
1145	assert(isa<NoExpansion>(Exp.get()));
1146	llvm::Value Arg = &AI++;
1147	if (LV.isBitField()) {
1148	EmitStoreThroughLValue(Src: RValue::get(V: Arg), Dst: LV);
1149	} else {
1150	// TODO: currently there are some places are inconsistent in what LLVM
1151	// pointer type they use (see D118744). Once clang uses opaque pointers
1152	// all LLVM pointer types will be the same and we can remove this check.
1153	if (Arg->getType()->isPointerTy()) {
1154	Address Addr = LV.getAddress();
1155	Arg = Builder.CreateBitCast(V: Arg, DestTy: Addr.getElementType());
1156	}
1157	EmitStoreOfScalar(value: Arg, lvalue: LV);
1158	}
1159	}
1160	}
1161
1162	void CodeGenFunction::ExpandTypeToArgs(
1163	QualType Ty, CallArg Arg, llvm::FunctionType *IRFuncTy,
1164	SmallVectorImpl<llvm::Value > &IRCallArgs, unsigned* &IRCallArgPos) {
1165	auto Exp = getTypeExpansion(Ty, Context: getContext());
1166	if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) {
1167	Address Addr = Arg.hasLValue() ? Arg.getKnownLValue().getAddress()
1168	: Arg.getKnownRValue().getAggregateAddress();
1169	forConstantArrayExpansion(CGF&: *this, CAE: CAExp, BaseAddr: Addr, Fn: [&](Address EltAddr) {
1170	CallArg EltArg =
1171	CallArg (convertTempToRValue(addr: EltAddr, type: CAExp->EltTy, Loc: SourceLocation ()),
1172	CAExp->EltTy);
1173	ExpandTypeToArgs(Ty: CAExp->EltTy, Arg: EltArg, IRFuncTy, IRCallArgs,
1174	IRCallArgPos);
1175	});
1176	} else if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) {
1177	Address This = Arg.hasLValue() ? Arg.getKnownLValue().getAddress()
1178	: Arg.getKnownRValue().getAggregateAddress();
1179	for (const CXXBaseSpecifier *BS : RExp->Bases) {
1180	// Perform a single step derived-to-base conversion.
1181	Address Base =
1182	GetAddressOfBaseClass(Value: This, Derived: Ty ->getAsCXXRecordDecl(), PathBegin: &BS, PathEnd: &BS + `1`,
1183	/NullCheckValue=/false, Loc: SourceLocation ());
1184	CallArg BaseArg = CallArg (RValue::getAggregate(addr: Base), BS->getType());
1185
1186	// Recurse onto bases.
1187	ExpandTypeToArgs(Ty: BS->getType(), Arg: BaseArg, IRFuncTy, IRCallArgs,
1188	IRCallArgPos);
1189	}
1190
1191	LValue LV = MakeAddrLValue(Addr: This, T: Ty);
1192	for (auto FD : RExp->Fields) {
1193	CallArg FldArg =
1194	CallArg (EmitRValueForField(LV, FD, Loc: SourceLocation ()), FD->getType());
1195	ExpandTypeToArgs(Ty: FD->getType(), Arg: FldArg, IRFuncTy, IRCallArgs,
1196	IRCallArgPos);
1197	}
1198	} else if (isa<ComplexExpansion>(Val: Exp.get())) {
1199	ComplexPairTy CV = Arg.getKnownRValue().getComplexVal();
1200	IRCallArgs [IRCallArgPos++] = CV.first;
1201	IRCallArgs [IRCallArgPos++] = CV.second;
1202	} else {
1203	assert(isa<NoExpansion>(Exp.get()));
1204	auto RV = Arg.getKnownRValue();
1205	assert(RV.isScalar() &&
1206	"Unexpected non-scalar rvalue during struct expansion.");
1207
1208	// Insert a bitcast as needed.
1209	llvm::Value *V = RV.getScalarVal();
1210	if (IRCallArgPos < IRFuncTy->getNumParams() &&
1211	V->getType() != IRFuncTy->getParamType(i: IRCallArgPos))
1212	V = Builder.CreateBitCast(V, DestTy: IRFuncTy->getParamType(i: IRCallArgPos));
1213
1214	IRCallArgs [IRCallArgPos++] = V;
1215	}
1216	}
1217
1218	/// Create a temporary allocation for the purposes of coercion.
1219	static RawAddress CreateTempAllocaForCoercion(CodeGenFunction &CGF,
1220	llvm::Type *Ty,
1221	CharUnits MinAlign,
1222	const Twine &Name = "tmp") {
1223	// Don't use an alignment that's worse than what LLVM would prefer.
1224	auto PrefAlign = CGF.CGM.getDataLayout().getPrefTypeAlign(Ty);
1225	CharUnits Align = std::max(a: MinAlign, b: CharUnits::fromQuantity(Quantity: PrefAlign));
1226
1227	return CGF.CreateTempAlloca(Ty, align: Align, Name: Name + ".coerce");
1228	}
1229
1230	/// EnterStructPointerForCoercedAccess - Given a struct pointer that we are
1231	/// accessing some number of bytes out of it, try to gep into the struct to get
1232	/// at its inner goodness. Dive as deep as possible without entering an element
1233	/// with an in-memory size smaller than DstSize.
1234	static Address EnterStructPointerForCoercedAccess(Address SrcPtr,
1235	llvm::StructType *SrcSTy,
1236	uint64_t DstSize,
1237	CodeGenFunction &CGF) {
1238	// We can't dive into a zero-element struct.
1239	if (SrcSTy->getNumElements() == `0`)
1240	return SrcPtr;
1241
1242	llvm::Type *FirstElt = SrcSTy->getElementType(N: `0`);
1243
1244	// If the first elt is at least as large as what we're looking for, or if the
1245	// first element is the same size as the whole struct, we can enter it. The
1246	// comparison must be made on the store size and not the alloca size. Using
1247	// the alloca size may overstate the size of the load.
1248	uint64_t FirstEltSize = CGF.CGM.getDataLayout().getTypeStoreSize(Ty: FirstElt);
1249	if (FirstEltSize < DstSize &&
1250	FirstEltSize < CGF.CGM.getDataLayout().getTypeStoreSize(Ty: SrcSTy))
1251	return SrcPtr;
1252
1253	// GEP into the first element.
1254	SrcPtr = CGF.Builder.CreateStructGEP(Addr: SrcPtr, Index: `0`, Name: "coerce.dive");
1255
1256	// If the first element is a struct, recurse.
1257	llvm::Type *SrcTy = SrcPtr.getElementType();
1258	if (llvm::StructType *SrcSTy = dyn_cast<llvm::StructType>(Val: SrcTy))
1259	return EnterStructPointerForCoercedAccess(SrcPtr, SrcSTy, DstSize, CGF);
1260
1261	return SrcPtr;
1262	}
1263
1264	/// CoerceIntOrPtrToIntOrPtr - Convert a value Val to the specific Ty where both
1265	/// are either integers or pointers. This does a truncation of the value if it
1266	/// is too large or a zero extension if it is too small.
1267	///
1268	/// This behaves as if the value were coerced through memory, so on big-endian
1269	/// targets the high bits are preserved in a truncation, while little-endian
1270	/// targets preserve the low bits.
1271	static llvm::Value CoerceIntOrPtrToIntOrPtr(llvm::Value Val, llvm::Type *Ty,
1272	CodeGenFunction &CGF) {
1273	if (Val->getType() == Ty)
1274	return Val;
1275
1276	if (isa<llvm::PointerType>(Val: Val->getType())) {
1277	// If this is Pointer->Pointer avoid conversion to and from int.
1278	if (isa<llvm::PointerType>(Val: Ty))
1279	return CGF.Builder.CreateBitCast(V: Val, DestTy: Ty, Name: "coerce.val");
1280
1281	// Convert the pointer to an integer so we can play with its width.
1282	Val = CGF.Builder.CreatePtrToInt(V: Val, DestTy: CGF.IntPtrTy, Name: "coerce.val.pi");
1283	}
1284
1285	llvm::Type *DestIntTy = Ty;
1286	if (isa<llvm::PointerType>(Val: DestIntTy))
1287	DestIntTy = CGF.IntPtrTy;
1288
1289	if (Val->getType() != DestIntTy) {
1290	const llvm::DataLayout &DL = CGF.CGM.getDataLayout();
1291	if (DL.isBigEndian()) {
1292	// Preserve the high bits on big-endian targets.
1293	// That is what memory coercion does.
1294	uint64_t SrcSize = DL.getTypeSizeInBits(Ty: Val->getType());
1295	uint64_t DstSize = DL.getTypeSizeInBits(Ty: DestIntTy);
1296
1297	if (SrcSize > DstSize) {
1298	Val = CGF.Builder.CreateLShr(LHS: Val, RHS: SrcSize - DstSize, Name: "coerce.highbits");
1299	Val = CGF.Builder.CreateTrunc(V: Val, DestTy: DestIntTy, Name: "coerce.val.ii");
1300	} else {
1301	Val = CGF.Builder.CreateZExt(V: Val, DestTy: DestIntTy, Name: "coerce.val.ii");
1302	Val = CGF.Builder.CreateShl(LHS: Val, RHS: DstSize - SrcSize, Name: "coerce.highbits");
1303	}
1304	} else {
1305	// Little-endian targets preserve the low bits. No shifts required.
1306	Val = CGF.Builder.CreateIntCast(V: Val, DestTy: DestIntTy, isSigned: false, Name: "coerce.val.ii");
1307	}
1308	}
1309
1310	if (isa<llvm::PointerType>(Val: Ty))
1311	Val = CGF.Builder.CreateIntToPtr(V: Val, DestTy: Ty, Name: "coerce.val.ip");
1312	return Val;
1313	}
1314
1315	static llvm::Value *CreatePFPCoercedLoad(Address Src, QualType SrcFETy,
1316	llvm::Type *Ty, CodeGenFunction &CGF) {
1317	std::vector<PFPField> PFPFields = CGF.getContext().findPFPFields(Ty: SrcFETy);
1318	if (PFPFields.empty())
1319	return nullptr;
1320
1321	auto LoadCoercedField = [&](CharUnits Offset,
1322	llvm::Type FieldType) -> llvm::Value {
1323	// Check whether the field at Offset is a PFP field. This function is called
1324	// in ascending order of offset, and PFPFields is sorted by offset. This
1325	// means that we only need to check the first element (and remove it from
1326	// PFPFields if matching).
1327	if (!PFPFields.empty() && PFPFields [`0`].Offset == Offset) {
1328	auto FieldAddr = CGF.EmitAddressOfPFPField(RecordPtr: Src, Field: PFPFields [`0`]);
1329	llvm::Value *FieldVal = CGF.Builder.CreateLoad(Addr: FieldAddr);
1330	if (isa<llvm::IntegerType>(Val: FieldType))
1331	FieldVal = CGF.Builder.CreatePtrToInt(V: FieldVal, DestTy: FieldType);
1332	PFPFields.erase(position: PFPFields.begin());
1333	return FieldVal;
1334	}
1335	auto FieldAddr =
1336	CGF.Builder
1337	.CreateConstInBoundsByteGEP(Addr: Src.withElementType(ElemTy: CGF.Int8Ty), Offset)
1338	.withElementType(ElemTy: FieldType);
1339	return CGF.Builder.CreateLoad(Addr: FieldAddr);
1340	};
1341
1342	// The types handled by this function are the only ones that may be generated
1343	// by AArch64ABIInfo::classify{Argument,Return}Type for struct types with
1344	// pointers. PFP is only supported on AArch64.
1345	if (isa<llvm::IntegerType>(Val: Ty) \|\| isa<llvm::PointerType>(Val: Ty)) {
1346	auto Addr = CGF.EmitAddressOfPFPField(RecordPtr: Src, Field: PFPFields [`0`]);
1347	llvm::Value *Val = CGF.Builder.CreateLoad(Addr);
1348	if (isa<llvm::IntegerType>(Val: Ty))
1349	Val = CGF.Builder.CreatePtrToInt(V: Val, DestTy: Ty);
1350	return Val;
1351	}
1352	auto *AT = cast<llvm::ArrayType>(Val: Ty);
1353	auto *ET = AT->getElementType();
1354	CharUnits WordSize = CGF.getContext().toCharUnitsFromBits(
1355	BitSize: CGF.CGM.getDataLayout().getTypeSizeInBits(Ty: ET));
1356	CharUnits Offset = CharUnits::Zero();
1357	llvm::Value *Val = llvm::PoisonValue::get(T: AT);
1358	for (unsigned Idx = `0`; Idx != AT->getNumElements(); ++Idx, Offset += WordSize)
1359	Val = CGF.Builder.CreateInsertValue(Agg: Val, Val: LoadCoercedField (Offset, ET), Idxs: Idx);
1360	return Val;
1361	}
1362
1363	/// CreateCoercedLoad - Create a load from \arg SrcPtr interpreted as
1364	/// a pointer to an object of type \arg Ty, known to be aligned to
1365	/// \arg SrcAlign bytes.
1366	///
1367	/// This safely handles the case when the src type is smaller than the
1368	/// destination type; in this situation the values of bits which not
1369	/// present in the src are undefined.
1370	static llvm::Value *CreateCoercedLoad(Address Src, QualType SrcFETy,
1371	llvm::Type *Ty, CodeGenFunction &CGF) {
1372	llvm::Type *SrcTy = Src.getElementType();
1373
1374	// If SrcTy and Ty are the same, just do a load.
1375	if (SrcTy == Ty)
1376	return CGF.Builder.CreateLoad(Addr: Src);
1377
1378	if (llvm::Value *V = CreatePFPCoercedLoad(Src, SrcFETy, Ty, CGF))
1379	return V;
1380
1381	llvm::TypeSize DstSize = CGF.CGM.getDataLayout().getTypeAllocSize(Ty);
1382
1383	if (llvm::StructType *SrcSTy = dyn_cast<llvm::StructType>(Val: SrcTy)) {
1384	Src = EnterStructPointerForCoercedAccess(SrcPtr: Src, SrcSTy,
1385	DstSize: DstSize.getFixedValue(), CGF);
1386	SrcTy = Src.getElementType();
1387	}
1388
1389	llvm::TypeSize SrcSize = CGF.CGM.getDataLayout().getTypeAllocSize(Ty: SrcTy);
1390
1391	// If the source and destination are integer or pointer types, just do an
1392	// extension or truncation to the desired type.
1393	if ((isa<llvm::IntegerType>(Val: Ty) \|\| isa<llvm::PointerType>(Val: Ty)) &&
1394	(isa<llvm::IntegerType>(Val: SrcTy) \|\| isa<llvm::PointerType>(Val: SrcTy))) {
1395	llvm::Value *Load = CGF.Builder.CreateLoad(Addr: Src);
1396	return CoerceIntOrPtrToIntOrPtr(Val: Load, Ty, CGF);
1397	}
1398
1399	// If load is legal, just bitcast the src pointer.
1400	if (!SrcSize.isScalable() && !DstSize.isScalable() &&
1401	SrcSize.getFixedValue() >= DstSize.getFixedValue()) {
1402	// Generally SrcSize is never greater than DstSize, since this means we are
1403	// losing bits. However, this can happen in cases where the structure has
1404	// additional padding, for example due to a user specified alignment.
1405	//
1406	// FIXME: Assert that we aren't truncating non-padding bits when have access
1407	// to that information.
1408	Src = Src.withElementType(ElemTy: Ty);
1409	return CGF.Builder.CreateLoad(Addr: Src);
1410	}
1411
1412	// If coercing a fixed vector to a scalable vector for ABI compatibility, and
1413	// the types match, use the llvm.vector.insert intrinsic to perform the
1414	// conversion.
1415	if (auto *ScalableDstTy = dyn_cast<llvm::ScalableVectorType>(Val: Ty)) {
1416	if (auto *FixedSrcTy = dyn_cast<llvm::FixedVectorType>(Val: SrcTy)) {
1417	// If we are casting a fixed i8 vector to a scalable i1 predicate
1418	// vector, use a vector insert and bitcast the result.
1419	if (ScalableDstTy->getElementType()->isIntegerTy(Bitwidth: `1`) &&
1420	FixedSrcTy->getElementType()->isIntegerTy(Bitwidth: `8`)) {
1421	ScalableDstTy = llvm::ScalableVectorType::get(
1422	ElementType: FixedSrcTy->getElementType(),
1423	MinNumElts: llvm::divideCeil(
1424	Numerator: ScalableDstTy->getElementCount().getKnownMinValue(), Denominator: `8`));
1425	}
1426	if (ScalableDstTy->getElementType() == FixedSrcTy->getElementType()) {
1427	auto *Load = CGF.Builder.CreateLoad(Addr: Src);
1428	auto *PoisonVec = llvm::PoisonValue::get(T: ScalableDstTy);
1429	llvm::Value *Result = CGF.Builder.CreateInsertVector(
1430	DstType: ScalableDstTy, SrcVec: PoisonVec, SubVec: Load, Idx: uint64_t(`0`), Name: "cast.scalable");
1431	ScalableDstTy = cast<llvm::ScalableVectorType>(
1432	Val: llvm::VectorType::getWithSizeAndScalar(SizeTy: ScalableDstTy, EltTy: Ty));
1433	if (Result->getType() != ScalableDstTy)
1434	Result = CGF.Builder.CreateBitCast(V: Result, DestTy: ScalableDstTy);
1435	if (Result->getType() != Ty)
1436	Result = CGF.Builder.CreateExtractVector(DstType: Ty, SrcVec: Result, Idx: uint64_t(`0`));
1437	return Result;
1438	}
1439	}
1440	}
1441
1442	// Otherwise do coercion through memory. This is stupid, but simple.
1443	RawAddress Tmp =
1444	CreateTempAllocaForCoercion(CGF, Ty, MinAlign: Src.getAlignment(), Name: Src.getName());
1445	CGF.Builder.CreateMemCpy(
1446	Dst: Tmp.getPointer(), DstAlign: Tmp.getAlignment().getAsAlign(),
1447	Src: Src.emitRawPointer(CGF), SrcAlign: Src.getAlignment().getAsAlign(),
1448	Size: llvm::ConstantInt::get(Ty: CGF.IntPtrTy, V: SrcSize.getKnownMinValue()));
1449	return CGF.Builder.CreateLoad(Addr: Tmp);
1450	}
1451
1452	static bool CreatePFPCoercedStore(llvm::Value *Src, QualType SrcFETy,
1453	Address Dst, CodeGenFunction &CGF) {
1454	std::vector<PFPField> PFPFields = CGF.getContext().findPFPFields(Ty: SrcFETy);
1455	if (PFPFields.empty())
1456	return false;
1457
1458	llvm::Type *SrcTy = Src->getType();
1459	auto StoreCoercedField = [&](CharUnits Offset, llvm::Value *FieldVal) {
1460	if (!PFPFields.empty() && PFPFields [`0`].Offset == Offset) {
1461	auto FieldAddr = CGF.EmitAddressOfPFPField(RecordPtr: Dst, Field: PFPFields [`0`]);
1462	if (isa<llvm::IntegerType>(Val: FieldVal->getType()))
1463	FieldVal = CGF.Builder.CreateIntToPtr(V: FieldVal, DestTy: CGF.VoidPtrTy);
1464	CGF.Builder.CreateStore(Val: FieldVal, Addr: FieldAddr);
1465	PFPFields.erase(position: PFPFields.begin());
1466	} else {
1467	auto FieldAddr = CGF.Builder
1468	.CreateConstInBoundsByteGEP(
1469	Addr: Dst.withElementType(ElemTy: CGF.Int8Ty), Offset)
1470	.withElementType(ElemTy: FieldVal->getType());
1471	CGF.Builder.CreateStore(Val: FieldVal, Addr: FieldAddr);
1472	}
1473	};
1474
1475	// The types handled by this function are the only ones that may be generated
1476	// by AArch64ABIInfo::classify{Argument,Return}Type for struct types with
1477	// pointers. PFP is only supported on AArch64.
1478	if (isa<llvm::IntegerType>(Val: SrcTy) \|\| isa<llvm::PointerType>(Val: SrcTy)) {
1479	if (isa<llvm::IntegerType>(Val: SrcTy))
1480	Src = CGF.Builder.CreateIntToPtr(V: Src, DestTy: CGF.VoidPtrTy);
1481	auto Addr = CGF.EmitAddressOfPFPField(RecordPtr: Dst, Field: PFPFields [`0`]);
1482	CGF.Builder.CreateStore(Val: Src, Addr);
1483	} else {
1484	auto *AT = cast<llvm::ArrayType>(Val: SrcTy);
1485	auto *ET = AT->getElementType();
1486	CharUnits WordSize = CGF.getContext().toCharUnitsFromBits(
1487	BitSize: CGF.CGM.getDataLayout().getTypeSizeInBits(Ty: ET));
1488	CharUnits Offset = CharUnits::Zero();
1489	for (unsigned i = `0`; i != AT->getNumElements(); ++i, Offset += WordSize)
1490	StoreCoercedField (Offset, CGF.Builder.CreateExtractValue(Agg: Src, Idxs: i));
1491	}
1492	return true;
1493	}
1494
1495	void CodeGenFunction::CreateCoercedStore(llvm::Value *Src, QualType SrcFETy,
1496	Address Dst, llvm::TypeSize DstSize,
1497	bool DstIsVolatile) {
1498	if (!DstSize)
1499	return;
1500
1501	llvm::Type *SrcTy = Src->getType();
1502	llvm::TypeSize SrcSize = CGM.getDataLayout().getTypeAllocSize(Ty: SrcTy);
1503
1504	// GEP into structs to try to make types match.
1505	// FIXME: This isn't really that useful with opaque types, but it impacts a
1506	// lot of regression tests.
1507	if (SrcTy != Dst.getElementType()) {
1508	if (llvm::StructType *DstSTy =
1509	dyn_cast<llvm::StructType>(Val: Dst.getElementType())) {
1510	assert(!SrcSize.isScalable());
1511	Dst = EnterStructPointerForCoercedAccess(SrcPtr: Dst, SrcSTy: DstSTy,
1512	DstSize: SrcSize.getFixedValue(), CGF&: *this);
1513	}
1514	}
1515
1516	if (CreatePFPCoercedStore(Src, SrcFETy, Dst, CGF&: *this))
1517	return;
1518
1519	if (SrcSize.isScalable() \|\| SrcSize <= DstSize) {
1520	if (SrcTy->isIntegerTy() && Dst.getElementType()->isPointerTy() &&
1521	SrcSize == CGM.getDataLayout().getTypeAllocSize(Ty: Dst.getElementType())) {
1522	// If the value is supposed to be a pointer, convert it before storing it.
1523	Src = CoerceIntOrPtrToIntOrPtr(Val: Src, Ty: Dst.getElementType(), CGF&: *this);
1524	auto *I = Builder.CreateStore(Val: Src, Addr: Dst, IsVolatile: DstIsVolatile);
1525	addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src);
1526	} else if (llvm::StructType *STy =
1527	dyn_cast<llvm::StructType>(Val: Src->getType())) {
1528	// Prefer scalar stores to first-class aggregate stores.
1529	Dst = Dst.withElementType(ElemTy: SrcTy);
1530	for (unsigned i = `0`, e = STy->getNumElements(); i != e; ++i) {
1531	Address EltPtr = Builder.CreateStructGEP(Addr: Dst, Index: i);
1532	llvm::Value *Elt = Builder.CreateExtractValue(Agg: Src, Idxs: i);
1533	auto *I = Builder.CreateStore(Val: Elt, Addr: EltPtr, IsVolatile: DstIsVolatile);
1534	addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Elt);
1535	}
1536	} else {
1537	auto *I =
1538	Builder.CreateStore(Val: Src, Addr: Dst.withElementType(ElemTy: SrcTy), IsVolatile: DstIsVolatile);
1539	addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src);
1540	}
1541	} else if (SrcTy->isIntegerTy()) {
1542	// If the source is a simple integer, coerce it directly.
1543	llvm::Type DstIntTy = Builder.getIntNTy(N: DstSize.getFixedValue() `8`);
1544	Src = CoerceIntOrPtrToIntOrPtr(Val: Src, Ty: DstIntTy, CGF&: *this);
1545	auto *I =
1546	Builder.CreateStore(Val: Src, Addr: Dst.withElementType(ElemTy: DstIntTy), IsVolatile: DstIsVolatile);
1547	addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src);
1548	} else {
1549	// Otherwise do coercion through memory. This is stupid, but
1550	// simple.
1551
1552	// Generally SrcSize is never greater than DstSize, since this means we are
1553	// losing bits. However, this can happen in cases where the structure has
1554	// additional padding, for example due to a user specified alignment.
1555	//
1556	// FIXME: Assert that we aren't truncating non-padding bits when have access
1557	// to that information.
1558	RawAddress Tmp =
1559	CreateTempAllocaForCoercion(CGF&: *this, Ty: SrcTy, MinAlign: Dst.getAlignment());
1560	Builder.CreateStore(Val: Src, Addr: Tmp);
1561	auto *I = Builder.CreateMemCpy(
1562	Dst: Dst.emitRawPointer(CGF&: *this), DstAlign: Dst.getAlignment().getAsAlign(),
1563	Src: Tmp.getPointer(), SrcAlign: Tmp.getAlignment().getAsAlign(),
1564	Size: Builder.CreateTypeSize(Ty: IntPtrTy, Size: DstSize));
1565	addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src);
1566	}
1567	}
1568
1569	static Address emitAddressAtOffset(CodeGenFunction &CGF, Address addr,
1570	const ABIArgInfo &info) {
1571	if (unsigned offset = info.getDirectOffset()) {
1572	addr = addr.withElementType(ElemTy: CGF.Int8Ty);
1573	addr = CGF.Builder.CreateConstInBoundsByteGEP(
1574	Addr: addr, Offset: CharUnits::fromQuantity(Quantity: offset));
1575	addr = addr.withElementType(ElemTy: info.getCoerceToType());
1576	}
1577	return addr;
1578	}
1579
1580	static std::pair<llvm::Value , bool*>
1581	CoerceScalableToFixed(CodeGenFunction &CGF, llvm::FixedVectorType *ToTy,
1582	llvm::ScalableVectorType FromTy, llvm::Value V,
1583	StringRef Name = "") {
1584	// If we are casting a scalable i1 predicate vector to a fixed i8
1585	// vector, first bitcast the source.
1586	if (FromTy->getElementType()->isIntegerTy(Bitwidth: `1`) &&
1587	ToTy->getElementType() == CGF.Builder.getInt8Ty()) {
1588	if (!FromTy->getElementCount().isKnownMultipleOf(RHS: `8`)) {
1589	FromTy = llvm::ScalableVectorType::get(
1590	ElementType: FromTy->getElementType(),
1591	MinNumElts: llvm::alignTo<`8`>(Value: FromTy->getElementCount().getKnownMinValue()));
1592	llvm::Value *ZeroVec = llvm::Constant::getNullValue(Ty: FromTy);
1593	V = CGF.Builder.CreateInsertVector(DstType: FromTy, SrcVec: ZeroVec, SubVec: V, Idx: uint64_t(`0`));
1594	}
1595	FromTy = llvm::ScalableVectorType::get(
1596	ElementType: ToTy->getElementType(),
1597	MinNumElts: FromTy->getElementCount().getKnownMinValue() / `8`);
1598	V = CGF.Builder.CreateBitCast(V, DestTy: FromTy);
1599	}
1600	if (FromTy->getElementType() == ToTy->getElementType()) {
1601	V->setName(Name + ".coerce");
1602	V = CGF.Builder.CreateExtractVector(DstType: ToTy, SrcVec: V, Idx: uint64_t(`0`), Name: "cast.fixed");
1603	return {V, true};
1604	}
1605	return {V, false};
1606	}
1607
1608	namespace {
1609
1610	/// Encapsulates information about the way function arguments from
1611	/// CGFunctionInfo should be passed to actual LLVM IR function.
1612	class ClangToLLVMArgMapping {
1613	static const unsigned InvalidIndex = ~`0U`;
1614	unsigned InallocaArgNo;
1615	unsigned SRetArgNo;
1616	unsigned TotalIRArgs;
1617
1618	/// Arguments of LLVM IR function corresponding to single Clang argument.
1619	struct IRArgs {
1620	unsigned PaddingArgIndex;
1621	// Argument is expanded to IR arguments at positions
1622	// [FirstArgIndex, FirstArgIndex + NumberOfArgs).
1623	unsigned FirstArgIndex;
1624	unsigned NumberOfArgs;
1625
1626	IRArgs()
1627	: PaddingArgIndex(InvalidIndex), FirstArgIndex(InvalidIndex),
1628	NumberOfArgs(`0`) {}
1629	};
1630
1631	SmallVector<IRArgs, `8`> ArgInfo;
1632
1633	public:
1634	ClangToLLVMArgMapping(const ASTContext &Context, const CGFunctionInfo &FI,
1635	bool OnlyRequiredArgs = false)
1636	: InallocaArgNo(InvalidIndex), SRetArgNo(InvalidIndex), TotalIRArgs(`0`),
1637	ArgInfo (OnlyRequiredArgs ? FI.getNumRequiredArgs() : FI.arg_size()) {
1638	construct(Context, FI, OnlyRequiredArgs);
1639	}
1640
1641	bool hasInallocaArg() const { return InallocaArgNo != InvalidIndex; }
1642	unsigned getInallocaArgNo() const {
1643	assert(hasInallocaArg());
1644	return InallocaArgNo;
1645	}
1646
1647	bool hasSRetArg() const { return SRetArgNo != InvalidIndex; }
1648	unsigned getSRetArgNo() const {
1649	assert(hasSRetArg());
1650	return SRetArgNo;
1651	}
1652
1653	unsigned totalIRArgs() const { return TotalIRArgs; }
1654
1655	bool hasPaddingArg(unsigned ArgNo) const {
1656	assert(ArgNo < ArgInfo.size());
1657	return ArgInfo [ArgNo].PaddingArgIndex != InvalidIndex;
1658	}
1659	unsigned getPaddingArgNo(unsigned ArgNo) const {
1660	assert(hasPaddingArg(ArgNo));
1661	return ArgInfo [ArgNo].PaddingArgIndex;
1662	}
1663
1664	/// Returns index of first IR argument corresponding to ArgNo, and their
1665	/// quantity.
1666	std::pair<unsigned, unsigned> getIRArgs(unsigned ArgNo) const {
1667	assert(ArgNo < ArgInfo.size());
1668	return std::make_pair(x: ArgInfo [ArgNo].FirstArgIndex,
1669	y: ArgInfo [ArgNo].NumberOfArgs);
1670	}
1671
1672	private:
1673	void construct(const ASTContext &Context, const CGFunctionInfo &FI,
1674	bool OnlyRequiredArgs);
1675	};
1676
1677	void ClangToLLVMArgMapping::construct(const ASTContext &Context,
1678	const CGFunctionInfo &FI,
1679	bool OnlyRequiredArgs) {
1680	unsigned IRArgNo = `0`;
1681	bool SwapThisWithSRet = false;
1682	const ABIArgInfo &RetAI = FI.getReturnInfo();
1683
1684	if (RetAI.getKind() == ABIArgInfo::Indirect) {
1685	SwapThisWithSRet = RetAI.isSRetAfterThis();
1686	SRetArgNo = SwapThisWithSRet ? `1` : IRArgNo++;
1687	}
1688
1689	unsigned ArgNo = `0`;
1690	unsigned NumArgs = OnlyRequiredArgs ? FI.getNumRequiredArgs() : FI.arg_size();
1691	for (CGFunctionInfo::const_arg_iterator I = FI.arg_begin(); ArgNo < NumArgs;
1692	++I, ++ArgNo) {
1693	assert(I != FI.arg_end());
1694	QualType ArgType = I->type;
1695	const ABIArgInfo &AI = I->info;
1696	// Collect data about IR arguments corresponding to Clang argument ArgNo.
1697	auto &IRArgs = ArgInfo [ArgNo];
1698
1699	if (AI.getPaddingType())
1700	IRArgs.PaddingArgIndex = IRArgNo++;
1701
1702	switch (AI.getKind()) {
1703	case ABIArgInfo::TargetSpecific:
1704	case ABIArgInfo::Extend:
1705	case ABIArgInfo::Direct: {
1706	// FIXME: handle sseregparm someday...
1707	llvm::StructType *STy = dyn_cast<llvm::StructType>(Val: AI.getCoerceToType());
1708	if (AI.isDirect() && AI.getCanBeFlattened() && STy) {
1709	IRArgs.NumberOfArgs = STy->getNumElements();
1710	} else {
1711	IRArgs.NumberOfArgs = `1`;
1712	}
1713	break;
1714	}
1715	case ABIArgInfo::Indirect:
1716	case ABIArgInfo::IndirectAliased:
1717	IRArgs.NumberOfArgs = `1`;
1718	break;
1719	case ABIArgInfo::Ignore:
1720	case ABIArgInfo::InAlloca:
1721	// ignore and inalloca doesn't have matching LLVM parameters.
1722	IRArgs.NumberOfArgs = `0`;
1723	break;
1724	case ABIArgInfo::CoerceAndExpand:
1725	IRArgs.NumberOfArgs = AI.getCoerceAndExpandTypeSequence().size();
1726	break;
1727	case ABIArgInfo::Expand:
1728	IRArgs.NumberOfArgs = getExpansionSize(Ty: ArgType, Context);
1729	break;
1730	}
1731
1732	if (IRArgs.NumberOfArgs > `0`) {
1733	IRArgs.FirstArgIndex = IRArgNo;
1734	IRArgNo += IRArgs.NumberOfArgs;
1735	}
1736
1737	// Skip over the sret parameter when it comes second. We already handled it
1738	// above.
1739	if (IRArgNo == `1` && SwapThisWithSRet)
1740	IRArgNo++;
1741	}
1742	assert(ArgNo == ArgInfo.size());
1743
1744	if (FI.usesInAlloca())
1745	InallocaArgNo = IRArgNo++;
1746
1747	TotalIRArgs = IRArgNo;
1748	}
1749	} // namespace
1750
1751	/*/
1752
1753	bool CodeGenModule::ReturnTypeUsesSRet(const CGFunctionInfo &FI) {
1754	const auto &RI = FI.getReturnInfo();
1755	return RI.isIndirect() \|\| (RI.isInAlloca() && RI.getInAllocaSRet());
1756	}
1757
1758	bool CodeGenModule::ReturnTypeHasInReg(const CGFunctionInfo &FI) {
1759	const auto &RI = FI.getReturnInfo();
1760	return RI.getInReg();
1761	}
1762
1763	bool CodeGenModule::ReturnSlotInterferesWithArgs(const CGFunctionInfo &FI) {
1764	return ReturnTypeUsesSRet(FI) &&
1765	getTargetCodeGenInfo().doesReturnSlotInterfereWithArgs();
1766	}
1767
1768	bool CodeGenModule::ReturnTypeUsesFPRet(QualType ResultType) {
1769	if (const BuiltinType *BT = ResultType ->getAs<BuiltinType>()) {
1770	switch (BT->getKind()) {
1771	default:
1772	return false;
1773	case BuiltinType::Float:
1774	return getTarget().useObjCFPRetForRealType(T: FloatModeKind::Float);
1775	case BuiltinType::Double:
1776	return getTarget().useObjCFPRetForRealType(T: FloatModeKind::Double);
1777	case BuiltinType::LongDouble:
1778	return getTarget().useObjCFPRetForRealType(T: FloatModeKind::LongDouble);
1779	}
1780	}
1781
1782	return false;
1783	}
1784
1785	bool CodeGenModule::ReturnTypeUsesFP2Ret(QualType ResultType) {
1786	if (const ComplexType *CT = ResultType ->getAs<ComplexType>()) {
1787	if (const BuiltinType *BT = CT->getElementType()->getAs<BuiltinType>()) {
1788	if (BT->getKind() == BuiltinType::LongDouble)
1789	return getTarget().useObjCFP2RetForComplexLongDouble();
1790	}
1791	}
1792
1793	return false;
1794	}
1795
1796	llvm::FunctionType *CodeGenTypes::GetFunctionType(GlobalDecl GD) {
1797	const CGFunctionInfo &FI = arrangeGlobalDeclaration(GD);
1798	return GetFunctionType(Info: FI);
1799	}
1800
1801	llvm::FunctionType CodeGenTypes::GetFunctionType(const* CGFunctionInfo &FI) {
1802
1803	bool Inserted = FunctionsBeingProcessed.insert(Ptr: &FI).second;
1804	(void)Inserted;
1805	assert(Inserted && "Recursively being processed?");
1806
1807	llvm::Type resultType = nullptr*;
1808	const ABIArgInfo &retAI = FI.getReturnInfo();
1809	switch (retAI.getKind()) {
1810	case ABIArgInfo::Expand:
1811	case ABIArgInfo::IndirectAliased:
1812	llvm_unreachable("Invalid ABI kind for return argument");
1813
1814	case ABIArgInfo::TargetSpecific:
1815	case ABIArgInfo::Extend:
1816	case ABIArgInfo::Direct:
1817	resultType = retAI.getCoerceToType();
1818	break;
1819
1820	case ABIArgInfo::InAlloca:
1821	if (retAI.getInAllocaSRet()) {
1822	// sret things on win32 aren't void, they return the sret pointer.
1823	QualType ret = FI.getReturnType();
1824	unsigned addressSpace = CGM.getTypes().getTargetAddressSpace(T: ret);
1825	resultType = llvm::PointerType::get(C&: getLLVMContext(), AddressSpace: addressSpace);
1826	} else {
1827	resultType = llvm::Type::getVoidTy(C&: getLLVMContext());
1828	}
1829	break;
1830
1831	case ABIArgInfo::Indirect:
1832	case ABIArgInfo::Ignore:
1833	resultType = llvm::Type::getVoidTy(C&: getLLVMContext());
1834	break;
1835
1836	case ABIArgInfo::CoerceAndExpand:
1837	resultType = retAI.getUnpaddedCoerceAndExpandType();
1838	break;
1839	}
1840
1841	ClangToLLVMArgMapping IRFunctionArgs(getContext(), FI, true);
1842	SmallVector<llvm::Type *, `8`> ArgTypes(IRFunctionArgs.totalIRArgs());
1843
1844	// Add type for sret argument.
1845	if (IRFunctionArgs.hasSRetArg()) {
1846	ArgTypes [IRFunctionArgs.getSRetArgNo()] = llvm::PointerType::get(
1847	C&: getLLVMContext(), AddressSpace: FI.getReturnInfo().getIndirectAddrSpace());
1848	}
1849
1850	// Add type for inalloca argument.
1851	if (IRFunctionArgs.hasInallocaArg())
1852	ArgTypes [IRFunctionArgs.getInallocaArgNo()] =
1853	llvm::PointerType::getUnqual(C&: getLLVMContext());
1854
1855	// Add in all of the required arguments.
1856	unsigned ArgNo = `0`;
1857	CGFunctionInfo::const_arg_iterator it = FI.arg_begin(),
1858	ie = it + FI.getNumRequiredArgs();
1859	for (; it != ie; ++it, ++ArgNo) {
1860	const ABIArgInfo &ArgInfo = it->info;
1861
1862	// Insert a padding type to ensure proper alignment.
1863	if (IRFunctionArgs.hasPaddingArg(ArgNo))
1864	ArgTypes [IRFunctionArgs.getPaddingArgNo(ArgNo)] =
1865	ArgInfo.getPaddingType();
1866
1867	unsigned FirstIRArg, NumIRArgs;
1868	std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo);
1869
1870	switch (ArgInfo.getKind()) {
1871	case ABIArgInfo::Ignore:
1872	case ABIArgInfo::InAlloca:
1873	assert(NumIRArgs == `0`);
1874	break;
1875
1876	case ABIArgInfo::Indirect:
1877	assert(NumIRArgs == `1`);
1878	// indirect arguments are always on the stack, which is alloca addr space.
1879	ArgTypes [FirstIRArg] = llvm::PointerType::get(
1880	C&: getLLVMContext(), AddressSpace: CGM.getDataLayout().getAllocaAddrSpace());
1881	break;
1882	case ABIArgInfo::IndirectAliased:
1883	assert(NumIRArgs == `1`);
1884	ArgTypes [FirstIRArg] = llvm::PointerType::get(
1885	C&: getLLVMContext(), AddressSpace: ArgInfo.getIndirectAddrSpace());
1886	break;
1887	case ABIArgInfo::TargetSpecific:
1888	case ABIArgInfo::Extend:
1889	case ABIArgInfo::Direct: {
1890	// Fast-isel and the optimizer generally like scalar values better than
1891	// FCAs, so we flatten them if this is safe to do for this argument.
1892	llvm::Type *argType = ArgInfo.getCoerceToType();
1893	llvm::StructType *st = dyn_cast<llvm::StructType>(Val: argType);
1894	if (st && ArgInfo.isDirect() && ArgInfo.getCanBeFlattened()) {
1895	assert(NumIRArgs == st->getNumElements());
1896	for (unsigned i = `0`, e = st->getNumElements(); i != e; ++i)
1897	ArgTypes [FirstIRArg + i] = st->getElementType(N: i);
1898	} else {
1899	assert(NumIRArgs == `1`);
1900	ArgTypes [FirstIRArg] = argType;
1901	}
1902	break;
1903	}
1904
1905	case ABIArgInfo::CoerceAndExpand: {
1906	auto ArgTypesIter = ArgTypes.begin() + FirstIRArg;
1907	for (auto *EltTy : ArgInfo.getCoerceAndExpandTypeSequence()) {
1908	*ArgTypesIter++ = EltTy;
1909	}
1910	assert(ArgTypesIter == ArgTypes.begin() + FirstIRArg + NumIRArgs);
1911	break;
1912	}
1913
1914	case ABIArgInfo::Expand:
1915	auto ArgTypesIter = ArgTypes.begin() + FirstIRArg;
1916	getExpandedTypes(Ty: it->type, TI&: ArgTypesIter);
1917	assert(ArgTypesIter == ArgTypes.begin() + FirstIRArg + NumIRArgs);
1918	break;
1919	}
1920	}
1921
1922	bool Erased = FunctionsBeingProcessed.erase(Ptr: &FI);
1923	(void)Erased;
1924	assert(Erased && "Not in set?");
1925
1926	return llvm::FunctionType::get(Result: resultType, Params: ArgTypes, isVarArg: FI.isVariadic());
1927	}
1928
1929	llvm::Type *CodeGenTypes::GetFunctionTypeForVTable(GlobalDecl GD) {
1930	const CXXMethodDecl *MD = cast<CXXMethodDecl>(Val: GD.getDecl());
1931	const FunctionProtoType *FPT = MD->getType()->castAs<FunctionProtoType>();
1932
1933	if (!isFuncTypeConvertible(FT: FPT))
1934	return llvm::StructType::get(Context&: getLLVMContext());
1935
1936	return GetFunctionType(GD);
1937	}
1938
1939	static void AddAttributesFromFunctionProtoType(ASTContext &Ctx,
1940	llvm::AttrBuilder &FuncAttrs,
1941	const FunctionProtoType *FPT) {
1942	if (!FPT)
1943	return;
1944
1945	if (!isUnresolvedExceptionSpec(ESpecType: FPT->getExceptionSpecType()) &&
1946	FPT->isNothrow())
1947	FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind);
1948
1949	unsigned SMEBits = FPT->getAArch64SMEAttributes();
1950	if (SMEBits & FunctionType::SME_PStateSMEnabledMask)
1951	FuncAttrs.addAttribute(A: "aarch64_pstate_sm_enabled");
1952	if (SMEBits & FunctionType::SME_PStateSMCompatibleMask)
1953	FuncAttrs.addAttribute(A: "aarch64_pstate_sm_compatible");
1954	if (SMEBits & FunctionType::SME_AgnosticZAStateMask)
1955	FuncAttrs.addAttribute(A: "aarch64_za_state_agnostic");
1956
1957	// ZA
1958	if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_Preserves)
1959	FuncAttrs.addAttribute(A: "aarch64_preserves_za");
1960	if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_In)
1961	FuncAttrs.addAttribute(A: "aarch64_in_za");
1962	if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_Out)
1963	FuncAttrs.addAttribute(A: "aarch64_out_za");
1964	if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_InOut)
1965	FuncAttrs.addAttribute(A: "aarch64_inout_za");
1966
1967	// ZT0
1968	if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_Preserves)
1969	FuncAttrs.addAttribute(A: "aarch64_preserves_zt0");
1970	if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_In)
1971	FuncAttrs.addAttribute(A: "aarch64_in_zt0");
1972	if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_Out)
1973	FuncAttrs.addAttribute(A: "aarch64_out_zt0");
1974	if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_InOut)
1975	FuncAttrs.addAttribute(A: "aarch64_inout_zt0");
1976	}
1977
1978	static void AddAttributesFromOMPAssumes(llvm::AttrBuilder &FuncAttrs,
1979	const Decl *Callee) {
1980	if (!Callee)
1981	return;
1982
1983	SmallVector<StringRef, `4`> Attrs;
1984
1985	for (const OMPAssumeAttr *AA : Callee->specific_attrs<OMPAssumeAttr>())
1986	AA->getAssumption().split(A&: Attrs, Separator: ",");
1987
1988	if (!Attrs.empty())
1989	FuncAttrs.addAttribute(A: llvm::AssumptionAttrKey,
1990	V: llvm::join(Begin: Attrs.begin(), End: Attrs.end(), Separator: ","));
1991	}
1992
1993	bool CodeGenModule::MayDropFunctionReturn(const ASTContext &Context,
1994	QualType ReturnType) const {
1995	// We can't just discard the return value for a record type with a
1996	// complex destructor or a non-trivially copyable type.
1997	if (const RecordType *RT =
1998	ReturnType.getCanonicalType()->getAsCanonical<RecordType>()) {
1999	if (const auto *ClassDecl = dyn_cast<CXXRecordDecl>(Val: RT->getDecl()))
2000	return ClassDecl->hasTrivialDestructor();
2001	}
2002	return ReturnType.isTriviallyCopyableType(Context);
2003	}
2004
2005	static bool HasStrictReturn(const CodeGenModule &Module, QualType RetTy,
2006	const Decl *TargetDecl) {
2007	// As-is msan can not tolerate noundef mismatch between caller and
2008	// implementation. Mismatch is possible for e.g. indirect calls from C-caller
2009	// into C++. Such mismatches lead to confusing false reports. To avoid
2010	// expensive workaround on msan we enforce initialization event in uncommon
2011	// cases where it's allowed.
2012	if (Module.getLangOpts().Sanitize.has(K: SanitizerKind::Memory))
2013	return true;
2014	// C++ explicitly makes returning undefined values UB. C's rule only applies
2015	// to used values, so we never mark them noundef for now.
2016	if (!Module.getLangOpts().CPlusPlus)
2017	return false;
2018	if (TargetDecl) {
2019	if (const FunctionDecl *FDecl = dyn_cast<FunctionDecl>(Val: TargetDecl)) {
2020	if (FDecl->isExternC())
2021	return false;
2022	} else if (const VarDecl *VDecl = dyn_cast<VarDecl>(Val: TargetDecl)) {
2023	// Function pointer.
2024	if (VDecl->isExternC())
2025	return false;
2026	}
2027	}
2028
2029	// We don't want to be too aggressive with the return checking, unless
2030	// it's explicit in the code opts or we're using an appropriate sanitizer.
2031	// Try to respect what the programmer intended.
2032	return Module.getCodeGenOpts().StrictReturn \|\|
2033	!Module.MayDropFunctionReturn(Context: Module.getContext(), ReturnType: RetTy) \|\|
2034	Module.getLangOpts().Sanitize.has(K: SanitizerKind::Return);
2035	}
2036
2037	/// Add denormal-fp-math and denormal-fp-math-f32 as appropriate for the
2038	/// requested denormal behavior, accounting for the overriding behavior of the
2039	/// -f32 case.
2040	static void addDenormalModeAttrs(llvm::DenormalMode FPDenormalMode,
2041	llvm::DenormalMode FP32DenormalMode,
2042	llvm::AttrBuilder &FuncAttrs) {
2043	llvm::DenormalFPEnv FPEnv(FPDenormalMode, FP32DenormalMode);
2044	if (FPEnv != llvm::DenormalFPEnv::getDefault())
2045	FuncAttrs.addDenormalFPEnvAttr(Mode: FPEnv);
2046	}
2047
2048	/// Add default attributes to a function, which have merge semantics under
2049	/// -mlink-builtin-bitcode and should not simply overwrite any existing
2050	/// attributes in the linked library.
2051	static void
2052	addMergableDefaultFunctionAttributes(const CodeGenOptions &CodeGenOpts,
2053	llvm::AttrBuilder &FuncAttrs) {
2054	addDenormalModeAttrs(FPDenormalMode: CodeGenOpts.FPDenormalMode, FP32DenormalMode: CodeGenOpts.FP32DenormalMode,
2055	FuncAttrs);
2056	}
2057
2058	static void getTrivialDefaultFunctionAttributes(
2059	StringRef Name, bool HasOptnone, const CodeGenOptions &CodeGenOpts,
2060	const LangOptions &LangOpts, bool AttrOnCallSite,
2061	llvm::AttrBuilder &FuncAttrs) {
2062	// OptimizeNoneAttr takes precedence over -Os or -Oz. No warning needed.
2063	if (!HasOptnone) {
2064	if (CodeGenOpts.OptimizeSize)
2065	FuncAttrs.addAttribute(Val: llvm::Attribute::OptimizeForSize);
2066	if (CodeGenOpts.OptimizeSize == `2`)
2067	FuncAttrs.addAttribute(Val: llvm::Attribute::MinSize);
2068	}
2069
2070	if (CodeGenOpts.DisableRedZone)
2071	FuncAttrs.addAttribute(Val: llvm::Attribute::NoRedZone);
2072	if (CodeGenOpts.IndirectTlsSegRefs)
2073	FuncAttrs.addAttribute(A: "indirect-tls-seg-refs");
2074	if (CodeGenOpts.NoImplicitFloat)
2075	FuncAttrs.addAttribute(Val: llvm::Attribute::NoImplicitFloat);
2076
2077	if (AttrOnCallSite) {
2078	// Attributes that should go on the call site only.
2079	// FIXME: Look for 'BuiltinAttr' on the function rather than re-checking
2080	// the -fno-builtin-foo list.
2081	if (!CodeGenOpts.SimplifyLibCalls \|\| LangOpts.isNoBuiltinFunc(Name))
2082	FuncAttrs.addAttribute(Val: llvm::Attribute::NoBuiltin);
2083	if (!CodeGenOpts.TrapFuncName.empty())
2084	FuncAttrs.addAttribute(A: "trap-func-name", V: CodeGenOpts.TrapFuncName);
2085	} else {
2086	switch (CodeGenOpts.getFramePointer()) {
2087	case CodeGenOptions::FramePointerKind::None:
2088	// This is the default behavior.
2089	break;
2090	case CodeGenOptions::FramePointerKind::Reserved:
2091	case CodeGenOptions::FramePointerKind::NonLeafNoReserve:
2092	case CodeGenOptions::FramePointerKind::NonLeaf:
2093	case CodeGenOptions::FramePointerKind::All:
2094	FuncAttrs.addAttribute(A: "frame-pointer",
2095	V: CodeGenOptions::getFramePointerKindName(
2096	Kind: CodeGenOpts.getFramePointer()));
2097	}
2098
2099	if (CodeGenOpts.LessPreciseFPMAD)
2100	FuncAttrs.addAttribute(A: "less-precise-fpmad", V: "true");
2101
2102	if (CodeGenOpts.NullPointerIsValid)
2103	FuncAttrs.addAttribute(Val: llvm::Attribute::NullPointerIsValid);
2104
2105	if (LangOpts.getDefaultExceptionMode() == LangOptions::FPE_Ignore)
2106	FuncAttrs.addAttribute(A: "no-trapping-math", V: "true");
2107
2108	// TODO: Are these all needed?
2109	// unsafe/inf/nan/nsz are handled by instruction-level FastMathFlags.
2110	if (CodeGenOpts.SoftFloat)
2111	FuncAttrs.addAttribute(A: "use-soft-float", V: "true");
2112	FuncAttrs.addAttribute(A: "stack-protector-buffer-size",
2113	V: llvm::utostr(X: CodeGenOpts.SSPBufferSize));
2114	if (LangOpts.NoSignedZero)
2115	FuncAttrs.addAttribute(A: "no-signed-zeros-fp-math", V: "true");
2116
2117	// TODO: Reciprocal estimate codegen options should apply to instructions?
2118	const std::vector<std::string> &Recips = CodeGenOpts.Reciprocals;
2119	if (!Recips.empty())
2120	FuncAttrs.addAttribute(A: "reciprocal-estimates", V: llvm::join(R: Recips, Separator: ","));
2121
2122	if (!CodeGenOpts.PreferVectorWidth.empty() &&
2123	CodeGenOpts.PreferVectorWidth != "none")
2124	FuncAttrs.addAttribute(A: "prefer-vector-width",
2125	V: CodeGenOpts.PreferVectorWidth);
2126
2127	if (CodeGenOpts.StackRealignment)
2128	FuncAttrs.addAttribute(A: "stackrealign");
2129	if (CodeGenOpts.Backchain)
2130	FuncAttrs.addAttribute(A: "backchain");
2131	if (CodeGenOpts.EnableSegmentedStacks)
2132	FuncAttrs.addAttribute(A: "split-stack");
2133
2134	if (CodeGenOpts.SpeculativeLoadHardening)
2135	FuncAttrs.addAttribute(Val: llvm::Attribute::SpeculativeLoadHardening);
2136
2137	// Add zero-call-used-regs attribute.
2138	switch (CodeGenOpts.getZeroCallUsedRegs()) {
2139	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::Skip:
2140	FuncAttrs.removeAttribute(A: "zero-call-used-regs");
2141	break;
2142	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::UsedGPRArg:
2143	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used-gpr-arg");
2144	break;
2145	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::UsedGPR:
2146	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used-gpr");
2147	break;
2148	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::UsedArg:
2149	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used-arg");
2150	break;
2151	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::Used:
2152	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used");
2153	break;
2154	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::AllGPRArg:
2155	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all-gpr-arg");
2156	break;
2157	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::AllGPR:
2158	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all-gpr");
2159	break;
2160	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::AllArg:
2161	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all-arg");
2162	break;
2163	case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::All:
2164	FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all");
2165	break;
2166	}
2167	}
2168
2169	if (LangOpts.assumeFunctionsAreConvergent()) {
2170	// Conservatively, mark all functions and calls in CUDA and OpenCL as
2171	// convergent (meaning, they may call an intrinsically convergent op, such
2172	// as __syncthreads() / barrier(), and so can't have certain optimizations
2173	// applied around them). LLVM will remove this attribute where it safely
2174	// can.
2175	FuncAttrs.addAttribute(Val: llvm::Attribute::Convergent);
2176	}
2177
2178	// TODO: NoUnwind attribute should be added for other GPU modes HIP,
2179	// OpenMP offload. AFAIK, neither of them support exceptions in device code.
2180	if ((LangOpts.CUDA && LangOpts.CUDAIsDevice) \|\| LangOpts.OpenCL \|\|
2181	LangOpts.SYCLIsDevice) {
2182	FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind);
2183	}
2184
2185	if (CodeGenOpts.SaveRegParams && !AttrOnCallSite)
2186	FuncAttrs.addAttribute(A: "save-reg-params");
2187
2188	for (StringRef Attr : CodeGenOpts.DefaultFunctionAttrs) {
2189	StringRef Var, Value;
2190	std::tie(args&: Var, args&: Value) = Attr.split(Separator: `'='`);
2191	FuncAttrs.addAttribute(A: Var, V: Value);
2192	}
2193
2194	TargetInfo::BranchProtectionInfo BPI(LangOpts);
2195	TargetCodeGenInfo::initBranchProtectionFnAttributes(BPI, FuncAttrs);
2196	}
2197
2198	/// Merges `target-features` from \TargetOpts and \F, and sets the result in
2199	/// \FuncAttr
2200	/// features from \F are always kept*
2201	/// a feature from \TargetOpts is kept if itself and its opposite are absent*
2202	/// from \F
2203	static void
2204	overrideFunctionFeaturesWithTargetFeatures(llvm::AttrBuilder &FuncAttr,
2205	const llvm::Function &F,
2206	const TargetOptions &TargetOpts) {
2207	auto FFeatures = F.getFnAttribute(Kind: "target-features");
2208
2209	llvm::StringSet<> MergedNames;
2210	SmallVector<StringRef> MergedFeatures;
2211	MergedFeatures.reserve(N: TargetOpts.Features.size());
2212
2213	auto AddUnmergedFeatures = [&](auto &&FeatureRange) {
2214	for (StringRef Feature : FeatureRange) {
2215	if (Feature.empty())
2216	continue;
2217	assert(Feature[`0`] == `'+'` \|\| Feature[`0`] == `'-'`);
2218	StringRef Name = Feature.drop_front(N: `1`);
2219	bool Merged = !MergedNames.insert(key: Name).second;
2220	if (!Merged)
2221	MergedFeatures.push_back(Elt: Feature);
2222	}
2223	};
2224
2225	if (FFeatures.isValid())
2226	AddUnmergedFeatures (llvm::split(Str: FFeatures.getValueAsString(), Separator: `','`));
2227	AddUnmergedFeatures (TargetOpts.Features);
2228
2229	if (!MergedFeatures.empty()) {
2230	llvm::sort(C&: MergedFeatures);
2231	FuncAttr.addAttribute(A: "target-features", V: llvm::join(R&: MergedFeatures, Separator: ","));
2232	}
2233	}
2234
2235	void CodeGen::mergeDefaultFunctionDefinitionAttributes(
2236	llvm::Function &F, const CodeGenOptions &CodeGenOpts,
2237	const LangOptions &LangOpts, const TargetOptions &TargetOpts,
2238	bool WillInternalize) {
2239
2240	llvm::AttrBuilder FuncAttrs(F.getContext());
2241	// Here we only extract the options that are relevant compared to the version
2242	// from GetCPUAndFeaturesAttributes.
2243	if (!TargetOpts.CPU.empty())
2244	FuncAttrs.addAttribute(A: "target-cpu", V: TargetOpts.CPU);
2245	if (!TargetOpts.TuneCPU.empty())
2246	FuncAttrs.addAttribute(A: "tune-cpu", V: TargetOpts.TuneCPU);
2247
2248	::getTrivialDefaultFunctionAttributes(Name: F.getName(), HasOptnone: F.hasOptNone(),
2249	CodeGenOpts, LangOpts,
2250	/AttrOnCallSite=/false, FuncAttrs);
2251
2252	if (!WillInternalize && F.isInterposable()) {
2253	// Do not promote "dynamic" denormal-fp-math to this translation unit's
2254	// setting for weak functions that won't be internalized. The user has no
2255	// real control for how builtin bitcode is linked, so we shouldn't assume
2256	// later copies will use a consistent mode.
2257	F.addFnAttrs(Attrs: FuncAttrs);
2258	return;
2259	}
2260
2261	llvm::AttributeMask AttrsToRemove;
2262
2263	llvm::DenormalFPEnv OptsFPEnv(CodeGenOpts.FPDenormalMode,
2264	CodeGenOpts.FP32DenormalMode);
2265	llvm::DenormalFPEnv MergedFPEnv =
2266	OptsFPEnv.mergeCalleeMode(Callee: F.getDenormalFPEnv());
2267
2268	if (MergedFPEnv == llvm::DenormalFPEnv::getDefault()) {
2269	AttrsToRemove.addAttribute(Val: llvm::Attribute::DenormalFPEnv);
2270	} else {
2271	// Overwrite existing attribute
2272	FuncAttrs.addDenormalFPEnvAttr(Mode: MergedFPEnv);
2273	}
2274
2275	F.removeFnAttrs(Attrs: AttrsToRemove);
2276
2277	overrideFunctionFeaturesWithTargetFeatures(FuncAttr&: FuncAttrs, F, TargetOpts);
2278
2279	F.addFnAttrs(Attrs: FuncAttrs);
2280	}
2281
2282	void CodeGenModule::getTrivialDefaultFunctionAttributes(
2283	StringRef Name, bool HasOptnone, bool AttrOnCallSite,
2284	llvm::AttrBuilder &FuncAttrs) {
2285	::getTrivialDefaultFunctionAttributes(Name, HasOptnone, CodeGenOpts: getCodeGenOpts(),
2286	LangOpts: getLangOpts(), AttrOnCallSite,
2287	FuncAttrs);
2288	}
2289
2290	void CodeGenModule::getDefaultFunctionAttributes(StringRef Name,
2291	bool HasOptnone,
2292	bool AttrOnCallSite,
2293	llvm::AttrBuilder &FuncAttrs) {
2294	getTrivialDefaultFunctionAttributes(Name, HasOptnone, AttrOnCallSite,
2295	FuncAttrs);
2296
2297	if (!AttrOnCallSite)
2298	TargetCodeGenInfo::initPointerAuthFnAttributes(Opts: CodeGenOpts.PointerAuth,
2299	FuncAttrs);
2300
2301	// If we're just getting the default, get the default values for mergeable
2302	// attributes.
2303	if (!AttrOnCallSite)
2304	addMergableDefaultFunctionAttributes(CodeGenOpts, FuncAttrs);
2305	}
2306
2307	void CodeGenModule::addDefaultFunctionDefinitionAttributes(
2308	llvm::AttrBuilder &attrs) {
2309	getDefaultFunctionAttributes(/function name/ Name: "", /optnone/ HasOptnone: false,
2310	/for call/ AttrOnCallSite: false, FuncAttrs&: attrs);
2311	GetCPUAndFeaturesAttributes(GD: GlobalDecl (), AttrBuilder&: attrs);
2312	}
2313
2314	static void addNoBuiltinAttributes(llvm::AttrBuilder &FuncAttrs,
2315	const LangOptions &LangOpts,
2316	const NoBuiltinAttr NBA = nullptr*) {
2317	auto AddNoBuiltinAttr = [&FuncAttrs](StringRef BuiltinName) {
2318	SmallString<`32`> AttributeName;
2319	AttributeName += "no-builtin-";
2320	AttributeName += BuiltinName;
2321	FuncAttrs.addAttribute(A: AttributeName);
2322	};
2323
2324	// First, handle the language options passed through -fno-builtin.
2325	if (LangOpts.NoBuiltin) {
2326	// -fno-builtin disables them all.
2327	FuncAttrs.addAttribute(A: "no-builtins");
2328	return;
2329	}
2330
2331	// Then, add attributes for builtins specified through -fno-builtin-<name>.
2332	llvm::for_each(Range: LangOpts.NoBuiltinFuncs, F: AddNoBuiltinAttr);
2333
2334	// Now, let's check the __attribute__((no_builtin("...")) attribute added to
2335	// the source.
2336	if (!NBA)
2337	return;
2338
2339	// If there is a wildcard in the builtin names specified through the
2340	// attribute, disable them all.
2341	if (llvm::is_contained(Range: NBA->builtinNames(), Element: "*")) {
2342	FuncAttrs.addAttribute(A: "no-builtins");
2343	return;
2344	}
2345
2346	// And last, add the rest of the builtin names.
2347	llvm::for_each(Range: NBA->builtinNames(), F: AddNoBuiltinAttr);
2348	}
2349
2350	static bool DetermineNoUndef(QualType QTy, CodeGenTypes &Types,
2351	const llvm::DataLayout &DL, const ABIArgInfo &AI,
2352	bool CheckCoerce = true) {
2353	llvm::Type *Ty = Types.ConvertTypeForMem(T: QTy);
2354	if (AI.getKind() == ABIArgInfo::Indirect \|\|
2355	AI.getKind() == ABIArgInfo::IndirectAliased)
2356	return true;
2357	if (AI.getKind() == ABIArgInfo::Extend && !AI.isNoExt())
2358	return true;
2359	if (!DL.typeSizeEqualsStoreSize(Ty))
2360	// TODO: This will result in a modest amount of values not marked noundef
2361	// when they could be. We care about values that invisibly* contain undef*
2362	// bits from the perspective of LLVM IR.
2363	return false;
2364	if (CheckCoerce && AI.canHaveCoerceToType()) {
2365	llvm::Type *CoerceTy = AI.getCoerceToType();
2366	if (llvm::TypeSize::isKnownGT(LHS: DL.getTypeSizeInBits(Ty: CoerceTy),
2367	RHS: DL.getTypeSizeInBits(Ty)))
2368	// If we're coercing to a type with a greater size than the canonical one,
2369	// we're introducing new undef bits.
2370	// Coercing to a type of smaller or equal size is ok, as we know that
2371	// there's no internal padding (typeSizeEqualsStoreSize).
2372	return false;
2373	}
2374	if (QTy ->isBitIntType())
2375	return true;
2376	if (QTy ->isReferenceType())
2377	return true;
2378	if (QTy ->isNullPtrType())
2379	return false;
2380	if (QTy ->isMemberPointerType())
2381	// TODO: Some member pointers are `noundef`, but it depends on the ABI. For
2382	// now, never mark them.
2383	return false;
2384	if (QTy ->isScalarType()) {
2385	if (const ComplexType *Complex = dyn_cast<ComplexType>(Val&: QTy))
2386	return DetermineNoUndef(QTy: Complex->getElementType(), Types, DL, AI, CheckCoerce: false);
2387	return true;
2388	}
2389	if (const VectorType *Vector = dyn_cast<VectorType>(Val&: QTy))
2390	return DetermineNoUndef(QTy: Vector->getElementType(), Types, DL, AI, CheckCoerce: false);
2391	if (const MatrixType *Matrix = dyn_cast<MatrixType>(Val&: QTy))
2392	return DetermineNoUndef(QTy: Matrix->getElementType(), Types, DL, AI, CheckCoerce: false);
2393	if (const ArrayType *Array = dyn_cast<ArrayType>(Val&: QTy))
2394	return DetermineNoUndef(QTy: Array->getElementType(), Types, DL, AI, CheckCoerce: false);
2395
2396	// TODO: Some structs may be `noundef`, in specific situations.
2397	return false;
2398	}
2399
2400	/// Check if the argument of a function has maybe_undef attribute.
2401	static bool IsArgumentMaybeUndef(const Decl *TargetDecl,
2402	unsigned NumRequiredArgs, unsigned ArgNo) {
2403	const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl);
2404	if (!FD)
2405	return false;
2406
2407	// Assume variadic arguments do not have maybe_undef attribute.
2408	if (ArgNo >= NumRequiredArgs)
2409	return false;
2410
2411	// Check if argument has maybe_undef attribute.
2412	if (ArgNo < FD->getNumParams()) {
2413	const ParmVarDecl *Param = FD->getParamDecl(i: ArgNo);
2414	if (Param && Param->hasAttr<MaybeUndefAttr>())
2415	return true;
2416	}
2417
2418	return false;
2419	}
2420
2421	/// Test if it's legal to apply nofpclass for the given parameter type and it's
2422	/// lowered IR type.
2423	static bool canApplyNoFPClass(const ABIArgInfo &AI, QualType ParamType,
2424	bool IsReturn) {
2425	// Should only apply to FP types in the source, not ABI promoted.
2426	if (!ParamType ->hasFloatingRepresentation())
2427	return false;
2428
2429	// The promoted-to IR type also needs to support nofpclass.
2430	llvm::Type *IRTy = AI.getCoerceToType();
2431	if (llvm::AttributeFuncs::isNoFPClassCompatibleType(Ty: IRTy))
2432	return true;
2433
2434	if (llvm::StructType *ST = dyn_cast<llvm::StructType>(Val: IRTy)) {
2435	return !IsReturn && AI.getCanBeFlattened() &&
2436	llvm::all_of(Range: ST->elements(),
2437	P: llvm::AttributeFuncs::isNoFPClassCompatibleType);
2438	}
2439
2440	return false;
2441	}
2442
2443	/// Return the nofpclass mask that can be applied to floating-point parameters.
2444	static llvm::FPClassTest getNoFPClassTestMask(const LangOptions &LangOpts) {
2445	llvm::FPClassTest Mask = llvm::fcNone;
2446	if (LangOpts.NoHonorInfs)
2447	Mask \|= llvm::fcInf;
2448	if (LangOpts.NoHonorNaNs)
2449	Mask \|= llvm::fcNan;
2450	return Mask;
2451	}
2452
2453	void CodeGenModule::AdjustMemoryAttribute(StringRef Name,
2454	CGCalleeInfo CalleeInfo,
2455	llvm::AttributeList &Attrs) {
2456	if (Attrs.getMemoryEffects().getModRef() == llvm::ModRefInfo::NoModRef) {
2457	Attrs = Attrs.removeFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::Memory);
2458	llvm::Attribute MemoryAttr = llvm::Attribute::getWithMemoryEffects(
2459	Context&: getLLVMContext(), ME: llvm::MemoryEffects::writeOnly());
2460	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Attr: MemoryAttr);
2461	}
2462	}
2463
2464	/// Construct the IR attribute list of a function or call.
2465	///
2466	/// When adding an attribute, please consider where it should be handled:
2467	///
2468	/// - getDefaultFunctionAttributes is for attributes that are essentially
2469	/// part of the global target configuration (but perhaps can be
2470	/// overridden on a per-function basis). Adding attributes there
2471	/// will cause them to also be set in frontends that build on Clang's
2472	/// target-configuration logic, as well as for code defined in library
2473	/// modules such as CUDA's libdevice.
2474	///
2475	/// - ConstructAttributeList builds on top of getDefaultFunctionAttributes
2476	/// and adds declaration-specific, convention-specific, and
2477	/// frontend-specific logic. The last is of particular importance:
2478	/// attributes that restrict how the frontend generates code must be
2479	/// added here rather than getDefaultFunctionAttributes.
2480	///
2481	void CodeGenModule::ConstructAttributeList(StringRef Name,
2482	const CGFunctionInfo &FI,
2483	CGCalleeInfo CalleeInfo,
2484	llvm::AttributeList &AttrList,
2485	unsigned &CallingConv,
2486	bool AttrOnCallSite, bool IsThunk) {
2487	llvm::AttrBuilder FuncAttrs(getLLVMContext());
2488	llvm::AttrBuilder RetAttrs(getLLVMContext());
2489
2490	// Collect function IR attributes from the CC lowering.
2491	// We'll collect the paramete and result attributes later.
2492	CallingConv = FI.getEffectiveCallingConvention();
2493	if (FI.isNoReturn())
2494	FuncAttrs.addAttribute(Val: llvm::Attribute::NoReturn);
2495	if (FI.isCmseNSCall())
2496	FuncAttrs.addAttribute(A: "cmse_nonsecure_call");
2497
2498	// Collect function IR attributes from the callee prototype if we have one.
2499	AddAttributesFromFunctionProtoType(Ctx&: getContext(), FuncAttrs,
2500	FPT: CalleeInfo.getCalleeFunctionProtoType());
2501	const Decl *TargetDecl = CalleeInfo.getCalleeDecl().getDecl();
2502
2503	// Attach assumption attributes to the declaration. If this is a call
2504	// site, attach assumptions from the caller to the call as well.
2505	AddAttributesFromOMPAssumes(FuncAttrs, Callee: TargetDecl);
2506
2507	bool HasOptnone = false;
2508	// The NoBuiltinAttr attached to the target FunctionDecl.
2509	const NoBuiltinAttr NBA = nullptr*;
2510
2511	// Some ABIs may result in additional accesses to arguments that may
2512	// otherwise not be present.
2513	std::optional<llvm::Attribute::AttrKind> MemAttrForPtrArgs;
2514	bool AddedPotentialArgAccess = false;
2515	auto AddPotentialArgAccess = [&]() {
2516	AddedPotentialArgAccess = true;
2517	llvm::Attribute A = FuncAttrs.getAttribute(Kind: llvm::Attribute::Memory);
2518	if (A.isValid())
2519	FuncAttrs.addMemoryAttr(ME: A.getMemoryEffects() \|
2520	llvm::MemoryEffects::argMemOnly());
2521	};
2522
2523	// Collect function IR attributes based on declaration-specific
2524	// information.
2525	// FIXME: handle sseregparm someday...
2526	if (TargetDecl) {
2527	if (TargetDecl->hasAttr<ReturnsTwiceAttr>())
2528	FuncAttrs.addAttribute(Val: llvm::Attribute::ReturnsTwice);
2529	if (TargetDecl->hasAttr<NoThrowAttr>())
2530	FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind);
2531	if (TargetDecl->hasAttr<NoReturnAttr>())
2532	FuncAttrs.addAttribute(Val: llvm::Attribute::NoReturn);
2533	if (TargetDecl->hasAttr<ColdAttr>())
2534	FuncAttrs.addAttribute(Val: llvm::Attribute::Cold);
2535	if (TargetDecl->hasAttr<HotAttr>())
2536	FuncAttrs.addAttribute(Val: llvm::Attribute::Hot);
2537	if (TargetDecl->hasAttr<NoDuplicateAttr>())
2538	FuncAttrs.addAttribute(Val: llvm::Attribute::NoDuplicate);
2539	if (TargetDecl->hasAttr<ConvergentAttr>())
2540	FuncAttrs.addAttribute(Val: llvm::Attribute::Convergent);
2541
2542	if (const FunctionDecl *Fn = dyn_cast<FunctionDecl>(Val: TargetDecl)) {
2543	AddAttributesFromFunctionProtoType(
2544	Ctx&: getContext(), FuncAttrs, FPT: Fn->getType()->getAs<FunctionProtoType>());
2545	if (AttrOnCallSite && Fn->isReplaceableGlobalAllocationFunction()) {
2546	// A sane operator new returns a non-aliasing pointer.
2547	auto Kind = Fn->getDeclName().getCXXOverloadedOperator();
2548	if (getCodeGenOpts().AssumeSaneOperatorNew &&
2549	(Kind == OO_New \|\| Kind == OO_Array_New))
2550	RetAttrs.addAttribute(Val: llvm::Attribute::NoAlias);
2551	}
2552	const CXXMethodDecl *MD = dyn_cast<CXXMethodDecl>(Val: Fn);
2553	const bool IsVirtualCall = MD && MD->isVirtual();
2554	// Don't use [[noreturn]], _Noreturn or [[no_builtin]] for a call to a
2555	// virtual function. These attributes are not inherited by overloads.
2556	if (!(AttrOnCallSite && IsVirtualCall)) {
2557	if (Fn->isNoReturn())
2558	FuncAttrs.addAttribute(Val: llvm::Attribute::NoReturn);
2559	NBA = Fn->getAttr<NoBuiltinAttr>();
2560	}
2561	}
2562
2563	if (isa<FunctionDecl>(Val: TargetDecl) \|\| isa<VarDecl>(Val: TargetDecl)) {
2564	// Only place nomerge attribute on call sites, never functions. This
2565	// allows it to work on indirect virtual function calls.
2566	if (AttrOnCallSite && TargetDecl->hasAttr<NoMergeAttr>())
2567	FuncAttrs.addAttribute(Val: llvm::Attribute::NoMerge);
2568	}
2569
2570	// 'const', 'pure' and 'noalias' attributed functions are also nounwind.
2571	if (TargetDecl->hasAttr<ConstAttr>()) {
2572	FuncAttrs.addMemoryAttr(ME: llvm::MemoryEffects::none());
2573	FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind);
2574	// gcc specifies that 'const' functions have greater restrictions than
2575	// 'pure' functions, so they also cannot have infinite loops.
2576	FuncAttrs.addAttribute(Val: llvm::Attribute::WillReturn);
2577	MemAttrForPtrArgs = llvm::Attribute::ReadNone;
2578	} else if (TargetDecl->hasAttr<PureAttr>()) {
2579	FuncAttrs.addMemoryAttr(ME: llvm::MemoryEffects::readOnly());
2580	FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind);
2581	// gcc specifies that 'pure' functions cannot have infinite loops.
2582	FuncAttrs.addAttribute(Val: llvm::Attribute::WillReturn);
2583	MemAttrForPtrArgs = llvm::Attribute::ReadOnly;
2584	} else if (TargetDecl->hasAttr<NoAliasAttr>()) {
2585	FuncAttrs.addMemoryAttr(ME: llvm::MemoryEffects::inaccessibleOrArgMemOnly());
2586	FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind);
2587	}
2588	if (const auto *RA = TargetDecl->getAttr<RestrictAttr>();
2589	RA && RA->getDeallocator() == nullptr)
2590	RetAttrs.addAttribute(Val: llvm::Attribute::NoAlias);
2591	if (TargetDecl->hasAttr<ReturnsNonNullAttr>() &&
2592	!CodeGenOpts.NullPointerIsValid)
2593	RetAttrs.addAttribute(Val: llvm::Attribute::NonNull);
2594	if (TargetDecl->hasAttr<AnyX86NoCallerSavedRegistersAttr>())
2595	FuncAttrs.addAttribute(A: "no_caller_saved_registers");
2596	if (TargetDecl->hasAttr<AnyX86NoCfCheckAttr>())
2597	FuncAttrs.addAttribute(Val: llvm::Attribute::NoCfCheck);
2598	if (TargetDecl->hasAttr<LeafAttr>())
2599	FuncAttrs.addAttribute(Val: llvm::Attribute::NoCallback);
2600	if (TargetDecl->hasAttr<BPFFastCallAttr>())
2601	FuncAttrs.addAttribute(A: "bpf_fastcall");
2602
2603	HasOptnone = TargetDecl->hasAttr<OptimizeNoneAttr>();
2604	if (auto *AllocSize = TargetDecl->getAttr<AllocSizeAttr>()) {
2605	std::optional<unsigned> NumElemsParam;
2606	if (AllocSize->getNumElemsParam().isValid())
2607	NumElemsParam = AllocSize->getNumElemsParam().getLLVMIndex();
2608	FuncAttrs.addAllocSizeAttr(ElemSizeArg: AllocSize->getElemSizeParam().getLLVMIndex(),
2609	NumElemsArg: NumElemsParam);
2610	}
2611
2612	// OpenCL v2.0 Work groups may be whether uniform or not.
2613	// '-cl-uniform-work-group-size' compile option gets a hint
2614	// to the compiler that the global work-size be a multiple of
2615	// the work-group size specified to clEnqueueNDRangeKernel
2616	// (i.e. work groups are uniform).
2617	if (getLangOpts().OffloadUniformBlock)
2618	FuncAttrs.addAttribute(A: "uniform-work-group-size");
2619
2620	if (TargetDecl->hasAttr<ArmLocallyStreamingAttr>())
2621	FuncAttrs.addAttribute(A: "aarch64_pstate_sm_body");
2622
2623	if (auto *ModularFormat = TargetDecl->getAttr<ModularFormatAttr>()) {
2624	FormatAttr *Format = TargetDecl->getAttr<FormatAttr>();
2625	StringRef Type = Format->getType()->getName();
2626	std::string FormatIdx = std::to_string(val: Format->getFormatIdx());
2627	std::string FirstArg = std::to_string(val: Format->getFirstArg());
2628	SmallVector<StringRef> Args = {
2629	Type, FormatIdx, FirstArg,
2630	ModularFormat->getModularImplFn()->getName(),
2631	ModularFormat->getImplName()};
2632	llvm::append_range(C&: Args, R: ModularFormat->aspects());
2633	FuncAttrs.addAttribute(A: "modular-format", V: llvm::join(R&: Args, Separator: ","));
2634	}
2635	}
2636
2637	// Attach "no-builtins" attributes to:
2638	// call sites: both `nobuiltin` and "no-builtins" or "no-builtin-<name>".*
2639	// definitions: "no-builtins" or "no-builtin-<name>" only.*
2640	// The attributes can come from:
2641	// LangOpts: -ffreestanding, -fno-builtin, -fno-builtin-<name>*
2642	// FunctionDecl attributes: __attribute__((no_builtin(...)))*
2643	addNoBuiltinAttributes(FuncAttrs, LangOpts: getLangOpts(), NBA);
2644
2645	// Collect function IR attributes based on global settiings.
2646	getDefaultFunctionAttributes(Name, HasOptnone, AttrOnCallSite, FuncAttrs);
2647
2648	// Override some default IR attributes based on declaration-specific
2649	// information.
2650	if (TargetDecl) {
2651	if (TargetDecl->hasAttr<NoSpeculativeLoadHardeningAttr>())
2652	FuncAttrs.removeAttribute(Val: llvm::Attribute::SpeculativeLoadHardening);
2653	if (TargetDecl->hasAttr<SpeculativeLoadHardeningAttr>())
2654	FuncAttrs.addAttribute(Val: llvm::Attribute::SpeculativeLoadHardening);
2655	if (TargetDecl->hasAttr<NoSplitStackAttr>())
2656	FuncAttrs.removeAttribute(A: "split-stack");
2657	if (TargetDecl->hasAttr<ZeroCallUsedRegsAttr>()) {
2658	// A function "__attribute__((...))" overrides the command-line flag.
2659	auto Kind =
2660	TargetDecl->getAttr<ZeroCallUsedRegsAttr>()->getZeroCallUsedRegs();
2661	FuncAttrs.removeAttribute(A: "zero-call-used-regs");
2662	FuncAttrs.addAttribute(
2663	A: "zero-call-used-regs",
2664	V: ZeroCallUsedRegsAttr::ConvertZeroCallUsedRegsKindToStr(Val: Kind));
2665	}
2666
2667	// Add NonLazyBind attribute to function declarations when -fno-plt
2668	// is used.
2669	// FIXME: what if we just haven't processed the function definition
2670	// yet, or if it's an external definition like C99 inline?
2671	if (CodeGenOpts.NoPLT) {
2672	if (auto *Fn = dyn_cast<FunctionDecl>(Val: TargetDecl)) {
2673	if (!Fn->isDefined() && !AttrOnCallSite) {
2674	FuncAttrs.addAttribute(Val: llvm::Attribute::NonLazyBind);
2675	}
2676	}
2677	}
2678	// Remove 'convergent' if requested.
2679	if (TargetDecl->hasAttr<NoConvergentAttr>())
2680	FuncAttrs.removeAttribute(Val: llvm::Attribute::Convergent);
2681	}
2682
2683	// Add "sample-profile-suffix-elision-policy" attribute for internal linkage
2684	// functions with -funique-internal-linkage-names.
2685	if (TargetDecl && CodeGenOpts.UniqueInternalLinkageNames) {
2686	if (const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl)) {
2687	if (!FD->isExternallyVisible())
2688	FuncAttrs.addAttribute(A: "sample-profile-suffix-elision-policy",
2689	V: "selected");
2690	}
2691	}
2692
2693	// Collect non-call-site function IR attributes from declaration-specific
2694	// information.
2695	if (!AttrOnCallSite) {
2696	if (TargetDecl && TargetDecl->hasAttr<CmseNSEntryAttr>())
2697	FuncAttrs.addAttribute(A: "cmse_nonsecure_entry");
2698
2699	// Whether tail calls are enabled.
2700	auto shouldDisableTailCalls = [&] {
2701	// Should this be honored in getDefaultFunctionAttributes?
2702	if (CodeGenOpts.DisableTailCalls)
2703	return true;
2704
2705	if (!TargetDecl)
2706	return false;
2707
2708	if (TargetDecl->hasAttr<DisableTailCallsAttr>() \|\|
2709	TargetDecl->hasAttr<AnyX86InterruptAttr>())
2710	return true;
2711
2712	if (CodeGenOpts.NoEscapingBlockTailCalls) {
2713	if (const auto *BD = dyn_cast<BlockDecl>(Val: TargetDecl))
2714	if (!BD->doesNotEscape())
2715	return true;
2716	}
2717
2718	return false;
2719	};
2720	if (shouldDisableTailCalls ())
2721	FuncAttrs.addAttribute(A: "disable-tail-calls", V: "true");
2722
2723	// These functions require the returns_twice attribute for correct codegen,
2724	// but the attribute may not be added if -fno-builtin is specified. We
2725	// explicitly add that attribute here.
2726	static const llvm::StringSet<> ReturnsTwiceFn{
2727	"_setjmpex", "setjmp", "_setjmp", "vfork",
2728	"sigsetjmp", "__sigsetjmp", "savectx", "getcontext"};
2729	if (ReturnsTwiceFn.contains(key: Name))
2730	FuncAttrs.addAttribute(Val: llvm::Attribute::ReturnsTwice);
2731
2732	// CPU/feature overrides. addDefaultFunctionDefinitionAttributes
2733	// handles these separately to set them based on the global defaults.
2734	GetCPUAndFeaturesAttributes(GD: CalleeInfo.getCalleeDecl(), AttrBuilder&: FuncAttrs);
2735
2736	// Windows hotpatching support
2737	if (!MSHotPatchFunctions.empty()) {
2738	bool IsHotPatched = llvm::binary_search(Range&: MSHotPatchFunctions, Value&: Name);
2739	if (IsHotPatched)
2740	FuncAttrs.addAttribute(A: "marked_for_windows_hot_patching");
2741	}
2742	}
2743
2744	// Mark functions that are replaceable by the loader.
2745	if (CodeGenOpts.isLoaderReplaceableFunctionName(FuncName: Name))
2746	FuncAttrs.addAttribute(A: "loader-replaceable");
2747
2748	// Collect attributes from arguments and return values.
2749	ClangToLLVMArgMapping IRFunctionArgs(getContext(), FI);
2750
2751	QualType RetTy = FI.getReturnType();
2752	const ABIArgInfo &RetAI = FI.getReturnInfo();
2753	const llvm::DataLayout &DL = getDataLayout();
2754
2755	// Determine if the return type could be partially undef
2756	if (CodeGenOpts.EnableNoundefAttrs &&
2757	HasStrictReturn(Module: *this, RetTy, TargetDecl)) {
2758	if (!RetTy ->isVoidType() && RetAI.getKind() != ABIArgInfo::Indirect &&
2759	DetermineNoUndef(QTy: RetTy, Types&: getTypes(), DL, AI: RetAI))
2760	RetAttrs.addAttribute(Val: llvm::Attribute::NoUndef);
2761	}
2762
2763	switch (RetAI.getKind()) {
2764	case ABIArgInfo::Extend:
2765	if (RetAI.isSignExt())
2766	RetAttrs.addAttribute(Val: llvm::Attribute::SExt);
2767	else if (RetAI.isZeroExt())
2768	RetAttrs.addAttribute(Val: llvm::Attribute::ZExt);
2769	else
2770	RetAttrs.addAttribute(Val: llvm::Attribute::NoExt);
2771	[[fallthrough]];
2772	case ABIArgInfo::TargetSpecific:
2773	case ABIArgInfo::Direct:
2774	if (RetAI.getInReg())
2775	RetAttrs.addAttribute(Val: llvm::Attribute::InReg);
2776
2777	if (canApplyNoFPClass(AI: RetAI, ParamType: RetTy, IsReturn: true))
2778	RetAttrs.addNoFPClassAttr(NoFPClassMask: getNoFPClassTestMask(LangOpts: getLangOpts()));
2779
2780	break;
2781	case ABIArgInfo::Ignore:
2782	break;
2783
2784	case ABIArgInfo::InAlloca:
2785	case ABIArgInfo::Indirect: {
2786	// inalloca and sret disable readnone and readonly
2787	AddPotentialArgAccess ();
2788	break;
2789	}
2790
2791	case ABIArgInfo::CoerceAndExpand:
2792	break;
2793
2794	case ABIArgInfo::Expand:
2795	case ABIArgInfo::IndirectAliased:
2796	llvm_unreachable("Invalid ABI kind for return argument");
2797	}
2798
2799	if (!IsThunk) {
2800	// FIXME: fix this properly, https://reviews.llvm.org/D100388
2801	if (const auto *RefTy = RetTy ->getAs<ReferenceType>()) {
2802	QualType PTy = RefTy->getPointeeType();
2803	if (!PTy ->isIncompleteType() && PTy ->isConstantSizeType())
2804	RetAttrs.addDereferenceableAttr(
2805	Bytes: getMinimumObjectSize(Ty: PTy).getQuantity());
2806	if (getTypes().getTargetAddressSpace(T: PTy) == `0` &&
2807	!CodeGenOpts.NullPointerIsValid)
2808	RetAttrs.addAttribute(Val: llvm::Attribute::NonNull);
2809	if (PTy ->isObjectType()) {
2810	llvm::Align Alignment =
2811	getNaturalPointeeTypeAlignment(T: RetTy).getAsAlign();
2812	RetAttrs.addAlignmentAttr(Align: Alignment);
2813	}
2814	}
2815	}
2816
2817	bool hasUsedSRet = false;
2818	SmallVector<llvm::AttributeSet, `4`> ArgAttrs(IRFunctionArgs.totalIRArgs());
2819
2820	// Attach attributes to sret.
2821	if (IRFunctionArgs.hasSRetArg()) {
2822	llvm::AttrBuilder SRETAttrs(getLLVMContext());
2823	SRETAttrs.addStructRetAttr(Ty: getTypes().ConvertTypeForMem(T: RetTy));
2824	SRETAttrs.addAttribute(Val: llvm::Attribute::Writable);
2825	SRETAttrs.addAttribute(Val: llvm::Attribute::DeadOnUnwind);
2826	hasUsedSRet = true;
2827	if (RetAI.getInReg())
2828	SRETAttrs.addAttribute(Val: llvm::Attribute::InReg);
2829	SRETAttrs.addAlignmentAttr(Align: RetAI.getIndirectAlign().getQuantity());
2830	ArgAttrs [IRFunctionArgs.getSRetArgNo()] =
2831	llvm::AttributeSet::get(C&: getLLVMContext(), B: SRETAttrs);
2832	}
2833
2834	// Attach attributes to inalloca argument.
2835	if (IRFunctionArgs.hasInallocaArg()) {
2836	llvm::AttrBuilder Attrs(getLLVMContext());
2837	Attrs.addInAllocaAttr(Ty: FI.getArgStruct());
2838	ArgAttrs [IRFunctionArgs.getInallocaArgNo()] =
2839	llvm::AttributeSet::get(C&: getLLVMContext(), B: Attrs);
2840	}
2841
2842	// Apply `nonnull`, `dereferenceable(N)` and `align N` to the `this` argument,
2843	// unless this is a thunk function. Add dead_on_return to the `this` argument
2844	// in base class destructors to aid in DSE.
2845	// FIXME: fix this properly, https://reviews.llvm.org/D100388
2846	if (FI.isInstanceMethod() && !IRFunctionArgs.hasInallocaArg() &&
2847	!FI.arg_begin()->type ->isVoidPointerType() && !IsThunk) {
2848	auto IRArgs = IRFunctionArgs.getIRArgs(ArgNo: `0`);
2849
2850	assert(IRArgs.second == `1` && "Expected only a single `this` pointer.");
2851
2852	llvm::AttrBuilder Attrs(getLLVMContext());
2853
2854	QualType ThisTy = FI.arg_begin()->type.getTypePtr()->getPointeeType();
2855
2856	if (!CodeGenOpts.NullPointerIsValid &&
2857	getTypes().getTargetAddressSpace(T: FI.arg_begin()->type) == `0`) {
2858	Attrs.addAttribute(Val: llvm::Attribute::NonNull);
2859	Attrs.addDereferenceableAttr(Bytes: getMinimumObjectSize(Ty: ThisTy).getQuantity());
2860	} else {
2861	// FIXME dereferenceable should be correct here, regardless of
2862	// NullPointerIsValid. However, dereferenceable currently does not always
2863	// respect NullPointerIsValid and may imply nonnull and break the program.
2864	// See https://reviews.llvm.org/D66618 for discussions.
2865	Attrs.addDereferenceableOrNullAttr(
2866	Bytes: getMinimumObjectSize(
2867	Ty: FI.arg_begin()->type.castAs<PointerType>()->getPointeeType())
2868	.getQuantity());
2869	}
2870
2871	llvm::Align Alignment =
2872	getNaturalTypeAlignment(T: ThisTy, /BaseInfo=/nullptr,
2873	/TBAAInfo=/nullptr, /forPointeeType=/true)
2874	.getAsAlign();
2875	Attrs.addAlignmentAttr(Align: Alignment);
2876
2877	const auto *DD = dyn_cast_if_present<CXXDestructorDecl>(
2878	Val: CalleeInfo.getCalleeDecl().getDecl());
2879	// Do not annotate vector deleting destructors with dead_on_return as the
2880	// this pointer in that case points to an array which we cannot
2881	// statically know the size of.
2882	if (DD &&
2883	CalleeInfo.getCalleeDecl().getDtorType() !=
2884	CXXDtorType::Dtor_VectorDeleting &&
2885	CodeGenOpts.StrictLifetimes) {
2886	const CXXRecordDecl *ClassDecl =
2887	dyn_cast<CXXRecordDecl>(Val: DD->getDeclContext());
2888	// TODO(boomanaiden154): We are being intentionally conservative here
2889	// as we gain experience with this optimization. We should remove the
2890	// condition for non-virtual bases after more testing. We cannot add
2891	// dead_on_return if we have virtual base classes because they will
2892	// generally still be live after the base object destructor.
2893	if (ClassDecl->getNumBases() == `0` && ClassDecl->getNumVBases() == `0`)
2894	Attrs.addDeadOnReturnAttr(Info: llvm::DeadOnReturnInfo (
2895	Context.getASTRecordLayout(D: ClassDecl).getDataSize().getQuantity()));
2896	}
2897
2898	ArgAttrs [IRArgs.first] = llvm::AttributeSet::get(C&: getLLVMContext(), B: Attrs);
2899	}
2900
2901	unsigned ArgNo = `0`;
2902	for (CGFunctionInfo::const_arg_iterator I = FI.arg_begin(), E = FI.arg_end();
2903	I != E; ++I, ++ArgNo) {
2904	QualType ParamType = I->type;
2905	const ABIArgInfo &AI = I->info;
2906	llvm::AttrBuilder Attrs(getLLVMContext());
2907
2908	// Add attribute for padding argument, if necessary.
2909	if (IRFunctionArgs.hasPaddingArg(ArgNo)) {
2910	if (AI.getPaddingInReg()) {
2911	ArgAttrs [IRFunctionArgs.getPaddingArgNo(ArgNo)] =
2912	llvm::AttributeSet::get(C&: getLLVMContext(),
2913	B: llvm::AttrBuilder (getLLVMContext())
2914	.addAttribute(Val: llvm::Attribute::InReg));
2915	}
2916	}
2917
2918	// Decide whether the argument we're handling could be partially undef
2919	if (CodeGenOpts.EnableNoundefAttrs &&
2920	DetermineNoUndef(QTy: ParamType, Types&: getTypes(), DL, AI)) {
2921	Attrs.addAttribute(Val: llvm::Attribute::NoUndef);
2922	}
2923
2924	// 'restrict' -> 'noalias' is done in EmitFunctionProlog when we
2925	// have the corresponding parameter variable. It doesn't make
2926	// sense to do it here because parameters are so messed up.
2927	switch (AI.getKind()) {
2928	case ABIArgInfo::Extend:
2929	if (AI.isSignExt())
2930	Attrs.addAttribute(Val: llvm::Attribute::SExt);
2931	else if (AI.isZeroExt())
2932	Attrs.addAttribute(Val: llvm::Attribute::ZExt);
2933	else
2934	Attrs.addAttribute(Val: llvm::Attribute::NoExt);
2935	[[fallthrough]];
2936	case ABIArgInfo::TargetSpecific:
2937	case ABIArgInfo::Direct:
2938	if (ArgNo == `0` && FI.isChainCall())
2939	Attrs.addAttribute(Val: llvm::Attribute::Nest);
2940	else if (AI.getInReg())
2941	Attrs.addAttribute(Val: llvm::Attribute::InReg);
2942	Attrs.addStackAlignmentAttr(Align: llvm::MaybeAlign (AI.getDirectAlign()));
2943
2944	if (canApplyNoFPClass(AI, ParamType, IsReturn: false))
2945	Attrs.addNoFPClassAttr(NoFPClassMask: getNoFPClassTestMask(LangOpts: getLangOpts()));
2946	break;
2947	case ABIArgInfo::Indirect: {
2948	if (AI.getInReg())
2949	Attrs.addAttribute(Val: llvm::Attribute::InReg);
2950
2951	// HLSL out and inout parameters must not be marked with ByVal or
2952	// DeadOnReturn attributes because stores to these parameters by the
2953	// callee are visible to the caller.
2954	if (auto ParamABI = FI.getExtParameterInfo(argIndex: ArgNo).getABI();
2955	ParamABI != ParameterABI::HLSLOut &&
2956	ParamABI != ParameterABI::HLSLInOut) {
2957
2958	// Depending on the ABI, this may be either a byval or a dead_on_return
2959	// argument.
2960	if (AI.getIndirectByVal()) {
2961	Attrs.addByValAttr(Ty: getTypes().ConvertTypeForMem(T: ParamType));
2962	} else {
2963	// Add dead_on_return when the object's lifetime ends in the callee.
2964	// This includes trivially-destructible objects, as well as objects
2965	// whose destruction / clean-up is carried out within the callee
2966	// (e.g., Obj-C ARC-managed structs, MSVC callee-destroyed objects).
2967	if (!ParamType.isDestructedType() \|\| !ParamType ->isRecordType() \|\|
2968	ParamType ->castAsRecordDecl()->isParamDestroyedInCallee())
2969	Attrs.addDeadOnReturnAttr(Info: llvm::DeadOnReturnInfo ());
2970	}
2971	}
2972
2973	auto *Decl = ParamType ->getAsRecordDecl();
2974	if (CodeGenOpts.PassByValueIsNoAlias && Decl &&
2975	Decl->getArgPassingRestrictions() ==
2976	RecordArgPassingKind::CanPassInRegs)
2977	// When calling the function, the pointer passed in will be the only
2978	// reference to the underlying object. Mark it accordingly.
2979	Attrs.addAttribute(Val: llvm::Attribute::NoAlias);
2980
2981	// TODO: We could add the byref attribute if not byval, but it would
2982	// require updating many testcases.
2983
2984	CharUnits Align = AI.getIndirectAlign();
2985
2986	// In a byval argument, it is important that the required
2987	// alignment of the type is honored, as LLVM might be creating a
2988	// new* stack object, and needs to know what alignment to give*
2989	// it. (Sometimes it can deduce a sensible alignment on its own,
2990	// but not if clang decides it must emit a packed struct, or the
2991	// user specifies increased alignment requirements.)
2992	//
2993	// This is different from indirect not* byval, where the object*
2994	// exists already, and the align attribute is purely
2995	// informative.
2996	assert(!Align.isZero());
2997
2998	// For now, only add this when we have a byval argument.
2999	// TODO: be less lazy about updating test cases.
3000	if (AI.getIndirectByVal())
3001	Attrs.addAlignmentAttr(Align: Align.getQuantity());
3002
3003	// byval disables readnone and readonly.
3004	AddPotentialArgAccess ();
3005	break;
3006	}
3007	case ABIArgInfo::IndirectAliased: {
3008	CharUnits Align = AI.getIndirectAlign();
3009	Attrs.addByRefAttr(Ty: getTypes().ConvertTypeForMem(T: ParamType));
3010	Attrs.addAlignmentAttr(Align: Align.getQuantity());
3011	break;
3012	}
3013	case ABIArgInfo::Ignore:
3014	case ABIArgInfo::Expand:
3015	case ABIArgInfo::CoerceAndExpand:
3016	break;
3017
3018	case ABIArgInfo::InAlloca:
3019	// inalloca disables readnone and readonly.
3020	AddPotentialArgAccess ();
3021	continue;
3022	}
3023
3024	if (const auto *RefTy = ParamType ->getAs<ReferenceType>()) {
3025	QualType PTy = RefTy->getPointeeType();
3026	if (!PTy ->isIncompleteType() && PTy ->isConstantSizeType())
3027	Attrs.addDereferenceableAttr(Bytes: getMinimumObjectSize(Ty: PTy).getQuantity());
3028	if (getTypes().getTargetAddressSpace(T: PTy) == `0` &&
3029	!CodeGenOpts.NullPointerIsValid)
3030	Attrs.addAttribute(Val: llvm::Attribute::NonNull);
3031	if (PTy ->isObjectType()) {
3032	llvm::Align Alignment =
3033	getNaturalPointeeTypeAlignment(T: ParamType).getAsAlign();
3034	Attrs.addAlignmentAttr(Align: Alignment);
3035	}
3036	}
3037
3038	// From OpenCL spec v3.0.10 section 6.3.5 Alignment of Types:
3039	// > For arguments to a __kernel function declared to be a pointer to a
3040	// > data type, the OpenCL compiler can assume that the pointee is always
3041	// > appropriately aligned as required by the data type.
3042	if (TargetDecl &&
3043	DeviceKernelAttr::isOpenCLSpelling(
3044	A: TargetDecl->getAttr<DeviceKernelAttr>()) &&
3045	ParamType ->isPointerType()) {
3046	QualType PTy = ParamType ->getPointeeType();
3047	if (!PTy ->isIncompleteType() && PTy ->isConstantSizeType()) {
3048	llvm::Align Alignment =
3049	getNaturalPointeeTypeAlignment(T: ParamType).getAsAlign();
3050	Attrs.addAlignmentAttr(Align: Alignment);
3051	}
3052	}
3053
3054	switch (FI.getExtParameterInfo(argIndex: ArgNo).getABI()) {
3055	case ParameterABI::HLSLOut:
3056	case ParameterABI::HLSLInOut:
3057	Attrs.addAttribute(Val: llvm::Attribute::NoAlias);
3058	break;
3059	case ParameterABI::Ordinary:
3060	break;
3061
3062	case ParameterABI::SwiftIndirectResult: {
3063	// Add 'sret' if we haven't already used it for something, but
3064	// only if the result is void.
3065	if (!hasUsedSRet && RetTy ->isVoidType()) {
3066	Attrs.addStructRetAttr(Ty: getTypes().ConvertTypeForMem(T: ParamType));
3067	hasUsedSRet = true;
3068	}
3069
3070	// Add 'noalias' in either case.
3071	Attrs.addAttribute(Val: llvm::Attribute::NoAlias);
3072
3073	// Add 'dereferenceable' and 'alignment'.
3074	auto PTy = ParamType ->getPointeeType();
3075	if (!PTy ->isIncompleteType() && PTy ->isConstantSizeType()) {
3076	auto info = getContext().getTypeInfoInChars(T: PTy);
3077	Attrs.addDereferenceableAttr(Bytes: info.Width.getQuantity());
3078	Attrs.addAlignmentAttr(Align: info.Align.getAsAlign());
3079	}
3080	break;
3081	}
3082
3083	case ParameterABI::SwiftErrorResult:
3084	Attrs.addAttribute(Val: llvm::Attribute::SwiftError);
3085	break;
3086
3087	case ParameterABI::SwiftContext:
3088	Attrs.addAttribute(Val: llvm::Attribute::SwiftSelf);
3089	break;
3090
3091	case ParameterABI::SwiftAsyncContext:
3092	Attrs.addAttribute(Val: llvm::Attribute::SwiftAsync);
3093	break;
3094	}
3095
3096	if (FI.getExtParameterInfo(argIndex: ArgNo).isNoEscape())
3097	Attrs.addCapturesAttr(CI: llvm::CaptureInfo::none());
3098
3099	if (Attrs.hasAttributes()) {
3100	unsigned FirstIRArg, NumIRArgs;
3101	std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo);
3102	for (unsigned i = `0`; i < NumIRArgs; i++)
3103	ArgAttrs [FirstIRArg + i] = ArgAttrs [FirstIRArg + i].addAttributes(
3104	C&: getLLVMContext(), AS: llvm::AttributeSet::get(C&: getLLVMContext(), B: Attrs));
3105	}
3106	}
3107	assert(ArgNo == FI.arg_size());
3108
3109	ArgNo = `0`;
3110	if (AddedPotentialArgAccess && MemAttrForPtrArgs) {
3111	llvm::FunctionType *FunctionType = getTypes().GetFunctionType(FI);
3112	for (CGFunctionInfo::const_arg_iterator I = FI.arg_begin(),
3113	E = FI.arg_end();
3114	I != E; ++I, ++ArgNo) {
3115	if (I->info.isDirect() \|\| I->info.isExpand() \|\|
3116	I->info.isCoerceAndExpand()) {
3117	unsigned FirstIRArg, NumIRArgs;
3118	std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo);
3119	for (unsigned i = FirstIRArg; i < FirstIRArg + NumIRArgs; ++i) {
3120	if (FunctionType->getParamType(i)->isPointerTy()) {
3121	ArgAttrs [i] =
3122	ArgAttrs [i].addAttribute(C&: getLLVMContext(), Kind: *MemAttrForPtrArgs);
3123	}
3124	}
3125	}
3126	}
3127	}
3128
3129	AttrList = llvm::AttributeList::get(
3130	C&: getLLVMContext(), FnAttrs: llvm::AttributeSet::get(C&: getLLVMContext(), B: FuncAttrs),
3131	RetAttrs: llvm::AttributeSet::get(C&: getLLVMContext(), B: RetAttrs), ArgAttrs);
3132	}
3133
3134	/// An argument came in as a promoted argument; demote it back to its
3135	/// declared type.
3136	static llvm::Value *emitArgumentDemotion(CodeGenFunction &CGF,
3137	const VarDecl *var,
3138	llvm::Value *value) {
3139	llvm::Type *varType = CGF.ConvertType(T: var->getType());
3140
3141	// This can happen with promotions that actually don't change the
3142	// underlying type, like the enum promotions.
3143	if (value->getType() == varType)
3144	return value;
3145
3146	assert((varType->isIntegerTy() \|\| varType->isFloatingPointTy()) &&
3147	"unexpected promotion type");
3148
3149	if (isa<llvm::IntegerType>(Val: varType))
3150	return CGF.Builder.CreateTrunc(V: value, DestTy: varType, Name: "arg.unpromote");
3151
3152	return CGF.Builder.CreateFPCast(V: value, DestTy: varType, Name: "arg.unpromote");
3153	}
3154
3155	/// Returns the attribute (either parameter attribute, or function
3156	/// attribute), which declares argument ArgNo to be non-null.
3157	static const NonNullAttr getNonNullAttr(const* Decl FD, const* ParmVarDecl *PVD,
3158	QualType ArgType, unsigned ArgNo) {
3159	// FIXME: __attribute__((nonnull)) can also be applied to:
3160	// - references to pointers, where the pointee is known to be
3161	// nonnull (apparently a Clang extension)
3162	// - transparent unions containing pointers
3163	// In the former case, LLVM IR cannot represent the constraint. In
3164	// the latter case, we have no guarantee that the transparent union
3165	// is in fact passed as a pointer.
3166	if (!ArgType ->isAnyPointerType() && !ArgType ->isBlockPointerType())
3167	return nullptr;
3168	// First, check attribute on parameter itself.
3169	if (PVD) {
3170	if (auto ParmNNAttr = PVD->getAttr<NonNullAttr>())
3171	return ParmNNAttr;
3172	}
3173	// Check function attributes.
3174	if (!FD)
3175	return nullptr;
3176	for (const auto *NNAttr : FD->specific_attrs<NonNullAttr>()) {
3177	if (NNAttr->isNonNull(IdxAST: ArgNo))
3178	return NNAttr;
3179	}
3180	return nullptr;
3181	}
3182
3183	namespace {
3184	struct CopyBackSwiftError final : EHScopeStack::Cleanup {
3185	Address Temp;
3186	Address Arg;
3187	CopyBackSwiftError(Address temp, Address arg) : Temp (temp), Arg (arg) {}
3188	void Emit(CodeGenFunction &CGF, Flags flags) override {
3189	llvm::Value *errorValue = CGF.Builder.CreateLoad(Addr: Temp);
3190	CGF.Builder.CreateStore(Val: errorValue, Addr: Arg);
3191	}
3192	};
3193	} // namespace
3194
3195	void CodeGenFunction::EmitFunctionProlog(const CGFunctionInfo &FI,
3196	llvm::Function *Fn,
3197	const FunctionArgList &Args) {
3198	if (CurCodeDecl && CurCodeDecl->hasAttr<NakedAttr>())
3199	// Naked functions don't have prologues.
3200	return;
3201
3202	// If this is an implicit-return-zero function, go ahead and
3203	// initialize the return value. TODO: it might be nice to have
3204	// a more general mechanism for this that didn't require synthesized
3205	// return statements.
3206	if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: CurCodeDecl)) {
3207	if (FD->hasImplicitReturnZero()) {
3208	QualType RetTy = FD->getReturnType().getUnqualifiedType();
3209	llvm::Type *LLVMTy = CGM.getTypes().ConvertType(T: RetTy);
3210	llvm::Constant *Zero = llvm::Constant::getNullValue(Ty: LLVMTy);
3211	Builder.CreateStore(Val: Zero, Addr: ReturnValue);
3212	}
3213	}
3214
3215	// FIXME: We no longer need the types from FunctionArgList; lift up and
3216	// simplify.
3217
3218	ClangToLLVMArgMapping IRFunctionArgs(CGM.getContext(), FI);
3219	assert(Fn->arg_size() == IRFunctionArgs.totalIRArgs());
3220
3221	// If we're using inalloca, all the memory arguments are GEPs off of the last
3222	// parameter, which is a pointer to the complete memory area.
3223	Address ArgStruct = Address::invalid();
3224	if (IRFunctionArgs.hasInallocaArg())
3225	ArgStruct = Address (Fn->getArg(i: IRFunctionArgs.getInallocaArgNo()),
3226	FI.getArgStruct(), FI.getArgStructAlignment());
3227
3228	// Name the struct return parameter.
3229	if (IRFunctionArgs.hasSRetArg()) {
3230	auto AI = Fn->getArg(i: IRFunctionArgs.getSRetArgNo());
3231	AI->setName("agg.result");
3232	AI->addAttr(Kind: llvm::Attribute::NoAlias);
3233	}
3234
3235	// Track if we received the parameter as a pointer (indirect, byval, or
3236	// inalloca). If already have a pointer, EmitParmDecl doesn't need to copy it
3237	// into a local alloca for us.
3238	SmallVector<ParamValue, `16`> ArgVals;
3239	ArgVals.reserve(N: Args.size());
3240
3241	// Create a pointer value for every parameter declaration. This usually
3242	// entails copying one or more LLVM IR arguments into an alloca. Don't push
3243	// any cleanups or do anything that might unwind. We do that separately, so
3244	// we can push the cleanups in the correct order for the ABI.
3245	assert(FI.arg_size() == Args.size() &&
3246	"Mismatch between function signature & arguments.");
3247	unsigned ArgNo = `0`;
3248	CGFunctionInfo::const_arg_iterator info_it = FI.arg_begin();
3249	for (FunctionArgList::const_iterator i = Args.begin(), e = Args.end(); i != e;
3250	++i, ++info_it, ++ArgNo) {
3251	const VarDecl Arg = i;
3252	const ABIArgInfo &ArgI = info_it->info;
3253
3254	bool isPromoted =
3255	isa<ParmVarDecl>(Val: Arg) && cast<ParmVarDecl>(Val: Arg)->isKNRPromoted();
3256	// We are converting from ABIArgInfo type to VarDecl type directly, unless
3257	// the parameter is promoted. In this case we convert to
3258	// CGFunctionInfo::ArgInfo type with subsequent argument demotion.
3259	QualType Ty = isPromoted ? info_it->type : Arg->getType();
3260	assert(hasScalarEvaluationKind(Ty) ==
3261	hasScalarEvaluationKind(Arg->getType()));
3262
3263	unsigned FirstIRArg, NumIRArgs;
3264	std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo);
3265
3266	switch (ArgI.getKind()) {
3267	case ABIArgInfo::InAlloca: {
3268	assert(NumIRArgs == `0`);
3269	auto FieldIndex = ArgI.getInAllocaFieldIndex();
3270	Address V =
3271	Builder.CreateStructGEP(Addr: ArgStruct, Index: FieldIndex, Name: Arg->getName());
3272	if (ArgI.getInAllocaIndirect())
3273	V = Address (Builder.CreateLoad(Addr: V), ConvertTypeForMem(T: Ty),
3274	getContext().getTypeAlignInChars(T: Ty));
3275	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: V));
3276	break;
3277	}
3278
3279	case ABIArgInfo::Indirect:
3280	case ABIArgInfo::IndirectAliased: {
3281	assert(NumIRArgs == `1`);
3282	Address ParamAddr = makeNaturalAddressForPointer(
3283	Ptr: Fn->getArg(i: FirstIRArg), T: Ty, Alignment: ArgI.getIndirectAlign(), ForPointeeType: false, BaseInfo: nullptr,
3284	TBAAInfo: nullptr, IsKnownNonNull: KnownNonNull);
3285
3286	if (!hasScalarEvaluationKind(T: Ty)) {
3287	// Aggregates and complex variables are accessed by reference. All we
3288	// need to do is realign the value, if requested. Also, if the address
3289	// may be aliased, copy it to ensure that the parameter variable is
3290	// mutable and has a unique adress, as C requires.
3291	if (ArgI.getIndirectRealign() \|\| ArgI.isIndirectAliased()) {
3292	RawAddress AlignedTemp = CreateMemTemp(T: Ty, Name: "coerce");
3293
3294	// Copy from the incoming argument pointer to the temporary with the
3295	// appropriate alignment.
3296	//
3297	// FIXME: We should have a common utility for generating an aggregate
3298	// copy.
3299	CharUnits Size = getContext().getTypeSizeInChars(T: Ty);
3300	Builder.CreateMemCpy(
3301	Dst: AlignedTemp.getPointer(), DstAlign: AlignedTemp.getAlignment().getAsAlign(),
3302	Src: ParamAddr.emitRawPointer(CGF&: *this),
3303	SrcAlign: ParamAddr.getAlignment().getAsAlign(),
3304	Size: llvm::ConstantInt::get(Ty: IntPtrTy, V: Size.getQuantity()));
3305	ParamAddr = AlignedTemp;
3306	}
3307	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: ParamAddr));
3308	} else {
3309	// Load scalar value from indirect argument.
3310	llvm::Value *V =
3311	EmitLoadOfScalar(Addr: ParamAddr, Volatile: false, Ty, Loc: Arg->getBeginLoc());
3312
3313	if (isPromoted)
3314	V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V);
3315	ArgVals.push_back(Elt: ParamValue::forDirect(value: V));
3316	}
3317	break;
3318	}
3319
3320	case ABIArgInfo::Extend:
3321	case ABIArgInfo::Direct: {
3322	auto AI = Fn->getArg(i: FirstIRArg);
3323	llvm::Type *LTy = ConvertType(T: Arg->getType());
3324
3325	// Prepare parameter attributes. So far, only attributes for pointer
3326	// parameters are prepared. See
3327	// http://llvm.org/docs/LangRef.html#paramattrs.
3328	if (ArgI.getDirectOffset() == `0` && LTy->isPointerTy() &&
3329	ArgI.getCoerceToType()->isPointerTy()) {
3330	assert(NumIRArgs == `1`);
3331
3332	if (const ParmVarDecl *PVD = dyn_cast<ParmVarDecl>(Val: Arg)) {
3333	// Set `nonnull` attribute if any.
3334	if (getNonNullAttr(FD: CurCodeDecl, PVD, ArgType: PVD->getType(),
3335	ArgNo: PVD->getFunctionScopeIndex()) &&
3336	!CGM.getCodeGenOpts().NullPointerIsValid)
3337	AI->addAttr(Kind: llvm::Attribute::NonNull);
3338
3339	QualType OTy = PVD->getOriginalType();
3340	if (const auto *ArrTy = getContext().getAsConstantArrayType(T: OTy)) {
3341	// A C99 array parameter declaration with the static keyword also
3342	// indicates dereferenceability, and if the size is constant we can
3343	// use the dereferenceable attribute (which requires the size in
3344	// bytes).
3345	if (ArrTy->getSizeModifier() == ArraySizeModifier::Static) {
3346	QualType ETy = ArrTy->getElementType();
3347	llvm::Align Alignment =
3348	CGM.getNaturalTypeAlignment(T: ETy).getAsAlign();
3349	AI->addAttrs(B&: llvm::AttrBuilder (getLLVMContext())
3350	.addAlignmentAttr(Align: Alignment));
3351	uint64_t ArrSize = ArrTy->getZExtSize();
3352	if (!ETy ->isIncompleteType() && ETy ->isConstantSizeType() &&
3353	ArrSize) {
3354	llvm::AttrBuilder Attrs(getLLVMContext());
3355	Attrs.addDereferenceableAttr(
3356	Bytes: getContext().getTypeSizeInChars(T: ETy).getQuantity() *
3357	ArrSize);
3358	AI->addAttrs(B&: Attrs);
3359	} else if (getContext().getTargetInfo().getNullPointerValue(
3360	AddrSpace: ETy.getAddressSpace()) == `0` &&
3361	!CGM.getCodeGenOpts().NullPointerIsValid) {
3362	AI->addAttr(Kind: llvm::Attribute::NonNull);
3363	}
3364	}
3365	} else if (const auto *ArrTy =
3366	getContext().getAsVariableArrayType(T: OTy)) {
3367	// For C99 VLAs with the static keyword, we don't know the size so
3368	// we can't use the dereferenceable attribute, but in addrspace(0)
3369	// we know that it must be nonnull.
3370	if (ArrTy->getSizeModifier() == ArraySizeModifier::Static) {
3371	QualType ETy = ArrTy->getElementType();
3372	llvm::Align Alignment =
3373	CGM.getNaturalTypeAlignment(T: ETy).getAsAlign();
3374	AI->addAttrs(B&: llvm::AttrBuilder (getLLVMContext())
3375	.addAlignmentAttr(Align: Alignment));
3376	if (!getTypes().getTargetAddressSpace(T: ETy) &&
3377	!CGM.getCodeGenOpts().NullPointerIsValid)
3378	AI->addAttr(Kind: llvm::Attribute::NonNull);
3379	}
3380	}
3381
3382	// Set `align` attribute if any.
3383	const auto *AVAttr = PVD->getAttr<AlignValueAttr>();
3384	if (!AVAttr)
3385	if (const auto *TOTy = OTy ->getAs<TypedefType>())
3386	AVAttr = TOTy->getDecl()->getAttr<AlignValueAttr>();
3387	if (AVAttr && !SanOpts.has(K: SanitizerKind::Alignment)) {
3388	// If alignment-assumption sanitizer is enabled, we do not* add*
3389	// alignment attribute here, but emit normal alignment assumption,
3390	// so the UBSAN check could function.
3391	llvm::ConstantInt *AlignmentCI =
3392	cast<llvm::ConstantInt>(Val: EmitScalarExpr(E: AVAttr->getAlignment()));
3393	uint64_t AlignmentInt =
3394	AlignmentCI->getLimitedValue(Limit: llvm::Value::MaximumAlignment);
3395	if (AI->getParamAlign().valueOrOne() < AlignmentInt) {
3396	AI->removeAttr(Kind: llvm::Attribute::AttrKind::Alignment);
3397	AI->addAttrs(B&: llvm::AttrBuilder (getLLVMContext())
3398	.addAlignmentAttr(Align: llvm::Align (AlignmentInt)));
3399	}
3400	}
3401	}
3402
3403	// Set 'noalias' if an argument type has the `restrict` qualifier.
3404	if (Arg->getType().isRestrictQualified())
3405	AI->addAttr(Kind: llvm::Attribute::NoAlias);
3406	}
3407
3408	// Prepare the argument value. If we have the trivial case, handle it
3409	// with no muss and fuss.
3410	if (!isa<llvm::StructType>(Val: ArgI.getCoerceToType()) &&
3411	ArgI.getCoerceToType() == ConvertType(T: Ty) &&
3412	ArgI.getDirectOffset() == `0`) {
3413	assert(NumIRArgs == `1`);
3414
3415	// LLVM expects swifterror parameters to be used in very restricted
3416	// ways. Copy the value into a less-restricted temporary.
3417	llvm::Value *V = AI;
3418	if (FI.getExtParameterInfo(argIndex: ArgNo).getABI() ==
3419	ParameterABI::SwiftErrorResult) {
3420	QualType pointeeTy = Ty ->getPointeeType();
3421	assert(pointeeTy->isPointerType());
3422	RawAddress temp =
3423	CreateMemTemp(T: pointeeTy, Align: getPointerAlign(), Name: "swifterror.temp");
3424	Address arg = makeNaturalAddressForPointer(
3425	Ptr: V, T: pointeeTy, Alignment: getContext().getTypeAlignInChars(T: pointeeTy));
3426	llvm::Value *incomingErrorValue = Builder.CreateLoad(Addr: arg);
3427	Builder.CreateStore(Val: incomingErrorValue, Addr: temp);
3428	V = temp.getPointer();
3429
3430	// Push a cleanup to copy the value back at the end of the function.
3431	// The convention does not guarantee that the value will be written
3432	// back if the function exits with an unwind exception.
3433	EHStack.pushCleanup<CopyBackSwiftError>(Kind: NormalCleanup, A: temp, A: arg);
3434	}
3435
3436	// Ensure the argument is the correct type.
3437	if (V->getType() != ArgI.getCoerceToType())
3438	V = Builder.CreateBitCast(V, DestTy: ArgI.getCoerceToType());
3439
3440	if (isPromoted)
3441	V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V);
3442
3443	// Because of merging of function types from multiple decls it is
3444	// possible for the type of an argument to not match the corresponding
3445	// type in the function type. Since we are codegening the callee
3446	// in here, add a cast to the argument type.
3447	llvm::Type *LTy = ConvertType(T: Arg->getType());
3448	if (V->getType() != LTy)
3449	V = Builder.CreateBitCast(V, DestTy: LTy);
3450
3451	ArgVals.push_back(Elt: ParamValue::forDirect(value: V));
3452	break;
3453	}
3454
3455	// VLST arguments are coerced to VLATs at the function boundary for
3456	// ABI consistency. If this is a VLST that was coerced to
3457	// a VLAT at the function boundary and the types match up, use
3458	// llvm.vector.extract to convert back to the original VLST.
3459	if (auto *VecTyTo = dyn_cast<llvm::FixedVectorType>(Val: ConvertType(T: Ty))) {
3460	llvm::Value *ArgVal = Fn->getArg(i: FirstIRArg);
3461	if (auto *VecTyFrom =
3462	dyn_cast<llvm::ScalableVectorType>(Val: ArgVal->getType())) {
3463	auto [Coerced, Extracted] = CoerceScalableToFixed(
3464	CGF&: *this, ToTy: VecTyTo, FromTy: VecTyFrom, V: ArgVal, Name: Arg->getName());
3465	if (Extracted) {
3466	assert(NumIRArgs == `1`);
3467	ArgVals.push_back(Elt: ParamValue::forDirect(value: Coerced));
3468	break;
3469	}
3470	}
3471	}
3472
3473	llvm::StructType *STy =
3474	dyn_cast<llvm::StructType>(Val: ArgI.getCoerceToType());
3475	Address Alloca =
3476	CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg), Name: Arg->getName());
3477
3478	// Pointer to store into.
3479	Address Ptr = emitAddressAtOffset(CGF&: *this, addr: Alloca, info: ArgI);
3480
3481	// Fast-isel and the optimizer generally like scalar values better than
3482	// FCAs, so we flatten them if this is safe to do for this argument.
3483	if (ArgI.isDirect() && ArgI.getCanBeFlattened() && STy &&
3484	STy->getNumElements() > `1`) {
3485	llvm::TypeSize StructSize = CGM.getDataLayout().getTypeAllocSize(Ty: STy);
3486	llvm::TypeSize PtrElementSize =
3487	CGM.getDataLayout().getTypeAllocSize(Ty: Ptr.getElementType());
3488	if (StructSize.isScalable()) {
3489	assert(STy->containsHomogeneousScalableVectorTypes() &&
3490	"ABI only supports structure with homogeneous scalable vector "
3491	"type");
3492	assert(StructSize == PtrElementSize &&
3493	"Only allow non-fractional movement of structure with"
3494	"homogeneous scalable vector type");
3495	assert(STy->getNumElements() == NumIRArgs);
3496
3497	llvm::Value *LoadedStructValue = llvm::PoisonValue::get(T: STy);
3498	for (unsigned i = `0`, e = STy->getNumElements(); i != e; ++i) {
3499	auto *AI = Fn->getArg(i: FirstIRArg + i);
3500	AI->setName(Arg->getName() + ".coerce" + Twine(i));
3501	LoadedStructValue =
3502	Builder.CreateInsertValue(Agg: LoadedStructValue, Val: AI, Idxs: i);
3503	}
3504
3505	Builder.CreateStore(Val: LoadedStructValue, Addr: Ptr);
3506	} else {
3507	uint64_t SrcSize = StructSize.getFixedValue();
3508	uint64_t DstSize = PtrElementSize.getFixedValue();
3509
3510	Address AddrToStoreInto = Address::invalid();
3511	if (SrcSize <= DstSize) {
3512	AddrToStoreInto = Ptr.withElementType(ElemTy: STy);
3513	} else {
3514	AddrToStoreInto =
3515	CreateTempAlloca(Ty: STy, align: Alloca.getAlignment(), Name: "coerce");
3516	}
3517
3518	assert(STy->getNumElements() == NumIRArgs);
3519	for (unsigned i = `0`, e = STy->getNumElements(); i != e; ++i) {
3520	auto AI = Fn->getArg(i: FirstIRArg + i);
3521	AI->setName(Arg->getName() + ".coerce" + Twine(i));
3522	Address EltPtr = Builder.CreateStructGEP(Addr: AddrToStoreInto, Index: i);
3523	Builder.CreateStore(Val: AI, Addr: EltPtr);
3524	}
3525
3526	if (SrcSize > DstSize) {
3527	Builder.CreateMemCpy(Dest: Ptr, Src: AddrToStoreInto, Size: DstSize);
3528	}
3529
3530	// Structures with PFP fields require a coerced store to add any
3531	// pointer signatures.
3532	if (getContext().hasPFPFields(Ty)) {
3533	llvm::Value *Struct = Builder.CreateLoad(Addr: Ptr);
3534	CreatePFPCoercedStore(Src: Struct, SrcFETy: Ty, Dst: Ptr, CGF&: *this);
3535	}
3536	}
3537	} else {
3538	// Simple case, just do a coerced store of the argument into the alloca.
3539	assert(NumIRArgs == `1`);
3540	auto AI = Fn->getArg(i: FirstIRArg);
3541	AI->setName(Arg->getName() + ".coerce");
3542	CreateCoercedStore(
3543	Src: AI, SrcFETy: Ty, Dst: Ptr,
3544	DstSize: llvm::TypeSize::getFixed(
3545	ExactSize: getContext().getTypeSizeInChars(T: Ty).getQuantity() -
3546	ArgI.getDirectOffset()),
3547	/DstIsVolatile=/false);
3548	}
3549
3550	// Match to what EmitParmDecl is expecting for this type.
3551	if (CodeGenFunction::hasScalarEvaluationKind(T: Ty)) {
3552	llvm::Value *V =
3553	EmitLoadOfScalar(Addr: Alloca, Volatile: false, Ty, Loc: Arg->getBeginLoc());
3554	if (isPromoted)
3555	V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V);
3556	ArgVals.push_back(Elt: ParamValue::forDirect(value: V));
3557	} else {
3558	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: Alloca));
3559	}
3560	break;
3561	}
3562
3563	case ABIArgInfo::CoerceAndExpand: {
3564	// Reconstruct into a temporary.
3565	Address alloca = CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg));
3566	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: alloca));
3567
3568	auto coercionType = ArgI.getCoerceAndExpandType();
3569	auto unpaddedCoercionType = ArgI.getUnpaddedCoerceAndExpandType();
3570	auto *unpaddedStruct = dyn_cast<llvm::StructType>(Val: unpaddedCoercionType);
3571
3572	alloca = alloca.withElementType(ElemTy: coercionType);
3573
3574	unsigned argIndex = FirstIRArg;
3575	unsigned unpaddedIndex = `0`;
3576	for (unsigned i = `0`, e = coercionType->getNumElements(); i != e; ++i) {
3577	llvm::Type *eltType = coercionType->getElementType(N: i);
3578	if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType))
3579	continue;
3580
3581	auto eltAddr = Builder.CreateStructGEP(Addr: alloca, Index: i);
3582	llvm::Value *elt = Fn->getArg(i: argIndex++);
3583
3584	auto paramType = unpaddedStruct
3585	? unpaddedStruct->getElementType(N: unpaddedIndex++)
3586	: unpaddedCoercionType;
3587
3588	if (auto *VecTyTo = dyn_cast<llvm::FixedVectorType>(Val: eltType)) {
3589	if (auto *VecTyFrom = dyn_cast<llvm::ScalableVectorType>(Val: paramType)) {
3590	bool Extracted;
3591	std::tie(args&: elt, args&: Extracted) = CoerceScalableToFixed(
3592	CGF&: *this, ToTy: VecTyTo, FromTy: VecTyFrom, V: elt, Name: elt->getName());
3593	assert(Extracted && "Unexpected scalable to fixed vector coercion");
3594	}
3595	}
3596	Builder.CreateStore(Val: elt, Addr: eltAddr);
3597	}
3598	assert(argIndex == FirstIRArg + NumIRArgs);
3599	break;
3600	}
3601
3602	case ABIArgInfo::Expand: {
3603	// If this structure was expanded into multiple arguments then
3604	// we need to create a temporary and reconstruct it from the
3605	// arguments.
3606	Address Alloca = CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg));
3607	LValue LV = MakeAddrLValue(Addr: Alloca, T: Ty);
3608	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: Alloca));
3609
3610	auto FnArgIter = Fn->arg_begin() + FirstIRArg;
3611	ExpandTypeFromArgs(Ty, LV, AI&: FnArgIter);
3612	assert(FnArgIter == Fn->arg_begin() + FirstIRArg + NumIRArgs);
3613	for (unsigned i = `0`, e = NumIRArgs; i != e; ++i) {
3614	auto AI = Fn->getArg(i: FirstIRArg + i);
3615	AI->setName(Arg->getName() + "." + Twine(i));
3616	}
3617	break;
3618	}
3619
3620	case ABIArgInfo::TargetSpecific: {
3621	auto *AI = Fn->getArg(i: FirstIRArg);
3622	AI->setName(Arg->getName() + ".target_coerce");
3623	Address Alloca =
3624	CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg), Name: Arg->getName());
3625	Address Ptr = emitAddressAtOffset(CGF&: *this, addr: Alloca, info: ArgI);
3626	CGM.getABIInfo().createCoercedStore(Val: AI, DstAddr: Ptr, AI: ArgI, DestIsVolatile: false, CGF&: *this);
3627	if (CodeGenFunction::hasScalarEvaluationKind(T: Ty)) {
3628	llvm::Value *V =
3629	EmitLoadOfScalar(Addr: Alloca, Volatile: false, Ty, Loc: Arg->getBeginLoc());
3630	if (isPromoted) {
3631	V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V);
3632	}
3633	ArgVals.push_back(Elt: ParamValue::forDirect(value: V));
3634	} else {
3635	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: Alloca));
3636	}
3637	break;
3638	}
3639	case ABIArgInfo::Ignore:
3640	assert(NumIRArgs == `0`);
3641	// Initialize the local variable appropriately.
3642	if (!hasScalarEvaluationKind(T: Ty)) {
3643	ArgVals.push_back(Elt: ParamValue::forIndirect(addr: CreateMemTemp(T: Ty)));
3644	} else {
3645	llvm::Value *U = llvm::UndefValue::get(T: ConvertType(T: Arg->getType()));
3646	ArgVals.push_back(Elt: ParamValue::forDirect(value: U));
3647	}
3648	break;
3649	}
3650	}
3651
3652	if (getTarget().getCXXABI().areArgsDestroyedLeftToRightInCallee()) {
3653	for (int I = Args.size() - `1`; I >= `0`; --I)
3654	EmitParmDecl(D: *Args [I], Arg: ArgVals [I], ArgNo: I + `1`);
3655	} else {
3656	for (unsigned I = `0`, E = Args.size(); I != E; ++I)
3657	EmitParmDecl(D: *Args [I], Arg: ArgVals [I], ArgNo: I + `1`);
3658	}
3659	}
3660
3661	static void eraseUnusedBitCasts(llvm::Instruction *insn) {
3662	while (insn->use_empty()) {
3663	llvm::BitCastInst *bitcast = dyn_cast<llvm::BitCastInst>(Val: insn);
3664	if (!bitcast)
3665	return;
3666
3667	// This is "safe" because we would have used a ConstantExpr otherwise.
3668	insn = cast<llvm::Instruction>(Val: bitcast->getOperand(i_nocapture: `0`));
3669	bitcast->eraseFromParent();
3670	}
3671	}
3672
3673	/// Try to emit a fused autorelease of a return result.
3674	static llvm::Value *tryEmitFusedAutoreleaseOfResult(CodeGenFunction &CGF,
3675	llvm::Value *result) {
3676	// We must be immediately followed the cast.
3677	llvm::BasicBlock *BB = CGF.Builder.GetInsertBlock();
3678	if (BB->empty())
3679	return nullptr;
3680	if (&BB->back() != result)
3681	return nullptr;
3682
3683	llvm::Type *resultType = result->getType();
3684
3685	// result is in a BasicBlock and is therefore an Instruction.
3686	llvm::Instruction *generator = cast<llvm::Instruction>(Val: result);
3687
3688	SmallVector<llvm::Instruction *, `4`> InstsToKill;
3689
3690	// Look for:
3691	// %generator = bitcast %type1* %generator2 to %type2*
3692	while (llvm::BitCastInst *bitcast = dyn_cast<llvm::BitCastInst>(Val: generator)) {
3693	// We would have emitted this as a constant if the operand weren't
3694	// an Instruction.
3695	generator = cast<llvm::Instruction>(Val: bitcast->getOperand(i_nocapture: `0`));
3696
3697	// Require the generator to be immediately followed by the cast.
3698	if (generator->getNextNode() != bitcast)
3699	return nullptr;
3700
3701	InstsToKill.push_back(Elt: bitcast);
3702	}
3703
3704	// Look for:
3705	// %generator = call i8 @objc_retain(i8* %originalResult)*
3706	// or
3707	// %generator = call i8 @objc_retainAutoreleasedReturnValue(i8* %originalResult)*
3708	llvm::CallInst *call = dyn_cast<llvm::CallInst>(Val: generator);
3709	if (!call)
3710	return nullptr;
3711
3712	bool doRetainAutorelease;
3713
3714	if (call->getCalledOperand() == CGF.CGM.getObjCEntrypoints().objc_retain) {
3715	doRetainAutorelease = true;
3716	} else if (call->getCalledOperand() ==
3717	CGF.CGM.getObjCEntrypoints().objc_retainAutoreleasedReturnValue) {
3718	doRetainAutorelease = false;
3719
3720	// If we emitted an assembly marker for this call (and the
3721	// ARCEntrypoints field should have been set if so), go looking
3722	// for that call. If we can't find it, we can't do this
3723	// optimization. But it should always be the immediately previous
3724	// instruction, unless we needed bitcasts around the call.
3725	if (CGF.CGM.getObjCEntrypoints().retainAutoreleasedReturnValueMarker) {
3726	llvm::Instruction *prev = call->getPrevNode();
3727	assert(prev);
3728	if (isa<llvm::BitCastInst>(Val: prev)) {
3729	prev = prev->getPrevNode();
3730	assert(prev);
3731	}
3732	assert(isa<llvm::CallInst>(prev));
3733	assert(cast<llvm::CallInst>(prev)->getCalledOperand() ==
3734	CGF.CGM.getObjCEntrypoints().retainAutoreleasedReturnValueMarker);
3735	InstsToKill.push_back(Elt: prev);
3736	}
3737	} else {
3738	return nullptr;
3739	}
3740
3741	result = call->getArgOperand(i: `0`);
3742	InstsToKill.push_back(Elt: call);
3743
3744	// Keep killing bitcasts, for sanity. Note that we no longer care
3745	// about precise ordering as long as there's exactly one use.
3746	while (llvm::BitCastInst *bitcast = dyn_cast<llvm::BitCastInst>(Val: result)) {
3747	if (!bitcast->hasOneUse())
3748	break;
3749	InstsToKill.push_back(Elt: bitcast);
3750	result = bitcast->getOperand(i_nocapture: `0`);
3751	}
3752
3753	// Delete all the unnecessary instructions, from latest to earliest.
3754	for (auto *I : InstsToKill)
3755	I->eraseFromParent();
3756
3757	// Do the fused retain/autorelease if we were asked to.
3758	if (doRetainAutorelease)
3759	result = CGF.EmitARCRetainAutoreleaseReturnValue(value: result);
3760
3761	// Cast back to the result type.
3762	return CGF.Builder.CreateBitCast(V: result, DestTy: resultType);
3763	}
3764
3765	/// If this is a +1 of the value of an immutable 'self', remove it.
3766	static llvm::Value *tryRemoveRetainOfSelf(CodeGenFunction &CGF,
3767	llvm::Value *result) {
3768	// This is only applicable to a method with an immutable 'self'.
3769	const ObjCMethodDecl *method =
3770	dyn_cast_or_null<ObjCMethodDecl>(Val: CGF.CurCodeDecl);
3771	if (!method)
3772	return nullptr;
3773	const VarDecl *self = method->getSelfDecl();
3774	if (!self->getType().isConstQualified())
3775	return nullptr;
3776
3777	// Look for a retain call. Note: stripPointerCasts looks through returned arg
3778	// functions, which would cause us to miss the retain.
3779	llvm::CallInst *retainCall = dyn_cast<llvm::CallInst>(Val: result);
3780	if (!retainCall \|\| retainCall->getCalledOperand() !=
3781	CGF.CGM.getObjCEntrypoints().objc_retain)
3782	return nullptr;
3783
3784	// Look for an ordinary load of 'self'.
3785	llvm::Value *retainedValue = retainCall->getArgOperand(i: `0`);
3786	llvm::LoadInst *load =
3787	dyn_cast<llvm::LoadInst>(Val: retainedValue->stripPointerCasts());
3788	if (!load \|\| load->isAtomic() \|\| load->isVolatile() \|\|
3789	load->getPointerOperand() != CGF.GetAddrOfLocalVar(VD: self).getBasePointer())
3790	return nullptr;
3791
3792	// Okay! Burn it all down. This relies for correctness on the
3793	// assumption that the retain is emitted as part of the return and
3794	// that thereafter everything is used "linearly".
3795	llvm::Type *resultType = result->getType();
3796	eraseUnusedBitCasts(insn: cast<llvm::Instruction>(Val: result));
3797	assert(retainCall->use_empty());
3798	retainCall->eraseFromParent();
3799	eraseUnusedBitCasts(insn: cast<llvm::Instruction>(Val: retainedValue));
3800
3801	return CGF.Builder.CreateBitCast(V: load, DestTy: resultType);
3802	}
3803
3804	/// Emit an ARC autorelease of the result of a function.
3805	///
3806	/// \return the value to actually return from the function
3807	static llvm::Value *emitAutoreleaseOfResult(CodeGenFunction &CGF,
3808	llvm::Value *result) {
3809	// If we're returning 'self', kill the initial retain. This is a
3810	// heuristic attempt to "encourage correctness" in the really unfortunate
3811	// case where we have a return of self during a dealloc and we desperately
3812	// need to avoid the possible autorelease.
3813	if (llvm::Value *self = tryRemoveRetainOfSelf(CGF, result))
3814	return self;
3815
3816	// At -O0, try to emit a fused retain/autorelease.
3817	if (CGF.shouldUseFusedARCCalls())
3818	if (llvm::Value *fused = tryEmitFusedAutoreleaseOfResult(CGF, result))
3819	return fused;
3820
3821	return CGF.EmitARCAutoreleaseReturnValue(value: result);
3822	}
3823
3824	/// Heuristically search for a dominating store to the return-value slot.
3825	static llvm::StoreInst *findDominatingStoreToReturnValue(CodeGenFunction &CGF) {
3826	llvm::Value *ReturnValuePtr = CGF.ReturnValue.getBasePointer();
3827
3828	// Check if a User is a store which pointerOperand is the ReturnValue.
3829	// We are looking for stores to the ReturnValue, not for stores of the
3830	// ReturnValue to some other location.
3831	auto GetStoreIfValid = [&CGF,
3832	ReturnValuePtr](llvm::User U) -> llvm::StoreInst {
3833	auto *SI = dyn_cast<llvm::StoreInst>(Val: U);
3834	if (!SI \|\| SI->getPointerOperand() != ReturnValuePtr \|\|
3835	SI->getValueOperand()->getType() != CGF.ReturnValue.getElementType())
3836	return nullptr;
3837	// These aren't actually possible for non-coerced returns, and we
3838	// only care about non-coerced returns on this code path.
3839	// All memory instructions inside __try block are volatile.
3840	assert(!SI->isAtomic() &&
3841	(!SI->isVolatile() \|\| CGF.currentFunctionUsesSEHTry()));
3842	return SI;
3843	};
3844	// If there are multiple uses of the return-value slot, just check
3845	// for something immediately preceding the IP. Sometimes this can
3846	// happen with how we generate implicit-returns; it can also happen
3847	// with noreturn cleanups.
3848	if (!ReturnValuePtr->hasOneUse()) {
3849	llvm::BasicBlock *IP = CGF.Builder.GetInsertBlock();
3850	if (IP->empty())
3851	return nullptr;
3852
3853	// Look at directly preceding instruction, skipping bitcasts, lifetime
3854	// markers, and fake uses and their operands.
3855	const llvm::Instruction LoadIntoFakeUse = nullptr*;
3856	for (llvm::Instruction &I : llvm::reverse(C&: *IP)) {
3857	// Ignore instructions that are just loads for fake uses; the load should
3858	// immediately precede the fake use, so we only need to remember the
3859	// operand for the last fake use seen.
3860	if (LoadIntoFakeUse == &I)
3861	continue;
3862	if (isa<llvm::BitCastInst>(Val: &I))
3863	continue;
3864	if (auto *II = dyn_cast<llvm::IntrinsicInst>(Val: &I)) {
3865	if (II->getIntrinsicID() == llvm::Intrinsic::lifetime_end)
3866	continue;
3867
3868	if (II->getIntrinsicID() == llvm::Intrinsic::fake_use) {
3869	LoadIntoFakeUse = dyn_cast<llvm::Instruction>(Val: II->getArgOperand(i: `0`));
3870	continue;
3871	}
3872	}
3873	return GetStoreIfValid (&I);
3874	}
3875	return nullptr;
3876	}
3877
3878	llvm::StoreInst *store = GetStoreIfValid (ReturnValuePtr->user_back());
3879	if (!store)
3880	return nullptr;
3881
3882	// Now do a first-and-dirty dominance check: just walk up the
3883	// single-predecessors chain from the current insertion point.
3884	llvm::BasicBlock *StoreBB = store->getParent();
3885	llvm::BasicBlock *IP = CGF.Builder.GetInsertBlock();
3886	llvm::SmallPtrSet<llvm::BasicBlock *, `4`> SeenBBs;
3887	while (IP != StoreBB) {
3888	if (!SeenBBs.insert(Ptr: IP).second \|\| !(IP = IP->getSinglePredecessor()))
3889	return nullptr;
3890	}
3891
3892	// Okay, the store's basic block dominates the insertion point; we
3893	// can do our thing.
3894	return store;
3895	}
3896
3897	// Helper functions for EmitCMSEClearRecord
3898
3899	// Set the bits corresponding to a field having width `BitWidth` and located at
3900	// offset `BitOffset` (from the least significant bit) within a storage unit of
3901	// `Bits.size()` bytes. Each element of `Bits` corresponds to one target byte.
3902	// Use little-endian layout, i.e.`Bits[0]` is the LSB.
3903	static void setBitRange(SmallVectorImpl<uint64_t> &Bits, int BitOffset,
3904	int BitWidth, int CharWidth) {
3905	assert(CharWidth <= `64`);
3906	assert(static_cast<unsigned>(BitWidth) <= Bits.size() * CharWidth);
3907
3908	int Pos = `0`;
3909	if (BitOffset >= CharWidth) {
3910	Pos += BitOffset / CharWidth;
3911	BitOffset = BitOffset % CharWidth;
3912	}
3913
3914	const uint64_t Used = (uint64_t(`1`) << CharWidth) - `1`;
3915	if (BitOffset + BitWidth >= CharWidth) {
3916	Bits [Pos++] \|= (Used << BitOffset) & Used;
3917	BitWidth -= CharWidth - BitOffset;
3918	BitOffset = `0`;
3919	}
3920
3921	while (BitWidth >= CharWidth) {
3922	Bits [Pos++] = Used;
3923	BitWidth -= CharWidth;
3924	}
3925
3926	if (BitWidth > `0`)
3927	Bits [Pos++] \|= (Used >> (CharWidth - BitWidth)) << BitOffset;
3928	}
3929
3930	// Set the bits corresponding to a field having width `BitWidth` and located at
3931	// offset `BitOffset` (from the least significant bit) within a storage unit of
3932	// `StorageSize` bytes, located at `StorageOffset` in `Bits`. Each element of
3933	// `Bits` corresponds to one target byte. Use target endian layout.
3934	static void setBitRange(SmallVectorImpl<uint64_t> &Bits, int StorageOffset,
3935	int StorageSize, int BitOffset, int BitWidth,
3936	int CharWidth, bool BigEndian) {
3937
3938	SmallVector<uint64_t, `8`> TmpBits(StorageSize);
3939	setBitRange(Bits&: TmpBits, BitOffset, BitWidth, CharWidth);
3940
3941	if (BigEndian)
3942	std::reverse(first: TmpBits.begin(), last: TmpBits.end());
3943
3944	for (uint64_t V : TmpBits)
3945	Bits [StorageOffset++] \|= V;
3946	}
3947
3948	static void setUsedBits(CodeGenModule &, QualType, int,
3949	SmallVectorImpl<uint64_t> &);
3950
3951	// Set the bits in `Bits`, which correspond to the value representations of
3952	// the actual members of the record type `RTy`. Note that this function does
3953	// not handle base classes, virtual tables, etc, since they cannot happen in
3954	// CMSE function arguments or return. The bit mask corresponds to the target
3955	// memory layout, i.e. it's endian dependent.
3956	static void setUsedBits(CodeGenModule &CGM, const RecordType RTy, int* Offset,
3957	SmallVectorImpl<uint64_t> &Bits) {
3958	ASTContext &Context = CGM.getContext();
3959	int CharWidth = Context.getCharWidth();
3960	const RecordDecl *RD = RTy->getDecl()->getDefinition();
3961	const ASTRecordLayout &ASTLayout = Context.getASTRecordLayout(D: RD);
3962	const CGRecordLayout &Layout = CGM.getTypes().getCGRecordLayout(RD);
3963
3964	int Idx = `0`;
3965	for (auto I = RD->field_begin(), E = RD->field_end(); I != E; ++I, ++Idx) {
3966	const FieldDecl F = I;
3967
3968	if (F->isUnnamedBitField() \|\| F->isZeroLengthBitField() \|\|
3969	F->getType()->isIncompleteArrayType())
3970	continue;
3971
3972	if (F->isBitField()) {
3973	const CGBitFieldInfo &BFI = Layout.getBitFieldInfo(FD: F);
3974	setBitRange(Bits, StorageOffset: Offset + BFI.StorageOffset.getQuantity(),
3975	StorageSize: BFI.StorageSize / CharWidth, BitOffset: BFI.Offset, BitWidth: BFI.Size, CharWidth,
3976	BigEndian: CGM.getDataLayout().isBigEndian());
3977	continue;
3978	}
3979
3980	setUsedBits(CGM, F->getType(),
3981	Offset + ASTLayout.getFieldOffset(FieldNo: Idx) / CharWidth, Bits);
3982	}
3983	}
3984
3985	// Set the bits in `Bits`, which correspond to the value representations of
3986	// the elements of an array type `ATy`.
3987	static void setUsedBits(CodeGenModule &CGM, const ConstantArrayType *ATy,
3988	int Offset, SmallVectorImpl<uint64_t> &Bits) {
3989	const ASTContext &Context = CGM.getContext();
3990
3991	QualType ETy = Context.getBaseElementType(VAT: ATy);
3992	int Size = Context.getTypeSizeInChars(T: ETy).getQuantity();
3993	SmallVector<uint64_t, `4`> TmpBits(Size);
3994	setUsedBits(CGM, ETy, `0`, TmpBits);
3995
3996	for (int I = `0`, N = Context.getConstantArrayElementCount(CA: ATy); I < N; ++I) {
3997	auto Src = TmpBits.begin();
3998	auto Dst = Bits.begin() + Offset + I * Size;
3999	for (int J = `0`; J < Size; ++J)
4000	Dst++ \|= Src++;
4001	}
4002	}
4003
4004	// Set the bits in `Bits`, which correspond to the value representations of
4005	// the type `QTy`.
4006	static void setUsedBits(CodeGenModule &CGM, QualType QTy, int Offset,
4007	SmallVectorImpl<uint64_t> &Bits) {
4008	if (const auto *RTy = QTy ->getAsCanonical<RecordType>())
4009	return setUsedBits(CGM, RTy, Offset, Bits);
4010
4011	ASTContext &Context = CGM.getContext();
4012	if (const auto *ATy = Context.getAsConstantArrayType(T: QTy))
4013	return setUsedBits(CGM, ATy, Offset, Bits);
4014
4015	int Size = Context.getTypeSizeInChars(T: QTy).getQuantity();
4016	if (Size <= `0`)
4017	return;
4018
4019	std::fill_n(first: Bits.begin() + Offset, n: Size,
4020	value: (uint64_t(`1`) << Context.getCharWidth()) - `1`);
4021	}
4022
4023	static uint64_t buildMultiCharMask(const SmallVectorImpl<uint64_t> &Bits,
4024	int Pos, int Size, int CharWidth,
4025	bool BigEndian) {
4026	assert(Size > `0`);
4027	uint64_t Mask = `0`;
4028	if (BigEndian) {
4029	for (auto P = Bits.begin() + Pos, E = Bits.begin() + Pos + Size; P != E;
4030	++P)
4031	Mask = (Mask << CharWidth) \| *P;
4032	} else {
4033	auto P = Bits.begin() + Pos + Size, End = Bits.begin() + Pos;
4034	do
4035	Mask = (Mask << CharWidth) \| *--P;
4036	while (P != End);
4037	}
4038	return Mask;
4039	}
4040
4041	// Emit code to clear the bits in a record, which aren't a part of any user
4042	// declared member, when the record is a function return.
4043	llvm::Value CodeGenFunction::EmitCMSEClearRecord(llvm::Value Src,
4044	llvm::IntegerType *ITy,
4045	QualType QTy) {
4046	assert(Src->getType() == ITy);
4047	assert(ITy->getScalarSizeInBits() <= `64`);
4048
4049	const llvm::DataLayout &DataLayout = CGM.getDataLayout();
4050	int Size = DataLayout.getTypeStoreSize(Ty: ITy);
4051	SmallVector<uint64_t, `4`> Bits(Size);
4052	setUsedBits(CGM, RTy: QTy ->castAsCanonical<RecordType>(), Offset: `0`, Bits);
4053
4054	int CharWidth = CGM.getContext().getCharWidth();
4055	uint64_t Mask =
4056	buildMultiCharMask(Bits, Pos: `0`, Size, CharWidth, BigEndian: DataLayout.isBigEndian());
4057
4058	return Builder.CreateAnd(LHS: Src, RHS: Mask, Name: "cmse.clear");
4059	}
4060
4061	// Emit code to clear the bits in a record, which aren't a part of any user
4062	// declared member, when the record is a function argument.
4063	llvm::Value CodeGenFunction::EmitCMSEClearRecord(llvm::Value Src,
4064	llvm::ArrayType *ATy,
4065	QualType QTy) {
4066	const llvm::DataLayout &DataLayout = CGM.getDataLayout();
4067	int Size = DataLayout.getTypeStoreSize(Ty: ATy);
4068	SmallVector<uint64_t, `16`> Bits(Size);
4069	setUsedBits(CGM, RTy: QTy ->castAsCanonical<RecordType>(), Offset: `0`, Bits);
4070
4071	// Clear each element of the LLVM array.
4072	int CharWidth = CGM.getContext().getCharWidth();
4073	int CharsPerElt =
4074	ATy->getArrayElementType()->getScalarSizeInBits() / CharWidth;
4075	int MaskIndex = `0`;
4076	llvm::Value *R = llvm::PoisonValue::get(T: ATy);
4077	for (int I = `0`, N = ATy->getArrayNumElements(); I != N; ++I) {
4078	uint64_t Mask = buildMultiCharMask(Bits, Pos: MaskIndex, Size: CharsPerElt, CharWidth,
4079	BigEndian: DataLayout.isBigEndian());
4080	MaskIndex += CharsPerElt;
4081	llvm::Value *T0 = Builder.CreateExtractValue(Agg: Src, Idxs: I);
4082	llvm::Value *T1 = Builder.CreateAnd(LHS: T0, RHS: Mask, Name: "cmse.clear");
4083	R = Builder.CreateInsertValue(Agg: R, Val: T1, Idxs: I);
4084	}
4085
4086	return R;
4087	}
4088
4089	void CodeGenFunction::EmitFunctionEpilog(
4090	const CGFunctionInfo &FI, bool EmitRetDbgLoc, SourceLocation EndLoc,
4091	uint64_t RetKeyInstructionsSourceAtom) {
4092	if (FI.isNoReturn()) {
4093	// Noreturn functions don't return.
4094	EmitUnreachable(Loc: EndLoc);
4095	return;
4096	}
4097
4098	if (CurCodeDecl && CurCodeDecl->hasAttr<NakedAttr>()) {
4099	// Naked functions don't have epilogues.
4100	Builder.CreateUnreachable();
4101	return;
4102	}
4103
4104	// Functions with no result always return void.
4105	if (!ReturnValue.isValid()) {
4106	auto *I = Builder.CreateRetVoid();
4107	if (RetKeyInstructionsSourceAtom)
4108	addInstToSpecificSourceAtom(KeyInstruction: I, Backup: nullptr, Atom: RetKeyInstructionsSourceAtom);
4109	else
4110	addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
4111	return;
4112	}
4113
4114	llvm::DebugLoc RetDbgLoc;
4115	llvm::Value RV = nullptr*;
4116	QualType RetTy = FI.getReturnType();
4117	const ABIArgInfo &RetAI = FI.getReturnInfo();
4118
4119	switch (RetAI.getKind()) {
4120	case ABIArgInfo::InAlloca:
4121	// Aggregates get evaluated directly into the destination. Sometimes we
4122	// need to return the sret value in a register, though.
4123	assert(hasAggregateEvaluationKind(RetTy));
4124	if (RetAI.getInAllocaSRet()) {
4125	llvm::Function::arg_iterator EI = CurFn->arg_end();
4126	--EI;
4127	llvm::Value ArgStruct = &EI;
4128	llvm::Value *SRet = Builder.CreateStructGEP(
4129	Ty: FI.getArgStruct(), Ptr: ArgStruct, Idx: RetAI.getInAllocaFieldIndex());
4130	llvm::Type *Ty =
4131	cast<llvm::GetElementPtrInst>(Val: SRet)->getResultElementType();
4132	RV = Builder.CreateAlignedLoad(Ty, Addr: SRet, Align: getPointerAlign(), Name: "sret");
4133	}
4134	break;
4135
4136	case ABIArgInfo::Indirect: {
4137	auto AI = CurFn->arg_begin();
4138	if (RetAI.isSRetAfterThis())
4139	++AI;
4140	switch (getEvaluationKind(T: RetTy)) {
4141	case TEK_Complex: {
4142	ComplexPairTy RT =
4143	EmitLoadOfComplex(src: MakeAddrLValue(Addr: ReturnValue, T: RetTy), loc: EndLoc);
4144	EmitStoreOfComplex(V: RT, dest: MakeNaturalAlignAddrLValue(V: &*AI, T: RetTy),
4145	/isInit/ true);
4146	break;
4147	}
4148	case TEK_Aggregate:
4149	// Do nothing; aggregates get evaluated directly into the destination.
4150	break;
4151	case TEK_Scalar: {
4152	LValueBaseInfo BaseInfo;
4153	TBAAAccessInfo TBAAInfo;
4154	CharUnits Alignment =
4155	CGM.getNaturalTypeAlignment(T: RetTy, BaseInfo: &BaseInfo, TBAAInfo: &TBAAInfo);
4156	Address ArgAddr(&*AI, ConvertType(T: RetTy), Alignment);
4157	LValue ArgVal =
4158	LValue::MakeAddr(Addr: ArgAddr, type: RetTy, Context&: getContext(), BaseInfo, TBAAInfo);
4159	EmitStoreOfScalar(
4160	value: EmitLoadOfScalar(lvalue: MakeAddrLValue(Addr: ReturnValue, T: RetTy), Loc: EndLoc), lvalue: ArgVal,
4161	/isInit/ true);
4162	break;
4163	}
4164	}
4165	break;
4166	}
4167
4168	case ABIArgInfo::Extend:
4169	case ABIArgInfo::Direct:
4170	if (RetAI.getCoerceToType() == ConvertType(T: RetTy) &&
4171	RetAI.getDirectOffset() == `0`) {
4172	// The internal return value temp always will have pointer-to-return-type
4173	// type, just do a load.
4174
4175	// If there is a dominating store to ReturnValue, we can elide
4176	// the load, zap the store, and usually zap the alloca.
4177	if (llvm::StoreInst SI = findDominatingStoreToReturnValue(CGF&: this)) {
4178	// Reuse the debug location from the store unless there is
4179	// cleanup code to be emitted between the store and return
4180	// instruction.
4181	if (EmitRetDbgLoc && !AutoreleaseResult)
4182	RetDbgLoc = SI->getDebugLoc();
4183	// Get the stored value and nuke the now-dead store.
4184	RV = SI->getValueOperand();
4185	SI->eraseFromParent();
4186
4187	// Otherwise, we have to do a simple load.
4188	} else {
4189	RV = Builder.CreateLoad(Addr: ReturnValue);
4190	}
4191	} else {
4192	// If the value is offset in memory, apply the offset now.
4193	Address V = emitAddressAtOffset(CGF&: *this, addr: ReturnValue, info: RetAI);
4194
4195	RV = CreateCoercedLoad(Src: V, SrcFETy: RetTy, Ty: RetAI.getCoerceToType(), CGF&: *this);
4196	}
4197
4198	// In ARC, end functions that return a retainable type with a call
4199	// to objc_autoreleaseReturnValue.
4200	if (AutoreleaseResult) {
4201	#ifndef NDEBUG
4202	// Type::isObjCRetainabletype has to be called on a QualType that hasn't
4203	// been stripped of the typedefs, so we cannot use RetTy here. Get the
4204	// original return type of FunctionDecl, CurCodeDecl, and BlockDecl from
4205	// CurCodeDecl or BlockInfo.
4206	QualType RT;
4207
4208	if (auto *FD = dyn_cast<FunctionDecl>(CurCodeDecl))
4209	RT = FD->getReturnType();
4210	else if (auto *MD = dyn_cast<ObjCMethodDecl>(CurCodeDecl))
4211	RT = MD->getReturnType();
4212	else if (isa<BlockDecl>(CurCodeDecl))
4213	RT = BlockInfo->BlockExpression->getFunctionType()->getReturnType();
4214	else
4215	llvm_unreachable("Unexpected function/method type");
4216
4217	assert(getLangOpts().ObjCAutoRefCount && !FI.isReturnsRetained() &&
4218	RT->isObjCRetainableType());
4219	#endif
4220	RV = emitAutoreleaseOfResult(CGF&: *this, result: RV);
4221	}
4222
4223	break;
4224
4225	case ABIArgInfo::Ignore:
4226	break;
4227
4228	case ABIArgInfo::CoerceAndExpand: {
4229	auto coercionType = RetAI.getCoerceAndExpandType();
4230	auto unpaddedCoercionType = RetAI.getUnpaddedCoerceAndExpandType();
4231	auto *unpaddedStruct = dyn_cast<llvm::StructType>(Val: unpaddedCoercionType);
4232
4233	// Load all of the coerced elements out into results.
4234	llvm::SmallVector<llvm::Value *, `4`> results;
4235	Address addr = ReturnValue.withElementType(ElemTy: coercionType);
4236	unsigned unpaddedIndex = `0`;
4237	for (unsigned i = `0`, e = coercionType->getNumElements(); i != e; ++i) {
4238	auto coercedEltType = coercionType->getElementType(N: i);
4239	if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType: coercedEltType))
4240	continue;
4241
4242	auto eltAddr = Builder.CreateStructGEP(Addr: addr, Index: i);
4243	llvm::Value *elt = CreateCoercedLoad(
4244	Src: eltAddr, SrcFETy: RetTy,
4245	Ty: unpaddedStruct ? unpaddedStruct->getElementType(N: unpaddedIndex++)
4246	: unpaddedCoercionType,
4247	CGF&: *this);
4248	results.push_back(Elt: elt);
4249	}
4250
4251	// If we have one result, it's the single direct result type.
4252	if (results.size() == `1`) {
4253	RV = results [`0`];
4254
4255	// Otherwise, we need to make a first-class aggregate.
4256	} else {
4257	// Construct a return type that lacks padding elements.
4258	llvm::Type *returnType = RetAI.getUnpaddedCoerceAndExpandType();
4259
4260	RV = llvm::PoisonValue::get(T: returnType);
4261	for (unsigned i = `0`, e = results.size(); i != e; ++i) {
4262	RV = Builder.CreateInsertValue(Agg: RV, Val: results [i], Idxs: i);
4263	}
4264	}
4265	break;
4266	}
4267	case ABIArgInfo::TargetSpecific: {
4268	Address V = emitAddressAtOffset(CGF&: *this, addr: ReturnValue, info: RetAI);
4269	RV = CGM.getABIInfo().createCoercedLoad(SrcAddr: V, AI: RetAI, CGF&: *this);
4270	break;
4271	}
4272	case ABIArgInfo::Expand:
4273	case ABIArgInfo::IndirectAliased:
4274	llvm_unreachable("Invalid ABI kind for return argument");
4275	}
4276
4277	llvm::Instruction *Ret;
4278	if (RV) {
4279	if (CurFuncDecl && CurFuncDecl->hasAttr<CmseNSEntryAttr>()) {
4280	// For certain return types, clear padding bits, as they may reveal
4281	// sensitive information.
4282	// Small struct/union types are passed as integers.
4283	auto *ITy = dyn_cast<llvm::IntegerType>(Val: RV->getType());
4284	if (ITy != nullptr && isa<RecordType>(Val: RetTy.getCanonicalType()))
4285	RV = EmitCMSEClearRecord(Src: RV, ITy, QTy: RetTy);
4286	}
4287	EmitReturnValueCheck(RV);
4288	Ret = Builder.CreateRet(V: RV);
4289	} else {
4290	Ret = Builder.CreateRetVoid();
4291	}
4292
4293	if (RetDbgLoc)
4294	Ret->setDebugLoc(std::move(RetDbgLoc));
4295
4296	llvm::Value Backup = RV ? Ret->getOperand(i: `0`) : nullptr*;
4297	if (RetKeyInstructionsSourceAtom)
4298	addInstToSpecificSourceAtom(KeyInstruction: Ret, Backup, Atom: RetKeyInstructionsSourceAtom);
4299	else
4300	addInstToNewSourceAtom(KeyInstruction: Ret, Backup);
4301	}
4302
4303	void CodeGenFunction::EmitReturnValueCheck(llvm::Value *RV) {
4304	// A current decl may not be available when emitting vtable thunks.
4305	if (!CurCodeDecl)
4306	return;
4307
4308	// If the return block isn't reachable, neither is this check, so don't emit
4309	// it.
4310	if (ReturnBlock.isValid() && ReturnBlock.getBlock()->use_empty())
4311	return;
4312
4313	ReturnsNonNullAttr RetNNAttr = nullptr*;
4314	if (SanOpts.has(K: SanitizerKind::ReturnsNonnullAttribute))
4315	RetNNAttr = CurCodeDecl->getAttr<ReturnsNonNullAttr>();
4316
4317	if (!RetNNAttr && !requiresReturnValueNullabilityCheck())
4318	return;
4319
4320	// Prefer the returns_nonnull attribute if it's present.
4321	SourceLocation AttrLoc;
4322	SanitizerKind::SanitizerOrdinal CheckKind;
4323	SanitizerHandler Handler;
4324	if (RetNNAttr) {
4325	assert(!requiresReturnValueNullabilityCheck() &&
4326	"Cannot check nullability and the nonnull attribute");
4327	AttrLoc = RetNNAttr->getLocation();
4328	CheckKind = SanitizerKind::SO_ReturnsNonnullAttribute;
4329	Handler = SanitizerHandler::NonnullReturn;
4330	} else {
4331	if (auto *DD = dyn_cast<DeclaratorDecl>(Val: CurCodeDecl))
4332	if (auto *TSI = DD->getTypeSourceInfo())
4333	if (auto FTL = TSI->getTypeLoc().getAsAdjusted<FunctionTypeLoc>())
4334	AttrLoc = FTL.getReturnLoc().findNullabilityLoc();
4335	CheckKind = SanitizerKind::SO_NullabilityReturn;
4336	Handler = SanitizerHandler::NullabilityReturn;
4337	}
4338
4339	SanitizerDebugLocation SanScope(this, {CheckKind}, Handler);
4340
4341	// Make sure the "return" source location is valid. If we're checking a
4342	// nullability annotation, make sure the preconditions for the check are met.
4343	llvm::BasicBlock *Check = createBasicBlock(name: "nullcheck");
4344	llvm::BasicBlock *NoCheck = createBasicBlock(name: "no.nullcheck");
4345	llvm::Value *SLocPtr = Builder.CreateLoad(Addr: ReturnLocation, Name: "return.sloc.load");
4346	llvm::Value *CanNullCheck = Builder.CreateIsNotNull(Arg: SLocPtr);
4347	if (requiresReturnValueNullabilityCheck())
4348	CanNullCheck =
4349	Builder.CreateAnd(LHS: CanNullCheck, RHS: RetValNullabilityPrecondition);
4350	Builder.CreateCondBr(Cond: CanNullCheck, True: Check, False: NoCheck);
4351	EmitBlock(BB: Check);
4352
4353	// Now do the null check.
4354	llvm::Value *Cond = Builder.CreateIsNotNull(Arg: RV);
4355	llvm::Constant *StaticData[] = {EmitCheckSourceLocation(Loc: AttrLoc)};
4356	llvm::Value *DynamicData[] = {SLocPtr};
4357	EmitCheck(Checked: std::make_pair(x&: Cond, y&: CheckKind), Check: Handler, StaticArgs: StaticData, DynamicArgs: DynamicData);
4358
4359	EmitBlock(BB: NoCheck);
4360
4361	#ifndef NDEBUG
4362	// The return location should not be used after the check has been emitted.
4363	ReturnLocation = Address::invalid();
4364	#endif
4365	}
4366
4367	static bool isInAllocaArgument(CGCXXABI &ABI, QualType type) {
4368	const CXXRecordDecl *RD = type ->getAsCXXRecordDecl();
4369	return RD && ABI.getRecordArgABI(RD) == CGCXXABI::RAA_DirectInMemory;
4370	}
4371
4372	static AggValueSlot createPlaceholderSlot(CodeGenFunction &CGF, QualType Ty) {
4373	// FIXME: Generate IR in one pass, rather than going back and fixing up these
4374	// placeholders.
4375	llvm::Type *IRTy = CGF.ConvertTypeForMem(T: Ty);
4376	llvm::Type *IRPtrTy = llvm::PointerType::getUnqual(C&: CGF.getLLVMContext());
4377	llvm::Value *Placeholder = llvm::PoisonValue::get(T: IRPtrTy);
4378
4379	// FIXME: When we generate this IR in one pass, we shouldn't need
4380	// this win32-specific alignment hack.
4381	CharUnits Align = CharUnits::fromQuantity(Quantity: `4`);
4382	Placeholder = CGF.Builder.CreateAlignedLoad(Ty: IRPtrTy, Addr: Placeholder, Align);
4383
4384	return AggValueSlot::forAddr(
4385	addr: Address (Placeholder, IRTy, Align), quals: Ty.getQualifiers(),
4386	isDestructed: AggValueSlot::IsNotDestructed, needsGC: AggValueSlot::DoesNotNeedGCBarriers,
4387	isAliased: AggValueSlot::IsNotAliased, mayOverlap: AggValueSlot::DoesNotOverlap);
4388	}
4389
4390	void CodeGenFunction::EmitDelegateCallArg(CallArgList &args,
4391	const VarDecl *param,
4392	SourceLocation loc) {
4393	// StartFunction converted the ABI-lowered parameter(s) into a
4394	// local alloca. We need to turn that into an r-value suitable
4395	// for EmitCall.
4396	Address local = GetAddrOfLocalVar(VD: param);
4397
4398	QualType type = param->getType();
4399
4400	// GetAddrOfLocalVar returns a pointer-to-pointer for references,
4401	// but the argument needs to be the original pointer.
4402	if (type ->isReferenceType()) {
4403	args.add(rvalue: RValue::get(V: Builder.CreateLoad(Addr: local)), type);
4404
4405	// In ARC, move out of consumed arguments so that the release cleanup
4406	// entered by StartFunction doesn't cause an over-release. This isn't
4407	// optimal -O0 code generation, but it should get cleaned up when
4408	// optimization is enabled. This also assumes that delegate calls are
4409	// performed exactly once for a set of arguments, but that should be safe.
4410	} else if (getLangOpts().ObjCAutoRefCount &&
4411	param->hasAttr<NSConsumedAttr>() && type ->isObjCRetainableType()) {
4412	llvm::Value *ptr = Builder.CreateLoad(Addr: local);
4413	auto null =
4414	llvm::ConstantPointerNull::get(T: cast<llvm::PointerType>(Val: ptr->getType()));
4415	Builder.CreateStore(Val: null, Addr: local);
4416	args.add(rvalue: RValue::get(V: ptr), type);
4417
4418	// For the most part, we just need to load the alloca, except that
4419	// aggregate r-values are actually pointers to temporaries.
4420	} else {
4421	args.add(rvalue: convertTempToRValue(addr: local, type, Loc: loc), type);
4422	}
4423
4424	// Deactivate the cleanup for the callee-destructed param that was pushed.
4425	if (type ->isRecordType() && !CurFuncIsThunk &&
4426	type ->castAsRecordDecl()->isParamDestroyedInCallee() &&
4427	param->needsDestruction(Ctx: getContext())) {
4428	EHScopeStack::stable_iterator cleanup =
4429	CalleeDestructedParamCleanups.lookup(Val: cast<ParmVarDecl>(Val: param));
4430	assert(cleanup.isValid() &&
4431	"cleanup for callee-destructed param not recorded");
4432	// This unreachable is a temporary marker which will be removed later.
4433	llvm::Instruction *isActive = Builder.CreateUnreachable();
4434	args.addArgCleanupDeactivation(Cleanup: cleanup, IsActiveIP: isActive);
4435	}
4436	}
4437
4438	static bool isProvablyNull(llvm::Value *addr) {
4439	return llvm::isa_and_nonnull<llvm::ConstantPointerNull>(Val: addr);
4440	}
4441
4442	static bool isProvablyNonNull(Address Addr, CodeGenFunction &CGF) {
4443	return llvm::isKnownNonZero(V: Addr.getBasePointer(), Q: CGF.CGM.getDataLayout());
4444	}
4445
4446	/// Emit the actual writing-back of a writeback.
4447	static void emitWriteback(CodeGenFunction &CGF,
4448	const CallArgList::Writeback &writeback) {
4449	const LValue &srcLV = writeback.Source;
4450	Address srcAddr = srcLV.getAddress();
4451	assert(!isProvablyNull(srcAddr.getBasePointer()) &&
4452	"shouldn't have writeback for provably null argument");
4453
4454	if (writeback.WritebackExpr) {
4455	CGF.EmitIgnoredExpr(E: writeback.WritebackExpr);
4456	CGF.EmitLifetimeEnd(Addr: writeback.Temporary.getBasePointer());
4457	return;
4458	}
4459
4460	llvm::BasicBlock contBB = nullptr*;
4461
4462	// If the argument wasn't provably non-null, we need to null check
4463	// before doing the store.
4464	bool provablyNonNull = isProvablyNonNull(Addr: srcAddr, CGF);
4465
4466	if (!provablyNonNull) {
4467	llvm::BasicBlock *writebackBB = CGF.createBasicBlock(name: "icr.writeback");
4468	contBB = CGF.createBasicBlock(name: "icr.done");
4469
4470	llvm::Value *isNull = CGF.Builder.CreateIsNull(Addr: srcAddr, Name: "icr.isnull");
4471	CGF.Builder.CreateCondBr(Cond: isNull, True: contBB, False: writebackBB);
4472	CGF.EmitBlock(BB: writebackBB);
4473	}
4474
4475	// Load the value to writeback.
4476	llvm::Value *value = CGF.Builder.CreateLoad(Addr: writeback.Temporary);
4477
4478	// Cast it back, in case we're writing an id to a Foo or something.*
4479	value = CGF.Builder.CreateBitCast(V: value, DestTy: srcAddr.getElementType(),
4480	Name: "icr.writeback-cast");
4481
4482	// Perform the writeback.
4483
4484	// If we have a "to use" value, it's something we need to emit a use
4485	// of. This has to be carefully threaded in: if it's done after the
4486	// release it's potentially undefined behavior (and the optimizer
4487	// will ignore it), and if it happens before the retain then the
4488	// optimizer could move the release there.
4489	if (writeback.ToUse) {
4490	assert(srcLV.getObjCLifetime() == Qualifiers::OCL_Strong);
4491
4492	// Retain the new value. No need to block-copy here: the block's
4493	// being passed up the stack.
4494	value = CGF.EmitARCRetainNonBlock(value);
4495
4496	// Emit the intrinsic use here.
4497	CGF.EmitARCIntrinsicUse(values: writeback.ToUse);
4498
4499	// Load the old value (primitively).
4500	llvm::Value *oldValue = CGF.EmitLoadOfScalar(lvalue: srcLV, Loc: SourceLocation ());
4501
4502	// Put the new value in place (primitively).
4503	CGF.EmitStoreOfScalar(value, lvalue: srcLV, /init/ isInit: false);
4504
4505	// Release the old value.
4506	CGF.EmitARCRelease(value: oldValue, precise: srcLV.isARCPreciseLifetime());
4507
4508	// Otherwise, we can just do a normal lvalue store.
4509	} else {
4510	CGF.EmitStoreThroughLValue(Src: RValue::get(V: value), Dst: srcLV);
4511	}
4512
4513	// Jump to the continuation block.
4514	if (!provablyNonNull)
4515	CGF.EmitBlock(BB: contBB);
4516	}
4517
4518	static void deactivateArgCleanupsBeforeCall(CodeGenFunction &CGF,
4519	const CallArgList &CallArgs) {
4520	ArrayRef<CallArgList::CallArgCleanup> Cleanups =
4521	CallArgs.getCleanupsToDeactivate();
4522	// Iterate in reverse to increase the likelihood of popping the cleanup.
4523	for (const auto &I : llvm::reverse(C&: Cleanups)) {
4524	CGF.DeactivateCleanupBlock(Cleanup: I.Cleanup, DominatingIP: I.IsActiveIP);
4525	I.IsActiveIP->eraseFromParent();
4526	}
4527	}
4528
4529	static const Expr maybeGetUnaryAddrOfOperand(const* Expr *E) {
4530	if (const UnaryOperator *uop = dyn_cast<UnaryOperator>(Val: E->IgnoreParens()))
4531	if (uop->getOpcode() == UO_AddrOf)
4532	return uop->getSubExpr();
4533	return nullptr;
4534	}
4535
4536	/// Emit an argument that's being passed call-by-writeback. That is,
4537	/// we are passing the address of an __autoreleased temporary; it
4538	/// might be copy-initialized with the current value of the given
4539	/// address, but it will definitely be copied out of after the call.
4540	static void emitWritebackArg(CodeGenFunction &CGF, CallArgList &args,
4541	const ObjCIndirectCopyRestoreExpr *CRE) {
4542	LValue srcLV;
4543
4544	// Make an optimistic effort to emit the address as an l-value.
4545	// This can fail if the argument expression is more complicated.
4546	if (const Expr *lvExpr = maybeGetUnaryAddrOfOperand(E: CRE->getSubExpr())) {
4547	srcLV = CGF.EmitLValue(E: lvExpr);
4548
4549	// Otherwise, just emit it as a scalar.
4550	} else {
4551	Address srcAddr = CGF.EmitPointerWithAlignment(Addr: CRE->getSubExpr());
4552
4553	QualType srcAddrType =
4554	CRE->getSubExpr()->getType()->castAs<PointerType>()->getPointeeType();
4555	srcLV = CGF.MakeAddrLValue(Addr: srcAddr, T: srcAddrType);
4556	}
4557	Address srcAddr = srcLV.getAddress();
4558
4559	// The dest and src types don't necessarily match in LLVM terms
4560	// because of the crazy ObjC compatibility rules.
4561
4562	llvm::PointerType *destType =
4563	cast<llvm::PointerType>(Val: CGF.ConvertType(T: CRE->getType()));
4564	llvm::Type *destElemType =
4565	CGF.ConvertTypeForMem(T: CRE->getType()->getPointeeType());
4566
4567	// If the address is a constant null, just pass the appropriate null.
4568	if (isProvablyNull(addr: srcAddr.getBasePointer())) {
4569	args.add(rvalue: RValue::get(V: llvm::ConstantPointerNull::get(T: destType)),
4570	type: CRE->getType());
4571	return;
4572	}
4573
4574	// Create the temporary.
4575	Address temp =
4576	CGF.CreateTempAlloca(Ty: destElemType, align: CGF.getPointerAlign(), Name: "icr.temp");
4577	// Loading an l-value can introduce a cleanup if the l-value is __weak,
4578	// and that cleanup will be conditional if we can't prove that the l-value
4579	// isn't null, so we need to register a dominating point so that the cleanups
4580	// system will make valid IR.
4581	CodeGenFunction::ConditionalEvaluation condEval(CGF);
4582
4583	// Zero-initialize it if we're not doing a copy-initialization.
4584	bool shouldCopy = CRE->shouldCopy();
4585	if (!shouldCopy) {
4586	llvm::Value *null =
4587	llvm::ConstantPointerNull::get(T: cast<llvm::PointerType>(Val: destElemType));
4588	CGF.Builder.CreateStore(Val: null, Addr: temp);
4589	}
4590
4591	llvm::BasicBlock contBB = nullptr*;
4592	llvm::BasicBlock originBB = nullptr*;
4593
4594	// If the address is not* known to be non-null, we need to switch.*
4595	llvm::Value *finalArgument;
4596
4597	bool provablyNonNull = isProvablyNonNull(Addr: srcAddr, CGF);
4598
4599	if (provablyNonNull) {
4600	finalArgument = temp.emitRawPointer(CGF);
4601	} else {
4602	llvm::Value *isNull = CGF.Builder.CreateIsNull(Addr: srcAddr, Name: "icr.isnull");
4603
4604	finalArgument = CGF.Builder.CreateSelect(
4605	C: isNull, True: llvm::ConstantPointerNull::get(T: destType),
4606	False: temp.emitRawPointer(CGF), Name: "icr.argument");
4607
4608	// If we need to copy, then the load has to be conditional, which
4609	// means we need control flow.
4610	if (shouldCopy) {
4611	originBB = CGF.Builder.GetInsertBlock();
4612	contBB = CGF.createBasicBlock(name: "icr.cont");
4613	llvm::BasicBlock *copyBB = CGF.createBasicBlock(name: "icr.copy");
4614	CGF.Builder.CreateCondBr(Cond: isNull, True: contBB, False: copyBB);
4615	CGF.EmitBlock(BB: copyBB);
4616	condEval.begin(CGF);
4617	}
4618	}
4619
4620	llvm::Value valueToUse = nullptr*;
4621
4622	// Perform a copy if necessary.
4623	if (shouldCopy) {
4624	RValue srcRV = CGF.EmitLoadOfLValue(V: srcLV, Loc: SourceLocation ());
4625	assert(srcRV.isScalar());
4626
4627	llvm::Value *src = srcRV.getScalarVal();
4628	src = CGF.Builder.CreateBitCast(V: src, DestTy: destElemType, Name: "icr.cast");
4629
4630	// Use an ordinary store, not a store-to-lvalue.
4631	CGF.Builder.CreateStore(Val: src, Addr: temp);
4632
4633	// If optimization is enabled, and the value was held in a
4634	// __strong variable, we need to tell the optimizer that this
4635	// value has to stay alive until we're doing the store back.
4636	// This is because the temporary is effectively unretained,
4637	// and so otherwise we can violate the high-level semantics.
4638	if (CGF.CGM.getCodeGenOpts().OptimizationLevel != `0` &&
4639	srcLV.getObjCLifetime() == Qualifiers::OCL_Strong) {
4640	valueToUse = src;
4641	}
4642	}
4643
4644	// Finish the control flow if we needed it.
4645	if (shouldCopy && !provablyNonNull) {
4646	llvm::BasicBlock *copyBB = CGF.Builder.GetInsertBlock();
4647	CGF.EmitBlock(BB: contBB);
4648
4649	// Make a phi for the value to intrinsically use.
4650	if (valueToUse) {
4651	llvm::PHINode *phiToUse =
4652	CGF.Builder.CreatePHI(Ty: valueToUse->getType(), NumReservedValues: `2`, Name: "icr.to-use");
4653	phiToUse->addIncoming(V: valueToUse, BB: copyBB);
4654	phiToUse->addIncoming(V: llvm::PoisonValue::get(T: valueToUse->getType()),
4655	BB: originBB);
4656	valueToUse = phiToUse;
4657	}
4658
4659	condEval.end(CGF);
4660	}
4661
4662	args.addWriteback(srcLV, temporary: temp, toUse: valueToUse);
4663	args.add(rvalue: RValue::get(V: finalArgument), type: CRE->getType());
4664	}
4665
4666	void CallArgList::allocateArgumentMemory(CodeGenFunction &CGF) {
4667	assert(!StackBase);
4668
4669	// Save the stack.
4670	StackBase = CGF.Builder.CreateStackSave(Name: "inalloca.save");
4671	}
4672
4673	void CallArgList::freeArgumentMemory(CodeGenFunction &CGF) const {
4674	if (StackBase) {
4675	// Restore the stack after the call.
4676	CGF.Builder.CreateStackRestore(Ptr: StackBase);
4677	}
4678	}
4679
4680	void CodeGenFunction::EmitNonNullArgCheck(RValue RV, QualType ArgType,
4681	SourceLocation ArgLoc,
4682	AbstractCallee AC, unsigned ParmNum) {
4683	if (!AC.getDecl() \|\| !(SanOpts.has(K: SanitizerKind::NonnullAttribute) \|\|
4684	SanOpts.has(K: SanitizerKind::NullabilityArg)))
4685	return;
4686
4687	// The param decl may be missing in a variadic function.
4688	auto PVD = ParmNum < AC.getNumParams() ? AC.getParamDecl(I: ParmNum) : nullptr;
4689	unsigned ArgNo = PVD ? PVD->getFunctionScopeIndex() : ParmNum;
4690
4691	// Prefer the nonnull attribute if it's present.
4692	const NonNullAttr NNAttr = nullptr*;
4693	if (SanOpts.has(K: SanitizerKind::NonnullAttribute))
4694	NNAttr = getNonNullAttr(FD: AC.getDecl(), PVD, ArgType, ArgNo);
4695
4696	bool CanCheckNullability = false;
4697	if (SanOpts.has(K: SanitizerKind::NullabilityArg) && !NNAttr && PVD &&
4698	!PVD->getType()->isRecordType()) {
4699	auto Nullability = PVD->getType()->getNullability();
4700	CanCheckNullability = Nullability &&
4701	*Nullability == NullabilityKind::NonNull &&
4702	PVD->getTypeSourceInfo();
4703	}
4704
4705	if (!NNAttr && !CanCheckNullability)
4706	return;
4707
4708	SourceLocation AttrLoc;
4709	SanitizerKind::SanitizerOrdinal CheckKind;
4710	SanitizerHandler Handler;
4711	if (NNAttr) {
4712	AttrLoc = NNAttr->getLocation();
4713	CheckKind = SanitizerKind::SO_NonnullAttribute;
4714	Handler = SanitizerHandler::NonnullArg;
4715	} else {
4716	AttrLoc = PVD->getTypeSourceInfo()->getTypeLoc().findNullabilityLoc();
4717	CheckKind = SanitizerKind::SO_NullabilityArg;
4718	Handler = SanitizerHandler::NullabilityArg;
4719	}
4720
4721	SanitizerDebugLocation SanScope(this, {CheckKind}, Handler);
4722	llvm::Value *Cond = EmitNonNullRValueCheck(RV, T: ArgType);
4723	llvm::Constant *StaticData[] = {
4724	EmitCheckSourceLocation(Loc: ArgLoc),
4725	EmitCheckSourceLocation(Loc: AttrLoc),
4726	llvm::ConstantInt::get(Ty: Int32Ty, V: ArgNo + `1`),
4727	};
4728	EmitCheck(Checked: std::make_pair(x&: Cond, y&: CheckKind), Check: Handler, StaticArgs: StaticData, DynamicArgs: {});
4729	}
4730
4731	void CodeGenFunction::EmitNonNullArgCheck(Address Addr, QualType ArgType,
4732	SourceLocation ArgLoc,
4733	AbstractCallee AC, unsigned ParmNum) {
4734	if (!AC.getDecl() \|\| !(SanOpts.has(K: SanitizerKind::NonnullAttribute) \|\|
4735	SanOpts.has(K: SanitizerKind::NullabilityArg)))
4736	return;
4737
4738	EmitNonNullArgCheck(RV: RValue::get(Addr, CGF&: *this), ArgType, ArgLoc, AC, ParmNum);
4739	}
4740
4741	// Check if the call is going to use the inalloca convention. This needs to
4742	// agree with CGFunctionInfo::usesInAlloca. The CGFunctionInfo is arranged
4743	// later, so we can't check it directly.
4744	static bool hasInAllocaArgs(CodeGenModule &CGM, CallingConv ExplicitCC,
4745	ArrayRef<QualType> ArgTypes) {
4746	// The Swift calling conventions don't go through the target-specific
4747	// argument classification, they never use inalloca.
4748	// TODO: Consider limiting inalloca use to only calling conventions supported
4749	// by MSVC.
4750	if (ExplicitCC == CC_Swift \|\| ExplicitCC == CC_SwiftAsync)
4751	return false;
4752	if (!CGM.getTarget().getCXXABI().isMicrosoft())
4753	return false;
4754	return llvm::any_of(Range&: ArgTypes, P: [&](QualType Ty) {
4755	return isInAllocaArgument(ABI&: CGM.getCXXABI(), type: Ty);
4756	});
4757	}
4758
4759	#ifndef NDEBUG
4760	// Determine whether the given argument is an Objective-C method
4761	// that may have type parameters in its signature.
4762	static bool isObjCMethodWithTypeParams(const ObjCMethodDecl *method) {
4763	const DeclContext *dc = method->getDeclContext();
4764	if (const ObjCInterfaceDecl *classDecl = dyn_cast<ObjCInterfaceDecl>(dc)) {
4765	return classDecl->getTypeParamListAsWritten();
4766	}
4767
4768	if (const ObjCCategoryDecl *catDecl = dyn_cast<ObjCCategoryDecl>(dc)) {
4769	return catDecl->getTypeParamList();
4770	}
4771
4772	return false;
4773	}
4774	#endif
4775
4776	/// EmitCallArgs - Emit call arguments for a function.
4777	void CodeGenFunction::EmitCallArgs(
4778	CallArgList &Args, PrototypeWrapper Prototype,
4779	llvm::iterator_range<CallExpr::const_arg_iterator> ArgRange,
4780	AbstractCallee AC, unsigned ParamsToSkip, EvaluationOrder Order) {
4781	SmallVector<QualType, `16`> ArgTypes;
4782
4783	assert((ParamsToSkip == `0` \|\| Prototype.P) &&
4784	"Can't skip parameters if type info is not provided");
4785
4786	// This variable only captures explicitly* written conventions, not those*
4787	// applied by default via command line flags or target defaults, such as
4788	// thiscall, aapcs, stdcall via -mrtd, etc. Computing that correctly would
4789	// require knowing if this is a C++ instance method or being able to see
4790	// unprototyped FunctionTypes.
4791	CallingConv ExplicitCC = CC_C;
4792
4793	// First, if a prototype was provided, use those argument types.
4794	bool IsVariadic = false;
4795	if (Prototype.P) {
4796	const auto MD = dyn_cast<const* ObjCMethodDecl *>(Val&: Prototype.P);
4797	if (MD) {
4798	IsVariadic = MD->isVariadic();
4799	ExplicitCC = getCallingConventionForDecl(
4800	D: MD, IsTargetDefaultMSABI: CGM.getTarget().getTriple().isOSWindows());
4801	ArgTypes.assign(in_start: MD->param_type_begin() + ParamsToSkip,
4802	in_end: MD->param_type_end());
4803	} else {
4804	const auto FPT = cast<const* FunctionProtoType *>(Val&: Prototype.P);
4805	IsVariadic = FPT->isVariadic();
4806	ExplicitCC = FPT->getExtInfo().getCC();
4807	ArgTypes.assign(in_start: FPT->param_type_begin() + ParamsToSkip,
4808	in_end: FPT->param_type_end());
4809	}
4810
4811	#ifndef NDEBUG
4812	// Check that the prototyped types match the argument expression types.
4813	bool isGenericMethod = MD && isObjCMethodWithTypeParams(MD);
4814	CallExpr::const_arg_iterator Arg = ArgRange.begin();
4815	for (QualType Ty : ArgTypes) {
4816	assert(Arg != ArgRange.end() && "Running over edge of argument list!");
4817	QualType ParamTy = Ty.getNonReferenceType();
4818	QualType ArgTy = (*Arg)->getType();
4819	if (const auto *OBT = ParamTy->getAs<OverflowBehaviorType>())
4820	ParamTy = OBT->getUnderlyingType();
4821	if (const auto *OBT = ArgTy->getAs<OverflowBehaviorType>())
4822	ArgTy = OBT->getUnderlyingType();
4823	assert((isGenericMethod \|\| Ty->isVariablyModifiedType() \|\|
4824	ParamTy->isObjCRetainableType() \|\|
4825	getContext().getCanonicalType(ParamTy).getTypePtr() ==
4826	getContext().getCanonicalType(ArgTy).getTypePtr()) &&
4827	"type mismatch in call argument!");
4828	++Arg;
4829	}
4830
4831	// Either we've emitted all the call args, or we have a call to variadic
4832	// function.
4833	assert((Arg == ArgRange.end() \|\| IsVariadic) &&
4834	"Extra arguments in non-variadic function!");
4835	#endif
4836	}
4837
4838	// If we still have any arguments, emit them using the type of the argument.
4839	for (auto *A : llvm::drop_begin(RangeOrContainer&: ArgRange, N: ArgTypes.size()))
4840	ArgTypes.push_back(Elt: IsVariadic ? getVarArgType(Arg: A) : A->getType());
4841	assert((int)ArgTypes.size() == (ArgRange.end() - ArgRange.begin()));
4842
4843	// We must evaluate arguments from right to left in the MS C++ ABI,
4844	// because arguments are destroyed left to right in the callee. As a special
4845	// case, there are certain language constructs that require left-to-right
4846	// evaluation, and in those cases we consider the evaluation order requirement
4847	// to trump the "destruction order is reverse construction order" guarantee.
4848	bool LeftToRight =
4849	CGM.getTarget().getCXXABI().areArgsDestroyedLeftToRightInCallee()
4850	? Order == EvaluationOrder::ForceLeftToRight
4851	: Order != EvaluationOrder::ForceRightToLeft;
4852
4853	auto MaybeEmitImplicitObjectSize = [&](unsigned I, const Expr *Arg,
4854	RValue EmittedArg) {
4855	if (!AC.hasFunctionDecl() \|\| I >= AC.getNumParams())
4856	return;
4857	auto *PS = AC.getParamDecl(I)->getAttr<PassObjectSizeAttr>();
4858	if (PS == nullptr)
4859	return;
4860
4861	const auto &Context = getContext();
4862	auto SizeTy = Context.getSizeType();
4863	auto T = Builder.getIntNTy(N: Context.getTypeSize(T: SizeTy));
4864	assert(EmittedArg.getScalarVal() && "We emitted nothing for the arg?");
4865	llvm::Value *V = evaluateOrEmitBuiltinObjectSize(
4866	E: Arg, Type: PS->getType(), ResType: T, EmittedE: EmittedArg.getScalarVal(), IsDynamic: PS->isDynamic());
4867	Args.add(rvalue: RValue::get(V), type: SizeTy);
4868	// If we're emitting args in reverse, be sure to do so with
4869	// pass_object_size, as well.
4870	if (!LeftToRight)
4871	std::swap(a&: Args.back(), b&: *(&Args.back() - `1`));
4872	};
4873
4874	// Insert a stack save if we're going to need any inalloca args.
4875	if (hasInAllocaArgs(CGM, ExplicitCC, ArgTypes)) {
4876	assert(getTarget().getTriple().getArch() == llvm::Triple::x86 &&
4877	"inalloca only supported on x86");
4878	Args.allocateArgumentMemory(CGF&: *this);
4879	}
4880
4881	// Evaluate each argument in the appropriate order.
4882	size_t CallArgsStart = Args.size();
4883	for (unsigned I = `0`, E = ArgTypes.size(); I != E; ++I) {
4884	unsigned Idx = LeftToRight ? I : E - I - `1`;
4885	CallExpr::const_arg_iterator Arg = ArgRange.begin() + Idx;
4886	unsigned InitialArgSize = Args.size();
4887	// If Arg is an ObjCIndirectCopyRestoreExpr, check that either the types of*
4888	// the argument and parameter match or the objc method is parameterized.
4889	assert((!isa<ObjCIndirectCopyRestoreExpr>(*Arg) \|\|
4890	getContext().hasSameUnqualifiedType((*Arg)->getType(),
4891	ArgTypes[Idx]) \|\|
4892	(isa<ObjCMethodDecl>(AC.getDecl()) &&
4893	isObjCMethodWithTypeParams(cast<ObjCMethodDecl>(AC.getDecl())))) &&
4894	"Argument and parameter types don't match");
4895	EmitCallArg(args&: Args, E: *Arg, ArgType: ArgTypes [Idx]);
4896	// In particular, we depend on it being the last arg in Args, and the
4897	// objectsize bits depend on there only being one arg if !LeftToRight.
4898	assert(InitialArgSize + `1` == Args.size() &&
4899	"The code below depends on only adding one arg per EmitCallArg");
4900	(void)InitialArgSize;
4901	// Since pointer argument are never emitted as LValue, it is safe to emit
4902	// non-null argument check for r-value only.
4903	if (!Args.back().hasLValue()) {
4904	RValue RVArg = Args.back().getKnownRValue();
4905	EmitNonNullArgCheck(RV: RVArg, ArgType: ArgTypes [Idx], ArgLoc: (*Arg)->getExprLoc(), AC,
4906	ParmNum: ParamsToSkip + Idx);
4907	// @llvm.objectsize should never have side-effects and shouldn't need
4908	// destruction/cleanups, so we can safely "emit" it after its arg,
4909	// regardless of right-to-leftness
4910	MaybeEmitImplicitObjectSize (Idx, *Arg, RVArg);
4911	}
4912	}
4913
4914	if (!LeftToRight) {
4915	// Un-reverse the arguments we just evaluated so they match up with the LLVM
4916	// IR function.
4917	std::reverse(first: Args.begin() + CallArgsStart, last: Args.end());
4918
4919	// Reverse the writebacks to match the MSVC ABI.
4920	Args.reverseWritebacks();
4921	}
4922	}
4923
4924	namespace {
4925
4926	struct DestroyUnpassedArg final : EHScopeStack::Cleanup {
4927	DestroyUnpassedArg(Address Addr, QualType Ty) : Addr (Addr), Ty (Ty) {}
4928
4929	Address Addr;
4930	QualType Ty;
4931
4932	void Emit(CodeGenFunction &CGF, Flags flags) override {
4933	QualType::DestructionKind DtorKind = Ty.isDestructedType();
4934	if (DtorKind == QualType::DK_cxx_destructor) {
4935	const CXXDestructorDecl *Dtor = Ty ->getAsCXXRecordDecl()->getDestructor();
4936	assert(!Dtor->isTrivial());
4937	CGF.EmitCXXDestructorCall(D: Dtor, Type: Dtor_Complete, /for vbase/ ForVirtualBase: false,
4938	/Delegating=/false, This: Addr, ThisTy: Ty);
4939	} else {
4940	CGF.callCStructDestructor(Dst: CGF.MakeAddrLValue(Addr, T: Ty));
4941	}
4942	}
4943	};
4944
4945	} // end anonymous namespace
4946
4947	RValue CallArg::getRValue(CodeGenFunction &CGF) const {
4948	if (!HasLV)
4949	return RV;
4950	LValue Copy = CGF.MakeAddrLValue(Addr: CGF.CreateMemTemp(T: Ty), T: Ty);
4951	CGF.EmitAggregateCopy(Dest: Copy, Src: LV, EltTy: Ty, MayOverlap: AggValueSlot::DoesNotOverlap,
4952	isVolatile: LV.isVolatile());
4953	IsUsed = true;
4954	return RValue::getAggregate(addr: Copy.getAddress());
4955	}
4956
4957	void CallArg::copyInto(CodeGenFunction &CGF, Address Addr) const {
4958	LValue Dst = CGF.MakeAddrLValue(Addr, T: Ty);
4959	if (!HasLV && RV.isScalar())
4960	CGF.EmitStoreOfScalar(value: RV.getScalarVal(), lvalue: Dst, /isInit=/true);
4961	else if (!HasLV && RV.isComplex())
4962	CGF.EmitStoreOfComplex(V: RV.getComplexVal(), dest: Dst, /init=/isInit: true);
4963	else {
4964	auto Addr = HasLV ? LV.getAddress() : RV.getAggregateAddress();
4965	LValue SrcLV = CGF.MakeAddrLValue(Addr, T: Ty);
4966	// We assume that call args are never copied into subobjects.
4967	CGF.EmitAggregateCopy(Dest: Dst, Src: SrcLV, EltTy: Ty, MayOverlap: AggValueSlot::DoesNotOverlap,
4968	isVolatile: HasLV ? LV.isVolatileQualified()
4969	: RV.isVolatileQualified());
4970	}
4971	IsUsed = true;
4972	}
4973
4974	void CodeGenFunction::EmitWritebacks(const CallArgList &args) {
4975	for (const auto &I : args.writebacks())
4976	emitWriteback(CGF&: *this, writeback: I);
4977	}
4978
4979	void CodeGenFunction::EmitCallArg(CallArgList &args, const Expr *E,
4980	QualType type) {
4981	std::optional<DisableDebugLocationUpdates> Dis;
4982	if (isa<CXXDefaultArgExpr>(Val: E))
4983	Dis.emplace(args&: *this);
4984	if (const ObjCIndirectCopyRestoreExpr *CRE =
4985	dyn_cast<ObjCIndirectCopyRestoreExpr>(Val: E)) {
4986	assert(getLangOpts().ObjCAutoRefCount);
4987	return emitWritebackArg(CGF&: *this, args, CRE);
4988	}
4989
4990	// Add writeback for HLSLOutParamExpr.
4991	// Needs to be before the assert below because HLSLOutArgExpr is an LValue
4992	// and is not a reference.
4993	if (const HLSLOutArgExpr *OE = dyn_cast<HLSLOutArgExpr>(Val: E)) {
4994	EmitHLSLOutArgExpr(E: OE, Args&: args, Ty: type);
4995	return;
4996	}
4997
4998	assert(type->isReferenceType() == E->isGLValue() &&
4999	"reference binding to unmaterialized r-value!");
5000
5001	if (E->isGLValue()) {
5002	assert(E->getObjectKind() == OK_Ordinary);
5003	return args.add(rvalue: EmitReferenceBindingToExpr(E), type);
5004	}
5005
5006	bool HasAggregateEvalKind = hasAggregateEvaluationKind(T: type);
5007
5008	// In the Microsoft C++ ABI, aggregate arguments are destructed by the callee.
5009	// However, we still have to push an EH-only cleanup in case we unwind before
5010	// we make it to the call.
5011	if (type ->isRecordType() &&
5012	type ->castAsRecordDecl()->isParamDestroyedInCallee()) {
5013	// If we're using inalloca, use the argument memory. Otherwise, use a
5014	// temporary.
5015	AggValueSlot Slot = args.isUsingInAlloca()
5016	? createPlaceholderSlot(CGF&: *this, Ty: type)
5017	: CreateAggTemp(T: type, Name: "agg.tmp");
5018
5019	bool DestroyedInCallee = true, NeedsCleanup = true;
5020	if (const auto *RD = type ->getAsCXXRecordDecl())
5021	DestroyedInCallee = RD->hasNonTrivialDestructor();
5022	else
5023	NeedsCleanup = type.isDestructedType();
5024
5025	if (DestroyedInCallee)
5026	Slot.setExternallyDestructed();
5027
5028	EmitAggExpr(E, AS: Slot);
5029	RValue RV = Slot.asRValue();
5030	args.add(rvalue: RV, type);
5031
5032	if (DestroyedInCallee && NeedsCleanup) {
5033	// Create a no-op GEP between the placeholder and the cleanup so we can
5034	// RAUW it successfully. It also serves as a marker of the first
5035	// instruction where the cleanup is active.
5036	pushFullExprCleanup<DestroyUnpassedArg>(kind: NormalAndEHCleanup,
5037	A: Slot.getAddress(), A: type);
5038	// This unreachable is a temporary marker which will be removed later.
5039	llvm::Instruction *IsActive =
5040	Builder.CreateFlagLoad(Addr: llvm::Constant::getNullValue(Ty: Int8PtrTy));
5041	args.addArgCleanupDeactivation(Cleanup: EHStack.stable_begin(), IsActiveIP: IsActive);
5042	}
5043	return;
5044	}
5045
5046	if (HasAggregateEvalKind && isa<ImplicitCastExpr>(Val: E) &&
5047	cast<CastExpr>(Val: E)->getCastKind() == CK_LValueToRValue &&
5048	!type ->isArrayParameterType() && !type.isNonTrivialToPrimitiveCopy()) {
5049	LValue L = EmitLValue(E: cast<CastExpr>(Val: E)->getSubExpr());
5050	assert(L.isSimple());
5051	args.addUncopiedAggregate(LV: L, type);
5052	return;
5053	}
5054
5055	args.add(rvalue: EmitAnyExprToTemp(E), type);
5056	}
5057
5058	QualType CodeGenFunction::getVarArgType(const Expr *Arg) {
5059	// System headers on Windows define NULL to 0 instead of 0LL on Win64. MSVC
5060	// implicitly widens null pointer constants that are arguments to varargs
5061	// functions to pointer-sized ints.
5062	if (!getTarget().getTriple().isOSWindows())
5063	return Arg->getType();
5064
5065	if (Arg->getType()->isIntegerType() &&
5066	getContext().getTypeSize(T: Arg->getType()) <
5067	getContext().getTargetInfo().getPointerWidth(AddrSpace: LangAS::Default) &&
5068	Arg->isNullPointerConstant(Ctx&: getContext(),
5069	NPC: Expr::NPC_ValueDependentIsNotNull)) {
5070	return getContext().getIntPtrType();
5071	}
5072
5073	return Arg->getType();
5074	}
5075
5076	// In ObjC ARC mode with no ObjC ARC exception safety, tell the ARC
5077	// optimizer it can aggressively ignore unwind edges.
5078	void CodeGenFunction::AddObjCARCExceptionMetadata(llvm::Instruction *Inst) {
5079	if (CGM.getCodeGenOpts().OptimizationLevel != `0` &&
5080	!CGM.getCodeGenOpts().ObjCAutoRefCountExceptions)
5081	Inst->setMetadata(Kind: "clang.arc.no_objc_arc_exceptions",
5082	Node: CGM.getNoObjCARCExceptionsMetadata());
5083	}
5084
5085	/// Emits a call to the given no-arguments nounwind runtime function.
5086	llvm::CallInst *
5087	CodeGenFunction::EmitNounwindRuntimeCall(llvm::FunctionCallee callee,
5088	const llvm::Twine &name) {
5089	return EmitNounwindRuntimeCall(callee, args: ArrayRef<llvm::Value *>(), name);
5090	}
5091
5092	/// Emits a call to the given nounwind runtime function.
5093	llvm::CallInst *
5094	CodeGenFunction::EmitNounwindRuntimeCall(llvm::FunctionCallee callee,
5095	ArrayRef<Address> args,
5096	const llvm::Twine &name) {
5097	SmallVector<llvm::Value *, `3`> values;
5098	for (auto arg : args)
5099	values.push_back(Elt: arg.emitRawPointer(CGF&: *this));
5100	return EmitNounwindRuntimeCall(callee, args: values, name);
5101	}
5102
5103	llvm::CallInst *
5104	CodeGenFunction::EmitNounwindRuntimeCall(llvm::FunctionCallee callee,
5105	ArrayRef<llvm::Value *> args,
5106	const llvm::Twine &name) {
5107	llvm::CallInst *call = EmitRuntimeCall(callee, args, name);
5108	call->setDoesNotThrow();
5109	return call;
5110	}
5111
5112	/// Emits a simple call (never an invoke) to the given no-arguments
5113	/// runtime function.
5114	llvm::CallInst *CodeGenFunction::EmitRuntimeCall(llvm::FunctionCallee callee,
5115	const llvm::Twine &name) {
5116	return EmitRuntimeCall(callee, args: {}, name);
5117	}
5118
5119	// Calls which may throw must have operand bundles indicating which funclet
5120	// they are nested within.
5121	SmallVector<llvm::OperandBundleDef, `1`>
5122	CodeGenFunction::getBundlesForFunclet(llvm::Value *Callee) {
5123	// There is no need for a funclet operand bundle if we aren't inside a
5124	// funclet.
5125	if (!CurrentFuncletPad)
5126	return (SmallVector<llvm::OperandBundleDef, `1`>());
5127
5128	// Skip intrinsics which cannot throw (as long as they don't lower into
5129	// regular function calls in the course of IR transformations).
5130	if (auto *CalleeFn = dyn_cast<llvm::Function>(Val: Callee->stripPointerCasts())) {
5131	if (CalleeFn->isIntrinsic() && CalleeFn->doesNotThrow()) {
5132	auto IID = CalleeFn->getIntrinsicID();
5133	if (!llvm::IntrinsicInst::mayLowerToFunctionCall(IID))
5134	return (SmallVector<llvm::OperandBundleDef, `1`>());
5135	}
5136	}
5137
5138	SmallVector<llvm::OperandBundleDef, `1`> BundleList;
5139	BundleList.emplace_back(Args: "funclet", Args&: CurrentFuncletPad);
5140	return BundleList;
5141	}
5142
5143	/// Emits a simple call (never an invoke) to the given runtime function.
5144	llvm::CallInst *CodeGenFunction::EmitRuntimeCall(llvm::FunctionCallee callee,
5145	ArrayRef<llvm::Value *> args,
5146	const llvm::Twine &name) {
5147	llvm::CallInst *call = Builder.CreateCall(
5148	Callee: callee, Args: args, OpBundles: getBundlesForFunclet(Callee: callee.getCallee()), Name: name);
5149	call->setCallingConv(getRuntimeCC());
5150
5151	if (CGM.shouldEmitConvergenceTokens() && call->isConvergent())
5152	return cast<llvm::CallInst>(Val: addConvergenceControlToken(Input: call));
5153	return call;
5154	}
5155
5156	/// Emits a call or invoke to the given noreturn runtime function.
5157	void CodeGenFunction::EmitNoreturnRuntimeCallOrInvoke(
5158	llvm::FunctionCallee callee, ArrayRef<llvm::Value *> args) {
5159	SmallVector<llvm::OperandBundleDef, `1`> BundleList =
5160	getBundlesForFunclet(Callee: callee.getCallee());
5161
5162	if (getInvokeDest()) {
5163	llvm::InvokeInst *invoke = Builder.CreateInvoke(
5164	Callee: callee, NormalDest: getUnreachableBlock(), UnwindDest: getInvokeDest(), Args: args, OpBundles: BundleList);
5165	invoke->setDoesNotReturn();
5166	invoke->setCallingConv(getRuntimeCC());
5167	} else {
5168	llvm::CallInst *call = Builder.CreateCall(Callee: callee, Args: args, OpBundles: BundleList);
5169	call->setDoesNotReturn();
5170	call->setCallingConv(getRuntimeCC());
5171	Builder.CreateUnreachable();
5172	}
5173	}
5174
5175	/// Emits a call or invoke instruction to the given nullary runtime function.
5176	llvm::CallBase *
5177	CodeGenFunction::EmitRuntimeCallOrInvoke(llvm::FunctionCallee callee,
5178	const Twine &name) {
5179	return EmitRuntimeCallOrInvoke(callee, args: {}, name);
5180	}
5181
5182	/// Emits a call or invoke instruction to the given runtime function.
5183	llvm::CallBase *
5184	CodeGenFunction::EmitRuntimeCallOrInvoke(llvm::FunctionCallee callee,
5185	ArrayRef<llvm::Value *> args,
5186	const Twine &name) {
5187	llvm::CallBase *call = EmitCallOrInvoke(Callee: callee, Args: args, Name: name);
5188	call->setCallingConv(getRuntimeCC());
5189	return call;
5190	}
5191
5192	/// Emits a call or invoke instruction to the given function, depending
5193	/// on the current state of the EH stack.
5194	llvm::CallBase *CodeGenFunction::EmitCallOrInvoke(llvm::FunctionCallee Callee,
5195	ArrayRef<llvm::Value *> Args,
5196	const Twine &Name) {
5197	llvm::BasicBlock *InvokeDest = getInvokeDest();
5198	SmallVector<llvm::OperandBundleDef, `1`> BundleList =
5199	getBundlesForFunclet(Callee: Callee.getCallee());
5200
5201	llvm::CallBase *Inst;
5202	if (!InvokeDest)
5203	Inst = Builder.CreateCall(Callee, Args, OpBundles: BundleList, Name);
5204	else {
5205	llvm::BasicBlock *ContBB = createBasicBlock(name: "invoke.cont");
5206	Inst = Builder.CreateInvoke(Callee, NormalDest: ContBB, UnwindDest: InvokeDest, Args, OpBundles: BundleList,
5207	Name);
5208	EmitBlock(BB: ContBB);
5209	}
5210
5211	// In ObjC ARC mode with no ObjC ARC exception safety, tell the ARC
5212	// optimizer it can aggressively ignore unwind edges.
5213	if (CGM.getLangOpts().ObjCAutoRefCount)
5214	AddObjCARCExceptionMetadata(Inst);
5215
5216	return Inst;
5217	}
5218
5219	void CodeGenFunction::deferPlaceholderReplacement(llvm::Instruction *Old,
5220	llvm::Value *New) {
5221	DeferredReplacements.push_back(
5222	Elt: std::make_pair(x: llvm::WeakTrackingVH (Old), y&: New));
5223	}
5224
5225	namespace {
5226
5227	/// Specify given \p NewAlign as the alignment of return value attribute. If
5228	/// such attribute already exists, re-set it to the maximal one of two options.
5229	[[nodiscard]] llvm::AttributeList
5230	maybeRaiseRetAlignmentAttribute(llvm::LLVMContext &Ctx,
5231	const llvm::AttributeList &Attrs,
5232	llvm::Align NewAlign) {
5233	llvm::Align CurAlign = Attrs.getRetAlignment().valueOrOne();
5234	if (CurAlign >= NewAlign)
5235	return Attrs;
5236	llvm::Attribute AlignAttr = llvm::Attribute::getWithAlignment(Context&: Ctx, Alignment: NewAlign);
5237	return Attrs.removeRetAttribute(C&: Ctx, Kind: llvm::Attribute::AttrKind::Alignment)
5238	.addRetAttribute(C&: Ctx, Attr: AlignAttr);
5239	}
5240
5241	template <typename AlignedAttrTy> class AbstractAssumeAlignedAttrEmitter {
5242	protected:
5243	CodeGenFunction &CGF;
5244
5245	/// We do nothing if this is, or becomes, nullptr.
5246	const AlignedAttrTy AA = nullptr*;
5247
5248	llvm::Value Alignment = nullptr; // May or may not be a constant.*
5249	llvm::ConstantInt OffsetCI = nullptr; // Constant, hopefully zero.*
5250
5251	AbstractAssumeAlignedAttrEmitter(CodeGenFunction &CGF_, const Decl *FuncDecl)
5252	: CGF(CGF_) {
5253	if (!FuncDecl)
5254	return;
5255	AA = FuncDecl->getAttr<AlignedAttrTy>();
5256	}
5257
5258	public:
5259	/// If we can, materialize the alignment as an attribute on return value.
5260	[[nodiscard]] llvm::AttributeList
5261	TryEmitAsCallSiteAttribute(const llvm::AttributeList &Attrs) {
5262	if (!AA \|\| OffsetCI \|\| CGF.SanOpts.has(K: SanitizerKind::Alignment))
5263	return Attrs;
5264	const auto *AlignmentCI = dyn_cast<llvm::ConstantInt>(Val: Alignment);
5265	if (!AlignmentCI)
5266	return Attrs;
5267	// We may legitimately have non-power-of-2 alignment here.
5268	// If so, this is UB land, emit it via `@llvm.assume` instead.
5269	if (!AlignmentCI->getValue().isPowerOf2())
5270	return Attrs;
5271	llvm::AttributeList NewAttrs = maybeRaiseRetAlignmentAttribute(
5272	Ctx&: CGF.getLLVMContext(), Attrs,
5273	NewAlign: llvm::Align (
5274	AlignmentCI->getLimitedValue(Limit: llvm::Value::MaximumAlignment)));
5275	AA = nullptr; // We're done. Disallow doing anything else.
5276	return NewAttrs;
5277	}
5278
5279	/// Emit alignment assumption.
5280	/// This is a general fallback that we take if either there is an offset,
5281	/// or the alignment is variable or we are sanitizing for alignment.
5282	void EmitAsAnAssumption(SourceLocation Loc, QualType RetTy, RValue &Ret) {
5283	if (!AA)
5284	return;
5285	CGF.emitAlignmentAssumption(Ret.getScalarVal(), RetTy, Loc,
5286	AA->getLocation(), Alignment, OffsetCI);
5287	AA = nullptr; // We're done. Disallow doing anything else.
5288	}
5289	};
5290
5291	/// Helper data structure to emit `AssumeAlignedAttr`.
5292	class AssumeAlignedAttrEmitter final
5293	: public AbstractAssumeAlignedAttrEmitter<AssumeAlignedAttr> {
5294	public:
5295	AssumeAlignedAttrEmitter(CodeGenFunction &CGF_, const Decl *FuncDecl)
5296	: AbstractAssumeAlignedAttrEmitter (CGF_, FuncDecl) {
5297	if (!AA)
5298	return;
5299	// It is guaranteed that the alignment/offset are constants.
5300	Alignment = cast<llvm::ConstantInt>(Val: CGF.EmitScalarExpr(E: AA->getAlignment()));
5301	if (Expr *Offset = AA->getOffset()) {
5302	OffsetCI = cast<llvm::ConstantInt>(Val: CGF.EmitScalarExpr(E: Offset));
5303	if (OffsetCI->isNullValue()) // Canonicalize zero offset to no offset.
5304	OffsetCI = nullptr;
5305	}
5306	}
5307	};
5308
5309	/// Helper data structure to emit `AllocAlignAttr`.
5310	class AllocAlignAttrEmitter final
5311	: public AbstractAssumeAlignedAttrEmitter<AllocAlignAttr> {
5312	public:
5313	AllocAlignAttrEmitter(CodeGenFunction &CGF_, const Decl *FuncDecl,
5314	const CallArgList &CallArgs)
5315	: AbstractAssumeAlignedAttrEmitter (CGF_, FuncDecl) {
5316	if (!AA)
5317	return;
5318	// Alignment may or may not be a constant, and that is okay.
5319	Alignment = CallArgs [AA->getParamIndex().getLLVMIndex()]
5320	.getRValue(CGF)
5321	.getScalarVal();
5322	}
5323	};
5324
5325	} // namespace
5326
5327	static unsigned getMaxVectorWidth(const llvm::Type *Ty) {
5328	if (auto *VT = dyn_cast<llvm::VectorType>(Val: Ty))
5329	return VT->getPrimitiveSizeInBits().getKnownMinValue();
5330	if (auto *AT = dyn_cast<llvm::ArrayType>(Val: Ty))
5331	return getMaxVectorWidth(Ty: AT->getElementType());
5332
5333	unsigned MaxVectorWidth = `0`;
5334	if (auto *ST = dyn_cast<llvm::StructType>(Val: Ty))
5335	for (auto *I : ST->elements())
5336	MaxVectorWidth = std::max(a: MaxVectorWidth, b: getMaxVectorWidth(Ty: I));
5337	return MaxVectorWidth;
5338	}
5339
5340	RValue CodeGenFunction::EmitCall(const CGFunctionInfo &CallInfo,
5341	const CGCallee &Callee,
5342	ReturnValueSlot ReturnValue,
5343	const CallArgList &CallArgs,
5344	llvm::CallBase *callOrInvoke, bool* IsMustTail,
5345	SourceLocation Loc,
5346	bool IsVirtualFunctionPointerThunk) {
5347	// FIXME: We no longer need the types from CallArgs; lift up and simplify.
5348
5349	assert(Callee.isOrdinary() \|\| Callee.isVirtual());
5350
5351	// Handle struct-return functions by passing a pointer to the
5352	// location that we would like to return into.
5353	QualType RetTy = CallInfo.getReturnType();
5354	const ABIArgInfo &RetAI = CallInfo.getReturnInfo();
5355
5356	llvm::FunctionType *IRFuncTy = getTypes().GetFunctionType(FI: CallInfo);
5357
5358	const Decl *TargetDecl = Callee.getAbstractInfo().getCalleeDecl().getDecl();
5359	if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl)) {
5360	// We can only guarantee that a function is called from the correct
5361	// context/function based on the appropriate target attributes,
5362	// so only check in the case where we have both always_inline and target
5363	// since otherwise we could be making a conditional call after a check for
5364	// the proper cpu features (and it won't cause code generation issues due to
5365	// function based code generation).
5366	if ((TargetDecl->hasAttr<AlwaysInlineAttr>() &&
5367	(TargetDecl->hasAttr<TargetAttr>() \|\|
5368	(CurFuncDecl && CurFuncDecl->hasAttr<TargetAttr>()))) \|\|
5369	(CurFuncDecl && CurFuncDecl->hasAttr<FlattenAttr>() &&
5370	(CurFuncDecl->hasAttr<TargetAttr>() \|\|
5371	TargetDecl->hasAttr<TargetAttr>())))
5372	checkTargetFeatures(Loc, TargetDecl: FD);
5373	}
5374
5375	// Some architectures (such as x86-64) have the ABI changed based on
5376	// attribute-target/features. Give them a chance to diagnose.
5377	const FunctionDecl *CallerDecl = dyn_cast_or_null<FunctionDecl>(Val: CurCodeDecl);
5378	const FunctionDecl *CalleeDecl = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl);
5379	CGM.getTargetCodeGenInfo().checkFunctionCallABI(CGM, CallLoc: Loc, Caller: CallerDecl,
5380	Callee: CalleeDecl, Args: CallArgs, ReturnType: RetTy);
5381
5382	// 1. Set up the arguments.
5383
5384	// If we're using inalloca, insert the allocation after the stack save.
5385	// FIXME: Do this earlier rather than hacking it in here!
5386	RawAddress ArgMemory = RawAddress::invalid();
5387	if (llvm::StructType *ArgStruct = CallInfo.getArgStruct()) {
5388	const llvm::DataLayout &DL = CGM.getDataLayout();
5389	llvm::Instruction *IP = CallArgs.getStackBase();
5390	llvm::AllocaInst *AI;
5391	if (IP) {
5392	IP = IP->getNextNode();
5393	AI = new llvm::AllocaInst (ArgStruct, DL.getAllocaAddrSpace(), "argmem",
5394	IP->getIterator());
5395	} else {
5396	AI = CreateTempAlloca(Ty: ArgStruct, Name: "argmem");
5397	}
5398	auto Align = CallInfo.getArgStructAlignment();
5399	AI->setAlignment(Align.getAsAlign());
5400	AI->setUsedWithInAlloca(true);
5401	assert(AI->isUsedWithInAlloca() && !AI->isStaticAlloca());
5402	ArgMemory = RawAddress (AI, ArgStruct, Align);
5403	}
5404
5405	ClangToLLVMArgMapping IRFunctionArgs(CGM.getContext(), CallInfo);
5406	SmallVector<llvm::Value *, `16`> IRCallArgs(IRFunctionArgs.totalIRArgs());
5407
5408	// If the call returns a temporary with struct return, create a temporary
5409	// alloca to hold the result, unless one is given to us.
5410	Address SRetPtr = Address::invalid();
5411	bool NeedSRetLifetimeEnd = false;
5412	if (RetAI.isIndirect() \|\| RetAI.isInAlloca() \|\| RetAI.isCoerceAndExpand()) {
5413	// For virtual function pointer thunks and musttail calls, we must always
5414	// forward an incoming SRet pointer to the callee, because a local alloca
5415	// would be de-allocated before the call. These cases both guarantee that
5416	// there will be an incoming SRet argument of the correct type.
5417	if ((IsVirtualFunctionPointerThunk \|\| IsMustTail) && RetAI.isIndirect()) {
5418	SRetPtr = makeNaturalAddressForPointer(Ptr: CurFn->arg_begin() +
5419	IRFunctionArgs.getSRetArgNo(),
5420	T: RetTy, Alignment: CharUnits::fromQuantity(Quantity: `1`));
5421	} else if (!ReturnValue.isNull()) {
5422	SRetPtr = ReturnValue.getAddress();
5423	} else {
5424	SRetPtr = CreateMemTempWithoutCast(T: RetTy, Name: "tmp");
5425	if (HaveInsertPoint() && ReturnValue.isUnused())
5426	NeedSRetLifetimeEnd = EmitLifetimeStart(Addr: SRetPtr.getBasePointer());
5427	}
5428	if (IRFunctionArgs.hasSRetArg()) {
5429	// A mismatch between the allocated return value's AS and the target's
5430	// chosen IndirectAS can happen e.g. when passing the this pointer through
5431	// a chain involving stores to / loads from the DefaultAS; we address this
5432	// here, symmetrically with the handling we have for normal pointer args.
5433	if (SRetPtr.getAddressSpace() != RetAI.getIndirectAddrSpace()) {
5434	llvm::Value *V = SRetPtr.getBasePointer();
5435	llvm::Type *Ty = llvm::PointerType::get(C&: getLLVMContext(),
5436	AddressSpace: RetAI.getIndirectAddrSpace());
5437
5438	SRetPtr = SRetPtr.withPointer(NewPointer: performAddrSpaceCast(Src: V, DestTy: Ty),
5439	IsKnownNonNull: SRetPtr.isKnownNonNull());
5440	}
5441	IRCallArgs [IRFunctionArgs.getSRetArgNo()] =
5442	getAsNaturalPointerTo(Addr: SRetPtr, PointeeType: RetTy);
5443	} else if (RetAI.isInAlloca()) {
5444	Address Addr =
5445	Builder.CreateStructGEP(Addr: ArgMemory, Index: RetAI.getInAllocaFieldIndex());
5446	Builder.CreateStore(Val: getAsNaturalPointerTo(Addr: SRetPtr, PointeeType: RetTy), Addr);
5447	}
5448	}
5449
5450	RawAddress swiftErrorTemp = RawAddress::invalid();
5451	Address swiftErrorArg = Address::invalid();
5452
5453	// When passing arguments using temporary allocas, we need to add the
5454	// appropriate lifetime markers. This vector keeps track of all the lifetime
5455	// markers that need to be ended right after the call.
5456	SmallVector<CallLifetimeEnd, `2`> CallLifetimeEndAfterCall;
5457
5458	// Translate all of the arguments as necessary to match the IR lowering.
5459	assert(CallInfo.arg_size() == CallArgs.size() &&
5460	"Mismatch between function signature & arguments.");
5461	unsigned ArgNo = `0`;
5462	CGFunctionInfo::const_arg_iterator info_it = CallInfo.arg_begin();
5463	for (CallArgList::const_iterator I = CallArgs.begin(), E = CallArgs.end();
5464	I != E; ++I, ++info_it, ++ArgNo) {
5465	const ABIArgInfo &ArgInfo = info_it->info;
5466
5467	// Insert a padding argument to ensure proper alignment.
5468	if (IRFunctionArgs.hasPaddingArg(ArgNo))
5469	IRCallArgs [IRFunctionArgs.getPaddingArgNo(ArgNo)] =
5470	llvm::UndefValue::get(T: ArgInfo.getPaddingType());
5471
5472	unsigned FirstIRArg, NumIRArgs;
5473	std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo);
5474
5475	bool ArgHasMaybeUndefAttr =
5476	IsArgumentMaybeUndef(TargetDecl, NumRequiredArgs: CallInfo.getNumRequiredArgs(), ArgNo);
5477
5478	switch (ArgInfo.getKind()) {
5479	case ABIArgInfo::InAlloca: {
5480	assert(NumIRArgs == `0`);
5481	assert(getTarget().getTriple().getArch() == llvm::Triple::x86);
5482	if (I->isAggregate()) {
5483	RawAddress Addr = I->hasLValue()
5484	? I->getKnownLValue().getAddress()
5485	: I->getKnownRValue().getAggregateAddress();
5486	llvm::Instruction *Placeholder =
5487	cast<llvm::Instruction>(Val: Addr.getPointer());
5488
5489	if (!ArgInfo.getInAllocaIndirect()) {
5490	// Replace the placeholder with the appropriate argument slot GEP.
5491	CGBuilderTy::InsertPoint IP = Builder.saveIP();
5492	Builder.SetInsertPoint(Placeholder);
5493	Addr = Builder.CreateStructGEP(Addr: ArgMemory,
5494	Index: ArgInfo.getInAllocaFieldIndex());
5495	Builder.restoreIP(IP);
5496	} else {
5497	// For indirect things such as overaligned structs, replace the
5498	// placeholder with a regular aggregate temporary alloca. Store the
5499	// address of this alloca into the struct.
5500	Addr = CreateMemTemp(T: info_it->type, Name: "inalloca.indirect.tmp");
5501	Address ArgSlot = Builder.CreateStructGEP(
5502	Addr: ArgMemory, Index: ArgInfo.getInAllocaFieldIndex());
5503	Builder.CreateStore(Val: Addr.getPointer(), Addr: ArgSlot);
5504	}
5505	deferPlaceholderReplacement(Old: Placeholder, New: Addr.getPointer());
5506	} else if (ArgInfo.getInAllocaIndirect()) {
5507	// Make a temporary alloca and store the address of it into the argument
5508	// struct.
5509	RawAddress Addr = CreateMemTempWithoutCast(
5510	T: I->Ty, Align: getContext().getTypeAlignInChars(T: I->Ty),
5511	Name: "indirect-arg-temp");
5512	I->copyInto(CGF&: *this, Addr);
5513	Address ArgSlot =
5514	Builder.CreateStructGEP(Addr: ArgMemory, Index: ArgInfo.getInAllocaFieldIndex());
5515	Builder.CreateStore(Val: Addr.getPointer(), Addr: ArgSlot);
5516	} else {
5517	// Store the RValue into the argument struct.
5518	Address Addr =
5519	Builder.CreateStructGEP(Addr: ArgMemory, Index: ArgInfo.getInAllocaFieldIndex());
5520	Addr = Addr.withElementType(ElemTy: ConvertTypeForMem(T: I->Ty));
5521	I->copyInto(CGF&: *this, Addr);
5522	}
5523	break;
5524	}
5525
5526	case ABIArgInfo::Indirect:
5527	case ABIArgInfo::IndirectAliased: {
5528	assert(NumIRArgs == `1`);
5529	if (I->isAggregate()) {
5530	// We want to avoid creating an unnecessary temporary+copy here;
5531	// however, we need one in three cases:
5532	// 1. If the argument is not byval, and we are required to copy the
5533	// source. (This case doesn't occur on any common architecture.)
5534	// 2. If the argument is byval, RV is not sufficiently aligned, and
5535	// we cannot force it to be sufficiently aligned.
5536	// 3. If the argument is byval, but RV is not located in default
5537	// or alloca address space.
5538	Address Addr = I->hasLValue()
5539	? I->getKnownLValue().getAddress()
5540	: I->getKnownRValue().getAggregateAddress();
5541	CharUnits Align = ArgInfo.getIndirectAlign();
5542	const llvm::DataLayout *TD = &CGM.getDataLayout();
5543
5544	assert((FirstIRArg >= IRFuncTy->getNumParams() \|\|
5545	IRFuncTy->getParamType(FirstIRArg)->getPointerAddressSpace() ==
5546	TD->getAllocaAddrSpace()) &&
5547	"indirect argument must be in alloca address space");
5548
5549	bool NeedCopy = false;
5550	if (Addr.getAlignment() < Align &&
5551	llvm::getOrEnforceKnownAlignment(V: Addr.emitRawPointer(CGF&: *this),
5552	PrefAlign: Align.getAsAlign(),
5553	DL: *TD) < Align.getAsAlign()) {
5554	NeedCopy = true;
5555	} else if (I->hasLValue()) {
5556	auto LV = I->getKnownLValue();
5557
5558	bool isByValOrRef =
5559	ArgInfo.isIndirectAliased() \|\| ArgInfo.getIndirectByVal();
5560
5561	if (!isByValOrRef \|\|
5562	(LV.getAlignment() < getContext().getTypeAlignInChars(T: I->Ty))) {
5563	NeedCopy = true;
5564	}
5565
5566	if (isByValOrRef && Addr.getType()->getAddressSpace() !=
5567	ArgInfo.getIndirectAddrSpace()) {
5568	NeedCopy = true;
5569	}
5570	}
5571
5572	if (!NeedCopy) {
5573	// Skip the extra memcpy call.
5574	llvm::Value *V = getAsNaturalPointerTo(Addr, PointeeType: I->Ty);
5575	auto *T = llvm::PointerType::get(C&: CGM.getLLVMContext(),
5576	AddressSpace: ArgInfo.getIndirectAddrSpace());
5577
5578	// FIXME: This should not depend on the language address spaces, and
5579	// only the contextual values. If the address space mismatches, see if
5580	// we can look through a cast to a compatible address space value,
5581	// otherwise emit a copy.
5582	llvm::Value *Val = performAddrSpaceCast(Src: V, DestTy: T);
5583	if (ArgHasMaybeUndefAttr)
5584	Val = Builder.CreateFreeze(V: Val);
5585	IRCallArgs [FirstIRArg] = Val;
5586	break;
5587	}
5588	} else if (I->getType()->isArrayParameterType()) {
5589	// Don't produce a temporary for ArrayParameterType arguments.
5590	// ArrayParameterType arguments are only created from
5591	// HLSL_ArrayRValue casts and HLSLOutArgExpr expressions, both
5592	// of which create temporaries already. This allows us to just use the
5593	// scalar for the decayed array pointer as the argument directly.
5594	IRCallArgs [FirstIRArg] = I->getKnownRValue().getScalarVal();
5595	break;
5596	}
5597
5598	// For non-aggregate args and aggregate args meeting conditions above
5599	// we need to create an aligned temporary, and copy to it.
5600	RawAddress AI = CreateMemTempWithoutCast(
5601	T: I->Ty, Align: ArgInfo.getIndirectAlign(), Name: "byval-temp");
5602	llvm::Value *Val = getAsNaturalPointerTo(Addr: AI, PointeeType: I->Ty);
5603	if (ArgHasMaybeUndefAttr)
5604	Val = Builder.CreateFreeze(V: Val);
5605	IRCallArgs [FirstIRArg] = Val;
5606
5607	// Emit lifetime markers for the temporary alloca and add cleanup code to
5608	// emit the end lifetime marker after the call.
5609	if (EmitLifetimeStart(Addr: AI.getPointer()))
5610	CallLifetimeEndAfterCall.emplace_back(Args&: AI);
5611
5612	// Generate the copy.
5613	I->copyInto(CGF&: *this, Addr: AI);
5614	break;
5615	}
5616
5617	case ABIArgInfo::Ignore:
5618	assert(NumIRArgs == `0`);
5619	break;
5620
5621	case ABIArgInfo::Extend:
5622	case ABIArgInfo::Direct: {
5623	if (!isa<llvm::StructType>(Val: ArgInfo.getCoerceToType()) &&
5624	ArgInfo.getCoerceToType() == ConvertType(T: info_it->type) &&
5625	ArgInfo.getDirectOffset() == `0`) {
5626	assert(NumIRArgs == `1`);
5627	llvm::Value *V;
5628	if (!I->isAggregate())
5629	V = I->getKnownRValue().getScalarVal();
5630	else
5631	V = Builder.CreateLoad(
5632	Addr: I->hasLValue() ? I->getKnownLValue().getAddress()
5633	: I->getKnownRValue().getAggregateAddress());
5634
5635	// Implement swifterror by copying into a new swifterror argument.
5636	// We'll write back in the normal path out of the call.
5637	if (CallInfo.getExtParameterInfo(argIndex: ArgNo).getABI() ==
5638	ParameterABI::SwiftErrorResult) {
5639	assert(!swiftErrorTemp.isValid() && "multiple swifterror args");
5640
5641	QualType pointeeTy = I->Ty ->getPointeeType();
5642	swiftErrorArg = makeNaturalAddressForPointer(
5643	Ptr: V, T: pointeeTy, Alignment: getContext().getTypeAlignInChars(T: pointeeTy));
5644
5645	swiftErrorTemp =
5646	CreateMemTemp(T: pointeeTy, Align: getPointerAlign(), Name: "swifterror.temp");
5647	V = swiftErrorTemp.getPointer();
5648	cast<llvm::AllocaInst>(Val: V)->setSwiftError(true);
5649
5650	llvm::Value *errorValue = Builder.CreateLoad(Addr: swiftErrorArg);
5651	Builder.CreateStore(Val: errorValue, Addr: swiftErrorTemp);
5652	}
5653
5654	// We might have to widen integers, but we should never truncate.
5655	if (ArgInfo.getCoerceToType() != V->getType() &&
5656	V->getType()->isIntegerTy())
5657	V = Builder.CreateZExt(V, DestTy: ArgInfo.getCoerceToType());
5658
5659	// The only plausible mismatch here would be for pointer address spaces.
5660	// We assume that the target has a reasonable mapping for the DefaultAS
5661	// (it can be casted to from incoming specific ASes), and insert an AS
5662	// cast to address the mismatch.
5663	if (FirstIRArg < IRFuncTy->getNumParams() &&
5664	V->getType() != IRFuncTy->getParamType(i: FirstIRArg)) {
5665	assert(V->getType()->isPointerTy() && "Only pointers can mismatch!");
5666	V = performAddrSpaceCast(Src: V, DestTy: IRFuncTy->getParamType(i: FirstIRArg));
5667	}
5668
5669	if (ArgHasMaybeUndefAttr)
5670	V = Builder.CreateFreeze(V);
5671	IRCallArgs [FirstIRArg] = V;
5672	break;
5673	}
5674
5675	llvm::StructType *STy =
5676	dyn_cast<llvm::StructType>(Val: ArgInfo.getCoerceToType());
5677
5678	// FIXME: Avoid the conversion through memory if possible.
5679	Address Src = Address::invalid();
5680	if (!I->isAggregate()) {
5681	Src = CreateMemTemp(T: I->Ty, Name: "coerce");
5682	I->copyInto(CGF&: *this, Addr: Src);
5683	} else {
5684	Src = I->hasLValue() ? I->getKnownLValue().getAddress()
5685	: I->getKnownRValue().getAggregateAddress();
5686	}
5687
5688	// If the value is offset in memory, apply the offset now.
5689	Src = emitAddressAtOffset(CGF&: *this, addr: Src, info: ArgInfo);
5690
5691	// Fast-isel and the optimizer generally like scalar values better than
5692	// FCAs, so we flatten them if this is safe to do for this argument.
5693	if (STy && ArgInfo.isDirect() && ArgInfo.getCanBeFlattened()) {
5694	llvm::Type *SrcTy = Src.getElementType();
5695	llvm::TypeSize SrcTypeSize =
5696	CGM.getDataLayout().getTypeAllocSize(Ty: SrcTy);
5697	llvm::TypeSize DstTypeSize = CGM.getDataLayout().getTypeAllocSize(Ty: STy);
5698	if (SrcTypeSize.isScalable()) {
5699	assert(STy->containsHomogeneousScalableVectorTypes() &&
5700	"ABI only supports structure with homogeneous scalable vector "
5701	"type");
5702	assert(SrcTypeSize == DstTypeSize &&
5703	"Only allow non-fractional movement of structure with "
5704	"homogeneous scalable vector type");
5705	assert(NumIRArgs == STy->getNumElements());
5706
5707	llvm::Value *StoredStructValue =
5708	Builder.CreateLoad(Addr: Src, Name: Src.getName() + ".tuple");
5709	for (unsigned i = `0`, e = STy->getNumElements(); i != e; ++i) {
5710	llvm::Value *Extract = Builder.CreateExtractValue(
5711	Agg: StoredStructValue, Idxs: i, Name: Src.getName() + ".extract" + Twine(i));
5712	IRCallArgs [FirstIRArg + i] = Extract;
5713	}
5714	} else {
5715	uint64_t SrcSize = SrcTypeSize.getFixedValue();
5716	uint64_t DstSize = DstTypeSize.getFixedValue();
5717	bool HasPFPFields = getContext().hasPFPFields(Ty: I->Ty);
5718
5719	// If the source type is smaller than the destination type of the
5720	// coerce-to logic, copy the source value into a temp alloca the size
5721	// of the destination type to allow loading all of it. The bits past
5722	// the source value are left undef.
5723	if (HasPFPFields \|\| SrcSize < DstSize) {
5724	Address TempAlloca = CreateTempAlloca(Ty: STy, align: Src.getAlignment(),
5725	Name: Src.getName() + ".coerce");
5726	if (HasPFPFields) {
5727	// Structures with PFP fields require a coerced load to remove any
5728	// pointer signatures.
5729	Builder.CreateStore(
5730	Val: CreatePFPCoercedLoad(Src, SrcFETy: I->Ty, Ty: ArgInfo.getCoerceToType(),
5731	CGF&: *this),
5732	Addr: TempAlloca);
5733	} else
5734	Builder.CreateMemCpy(Dest: TempAlloca, Src, Size: SrcSize);
5735	Src = TempAlloca;
5736	} else {
5737	Src = Src.withElementType(ElemTy: STy);
5738	}
5739
5740	assert(NumIRArgs == STy->getNumElements());
5741	for (unsigned i = `0`, e = STy->getNumElements(); i != e; ++i) {
5742	Address EltPtr = Builder.CreateStructGEP(Addr: Src, Index: i);
5743	llvm::Value *LI = Builder.CreateLoad(Addr: EltPtr);
5744	if (ArgHasMaybeUndefAttr)
5745	LI = Builder.CreateFreeze(V: LI);
5746	IRCallArgs [FirstIRArg + i] = LI;
5747	}
5748	}
5749	} else {
5750	// In the simple case, just pass the coerced loaded value.
5751	assert(NumIRArgs == `1`);
5752	llvm::Value *Load =
5753	CreateCoercedLoad(Src, SrcFETy: I->Ty, Ty: ArgInfo.getCoerceToType(), CGF&: *this);
5754
5755	if (CallInfo.isCmseNSCall()) {
5756	// For certain parameter types, clear padding bits, as they may reveal
5757	// sensitive information.
5758	// Small struct/union types are passed as integer arrays.
5759	auto *ATy = dyn_cast<llvm::ArrayType>(Val: Load->getType());
5760	if (ATy != nullptr && isa<RecordType>(Val: I->Ty.getCanonicalType()))
5761	Load = EmitCMSEClearRecord(Src: Load, ATy, QTy: I->Ty);
5762	}
5763
5764	if (ArgHasMaybeUndefAttr)
5765	Load = Builder.CreateFreeze(V: Load);
5766	IRCallArgs [FirstIRArg] = Load;
5767	}
5768
5769	break;
5770	}
5771
5772	case ABIArgInfo::CoerceAndExpand: {
5773	auto coercionType = ArgInfo.getCoerceAndExpandType();
5774	auto layout = CGM.getDataLayout().getStructLayout(Ty: coercionType);
5775	auto unpaddedCoercionType = ArgInfo.getUnpaddedCoerceAndExpandType();
5776	auto *unpaddedStruct = dyn_cast<llvm::StructType>(Val: unpaddedCoercionType);
5777
5778	Address addr = Address::invalid();
5779	RawAddress AllocaAddr = RawAddress::invalid();
5780	bool NeedLifetimeEnd = false;
5781	if (I->isAggregate()) {
5782	addr = I->hasLValue() ? I->getKnownLValue().getAddress()
5783	: I->getKnownRValue().getAggregateAddress();
5784
5785	} else {
5786	RValue RV = I->getKnownRValue();
5787	assert(RV.isScalar()); // complex should always just be direct
5788
5789	llvm::Type *scalarType = RV.getScalarVal()->getType();
5790	auto scalarAlign = CGM.getDataLayout().getPrefTypeAlign(Ty: scalarType);
5791
5792	// Materialize to a temporary.
5793	addr = CreateTempAlloca(Ty: RV.getScalarVal()->getType(),
5794	align: CharUnits::fromQuantity(Quantity: std::max(
5795	a: layout->getAlignment(), b: scalarAlign)),
5796	Name: "tmp",
5797	/ArraySize=/nullptr, Alloca: &AllocaAddr);
5798	NeedLifetimeEnd = EmitLifetimeStart(Addr: AllocaAddr.getPointer());
5799
5800	Builder.CreateStore(Val: RV.getScalarVal(), Addr: addr);
5801	}
5802
5803	addr = addr.withElementType(ElemTy: coercionType);
5804
5805	unsigned IRArgPos = FirstIRArg;
5806	unsigned unpaddedIndex = `0`;
5807	for (unsigned i = `0`, e = coercionType->getNumElements(); i != e; ++i) {
5808	llvm::Type *eltType = coercionType->getElementType(N: i);
5809	if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType))
5810	continue;
5811	Address eltAddr = Builder.CreateStructGEP(Addr: addr, Index: i);
5812	llvm::Value *elt = CreateCoercedLoad(
5813	Src: eltAddr, SrcFETy: I->Ty,
5814	Ty: unpaddedStruct ? unpaddedStruct->getElementType(N: unpaddedIndex++)
5815	: unpaddedCoercionType,
5816	CGF&: *this);
5817	if (ArgHasMaybeUndefAttr)
5818	elt = Builder.CreateFreeze(V: elt);
5819	IRCallArgs [IRArgPos++] = elt;
5820	}
5821	assert(IRArgPos == FirstIRArg + NumIRArgs);
5822
5823	if (NeedLifetimeEnd)
5824	EmitLifetimeEnd(Addr: AllocaAddr.getPointer());
5825	break;
5826	}
5827
5828	case ABIArgInfo::Expand: {
5829	unsigned IRArgPos = FirstIRArg;
5830	ExpandTypeToArgs(Ty: I->Ty, Arg: *I, IRFuncTy, IRCallArgs, IRCallArgPos&: IRArgPos);
5831	assert(IRArgPos == FirstIRArg + NumIRArgs);
5832	break;
5833	}
5834
5835	case ABIArgInfo::TargetSpecific: {
5836	Address Src = Address::invalid();
5837	if (!I->isAggregate()) {
5838	Src = CreateMemTemp(T: I->Ty, Name: "target_coerce");
5839	I->copyInto(CGF&: *this, Addr: Src);
5840	} else {
5841	Src = I->hasLValue() ? I->getKnownLValue().getAddress()
5842	: I->getKnownRValue().getAggregateAddress();
5843	}
5844
5845	// If the value is offset in memory, apply the offset now.
5846	Src = emitAddressAtOffset(CGF&: *this, addr: Src, info: ArgInfo);
5847	llvm::Value *Load =
5848	CGM.getABIInfo().createCoercedLoad(SrcAddr: Src, AI: ArgInfo, CGF&: *this);
5849	IRCallArgs [FirstIRArg] = Load;
5850	break;
5851	}
5852	}
5853	}
5854
5855	const CGCallee &ConcreteCallee = Callee.prepareConcreteCallee(CGF&: *this);
5856	llvm::Value *CalleePtr = ConcreteCallee.getFunctionPointer();
5857
5858	// If we're using inalloca, set up that argument.
5859	if (ArgMemory.isValid()) {
5860	llvm::Value *Arg = ArgMemory.getPointer();
5861	assert(IRFunctionArgs.hasInallocaArg());
5862	IRCallArgs [IRFunctionArgs.getInallocaArgNo()] = Arg;
5863	}
5864
5865	// 2. Prepare the function pointer.
5866
5867	// If the callee is a bitcast of a non-variadic function to have a
5868	// variadic function pointer type, check to see if we can remove the
5869	// bitcast. This comes up with unprototyped functions.
5870	//
5871	// This makes the IR nicer, but more importantly it ensures that we
5872	// can inline the function at -O0 if it is marked always_inline.
5873	auto simplifyVariadicCallee = [](llvm::FunctionType *CalleeFT,
5874	llvm::Value Ptr) -> llvm::Function {
5875	if (!CalleeFT->isVarArg())
5876	return nullptr;
5877
5878	// Get underlying value if it's a bitcast
5879	if (llvm::ConstantExpr *CE = dyn_cast<llvm::ConstantExpr>(Val: Ptr)) {
5880	if (CE->getOpcode() == llvm::Instruction::BitCast)
5881	Ptr = CE->getOperand(i_nocapture: `0`);
5882	}
5883
5884	llvm::Function *OrigFn = dyn_cast<llvm::Function>(Val: Ptr);
5885	if (!OrigFn)
5886	return nullptr;
5887
5888	llvm::FunctionType *OrigFT = OrigFn->getFunctionType();
5889
5890	// If the original type is variadic, or if any of the component types
5891	// disagree, we cannot remove the cast.
5892	if (OrigFT->isVarArg() \|\|
5893	OrigFT->getNumParams() != CalleeFT->getNumParams() \|\|
5894	OrigFT->getReturnType() != CalleeFT->getReturnType())
5895	return nullptr;
5896
5897	for (unsigned i = `0`, e = OrigFT->getNumParams(); i != e; ++i)
5898	if (OrigFT->getParamType(i) != CalleeFT->getParamType(i))
5899	return nullptr;
5900
5901	return OrigFn;
5902	};
5903
5904	if (llvm::Function *OrigFn = simplifyVariadicCallee (IRFuncTy, CalleePtr)) {
5905	CalleePtr = OrigFn;
5906	IRFuncTy = OrigFn->getFunctionType();
5907	}
5908
5909	// 3. Perform the actual call.
5910
5911	// Deactivate any cleanups that we're supposed to do immediately before
5912	// the call.
5913	if (!CallArgs.getCleanupsToDeactivate().empty())
5914	deactivateArgCleanupsBeforeCall(CGF&: *this, CallArgs);
5915
5916	// Update the largest vector width if any arguments have vector types.
5917	for (unsigned i = `0`; i < IRCallArgs.size(); ++i)
5918	LargestVectorWidth = std::max(a: LargestVectorWidth,
5919	b: getMaxVectorWidth(Ty: IRCallArgs [i]->getType()));
5920
5921	// Compute the calling convention and attributes.
5922	unsigned CallingConv;
5923	llvm::AttributeList Attrs;
5924	CGM.ConstructAttributeList(Name: CalleePtr->getName(), FI: CallInfo,
5925	CalleeInfo: Callee.getAbstractInfo(), AttrList&: Attrs, CallingConv,
5926	/AttrOnCallSite=/true,
5927	/IsThunk=/false);
5928
5929	if (CallingConv == llvm::CallingConv::X86_VectorCall &&
5930	getTarget().getTriple().isWindowsArm64EC()) {
5931	CGM.Error(loc: Loc, error: "__vectorcall calling convention is not currently "
5932	"supported");
5933	}
5934
5935	if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: CurFuncDecl)) {
5936	if (FD->hasAttr<StrictFPAttr>())
5937	// All calls within a strictfp function are marked strictfp
5938	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::StrictFP);
5939
5940	// If -ffast-math is enabled and the function is guarded by an
5941	// '__attribute__((optnone)) adjust the memory attribute so the BE emits the
5942	// library call instead of the intrinsic.
5943	if (FD->hasAttr<OptimizeNoneAttr>() && getLangOpts().FastMath)
5944	CGM.AdjustMemoryAttribute(Name: CalleePtr->getName(), CalleeInfo: Callee.getAbstractInfo(),
5945	Attrs);
5946	}
5947	// Add call-site nomerge attribute if exists.
5948	if (InNoMergeAttributedStmt)
5949	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::NoMerge);
5950
5951	// Add call-site noinline attribute if exists.
5952	if (InNoInlineAttributedStmt)
5953	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::NoInline);
5954
5955	// Add call-site always_inline attribute if exists.
5956	// Note: This corresponds to the [[clang::always_inline]] statement attribute.
5957	if (InAlwaysInlineAttributedStmt &&
5958	!CGM.getTargetCodeGenInfo().wouldInliningViolateFunctionCallABI(
5959	Caller: CallerDecl, Callee: CalleeDecl))
5960	Attrs =
5961	Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::AlwaysInline);
5962
5963	// Remove call-site convergent attribute if requested.
5964	if (InNoConvergentAttributedStmt)
5965	Attrs =
5966	Attrs.removeFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::Convergent);
5967
5968	// Apply some call-site-specific attributes.
5969	// TODO: work this into building the attribute set.
5970
5971	// Apply always_inline to all calls within flatten functions.
5972	// FIXME: should this really take priority over __try, below?
5973	if (CurCodeDecl && CurCodeDecl->hasAttr<FlattenAttr>() &&
5974	!InNoInlineAttributedStmt &&
5975	!(TargetDecl && TargetDecl->hasAttr<NoInlineAttr>()) &&
5976	!CGM.getTargetCodeGenInfo().wouldInliningViolateFunctionCallABI(
5977	Caller: CallerDecl, Callee: CalleeDecl)) {
5978	Attrs =
5979	Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::AlwaysInline);
5980	}
5981
5982	// Disable inlining inside SEH __try blocks.
5983	if (isSEHTryScope()) {
5984	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::NoInline);
5985	}
5986
5987	// Decide whether to use a call or an invoke.
5988	bool CannotThrow;
5989	if (currentFunctionUsesSEHTry()) {
5990	// SEH cares about asynchronous exceptions, so everything can "throw."
5991	CannotThrow = false;
5992	} else if (isCleanupPadScope() &&
5993	EHPersonality::get(CGF&: *this).isMSVCXXPersonality()) {
5994	// The MSVC++ personality will implicitly terminate the program if an
5995	// exception is thrown during a cleanup outside of a try/catch.
5996	// We don't need to model anything in IR to get this behavior.
5997	CannotThrow = true;
5998	} else {
5999	// Otherwise, nounwind call sites will never throw.
6000	CannotThrow = Attrs.hasFnAttr(Kind: llvm::Attribute::NoUnwind);
6001
6002	if (auto *FPtr = dyn_cast<llvm::Function>(Val: CalleePtr))
6003	if (FPtr->hasFnAttribute(Kind: llvm::Attribute::NoUnwind))
6004	CannotThrow = true;
6005	}
6006
6007	// If we made a temporary, be sure to clean up after ourselves. Note that we
6008	// can't depend on being inside of an ExprWithCleanups, so we need to manually
6009	// pop this cleanup later on. Being eager about this is OK, since this
6010	// temporary is 'invisible' outside of the callee.
6011	if (NeedSRetLifetimeEnd)
6012	pushFullExprCleanup<CallLifetimeEnd>(kind: NormalEHLifetimeMarker, A: SRetPtr);
6013
6014	llvm::BasicBlock InvokeDest = CannotThrow ? nullptr* : getInvokeDest();
6015
6016	SmallVector<llvm::OperandBundleDef, `1`> BundleList =
6017	getBundlesForFunclet(Callee: CalleePtr);
6018
6019	if (SanOpts.has(K: SanitizerKind::KCFI) &&
6020	!isa_and_nonnull<FunctionDecl>(Val: TargetDecl))
6021	EmitKCFIOperandBundle(Callee: ConcreteCallee, Bundles&: BundleList);
6022
6023	// Add the pointer-authentication bundle.
6024	EmitPointerAuthOperandBundle(Info: ConcreteCallee.getPointerAuthInfo(), Bundles&: BundleList);
6025
6026	if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: CurFuncDecl))
6027	if (FD->hasAttr<StrictFPAttr>())
6028	// All calls within a strictfp function are marked strictfp
6029	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::StrictFP);
6030
6031	AssumeAlignedAttrEmitter AssumeAlignedAttrEmitter(*this, TargetDecl);
6032	Attrs = AssumeAlignedAttrEmitter.TryEmitAsCallSiteAttribute(Attrs);
6033
6034	AllocAlignAttrEmitter AllocAlignAttrEmitter(*this, TargetDecl, CallArgs);
6035	Attrs = AllocAlignAttrEmitter.TryEmitAsCallSiteAttribute(Attrs);
6036
6037	// Emit the actual call/invoke instruction.
6038	llvm::CallBase *CI;
6039	if (!InvokeDest) {
6040	CI = Builder.CreateCall(FTy: IRFuncTy, Callee: CalleePtr, Args: IRCallArgs, OpBundles: BundleList);
6041	} else {
6042	llvm::BasicBlock *Cont = createBasicBlock(name: "invoke.cont");
6043	CI = Builder.CreateInvoke(Ty: IRFuncTy, Callee: CalleePtr, NormalDest: Cont, UnwindDest: InvokeDest, Args: IRCallArgs,
6044	OpBundles: BundleList);
6045	EmitBlock(BB: Cont);
6046	}
6047	if (CI->getCalledFunction() && CI->getCalledFunction()->hasName() &&
6048	CI->getCalledFunction()->getName().starts_with(Prefix: "_Z4sqrt")) {
6049	SetSqrtFPAccuracy(CI);
6050	}
6051	if (callOrInvoke) {
6052	*callOrInvoke = CI;
6053	if (CGM.getCodeGenOpts().CallGraphSection) {
6054	QualType CST;
6055	if (TargetDecl && TargetDecl->getFunctionType())
6056	CST = QualType (TargetDecl->getFunctionType(), `0`);
6057	else if (const auto *FPT =
6058	Callee.getAbstractInfo().getCalleeFunctionProtoType())
6059	CST = QualType (FPT, `0`);
6060	else
6061	llvm_unreachable(
6062	"Cannot find the callee type to generate callee_type metadata.");
6063
6064	// Set type identifier metadata of indirect calls for call graph section.
6065	if (!CST.isNull())
6066	CGM.createCalleeTypeMetadataForIcall(QT: CST, CB: *callOrInvoke);
6067	}
6068	}
6069
6070	// If this is within a function that has the guard(nocf) attribute and is an
6071	// indirect call, add the "guard_nocf" attribute to this call to indicate that
6072	// Control Flow Guard checks should not be added, even if the call is inlined.
6073	if (const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: CurFuncDecl)) {
6074	if (const auto *A = FD->getAttr<CFGuardAttr>()) {
6075	if (A->getGuard() == CFGuardAttr::GuardArg::nocf &&
6076	!CI->getCalledFunction())
6077	Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: "guard_nocf");
6078	}
6079	}
6080
6081	// Apply the attributes and calling convention.
6082	CI->setAttributes(Attrs);
6083	CI->setCallingConv(static_cast<llvm::CallingConv::ID>(CallingConv));
6084
6085	// Apply various metadata.
6086
6087	if (!CI->getType()->isVoidTy())
6088	CI->setName("call");
6089
6090	if (CGM.shouldEmitConvergenceTokens() && CI->isConvergent())
6091	CI = addConvergenceControlToken(Input: CI);
6092
6093	// Update largest vector width from the return type.
6094	LargestVectorWidth =
6095	std::max(a: LargestVectorWidth, b: getMaxVectorWidth(Ty: CI->getType()));
6096
6097	// Insert instrumentation or attach profile metadata at indirect call sites.
6098	// For more details, see the comment before the definition of
6099	// IPVK_IndirectCallTarget in InstrProfData.inc.
6100	if (!CI->getCalledFunction())
6101	PGO ->valueProfile(Builder, ValueKind: llvm::IPVK_IndirectCallTarget, ValueSite: CI, ValuePtr: CalleePtr);
6102
6103	// In ObjC ARC mode with no ObjC ARC exception safety, tell the ARC
6104	// optimizer it can aggressively ignore unwind edges.
6105	if (CGM.getLangOpts().ObjCAutoRefCount)
6106	AddObjCARCExceptionMetadata(Inst: CI);
6107
6108	// Set tail call kind if necessary.
6109	bool IsPPC = getTarget().getTriple().isPPC();
6110	bool IsMIPS = getTarget().getTriple().isMIPS();
6111	bool HasMips16 = false;
6112	if (IsMIPS) {
6113	const TargetOptions &TargetOpts = getTarget().getTargetOpts();
6114	HasMips16 = TargetOpts.FeatureMap.lookup(Key: "mips16");
6115	if (!HasMips16)
6116	HasMips16 = llvm::is_contained(Range: TargetOpts.Features, Element: "+mips16");
6117	}
6118	if (llvm::CallInst *Call = dyn_cast<llvm::CallInst>(Val: CI)) {
6119	if (TargetDecl && TargetDecl->hasAttr<NotTailCalledAttr>())
6120	Call->setTailCallKind(llvm::CallInst::TCK_NoTail);
6121	else if (IsMustTail) {
6122	if (IsPPC) {
6123	if (getTarget().getTriple().isOSAIX())
6124	CGM.getDiags().Report(Loc, DiagID: diag::err_aix_musttail_unsupported);
6125	else if (!getTarget().hasFeature(Feature: "pcrelative-memops")) {
6126	if (getTarget().hasFeature(Feature: "longcall"))
6127	CGM.getDiags().Report(Loc, DiagID: diag::err_ppc_impossible_musttail) << `0`;
6128	else if (Call->isIndirectCall())
6129	CGM.getDiags().Report(Loc, DiagID: diag::err_ppc_impossible_musttail) << `1`;
6130	else if (isa_and_nonnull<FunctionDecl>(Val: TargetDecl)) {
6131	if (!cast<FunctionDecl>(Val: TargetDecl)->isDefined())
6132	// The undefined callee may be a forward declaration. Without
6133	// knowning all symbols in the module, we won't know the symbol is
6134	// defined or not. Collect all these symbols for later diagnosing.
6135	CGM.addUndefinedGlobalForTailCall(
6136	Global: {cast<FunctionDecl>(Val: TargetDecl), Loc});
6137	else {
6138	llvm::GlobalValue::LinkageTypes Linkage = CGM.getFunctionLinkage(
6139	GD: GlobalDecl (cast<FunctionDecl>(Val: TargetDecl)));
6140	if (llvm::GlobalValue::isWeakForLinker(Linkage) \|\|
6141	llvm::GlobalValue::isDiscardableIfUnused(Linkage))
6142	CGM.getDiags().Report(Loc, DiagID: diag::err_ppc_impossible_musttail)
6143	<< `2`;
6144	}
6145	}
6146	}
6147	}
6148	if (IsMIPS) {
6149	if (HasMips16)
6150	CGM.getDiags().Report(Loc, DiagID: diag::err_mips_impossible_musttail) << `0`;
6151	else if (const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl))
6152	CGM.addUndefinedGlobalForTailCall(Global: {FD, Loc});
6153	}
6154	Call->setTailCallKind(llvm::CallInst::TCK_MustTail);
6155	}
6156	}
6157
6158	// Add metadata for calls to MSAllocator functions
6159	if (getDebugInfo() && TargetDecl && TargetDecl->hasAttr<MSAllocatorAttr>())
6160	getDebugInfo()->addHeapAllocSiteMetadata(CallSite: CI, AllocatedTy: RetTy ->getPointeeType(), Loc);
6161
6162	// Add metadata if calling an __attribute__((error(""))) or warning fn.
6163	if (TargetDecl && TargetDecl->hasAttr<ErrorAttr>()) {
6164	llvm::ConstantInt *Line =
6165	llvm::ConstantInt::get(Ty: Int64Ty, V: Loc.getRawEncoding());
6166	llvm::ConstantAsMetadata *MD = llvm::ConstantAsMetadata::get(C: Line);
6167	llvm::MDTuple *MDT = llvm::MDNode::get(Context&: getLLVMContext(), MDs: {MD});
6168	CI->setMetadata(Kind: "srcloc", Node: MDT);
6169	}
6170
6171	// 4. Finish the call.
6172
6173	// If the call doesn't return, finish the basic block and clear the
6174	// insertion point; this allows the rest of IRGen to discard
6175	// unreachable code.
6176	if (CI->doesNotReturn()) {
6177	if (NeedSRetLifetimeEnd)
6178	PopCleanupBlock();
6179
6180	// Strip away the noreturn attribute to better diagnose unreachable UB.
6181	if (SanOpts.has(K: SanitizerKind::Unreachable)) {
6182	// Also remove from function since CallBase::hasFnAttr additionally checks
6183	// attributes of the called function.
6184	if (auto *F = CI->getCalledFunction())
6185	F->removeFnAttr(Kind: llvm::Attribute::NoReturn);
6186	CI->removeFnAttr(Kind: llvm::Attribute::NoReturn);
6187
6188	// Avoid incompatibility with ASan which relies on the `noreturn`
6189	// attribute to insert handler calls.
6190	if (SanOpts.hasOneOf(K: SanitizerKind::Address \|
6191	SanitizerKind::KernelAddress)) {
6192	SanitizerScope SanScope(this);
6193	llvm::IRBuilder<>::InsertPointGuard IPGuard(Builder);
6194	Builder.SetInsertPoint(CI);
6195	auto FnType = llvm::FunctionType::get(Result: CGM.VoidTy, /isVarArg=/*false);
6196	llvm::FunctionCallee Fn =
6197	CGM.CreateRuntimeFunction(Ty: FnType, Name: "__asan_handle_no_return");
6198	EmitNounwindRuntimeCall(callee: Fn);
6199	}
6200	}
6201
6202	EmitUnreachable(Loc);
6203	Builder.ClearInsertionPoint();
6204
6205	// FIXME: For now, emit a dummy basic block because expr emitters in
6206	// generally are not ready to handle emitting expressions at unreachable
6207	// points.
6208	EnsureInsertPoint();
6209
6210	// Return a reasonable RValue.
6211	return GetUndefRValue(Ty: RetTy);
6212	}
6213
6214	// If this is a musttail call, return immediately. We do not branch to the
6215	// epilogue in this case.
6216	if (IsMustTail) {
6217	for (auto it = EHStack.find(sp: CurrentCleanupScopeDepth); it != EHStack.end();
6218	++it) {
6219	EHCleanupScope Cleanup = dyn_cast<EHCleanupScope>(Val: &it);
6220	// Fake uses can be safely emitted immediately prior to the tail call, so
6221	// we choose to emit them just before the call here.
6222	if (Cleanup && Cleanup->isFakeUse()) {
6223	CGBuilderTy::InsertPointGuard IPG(Builder);
6224	Builder.SetInsertPoint(CI);
6225	Cleanup->getCleanup()->Emit(CGF&: *this, flags: EHScopeStack::Cleanup::Flags ());
6226	} else if (!(Cleanup &&
6227	Cleanup->getCleanup()->isRedundantBeforeReturn())) {
6228	CGM.ErrorUnsupported(S: MustTailCall, Type: "tail call skipping over cleanups");
6229	}
6230	}
6231	if (CI->getType()->isVoidTy())
6232	Builder.CreateRetVoid();
6233	else
6234	Builder.CreateRet(V: CI);
6235	Builder.ClearInsertionPoint();
6236	EnsureInsertPoint();
6237	return GetUndefRValue(Ty: RetTy);
6238	}
6239
6240	// Perform the swifterror writeback.
6241	if (swiftErrorTemp.isValid()) {
6242	llvm::Value *errorResult = Builder.CreateLoad(Addr: swiftErrorTemp);
6243	Builder.CreateStore(Val: errorResult, Addr: swiftErrorArg);
6244	}
6245
6246	// Emit any call-associated writebacks immediately. Arguably this
6247	// should happen after any return-value munging.
6248	if (CallArgs.hasWritebacks())
6249	EmitWritebacks(args: CallArgs);
6250
6251	// The stack cleanup for inalloca arguments has to run out of the normal
6252	// lexical order, so deactivate it and run it manually here.
6253	CallArgs.freeArgumentMemory(CGF&: *this);
6254
6255	// Extract the return value.
6256	RValue Ret;
6257
6258	// If the current function is a virtual function pointer thunk, avoid copying
6259	// the return value of the musttail call to a temporary.
6260	if (IsVirtualFunctionPointerThunk) {
6261	Ret = RValue::get(V: CI);
6262	} else {
6263	Ret = [&] {
6264	switch (RetAI.getKind()) {
6265	case ABIArgInfo::CoerceAndExpand: {
6266	auto coercionType = RetAI.getCoerceAndExpandType();
6267
6268	Address addr = SRetPtr.withElementType(ElemTy: coercionType);
6269
6270	assert(CI->getType() == RetAI.getUnpaddedCoerceAndExpandType());
6271	bool requiresExtract = isa<llvm::StructType>(Val: CI->getType());
6272
6273	unsigned unpaddedIndex = `0`;
6274	for (unsigned i = `0`, e = coercionType->getNumElements(); i != e; ++i) {
6275	llvm::Type *eltType = coercionType->getElementType(N: i);
6276	if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType))
6277	continue;
6278	Address eltAddr = Builder.CreateStructGEP(Addr: addr, Index: i);
6279	llvm::Value *elt = CI;
6280	if (requiresExtract)
6281	elt = Builder.CreateExtractValue(Agg: elt, Idxs: unpaddedIndex++);
6282	else
6283	assert(unpaddedIndex == `0`);
6284	Builder.CreateStore(Val: elt, Addr: eltAddr);
6285	}
6286	[[fallthrough]];
6287	}
6288
6289	case ABIArgInfo::InAlloca:
6290	case ABIArgInfo::Indirect: {
6291	RValue ret = convertTempToRValue(addr: SRetPtr, type: RetTy, Loc: SourceLocation ());
6292	if (NeedSRetLifetimeEnd)
6293	PopCleanupBlock();
6294	return ret;
6295	}
6296
6297	case ABIArgInfo::Ignore:
6298	// If we are ignoring an argument that had a result, make sure to
6299	// construct the appropriate return value for our caller.
6300	return GetUndefRValue(Ty: RetTy);
6301
6302	case ABIArgInfo::Extend:
6303	case ABIArgInfo::Direct: {
6304	llvm::Type *RetIRTy = ConvertType(T: RetTy);
6305	if (RetAI.getCoerceToType() == RetIRTy &&
6306	RetAI.getDirectOffset() == `0`) {
6307	switch (getEvaluationKind(T: RetTy)) {
6308	case TEK_Complex: {
6309	llvm::Value *Real = Builder.CreateExtractValue(Agg: CI, Idxs: `0`);
6310	llvm::Value *Imag = Builder.CreateExtractValue(Agg: CI, Idxs: `1`);
6311	return RValue::getComplex(C: std::make_pair(x&: Real, y&: Imag));
6312	}
6313	case TEK_Aggregate:
6314	break;
6315	case TEK_Scalar: {
6316	// If the argument doesn't match, perform a bitcast to coerce it.
6317	// This can happen due to trivial type mismatches.
6318	llvm::Value *V = CI;
6319	if (V->getType() != RetIRTy)
6320	V = Builder.CreateBitCast(V, DestTy: RetIRTy);
6321	return RValue::get(V);
6322	}
6323	}
6324	}
6325
6326	// If coercing a fixed vector from a scalable vector for ABI
6327	// compatibility, and the types match, use the llvm.vector.extract
6328	// intrinsic to perform the conversion.
6329	if (auto *FixedDstTy = dyn_cast<llvm::FixedVectorType>(Val: RetIRTy)) {
6330	llvm::Value *V = CI;
6331	if (auto *ScalableSrcTy =
6332	dyn_cast<llvm::ScalableVectorType>(Val: V->getType())) {
6333	if (FixedDstTy->getElementType() ==
6334	ScalableSrcTy->getElementType()) {
6335	V = Builder.CreateExtractVector(DstType: FixedDstTy, SrcVec: V, Idx: uint64_t(`0`),
6336	Name: "cast.fixed");
6337	return RValue::get(V);
6338	}
6339	}
6340	}
6341
6342	Address DestPtr = ReturnValue.getValue();
6343	bool DestIsVolatile = ReturnValue.isVolatile();
6344	uint64_t DestSize =
6345	getContext().getTypeInfoDataSizeInChars(T: RetTy).Width.getQuantity();
6346
6347	if (!DestPtr.isValid()) {
6348	DestPtr = CreateMemTemp(T: RetTy, Name: "coerce");
6349	DestIsVolatile = false;
6350	DestSize = getContext().getTypeSizeInChars(T: RetTy).getQuantity();
6351	}
6352
6353	// An empty record can overlap other data (if declared with
6354	// no_unique_address); omit the store for such types - as there is no
6355	// actual data to store.
6356	if (!isEmptyRecord(Context&: getContext(), T: RetTy, AllowArrays: true)) {
6357	// If the value is offset in memory, apply the offset now.
6358	Address StorePtr = emitAddressAtOffset(CGF&: *this, addr: DestPtr, info: RetAI);
6359	CreateCoercedStore(
6360	Src: CI, SrcFETy: RetTy, Dst: StorePtr,
6361	DstSize: llvm::TypeSize::getFixed(ExactSize: DestSize - RetAI.getDirectOffset()),
6362	DstIsVolatile: DestIsVolatile);
6363	}
6364
6365	return convertTempToRValue(addr: DestPtr, type: RetTy, Loc: SourceLocation ());
6366	}
6367
6368	case ABIArgInfo::TargetSpecific: {
6369	Address DestPtr = ReturnValue.getValue();
6370	Address StorePtr = emitAddressAtOffset(CGF&: *this, addr: DestPtr, info: RetAI);
6371	bool DestIsVolatile = ReturnValue.isVolatile();
6372	if (!DestPtr.isValid()) {
6373	DestPtr = CreateMemTemp(T: RetTy, Name: "target_coerce");
6374	DestIsVolatile = false;
6375	}
6376	CGM.getABIInfo().createCoercedStore(Val: CI, DstAddr: StorePtr, AI: RetAI, DestIsVolatile,
6377	CGF&: *this);
6378	return convertTempToRValue(addr: DestPtr, type: RetTy, Loc: SourceLocation ());
6379	}
6380
6381	case ABIArgInfo::Expand:
6382	case ABIArgInfo::IndirectAliased:
6383	llvm_unreachable("Invalid ABI kind for return argument");
6384	}
6385
6386	llvm_unreachable("Unhandled ABIArgInfo::Kind");
6387	}();
6388	}
6389
6390	// Emit the assume_aligned check on the return value.
6391	if (Ret.isScalar() && TargetDecl) {
6392	AssumeAlignedAttrEmitter.EmitAsAnAssumption(Loc, RetTy, Ret);
6393	AllocAlignAttrEmitter.EmitAsAnAssumption(Loc, RetTy, Ret);
6394	}
6395
6396	// Explicitly call CallLifetimeEnd::Emit just to re-use the code even though
6397	// we can't use the full cleanup mechanism.
6398	for (CallLifetimeEnd &LifetimeEnd : CallLifetimeEndAfterCall)
6399	LifetimeEnd.Emit(CGF&: *this, /Flags=/flags: {});
6400
6401	if (!ReturnValue.isExternallyDestructed() &&
6402	RetTy.isDestructedType() == QualType::DK_nontrivial_c_struct)
6403	pushDestroy(dtorKind: QualType::DK_nontrivial_c_struct, addr: Ret.getAggregateAddress(),
6404	type: RetTy);
6405
6406	// Generate function declaration DISuprogram in order to be used
6407	// in debug info about call sites.
6408	if (CGDebugInfo *DI = getDebugInfo()) {
6409	// Ensure call site info would actually be emitted before collecting
6410	// further callee info.
6411	if (CalleeDecl && !CalleeDecl->hasAttr<NoDebugAttr>() &&
6412	DI->getCallSiteRelatedAttrs() != llvm::DINode::FlagZero) {
6413	CodeGenFunction CalleeCGF(CGM);
6414	const GlobalDecl &CalleeGlobalDecl =
6415	Callee.getAbstractInfo().getCalleeDecl();
6416	CalleeCGF.CurGD = CalleeGlobalDecl;
6417	FunctionArgList Args;
6418	QualType ResTy = CalleeCGF.BuildFunctionArgList(GD: CalleeGlobalDecl, Args);
6419	DI->EmitFuncDeclForCallSite(
6420	CallOrInvoke: CI, CalleeType: DI->getFunctionType(FD: CalleeDecl, RetTy: ResTy, Args), CalleeGlobalDecl);
6421	}
6422	// Generate call site target information.
6423	DI->addCallTargetIfVirtual(FD: CalleeDecl, CI);
6424	}
6425
6426	return Ret;
6427	}
6428
6429	CGCallee CGCallee::prepareConcreteCallee(CodeGenFunction &CGF) const {
6430	if (isVirtual()) {
6431	const CallExpr *CE = getVirtualCallExpr();
6432	return CGF.CGM.getCXXABI().getVirtualFunctionPointer(
6433	CGF, GD: getVirtualMethodDecl(), This: getThisAddress(), Ty: getVirtualFunctionType(),
6434	Loc: CE ? CE->getBeginLoc() : SourceLocation ());
6435	}
6436
6437	return *this;
6438	}
6439
6440	/ VarArg handling /
6441
6442	RValue CodeGenFunction::EmitVAArg(VAArgExpr *VE, Address &VAListAddr,
6443	AggValueSlot Slot) {
6444	VAListAddr = VE->isMicrosoftABI() ? EmitMSVAListRef(E: VE->getSubExpr())
6445	: EmitVAListRef(E: VE->getSubExpr());
6446	QualType Ty = VE->getType();
6447	if (Ty ->isVariablyModifiedType())
6448	EmitVariablyModifiedType(Ty);
6449	if (VE->isMicrosoftABI())
6450	return CGM.getABIInfo().EmitMSVAArg(CGF&: *this, VAListAddr, Ty, Slot);
6451	return CGM.getABIInfo().EmitVAArg(CGF&: *this, VAListAddr, Ty, Slot);
6452	}
6453
6454	DisableDebugLocationUpdates::DisableDebugLocationUpdates(CodeGenFunction &CGF)
6455	: CGF(CGF) {
6456	CGF.disableDebugInfo();
6457	}
6458
6459	DisableDebugLocationUpdates::~DisableDebugLocationUpdates() {
6460	CGF.enableDebugInfo();
6461	}
6462

Browse the source code of llvm_projects/clang/lib/CodeGen/CGCall.cpp