| 1 | //===--- CGCall.cpp - Encapsulate calling convention details --------------===// | 
|---|
| 2 | // | 
|---|
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|---|
| 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|---|
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|---|
| 6 | // | 
|---|
| 7 | //===----------------------------------------------------------------------===// | 
|---|
| 8 | // | 
|---|
| 9 | // These classes wrap the information about a call or function | 
|---|
| 10 | // definition used to handle ABI compliancy. | 
|---|
| 11 | // | 
|---|
| 12 | //===----------------------------------------------------------------------===// | 
|---|
| 13 |  | 
|---|
| 14 | #include "CGCall.h" | 
|---|
| 15 | #include "ABIInfo.h" | 
|---|
| 16 | #include "ABIInfoImpl.h" | 
|---|
| 17 | #include "CGBlocks.h" | 
|---|
| 18 | #include "CGCXXABI.h" | 
|---|
| 19 | #include "CGCleanup.h" | 
|---|
| 20 | #include "CGDebugInfo.h" | 
|---|
| 21 | #include "CGRecordLayout.h" | 
|---|
| 22 | #include "CodeGenFunction.h" | 
|---|
| 23 | #include "CodeGenModule.h" | 
|---|
| 24 | #include "CodeGenPGO.h" | 
|---|
| 25 | #include "TargetInfo.h" | 
|---|
| 26 | #include "clang/AST/Attr.h" | 
|---|
| 27 | #include "clang/AST/Decl.h" | 
|---|
| 28 | #include "clang/AST/DeclCXX.h" | 
|---|
| 29 | #include "clang/AST/DeclObjC.h" | 
|---|
| 30 | #include "clang/Basic/CodeGenOptions.h" | 
|---|
| 31 | #include "clang/Basic/TargetInfo.h" | 
|---|
| 32 | #include "clang/CodeGen/CGFunctionInfo.h" | 
|---|
| 33 | #include "clang/CodeGen/SwiftCallingConv.h" | 
|---|
| 34 | #include "llvm/ADT/StringExtras.h" | 
|---|
| 35 | #include "llvm/Analysis/ValueTracking.h" | 
|---|
| 36 | #include "llvm/IR/Assumptions.h" | 
|---|
| 37 | #include "llvm/IR/AttributeMask.h" | 
|---|
| 38 | #include "llvm/IR/Attributes.h" | 
|---|
| 39 | #include "llvm/IR/CallingConv.h" | 
|---|
| 40 | #include "llvm/IR/DataLayout.h" | 
|---|
| 41 | #include "llvm/IR/InlineAsm.h" | 
|---|
| 42 | #include "llvm/IR/IntrinsicInst.h" | 
|---|
| 43 | #include "llvm/IR/Intrinsics.h" | 
|---|
| 44 | #include "llvm/IR/Type.h" | 
|---|
| 45 | #include "llvm/Transforms/Utils/Local.h" | 
|---|
| 46 | #include <optional> | 
|---|
| 47 | using namespace clang; | 
|---|
| 48 | using namespace CodeGen; | 
|---|
| 49 |  | 
|---|
| 50 | /***/ | 
|---|
| 51 |  | 
|---|
| 52 | unsigned CodeGenTypes::ClangCallConvToLLVMCallConv(CallingConv CC) { | 
|---|
| 53 | switch (CC) { | 
|---|
| 54 | default: | 
|---|
| 55 | return llvm::CallingConv::C; | 
|---|
| 56 | case CC_X86StdCall: | 
|---|
| 57 | return llvm::CallingConv::X86_StdCall; | 
|---|
| 58 | case CC_X86FastCall: | 
|---|
| 59 | return llvm::CallingConv::X86_FastCall; | 
|---|
| 60 | case CC_X86RegCall: | 
|---|
| 61 | return llvm::CallingConv::X86_RegCall; | 
|---|
| 62 | case CC_X86ThisCall: | 
|---|
| 63 | return llvm::CallingConv::X86_ThisCall; | 
|---|
| 64 | case CC_Win64: | 
|---|
| 65 | return llvm::CallingConv::Win64; | 
|---|
| 66 | case CC_X86_64SysV: | 
|---|
| 67 | return llvm::CallingConv::X86_64_SysV; | 
|---|
| 68 | case CC_AAPCS: | 
|---|
| 69 | return llvm::CallingConv::ARM_AAPCS; | 
|---|
| 70 | case CC_AAPCS_VFP: | 
|---|
| 71 | return llvm::CallingConv::ARM_AAPCS_VFP; | 
|---|
| 72 | case CC_IntelOclBicc: | 
|---|
| 73 | return llvm::CallingConv::Intel_OCL_BI; | 
|---|
| 74 | // TODO: Add support for __pascal to LLVM. | 
|---|
| 75 | case CC_X86Pascal: | 
|---|
| 76 | return llvm::CallingConv::C; | 
|---|
| 77 | // TODO: Add support for __vectorcall to LLVM. | 
|---|
| 78 | case CC_X86VectorCall: | 
|---|
| 79 | return llvm::CallingConv::X86_VectorCall; | 
|---|
| 80 | case CC_AArch64VectorCall: | 
|---|
| 81 | return llvm::CallingConv::AArch64_VectorCall; | 
|---|
| 82 | case CC_AArch64SVEPCS: | 
|---|
| 83 | return llvm::CallingConv::AArch64_SVE_VectorCall; | 
|---|
| 84 | case CC_SpirFunction: | 
|---|
| 85 | return llvm::CallingConv::SPIR_FUNC; | 
|---|
| 86 | case CC_DeviceKernel: | 
|---|
| 87 | return CGM.getTargetCodeGenInfo().getDeviceKernelCallingConv(); | 
|---|
| 88 | case CC_PreserveMost: | 
|---|
| 89 | return llvm::CallingConv::PreserveMost; | 
|---|
| 90 | case CC_PreserveAll: | 
|---|
| 91 | return llvm::CallingConv::PreserveAll; | 
|---|
| 92 | case CC_Swift: | 
|---|
| 93 | return llvm::CallingConv::Swift; | 
|---|
| 94 | case CC_SwiftAsync: | 
|---|
| 95 | return llvm::CallingConv::SwiftTail; | 
|---|
| 96 | case CC_M68kRTD: | 
|---|
| 97 | return llvm::CallingConv::M68k_RTD; | 
|---|
| 98 | case CC_PreserveNone: | 
|---|
| 99 | return llvm::CallingConv::PreserveNone; | 
|---|
| 100 | // clang-format off | 
|---|
| 101 | case CC_RISCVVectorCall: return llvm::CallingConv::RISCV_VectorCall; | 
|---|
| 102 | // clang-format on | 
|---|
| 103 | #define CC_VLS_CASE(ABI_VLEN)                                                  \ | 
|---|
| 104 | case CC_RISCVVLSCall_##ABI_VLEN:                                             \ | 
|---|
| 105 | return llvm::CallingConv::RISCV_VLSCall_##ABI_VLEN; | 
|---|
| 106 | CC_VLS_CASE(32) | 
|---|
| 107 | CC_VLS_CASE(64) | 
|---|
| 108 | CC_VLS_CASE(128) | 
|---|
| 109 | CC_VLS_CASE(256) | 
|---|
| 110 | CC_VLS_CASE(512) | 
|---|
| 111 | CC_VLS_CASE(1024) | 
|---|
| 112 | CC_VLS_CASE(2048) | 
|---|
| 113 | CC_VLS_CASE(4096) | 
|---|
| 114 | CC_VLS_CASE(8192) | 
|---|
| 115 | CC_VLS_CASE(16384) | 
|---|
| 116 | CC_VLS_CASE(32768) | 
|---|
| 117 | CC_VLS_CASE(65536) | 
|---|
| 118 | #undef CC_VLS_CASE | 
|---|
| 119 | } | 
|---|
| 120 | } | 
|---|
| 121 |  | 
|---|
| 122 | /// Derives the 'this' type for codegen purposes, i.e. ignoring method CVR | 
|---|
| 123 | /// qualification. Either or both of RD and MD may be null. A null RD indicates | 
|---|
| 124 | /// that there is no meaningful 'this' type, and a null MD can occur when | 
|---|
| 125 | /// calling a method pointer. | 
|---|
| 126 | CanQualType CodeGenTypes::DeriveThisType(const CXXRecordDecl *RD, | 
|---|
| 127 | const CXXMethodDecl *MD) { | 
|---|
| 128 | QualType RecTy; | 
|---|
| 129 | if (RD) | 
|---|
| 130 | RecTy = Context.getTagDeclType(Decl: RD)->getCanonicalTypeInternal(); | 
|---|
| 131 | else | 
|---|
| 132 | RecTy = Context.VoidTy; | 
|---|
| 133 |  | 
|---|
| 134 | if (MD) | 
|---|
| 135 | RecTy = Context.getAddrSpaceQualType( | 
|---|
| 136 | T: RecTy, AddressSpace: MD->getMethodQualifiers().getAddressSpace()); | 
|---|
| 137 | return Context.getPointerType(T: CanQualType::CreateUnsafe(Other: RecTy)); | 
|---|
| 138 | } | 
|---|
| 139 |  | 
|---|
| 140 | /// Returns the canonical formal type of the given C++ method. | 
|---|
| 141 | static CanQual<FunctionProtoType> GetFormalType(const CXXMethodDecl *MD) { | 
|---|
| 142 | return MD->getType() | 
|---|
| 143 | ->getCanonicalTypeUnqualified() | 
|---|
| 144 | .getAs<FunctionProtoType>(); | 
|---|
| 145 | } | 
|---|
| 146 |  | 
|---|
| 147 | /// Returns the "extra-canonicalized" return type, which discards | 
|---|
| 148 | /// qualifiers on the return type.  Codegen doesn't care about them, | 
|---|
| 149 | /// and it makes ABI code a little easier to be able to assume that | 
|---|
| 150 | /// all parameter and return types are top-level unqualified. | 
|---|
| 151 | static CanQualType GetReturnType(QualType RetTy) { | 
|---|
| 152 | return RetTy->getCanonicalTypeUnqualified().getUnqualifiedType(); | 
|---|
| 153 | } | 
|---|
| 154 |  | 
|---|
| 155 | /// Arrange the argument and result information for a value of the given | 
|---|
| 156 | /// unprototyped freestanding function type. | 
|---|
| 157 | const CGFunctionInfo & | 
|---|
| 158 | CodeGenTypes::arrangeFreeFunctionType(CanQual<FunctionNoProtoType> FTNP) { | 
|---|
| 159 | // When translating an unprototyped function type, always use a | 
|---|
| 160 | // variadic type. | 
|---|
| 161 | return arrangeLLVMFunctionInfo(returnType: FTNP->getReturnType().getUnqualifiedType(), | 
|---|
| 162 | opts: FnInfoOpts::None, argTypes: {}, info: FTNP->getExtInfo(), paramInfos: {}, | 
|---|
| 163 | args: RequiredArgs(0)); | 
|---|
| 164 | } | 
|---|
| 165 |  | 
|---|
| 166 | static void addExtParameterInfosForCall( | 
|---|
| 167 | llvm::SmallVectorImpl<FunctionProtoType::ExtParameterInfo> ¶mInfos, | 
|---|
| 168 | const FunctionProtoType *proto, unsigned prefixArgs, unsigned totalArgs) { | 
|---|
| 169 | assert(proto->hasExtParameterInfos()); | 
|---|
| 170 | assert(paramInfos.size() <= prefixArgs); | 
|---|
| 171 | assert(proto->getNumParams() + prefixArgs <= totalArgs); | 
|---|
| 172 |  | 
|---|
| 173 | paramInfos.reserve(N: totalArgs); | 
|---|
| 174 |  | 
|---|
| 175 | // Add default infos for any prefix args that don't already have infos. | 
|---|
| 176 | paramInfos.resize(N: prefixArgs); | 
|---|
| 177 |  | 
|---|
| 178 | // Add infos for the prototype. | 
|---|
| 179 | for (const auto &ParamInfo : proto->getExtParameterInfos()) { | 
|---|
| 180 | paramInfos.push_back(Elt: ParamInfo); | 
|---|
| 181 | // pass_object_size params have no parameter info. | 
|---|
| 182 | if (ParamInfo.hasPassObjectSize()) | 
|---|
| 183 | paramInfos.emplace_back(); | 
|---|
| 184 | } | 
|---|
| 185 |  | 
|---|
| 186 | assert(paramInfos.size() <= totalArgs && | 
|---|
| 187 | "Did we forget to insert pass_object_size args?"); | 
|---|
| 188 | // Add default infos for the variadic and/or suffix arguments. | 
|---|
| 189 | paramInfos.resize(N: totalArgs); | 
|---|
| 190 | } | 
|---|
| 191 |  | 
|---|
| 192 | /// Adds the formal parameters in FPT to the given prefix. If any parameter in | 
|---|
| 193 | /// FPT has pass_object_size attrs, then we'll add parameters for those, too. | 
|---|
| 194 | static void appendParameterTypes( | 
|---|
| 195 | const CodeGenTypes &CGT, SmallVectorImpl<CanQualType> &prefix, | 
|---|
| 196 | SmallVectorImpl<FunctionProtoType::ExtParameterInfo> ¶mInfos, | 
|---|
| 197 | CanQual<FunctionProtoType> FPT) { | 
|---|
| 198 | // Fast path: don't touch param info if we don't need to. | 
|---|
| 199 | if (!FPT->hasExtParameterInfos()) { | 
|---|
| 200 | assert(paramInfos.empty() && | 
|---|
| 201 | "We have paramInfos, but the prototype doesn't?"); | 
|---|
| 202 | prefix.append(in_start: FPT->param_type_begin(), in_end: FPT->param_type_end()); | 
|---|
| 203 | return; | 
|---|
| 204 | } | 
|---|
| 205 |  | 
|---|
| 206 | unsigned PrefixSize = prefix.size(); | 
|---|
| 207 | // In the vast majority of cases, we'll have precisely FPT->getNumParams() | 
|---|
| 208 | // parameters; the only thing that can change this is the presence of | 
|---|
| 209 | // pass_object_size. So, we preallocate for the common case. | 
|---|
| 210 | prefix.reserve(N: prefix.size() + FPT->getNumParams()); | 
|---|
| 211 |  | 
|---|
| 212 | auto ExtInfos = FPT->getExtParameterInfos(); | 
|---|
| 213 | assert(ExtInfos.size() == FPT->getNumParams()); | 
|---|
| 214 | for (unsigned I = 0, E = FPT->getNumParams(); I != E; ++I) { | 
|---|
| 215 | prefix.push_back(Elt: FPT->getParamType(i: I)); | 
|---|
| 216 | if (ExtInfos[I].hasPassObjectSize()) | 
|---|
| 217 | prefix.push_back(Elt: CGT.getContext().getSizeType()); | 
|---|
| 218 | } | 
|---|
| 219 |  | 
|---|
| 220 | addExtParameterInfosForCall(paramInfos, proto: FPT.getTypePtr(), prefixArgs: PrefixSize, | 
|---|
| 221 | totalArgs: prefix.size()); | 
|---|
| 222 | } | 
|---|
| 223 |  | 
|---|
| 224 | using ExtParameterInfoList = | 
|---|
| 225 | SmallVector<FunctionProtoType::ExtParameterInfo, 16>; | 
|---|
| 226 |  | 
|---|
| 227 | /// Arrange the LLVM function layout for a value of the given function | 
|---|
| 228 | /// type, on top of any implicit parameters already stored. | 
|---|
| 229 | static const CGFunctionInfo & | 
|---|
| 230 | arrangeLLVMFunctionInfo(CodeGenTypes &CGT, bool instanceMethod, | 
|---|
| 231 | SmallVectorImpl<CanQualType> &prefix, | 
|---|
| 232 | CanQual<FunctionProtoType> FTP) { | 
|---|
| 233 | ExtParameterInfoList paramInfos; | 
|---|
| 234 | RequiredArgs Required = RequiredArgs::forPrototypePlus(prototype: FTP, additional: prefix.size()); | 
|---|
| 235 | appendParameterTypes(CGT, prefix, paramInfos, FPT: FTP); | 
|---|
| 236 | CanQualType resultType = FTP->getReturnType().getUnqualifiedType(); | 
|---|
| 237 |  | 
|---|
| 238 | FnInfoOpts opts = | 
|---|
| 239 | instanceMethod ? FnInfoOpts::IsInstanceMethod : FnInfoOpts::None; | 
|---|
| 240 | return CGT.arrangeLLVMFunctionInfo(returnType: resultType, opts, argTypes: prefix, | 
|---|
| 241 | info: FTP->getExtInfo(), paramInfos, args: Required); | 
|---|
| 242 | } | 
|---|
| 243 |  | 
|---|
| 244 | using CanQualTypeList = SmallVector<CanQualType, 16>; | 
|---|
| 245 |  | 
|---|
| 246 | /// Arrange the argument and result information for a value of the | 
|---|
| 247 | /// given freestanding function type. | 
|---|
| 248 | const CGFunctionInfo & | 
|---|
| 249 | CodeGenTypes::arrangeFreeFunctionType(CanQual<FunctionProtoType> FTP) { | 
|---|
| 250 | CanQualTypeList argTypes; | 
|---|
| 251 | return ::arrangeLLVMFunctionInfo(CGT&: *this, /*instanceMethod=*/false, prefix&: argTypes, | 
|---|
| 252 | FTP); | 
|---|
| 253 | } | 
|---|
| 254 |  | 
|---|
| 255 | static CallingConv getCallingConventionForDecl(const ObjCMethodDecl *D, | 
|---|
| 256 | bool IsTargetDefaultMSABI) { | 
|---|
| 257 | // Set the appropriate calling convention for the Function. | 
|---|
| 258 | if (D->hasAttr<StdCallAttr>()) | 
|---|
| 259 | return CC_X86StdCall; | 
|---|
| 260 |  | 
|---|
| 261 | if (D->hasAttr<FastCallAttr>()) | 
|---|
| 262 | return CC_X86FastCall; | 
|---|
| 263 |  | 
|---|
| 264 | if (D->hasAttr<RegCallAttr>()) | 
|---|
| 265 | return CC_X86RegCall; | 
|---|
| 266 |  | 
|---|
| 267 | if (D->hasAttr<ThisCallAttr>()) | 
|---|
| 268 | return CC_X86ThisCall; | 
|---|
| 269 |  | 
|---|
| 270 | if (D->hasAttr<VectorCallAttr>()) | 
|---|
| 271 | return CC_X86VectorCall; | 
|---|
| 272 |  | 
|---|
| 273 | if (D->hasAttr<PascalAttr>()) | 
|---|
| 274 | return CC_X86Pascal; | 
|---|
| 275 |  | 
|---|
| 276 | if (PcsAttr *PCS = D->getAttr<PcsAttr>()) | 
|---|
| 277 | return (PCS->getPCS() == PcsAttr::AAPCS ? CC_AAPCS : CC_AAPCS_VFP); | 
|---|
| 278 |  | 
|---|
| 279 | if (D->hasAttr<AArch64VectorPcsAttr>()) | 
|---|
| 280 | return CC_AArch64VectorCall; | 
|---|
| 281 |  | 
|---|
| 282 | if (D->hasAttr<AArch64SVEPcsAttr>()) | 
|---|
| 283 | return CC_AArch64SVEPCS; | 
|---|
| 284 |  | 
|---|
| 285 | if (D->hasAttr<DeviceKernelAttr>()) | 
|---|
| 286 | return CC_DeviceKernel; | 
|---|
| 287 |  | 
|---|
| 288 | if (D->hasAttr<IntelOclBiccAttr>()) | 
|---|
| 289 | return CC_IntelOclBicc; | 
|---|
| 290 |  | 
|---|
| 291 | if (D->hasAttr<MSABIAttr>()) | 
|---|
| 292 | return IsTargetDefaultMSABI ? CC_C : CC_Win64; | 
|---|
| 293 |  | 
|---|
| 294 | if (D->hasAttr<SysVABIAttr>()) | 
|---|
| 295 | return IsTargetDefaultMSABI ? CC_X86_64SysV : CC_C; | 
|---|
| 296 |  | 
|---|
| 297 | if (D->hasAttr<PreserveMostAttr>()) | 
|---|
| 298 | return CC_PreserveMost; | 
|---|
| 299 |  | 
|---|
| 300 | if (D->hasAttr<PreserveAllAttr>()) | 
|---|
| 301 | return CC_PreserveAll; | 
|---|
| 302 |  | 
|---|
| 303 | if (D->hasAttr<M68kRTDAttr>()) | 
|---|
| 304 | return CC_M68kRTD; | 
|---|
| 305 |  | 
|---|
| 306 | if (D->hasAttr<PreserveNoneAttr>()) | 
|---|
| 307 | return CC_PreserveNone; | 
|---|
| 308 |  | 
|---|
| 309 | if (D->hasAttr<RISCVVectorCCAttr>()) | 
|---|
| 310 | return CC_RISCVVectorCall; | 
|---|
| 311 |  | 
|---|
| 312 | if (RISCVVLSCCAttr *PCS = D->getAttr<RISCVVLSCCAttr>()) { | 
|---|
| 313 | switch (PCS->getVectorWidth()) { | 
|---|
| 314 | default: | 
|---|
| 315 | llvm_unreachable( "Invalid RISC-V VLS ABI VLEN"); | 
|---|
| 316 | #define CC_VLS_CASE(ABI_VLEN)                                                  \ | 
|---|
| 317 | case ABI_VLEN:                                                               \ | 
|---|
| 318 | return CC_RISCVVLSCall_##ABI_VLEN; | 
|---|
| 319 | CC_VLS_CASE(32) | 
|---|
| 320 | CC_VLS_CASE(64) | 
|---|
| 321 | CC_VLS_CASE(128) | 
|---|
| 322 | CC_VLS_CASE(256) | 
|---|
| 323 | CC_VLS_CASE(512) | 
|---|
| 324 | CC_VLS_CASE(1024) | 
|---|
| 325 | CC_VLS_CASE(2048) | 
|---|
| 326 | CC_VLS_CASE(4096) | 
|---|
| 327 | CC_VLS_CASE(8192) | 
|---|
| 328 | CC_VLS_CASE(16384) | 
|---|
| 329 | CC_VLS_CASE(32768) | 
|---|
| 330 | CC_VLS_CASE(65536) | 
|---|
| 331 | #undef CC_VLS_CASE | 
|---|
| 332 | } | 
|---|
| 333 | } | 
|---|
| 334 |  | 
|---|
| 335 | return CC_C; | 
|---|
| 336 | } | 
|---|
| 337 |  | 
|---|
| 338 | /// Arrange the argument and result information for a call to an | 
|---|
| 339 | /// unknown C++ non-static member function of the given abstract type. | 
|---|
| 340 | /// (A null RD means we don't have any meaningful "this" argument type, | 
|---|
| 341 | ///  so fall back to a generic pointer type). | 
|---|
| 342 | /// The member function must be an ordinary function, i.e. not a | 
|---|
| 343 | /// constructor or destructor. | 
|---|
| 344 | const CGFunctionInfo & | 
|---|
| 345 | CodeGenTypes::arrangeCXXMethodType(const CXXRecordDecl *RD, | 
|---|
| 346 | const FunctionProtoType *FTP, | 
|---|
| 347 | const CXXMethodDecl *MD) { | 
|---|
| 348 | CanQualTypeList argTypes; | 
|---|
| 349 |  | 
|---|
| 350 | // Add the 'this' pointer. | 
|---|
| 351 | argTypes.push_back(Elt: DeriveThisType(RD, MD)); | 
|---|
| 352 |  | 
|---|
| 353 | return ::arrangeLLVMFunctionInfo( | 
|---|
| 354 | CGT&: *this, /*instanceMethod=*/true, prefix&: argTypes, | 
|---|
| 355 | FTP: FTP->getCanonicalTypeUnqualified().getAs<FunctionProtoType>()); | 
|---|
| 356 | } | 
|---|
| 357 |  | 
|---|
| 358 | /// Set calling convention for CUDA/HIP kernel. | 
|---|
| 359 | static void setCUDAKernelCallingConvention(CanQualType &FTy, CodeGenModule &CGM, | 
|---|
| 360 | const FunctionDecl *FD) { | 
|---|
| 361 | if (FD->hasAttr<CUDAGlobalAttr>()) { | 
|---|
| 362 | const FunctionType *FT = FTy->getAs<FunctionType>(); | 
|---|
| 363 | CGM.getTargetCodeGenInfo().setCUDAKernelCallingConvention(FT); | 
|---|
| 364 | FTy = FT->getCanonicalTypeUnqualified(); | 
|---|
| 365 | } | 
|---|
| 366 | } | 
|---|
| 367 |  | 
|---|
| 368 | /// Arrange the argument and result information for a declaration or | 
|---|
| 369 | /// definition of the given C++ non-static member function.  The | 
|---|
| 370 | /// member function must be an ordinary function, i.e. not a | 
|---|
| 371 | /// constructor or destructor. | 
|---|
| 372 | const CGFunctionInfo & | 
|---|
| 373 | CodeGenTypes::arrangeCXXMethodDeclaration(const CXXMethodDecl *MD) { | 
|---|
| 374 | assert(!isa<CXXConstructorDecl>(MD) && "wrong method for constructors!"); | 
|---|
| 375 | assert(!isa<CXXDestructorDecl>(MD) && "wrong method for destructors!"); | 
|---|
| 376 |  | 
|---|
| 377 | CanQualType FT = GetFormalType(MD).getAs<Type>(); | 
|---|
| 378 | setCUDAKernelCallingConvention(FTy&: FT, CGM, FD: MD); | 
|---|
| 379 | auto prototype = FT.getAs<FunctionProtoType>(); | 
|---|
| 380 |  | 
|---|
| 381 | if (MD->isImplicitObjectMemberFunction()) { | 
|---|
| 382 | // The abstract case is perfectly fine. | 
|---|
| 383 | const CXXRecordDecl *ThisType = | 
|---|
| 384 | getCXXABI().getThisArgumentTypeForMethod(GD: MD); | 
|---|
| 385 | return arrangeCXXMethodType(RD: ThisType, FTP: prototype.getTypePtr(), MD); | 
|---|
| 386 | } | 
|---|
| 387 |  | 
|---|
| 388 | return arrangeFreeFunctionType(FTP: prototype); | 
|---|
| 389 | } | 
|---|
| 390 |  | 
|---|
| 391 | bool CodeGenTypes::inheritingCtorHasParams( | 
|---|
| 392 | const InheritedConstructor &Inherited, CXXCtorType Type) { | 
|---|
| 393 | // Parameters are unnecessary if we're constructing a base class subobject | 
|---|
| 394 | // and the inherited constructor lives in a virtual base. | 
|---|
| 395 | return Type == Ctor_Complete || | 
|---|
| 396 | !Inherited.getShadowDecl()->constructsVirtualBase() || | 
|---|
| 397 | !Target.getCXXABI().hasConstructorVariants(); | 
|---|
| 398 | } | 
|---|
| 399 |  | 
|---|
| 400 | const CGFunctionInfo & | 
|---|
| 401 | CodeGenTypes::arrangeCXXStructorDeclaration(GlobalDecl GD) { | 
|---|
| 402 | auto *MD = cast<CXXMethodDecl>(Val: GD.getDecl()); | 
|---|
| 403 |  | 
|---|
| 404 | CanQualTypeList argTypes; | 
|---|
| 405 | ExtParameterInfoList paramInfos; | 
|---|
| 406 |  | 
|---|
| 407 | const CXXRecordDecl *ThisType = getCXXABI().getThisArgumentTypeForMethod(GD); | 
|---|
| 408 | argTypes.push_back(Elt: DeriveThisType(RD: ThisType, MD)); | 
|---|
| 409 |  | 
|---|
| 410 | bool PassParams = true; | 
|---|
| 411 |  | 
|---|
| 412 | if (auto *CD = dyn_cast<CXXConstructorDecl>(Val: MD)) { | 
|---|
| 413 | // A base class inheriting constructor doesn't get forwarded arguments | 
|---|
| 414 | // needed to construct a virtual base (or base class thereof). | 
|---|
| 415 | if (auto Inherited = CD->getInheritedConstructor()) | 
|---|
| 416 | PassParams = inheritingCtorHasParams(Inherited, Type: GD.getCtorType()); | 
|---|
| 417 | } | 
|---|
| 418 |  | 
|---|
| 419 | CanQual<FunctionProtoType> FTP = GetFormalType(MD); | 
|---|
| 420 |  | 
|---|
| 421 | // Add the formal parameters. | 
|---|
| 422 | if (PassParams) | 
|---|
| 423 | appendParameterTypes(CGT: *this, prefix&: argTypes, paramInfos, FPT: FTP); | 
|---|
| 424 |  | 
|---|
| 425 | CGCXXABI::AddedStructorArgCounts AddedArgs = | 
|---|
| 426 | getCXXABI().buildStructorSignature(GD, ArgTys&: argTypes); | 
|---|
| 427 | if (!paramInfos.empty()) { | 
|---|
| 428 | // Note: prefix implies after the first param. | 
|---|
| 429 | if (AddedArgs.Prefix) | 
|---|
| 430 | paramInfos.insert(I: paramInfos.begin() + 1, NumToInsert: AddedArgs.Prefix, | 
|---|
| 431 | Elt: FunctionProtoType::ExtParameterInfo{}); | 
|---|
| 432 | if (AddedArgs.Suffix) | 
|---|
| 433 | paramInfos.append(NumInputs: AddedArgs.Suffix, | 
|---|
| 434 | Elt: FunctionProtoType::ExtParameterInfo{}); | 
|---|
| 435 | } | 
|---|
| 436 |  | 
|---|
| 437 | RequiredArgs required = | 
|---|
| 438 | (PassParams && MD->isVariadic() ? RequiredArgs(argTypes.size()) | 
|---|
| 439 | : RequiredArgs::All); | 
|---|
| 440 |  | 
|---|
| 441 | FunctionType::ExtInfo extInfo = FTP->getExtInfo(); | 
|---|
| 442 | CanQualType resultType = getCXXABI().HasThisReturn(GD) ? argTypes.front() | 
|---|
| 443 | : getCXXABI().hasMostDerivedReturn(GD) | 
|---|
| 444 | ? CGM.getContext().VoidPtrTy | 
|---|
| 445 | : Context.VoidTy; | 
|---|
| 446 | return arrangeLLVMFunctionInfo(returnType: resultType, opts: FnInfoOpts::IsInstanceMethod, | 
|---|
| 447 | argTypes, info: extInfo, paramInfos, args: required); | 
|---|
| 448 | } | 
|---|
| 449 |  | 
|---|
| 450 | static CanQualTypeList getArgTypesForCall(ASTContext &ctx, | 
|---|
| 451 | const CallArgList &args) { | 
|---|
| 452 | CanQualTypeList argTypes; | 
|---|
| 453 | for (auto &arg : args) | 
|---|
| 454 | argTypes.push_back(Elt: ctx.getCanonicalParamType(T: arg.Ty)); | 
|---|
| 455 | return argTypes; | 
|---|
| 456 | } | 
|---|
| 457 |  | 
|---|
| 458 | static CanQualTypeList getArgTypesForDeclaration(ASTContext &ctx, | 
|---|
| 459 | const FunctionArgList &args) { | 
|---|
| 460 | CanQualTypeList argTypes; | 
|---|
| 461 | for (auto &arg : args) | 
|---|
| 462 | argTypes.push_back(Elt: ctx.getCanonicalParamType(T: arg->getType())); | 
|---|
| 463 | return argTypes; | 
|---|
| 464 | } | 
|---|
| 465 |  | 
|---|
| 466 | static ExtParameterInfoList | 
|---|
| 467 | getExtParameterInfosForCall(const FunctionProtoType *proto, unsigned prefixArgs, | 
|---|
| 468 | unsigned totalArgs) { | 
|---|
| 469 | ExtParameterInfoList result; | 
|---|
| 470 | if (proto->hasExtParameterInfos()) { | 
|---|
| 471 | addExtParameterInfosForCall(paramInfos&: result, proto, prefixArgs, totalArgs); | 
|---|
| 472 | } | 
|---|
| 473 | return result; | 
|---|
| 474 | } | 
|---|
| 475 |  | 
|---|
| 476 | /// Arrange a call to a C++ method, passing the given arguments. | 
|---|
| 477 | /// | 
|---|
| 478 | /// ExtraPrefixArgs is the number of ABI-specific args passed after the `this` | 
|---|
| 479 | /// parameter. | 
|---|
| 480 | /// ExtraSuffixArgs is the number of ABI-specific args passed at the end of | 
|---|
| 481 | /// args. | 
|---|
| 482 | /// PassProtoArgs indicates whether `args` has args for the parameters in the | 
|---|
| 483 | /// given CXXConstructorDecl. | 
|---|
| 484 | const CGFunctionInfo &CodeGenTypes::arrangeCXXConstructorCall( | 
|---|
| 485 | const CallArgList &args, const CXXConstructorDecl *D, CXXCtorType CtorKind, | 
|---|
| 486 | unsigned , unsigned , bool PassProtoArgs) { | 
|---|
| 487 | CanQualTypeList ArgTypes; | 
|---|
| 488 | for (const auto &Arg : args) | 
|---|
| 489 | ArgTypes.push_back(Elt: Context.getCanonicalParamType(T: Arg.Ty)); | 
|---|
| 490 |  | 
|---|
| 491 | // +1 for implicit this, which should always be args[0]. | 
|---|
| 492 | unsigned TotalPrefixArgs = 1 + ExtraPrefixArgs; | 
|---|
| 493 |  | 
|---|
| 494 | CanQual<FunctionProtoType> FPT = GetFormalType(MD: D); | 
|---|
| 495 | RequiredArgs Required = PassProtoArgs | 
|---|
| 496 | ? RequiredArgs::forPrototypePlus( | 
|---|
| 497 | prototype: FPT, additional: TotalPrefixArgs + ExtraSuffixArgs) | 
|---|
| 498 | : RequiredArgs::All; | 
|---|
| 499 |  | 
|---|
| 500 | GlobalDecl GD(D, CtorKind); | 
|---|
| 501 | CanQualType ResultType = getCXXABI().HasThisReturn(GD) ? ArgTypes.front() | 
|---|
| 502 | : getCXXABI().hasMostDerivedReturn(GD) | 
|---|
| 503 | ? CGM.getContext().VoidPtrTy | 
|---|
| 504 | : Context.VoidTy; | 
|---|
| 505 |  | 
|---|
| 506 | FunctionType::ExtInfo Info = FPT->getExtInfo(); | 
|---|
| 507 | ExtParameterInfoList ParamInfos; | 
|---|
| 508 | // If the prototype args are elided, we should only have ABI-specific args, | 
|---|
| 509 | // which never have param info. | 
|---|
| 510 | if (PassProtoArgs && FPT->hasExtParameterInfos()) { | 
|---|
| 511 | // ABI-specific suffix arguments are treated the same as variadic arguments. | 
|---|
| 512 | addExtParameterInfosForCall(paramInfos&: ParamInfos, proto: FPT.getTypePtr(), prefixArgs: TotalPrefixArgs, | 
|---|
| 513 | totalArgs: ArgTypes.size()); | 
|---|
| 514 | } | 
|---|
| 515 |  | 
|---|
| 516 | return arrangeLLVMFunctionInfo(returnType: ResultType, opts: FnInfoOpts::IsInstanceMethod, | 
|---|
| 517 | argTypes: ArgTypes, info: Info, paramInfos: ParamInfos, args: Required); | 
|---|
| 518 | } | 
|---|
| 519 |  | 
|---|
| 520 | /// Arrange the argument and result information for the declaration or | 
|---|
| 521 | /// definition of the given function. | 
|---|
| 522 | const CGFunctionInfo & | 
|---|
| 523 | CodeGenTypes::arrangeFunctionDeclaration(const GlobalDecl GD) { | 
|---|
| 524 | const FunctionDecl *FD = cast<FunctionDecl>(Val: GD.getDecl()); | 
|---|
| 525 | if (const CXXMethodDecl *MD = dyn_cast<CXXMethodDecl>(Val: FD)) | 
|---|
| 526 | if (MD->isImplicitObjectMemberFunction()) | 
|---|
| 527 | return arrangeCXXMethodDeclaration(MD); | 
|---|
| 528 |  | 
|---|
| 529 | CanQualType FTy = FD->getType()->getCanonicalTypeUnqualified(); | 
|---|
| 530 |  | 
|---|
| 531 | assert(isa<FunctionType>(FTy)); | 
|---|
| 532 | setCUDAKernelCallingConvention(FTy, CGM, FD); | 
|---|
| 533 |  | 
|---|
| 534 | if (DeviceKernelAttr::isOpenCLSpelling(A: FD->getAttr<DeviceKernelAttr>()) && | 
|---|
| 535 | GD.getKernelReferenceKind() == KernelReferenceKind::Stub) { | 
|---|
| 536 | const FunctionType *FT = FTy->getAs<FunctionType>(); | 
|---|
| 537 | CGM.getTargetCodeGenInfo().setOCLKernelStubCallingConvention(FT); | 
|---|
| 538 | FTy = FT->getCanonicalTypeUnqualified(); | 
|---|
| 539 | } | 
|---|
| 540 |  | 
|---|
| 541 | // When declaring a function without a prototype, always use a | 
|---|
| 542 | // non-variadic type. | 
|---|
| 543 | if (CanQual<FunctionNoProtoType> noProto = FTy.getAs<FunctionNoProtoType>()) { | 
|---|
| 544 | return arrangeLLVMFunctionInfo(returnType: noProto->getReturnType(), opts: FnInfoOpts::None, | 
|---|
| 545 | argTypes: {}, info: noProto->getExtInfo(), paramInfos: {}, | 
|---|
| 546 | args: RequiredArgs::All); | 
|---|
| 547 | } | 
|---|
| 548 |  | 
|---|
| 549 | return arrangeFreeFunctionType(FTP: FTy.castAs<FunctionProtoType>()); | 
|---|
| 550 | } | 
|---|
| 551 |  | 
|---|
| 552 | /// Arrange the argument and result information for the declaration or | 
|---|
| 553 | /// definition of an Objective-C method. | 
|---|
| 554 | const CGFunctionInfo & | 
|---|
| 555 | CodeGenTypes::arrangeObjCMethodDeclaration(const ObjCMethodDecl *MD) { | 
|---|
| 556 | // It happens that this is the same as a call with no optional | 
|---|
| 557 | // arguments, except also using the formal 'self' type. | 
|---|
| 558 | return arrangeObjCMessageSendSignature(MD, receiverType: MD->getSelfDecl()->getType()); | 
|---|
| 559 | } | 
|---|
| 560 |  | 
|---|
| 561 | /// Arrange the argument and result information for the function type | 
|---|
| 562 | /// through which to perform a send to the given Objective-C method, | 
|---|
| 563 | /// using the given receiver type.  The receiver type is not always | 
|---|
| 564 | /// the 'self' type of the method or even an Objective-C pointer type. | 
|---|
| 565 | /// This is *not* the right method for actually performing such a | 
|---|
| 566 | /// message send, due to the possibility of optional arguments. | 
|---|
| 567 | const CGFunctionInfo & | 
|---|
| 568 | CodeGenTypes::arrangeObjCMessageSendSignature(const ObjCMethodDecl *MD, | 
|---|
| 569 | QualType receiverType) { | 
|---|
| 570 | CanQualTypeList argTys; | 
|---|
| 571 | ExtParameterInfoList extParamInfos(MD->isDirectMethod() ? 1 : 2); | 
|---|
| 572 | argTys.push_back(Elt: Context.getCanonicalParamType(T: receiverType)); | 
|---|
| 573 | if (!MD->isDirectMethod()) | 
|---|
| 574 | argTys.push_back(Elt: Context.getCanonicalParamType(T: Context.getObjCSelType())); | 
|---|
| 575 | for (const auto *I : MD->parameters()) { | 
|---|
| 576 | argTys.push_back(Elt: Context.getCanonicalParamType(T: I->getType())); | 
|---|
| 577 | auto extParamInfo = FunctionProtoType::ExtParameterInfo().withIsNoEscape( | 
|---|
| 578 | NoEscape: I->hasAttr<NoEscapeAttr>()); | 
|---|
| 579 | extParamInfos.push_back(Elt: extParamInfo); | 
|---|
| 580 | } | 
|---|
| 581 |  | 
|---|
| 582 | FunctionType::ExtInfo einfo; | 
|---|
| 583 | bool IsTargetDefaultMSABI = | 
|---|
| 584 | getContext().getTargetInfo().getTriple().isOSWindows() || | 
|---|
| 585 | getContext().getTargetInfo().getTriple().isUEFI(); | 
|---|
| 586 | einfo = einfo.withCallingConv( | 
|---|
| 587 | cc: getCallingConventionForDecl(D: MD, IsTargetDefaultMSABI)); | 
|---|
| 588 |  | 
|---|
| 589 | if (getContext().getLangOpts().ObjCAutoRefCount && | 
|---|
| 590 | MD->hasAttr<NSReturnsRetainedAttr>()) | 
|---|
| 591 | einfo = einfo.withProducesResult(producesResult: true); | 
|---|
| 592 |  | 
|---|
| 593 | RequiredArgs required = | 
|---|
| 594 | (MD->isVariadic() ? RequiredArgs(argTys.size()) : RequiredArgs::All); | 
|---|
| 595 |  | 
|---|
| 596 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: MD->getReturnType()), | 
|---|
| 597 | opts: FnInfoOpts::None, argTypes: argTys, info: einfo, paramInfos: extParamInfos, | 
|---|
| 598 | args: required); | 
|---|
| 599 | } | 
|---|
| 600 |  | 
|---|
| 601 | const CGFunctionInfo & | 
|---|
| 602 | CodeGenTypes::arrangeUnprototypedObjCMessageSend(QualType returnType, | 
|---|
| 603 | const CallArgList &args) { | 
|---|
| 604 | CanQualTypeList argTypes = getArgTypesForCall(ctx&: Context, args); | 
|---|
| 605 | FunctionType::ExtInfo einfo; | 
|---|
| 606 |  | 
|---|
| 607 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: returnType), opts: FnInfoOpts::None, | 
|---|
| 608 | argTypes, info: einfo, paramInfos: {}, args: RequiredArgs::All); | 
|---|
| 609 | } | 
|---|
| 610 |  | 
|---|
| 611 | const CGFunctionInfo &CodeGenTypes::arrangeGlobalDeclaration(GlobalDecl GD) { | 
|---|
| 612 | // FIXME: Do we need to handle ObjCMethodDecl? | 
|---|
| 613 | if (isa<CXXConstructorDecl>(Val: GD.getDecl()) || | 
|---|
| 614 | isa<CXXDestructorDecl>(Val: GD.getDecl())) | 
|---|
| 615 | return arrangeCXXStructorDeclaration(GD); | 
|---|
| 616 |  | 
|---|
| 617 | return arrangeFunctionDeclaration(GD); | 
|---|
| 618 | } | 
|---|
| 619 |  | 
|---|
| 620 | /// Arrange a thunk that takes 'this' as the first parameter followed by | 
|---|
| 621 | /// varargs.  Return a void pointer, regardless of the actual return type. | 
|---|
| 622 | /// The body of the thunk will end in a musttail call to a function of the | 
|---|
| 623 | /// correct type, and the caller will bitcast the function to the correct | 
|---|
| 624 | /// prototype. | 
|---|
| 625 | const CGFunctionInfo & | 
|---|
| 626 | CodeGenTypes::arrangeUnprototypedMustTailThunk(const CXXMethodDecl *MD) { | 
|---|
| 627 | assert(MD->isVirtual() && "only methods have thunks"); | 
|---|
| 628 | CanQual<FunctionProtoType> FTP = GetFormalType(MD); | 
|---|
| 629 | CanQualType ArgTys[] = {DeriveThisType(RD: MD->getParent(), MD)}; | 
|---|
| 630 | return arrangeLLVMFunctionInfo(returnType: Context.VoidTy, opts: FnInfoOpts::None, argTypes: ArgTys, | 
|---|
| 631 | info: FTP->getExtInfo(), paramInfos: {}, args: RequiredArgs(1)); | 
|---|
| 632 | } | 
|---|
| 633 |  | 
|---|
| 634 | const CGFunctionInfo & | 
|---|
| 635 | CodeGenTypes::arrangeMSCtorClosure(const CXXConstructorDecl *CD, | 
|---|
| 636 | CXXCtorType CT) { | 
|---|
| 637 | assert(CT == Ctor_CopyingClosure || CT == Ctor_DefaultClosure); | 
|---|
| 638 |  | 
|---|
| 639 | CanQual<FunctionProtoType> FTP = GetFormalType(MD: CD); | 
|---|
| 640 | SmallVector<CanQualType, 2> ArgTys; | 
|---|
| 641 | const CXXRecordDecl *RD = CD->getParent(); | 
|---|
| 642 | ArgTys.push_back(Elt: DeriveThisType(RD, MD: CD)); | 
|---|
| 643 | if (CT == Ctor_CopyingClosure) | 
|---|
| 644 | ArgTys.push_back(Elt: *FTP->param_type_begin()); | 
|---|
| 645 | if (RD->getNumVBases() > 0) | 
|---|
| 646 | ArgTys.push_back(Elt: Context.IntTy); | 
|---|
| 647 | CallingConv CC = Context.getDefaultCallingConvention( | 
|---|
| 648 | /*IsVariadic=*/false, /*IsCXXMethod=*/true); | 
|---|
| 649 | return arrangeLLVMFunctionInfo(returnType: Context.VoidTy, opts: FnInfoOpts::IsInstanceMethod, | 
|---|
| 650 | argTypes: ArgTys, info: FunctionType::ExtInfo(CC), paramInfos: {}, | 
|---|
| 651 | args: RequiredArgs::All); | 
|---|
| 652 | } | 
|---|
| 653 |  | 
|---|
| 654 | /// Arrange a call as unto a free function, except possibly with an | 
|---|
| 655 | /// additional number of formal parameters considered required. | 
|---|
| 656 | static const CGFunctionInfo & | 
|---|
| 657 | arrangeFreeFunctionLikeCall(CodeGenTypes &CGT, CodeGenModule &CGM, | 
|---|
| 658 | const CallArgList &args, const FunctionType *fnType, | 
|---|
| 659 | unsigned , bool chainCall) { | 
|---|
| 660 | assert(args.size() >= numExtraRequiredArgs); | 
|---|
| 661 |  | 
|---|
| 662 | ExtParameterInfoList paramInfos; | 
|---|
| 663 |  | 
|---|
| 664 | // In most cases, there are no optional arguments. | 
|---|
| 665 | RequiredArgs required = RequiredArgs::All; | 
|---|
| 666 |  | 
|---|
| 667 | // If we have a variadic prototype, the required arguments are the | 
|---|
| 668 | // extra prefix plus the arguments in the prototype. | 
|---|
| 669 | if (const FunctionProtoType *proto = dyn_cast<FunctionProtoType>(Val: fnType)) { | 
|---|
| 670 | if (proto->isVariadic()) | 
|---|
| 671 | required = RequiredArgs::forPrototypePlus(prototype: proto, additional: numExtraRequiredArgs); | 
|---|
| 672 |  | 
|---|
| 673 | if (proto->hasExtParameterInfos()) | 
|---|
| 674 | addExtParameterInfosForCall(paramInfos, proto, prefixArgs: numExtraRequiredArgs, | 
|---|
| 675 | totalArgs: args.size()); | 
|---|
| 676 |  | 
|---|
| 677 | // If we don't have a prototype at all, but we're supposed to | 
|---|
| 678 | // explicitly use the variadic convention for unprototyped calls, | 
|---|
| 679 | // treat all of the arguments as required but preserve the nominal | 
|---|
| 680 | // possibility of variadics. | 
|---|
| 681 | } else if (CGM.getTargetCodeGenInfo().isNoProtoCallVariadic( | 
|---|
| 682 | args, fnType: cast<FunctionNoProtoType>(Val: fnType))) { | 
|---|
| 683 | required = RequiredArgs(args.size()); | 
|---|
| 684 | } | 
|---|
| 685 |  | 
|---|
| 686 | CanQualTypeList argTypes; | 
|---|
| 687 | for (const auto &arg : args) | 
|---|
| 688 | argTypes.push_back(Elt: CGT.getContext().getCanonicalParamType(T: arg.Ty)); | 
|---|
| 689 | FnInfoOpts opts = chainCall ? FnInfoOpts::IsChainCall : FnInfoOpts::None; | 
|---|
| 690 | return CGT.arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: fnType->getReturnType()), | 
|---|
| 691 | opts, argTypes, info: fnType->getExtInfo(), | 
|---|
| 692 | paramInfos, args: required); | 
|---|
| 693 | } | 
|---|
| 694 |  | 
|---|
| 695 | /// Figure out the rules for calling a function with the given formal | 
|---|
| 696 | /// type using the given arguments.  The arguments are necessary | 
|---|
| 697 | /// because the function might be unprototyped, in which case it's | 
|---|
| 698 | /// target-dependent in crazy ways. | 
|---|
| 699 | const CGFunctionInfo &CodeGenTypes::arrangeFreeFunctionCall( | 
|---|
| 700 | const CallArgList &args, const FunctionType *fnType, bool chainCall) { | 
|---|
| 701 | return arrangeFreeFunctionLikeCall(CGT&: *this, CGM, args, fnType, | 
|---|
| 702 | numExtraRequiredArgs: chainCall ? 1 : 0, chainCall); | 
|---|
| 703 | } | 
|---|
| 704 |  | 
|---|
| 705 | /// A block function is essentially a free function with an | 
|---|
| 706 | /// extra implicit argument. | 
|---|
| 707 | const CGFunctionInfo & | 
|---|
| 708 | CodeGenTypes::arrangeBlockFunctionCall(const CallArgList &args, | 
|---|
| 709 | const FunctionType *fnType) { | 
|---|
| 710 | return arrangeFreeFunctionLikeCall(CGT&: *this, CGM, args, fnType, numExtraRequiredArgs: 1, | 
|---|
| 711 | /*chainCall=*/false); | 
|---|
| 712 | } | 
|---|
| 713 |  | 
|---|
| 714 | const CGFunctionInfo & | 
|---|
| 715 | CodeGenTypes::arrangeBlockFunctionDeclaration(const FunctionProtoType *proto, | 
|---|
| 716 | const FunctionArgList ¶ms) { | 
|---|
| 717 | ExtParameterInfoList paramInfos = | 
|---|
| 718 | getExtParameterInfosForCall(proto, prefixArgs: 1, totalArgs: params.size()); | 
|---|
| 719 | CanQualTypeList argTypes = getArgTypesForDeclaration(ctx&: Context, args: params); | 
|---|
| 720 |  | 
|---|
| 721 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: proto->getReturnType()), | 
|---|
| 722 | opts: FnInfoOpts::None, argTypes, | 
|---|
| 723 | info: proto->getExtInfo(), paramInfos, | 
|---|
| 724 | args: RequiredArgs::forPrototypePlus(prototype: proto, additional: 1)); | 
|---|
| 725 | } | 
|---|
| 726 |  | 
|---|
| 727 | const CGFunctionInfo & | 
|---|
| 728 | CodeGenTypes::arrangeBuiltinFunctionCall(QualType resultType, | 
|---|
| 729 | const CallArgList &args) { | 
|---|
| 730 | CanQualTypeList argTypes; | 
|---|
| 731 | for (const auto &Arg : args) | 
|---|
| 732 | argTypes.push_back(Elt: Context.getCanonicalParamType(T: Arg.Ty)); | 
|---|
| 733 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: resultType), opts: FnInfoOpts::None, | 
|---|
| 734 | argTypes, info: FunctionType::ExtInfo(), | 
|---|
| 735 | /*paramInfos=*/{}, args: RequiredArgs::All); | 
|---|
| 736 | } | 
|---|
| 737 |  | 
|---|
| 738 | const CGFunctionInfo & | 
|---|
| 739 | CodeGenTypes::arrangeBuiltinFunctionDeclaration(QualType resultType, | 
|---|
| 740 | const FunctionArgList &args) { | 
|---|
| 741 | CanQualTypeList argTypes = getArgTypesForDeclaration(ctx&: Context, args); | 
|---|
| 742 |  | 
|---|
| 743 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: resultType), opts: FnInfoOpts::None, | 
|---|
| 744 | argTypes, info: FunctionType::ExtInfo(), paramInfos: {}, | 
|---|
| 745 | args: RequiredArgs::All); | 
|---|
| 746 | } | 
|---|
| 747 |  | 
|---|
| 748 | const CGFunctionInfo &CodeGenTypes::arrangeBuiltinFunctionDeclaration( | 
|---|
| 749 | CanQualType resultType, ArrayRef<CanQualType> argTypes) { | 
|---|
| 750 | return arrangeLLVMFunctionInfo(returnType: resultType, opts: FnInfoOpts::None, argTypes, | 
|---|
| 751 | info: FunctionType::ExtInfo(), paramInfos: {}, | 
|---|
| 752 | args: RequiredArgs::All); | 
|---|
| 753 | } | 
|---|
| 754 |  | 
|---|
| 755 | const CGFunctionInfo & | 
|---|
| 756 | CodeGenTypes::arrangeSYCLKernelCallerDeclaration(QualType resultType, | 
|---|
| 757 | const FunctionArgList &args) { | 
|---|
| 758 | CanQualTypeList argTypes = getArgTypesForDeclaration(ctx&: Context, args); | 
|---|
| 759 |  | 
|---|
| 760 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: resultType), opts: FnInfoOpts::None, | 
|---|
| 761 | argTypes, | 
|---|
| 762 | info: FunctionType::ExtInfo(CC_DeviceKernel), | 
|---|
| 763 | /*paramInfos=*/{}, args: RequiredArgs::All); | 
|---|
| 764 | } | 
|---|
| 765 |  | 
|---|
| 766 | /// Arrange a call to a C++ method, passing the given arguments. | 
|---|
| 767 | /// | 
|---|
| 768 | /// numPrefixArgs is the number of ABI-specific prefix arguments we have. It | 
|---|
| 769 | /// does not count `this`. | 
|---|
| 770 | const CGFunctionInfo &CodeGenTypes::arrangeCXXMethodCall( | 
|---|
| 771 | const CallArgList &args, const FunctionProtoType *proto, | 
|---|
| 772 | RequiredArgs required, unsigned numPrefixArgs) { | 
|---|
| 773 | assert(numPrefixArgs + 1 <= args.size() && | 
|---|
| 774 | "Emitting a call with less args than the required prefix?"); | 
|---|
| 775 | // Add one to account for `this`. It's a bit awkward here, but we don't count | 
|---|
| 776 | // `this` in similar places elsewhere. | 
|---|
| 777 | ExtParameterInfoList paramInfos = | 
|---|
| 778 | getExtParameterInfosForCall(proto, prefixArgs: numPrefixArgs + 1, totalArgs: args.size()); | 
|---|
| 779 |  | 
|---|
| 780 | CanQualTypeList argTypes = getArgTypesForCall(ctx&: Context, args); | 
|---|
| 781 |  | 
|---|
| 782 | FunctionType::ExtInfo info = proto->getExtInfo(); | 
|---|
| 783 | return arrangeLLVMFunctionInfo(returnType: GetReturnType(RetTy: proto->getReturnType()), | 
|---|
| 784 | opts: FnInfoOpts::IsInstanceMethod, argTypes, info, | 
|---|
| 785 | paramInfos, args: required); | 
|---|
| 786 | } | 
|---|
| 787 |  | 
|---|
| 788 | const CGFunctionInfo &CodeGenTypes::arrangeNullaryFunction() { | 
|---|
| 789 | return arrangeLLVMFunctionInfo(returnType: getContext().VoidTy, opts: FnInfoOpts::None, argTypes: {}, | 
|---|
| 790 | info: FunctionType::ExtInfo(), paramInfos: {}, | 
|---|
| 791 | args: RequiredArgs::All); | 
|---|
| 792 | } | 
|---|
| 793 |  | 
|---|
| 794 | const CGFunctionInfo &CodeGenTypes::arrangeCall(const CGFunctionInfo &signature, | 
|---|
| 795 | const CallArgList &args) { | 
|---|
| 796 | assert(signature.arg_size() <= args.size()); | 
|---|
| 797 | if (signature.arg_size() == args.size()) | 
|---|
| 798 | return signature; | 
|---|
| 799 |  | 
|---|
| 800 | ExtParameterInfoList paramInfos; | 
|---|
| 801 | auto sigParamInfos = signature.getExtParameterInfos(); | 
|---|
| 802 | if (!sigParamInfos.empty()) { | 
|---|
| 803 | paramInfos.append(in_start: sigParamInfos.begin(), in_end: sigParamInfos.end()); | 
|---|
| 804 | paramInfos.resize(N: args.size()); | 
|---|
| 805 | } | 
|---|
| 806 |  | 
|---|
| 807 | CanQualTypeList argTypes = getArgTypesForCall(ctx&: Context, args); | 
|---|
| 808 |  | 
|---|
| 809 | assert(signature.getRequiredArgs().allowsOptionalArgs()); | 
|---|
| 810 | FnInfoOpts opts = FnInfoOpts::None; | 
|---|
| 811 | if (signature.isInstanceMethod()) | 
|---|
| 812 | opts |= FnInfoOpts::IsInstanceMethod; | 
|---|
| 813 | if (signature.isChainCall()) | 
|---|
| 814 | opts |= FnInfoOpts::IsChainCall; | 
|---|
| 815 | if (signature.isDelegateCall()) | 
|---|
| 816 | opts |= FnInfoOpts::IsDelegateCall; | 
|---|
| 817 | return arrangeLLVMFunctionInfo(returnType: signature.getReturnType(), opts, argTypes, | 
|---|
| 818 | info: signature.getExtInfo(), paramInfos, | 
|---|
| 819 | args: signature.getRequiredArgs()); | 
|---|
| 820 | } | 
|---|
| 821 |  | 
|---|
| 822 | namespace clang { | 
|---|
| 823 | namespace CodeGen { | 
|---|
| 824 | void computeSPIRKernelABIInfo(CodeGenModule &CGM, CGFunctionInfo &FI); | 
|---|
| 825 | } | 
|---|
| 826 | } // namespace clang | 
|---|
| 827 |  | 
|---|
| 828 | /// Arrange the argument and result information for an abstract value | 
|---|
| 829 | /// of a given function type.  This is the method which all of the | 
|---|
| 830 | /// above functions ultimately defer to. | 
|---|
| 831 | const CGFunctionInfo &CodeGenTypes::arrangeLLVMFunctionInfo( | 
|---|
| 832 | CanQualType resultType, FnInfoOpts opts, ArrayRef<CanQualType> argTypes, | 
|---|
| 833 | FunctionType::ExtInfo info, | 
|---|
| 834 | ArrayRef<FunctionProtoType::ExtParameterInfo> paramInfos, | 
|---|
| 835 | RequiredArgs required) { | 
|---|
| 836 | assert(llvm::all_of(argTypes, | 
|---|
| 837 | [](CanQualType T) { return T.isCanonicalAsParam(); })); | 
|---|
| 838 |  | 
|---|
| 839 | // Lookup or create unique function info. | 
|---|
| 840 | llvm::FoldingSetNodeID ID; | 
|---|
| 841 | bool isInstanceMethod = | 
|---|
| 842 | (opts & FnInfoOpts::IsInstanceMethod) == FnInfoOpts::IsInstanceMethod; | 
|---|
| 843 | bool isChainCall = | 
|---|
| 844 | (opts & FnInfoOpts::IsChainCall) == FnInfoOpts::IsChainCall; | 
|---|
| 845 | bool isDelegateCall = | 
|---|
| 846 | (opts & FnInfoOpts::IsDelegateCall) == FnInfoOpts::IsDelegateCall; | 
|---|
| 847 | CGFunctionInfo::Profile(ID, InstanceMethod: isInstanceMethod, ChainCall: isChainCall, IsDelegateCall: isDelegateCall, | 
|---|
| 848 | info, paramInfos, required, resultType, argTypes); | 
|---|
| 849 |  | 
|---|
| 850 | void *insertPos = nullptr; | 
|---|
| 851 | CGFunctionInfo *FI = FunctionInfos.FindNodeOrInsertPos(ID, InsertPos&: insertPos); | 
|---|
| 852 | if (FI) | 
|---|
| 853 | return *FI; | 
|---|
| 854 |  | 
|---|
| 855 | unsigned CC = ClangCallConvToLLVMCallConv(CC: info.getCC()); | 
|---|
| 856 |  | 
|---|
| 857 | // Construct the function info.  We co-allocate the ArgInfos. | 
|---|
| 858 | FI = CGFunctionInfo::create(llvmCC: CC, instanceMethod: isInstanceMethod, chainCall: isChainCall, delegateCall: isDelegateCall, | 
|---|
| 859 | extInfo: info, paramInfos, resultType, argTypes, required); | 
|---|
| 860 | FunctionInfos.InsertNode(N: FI, InsertPos: insertPos); | 
|---|
| 861 |  | 
|---|
| 862 | bool inserted = FunctionsBeingProcessed.insert(Ptr: FI).second; | 
|---|
| 863 | (void)inserted; | 
|---|
| 864 | assert(inserted && "Recursively being processed?"); | 
|---|
| 865 |  | 
|---|
| 866 | // Compute ABI information. | 
|---|
| 867 | if (CC == llvm::CallingConv::SPIR_KERNEL) { | 
|---|
| 868 | // Force target independent argument handling for the host visible | 
|---|
| 869 | // kernel functions. | 
|---|
| 870 | computeSPIRKernelABIInfo(CGM, FI&: *FI); | 
|---|
| 871 | } else if (info.getCC() == CC_Swift || info.getCC() == CC_SwiftAsync) { | 
|---|
| 872 | swiftcall::computeABIInfo(CGM, FI&: *FI); | 
|---|
| 873 | } else { | 
|---|
| 874 | CGM.getABIInfo().computeInfo(FI&: *FI); | 
|---|
| 875 | } | 
|---|
| 876 |  | 
|---|
| 877 | // Loop over all of the computed argument and return value info.  If any of | 
|---|
| 878 | // them are direct or extend without a specified coerce type, specify the | 
|---|
| 879 | // default now. | 
|---|
| 880 | ABIArgInfo &retInfo = FI->getReturnInfo(); | 
|---|
| 881 | if (retInfo.canHaveCoerceToType() && retInfo.getCoerceToType() == nullptr) | 
|---|
| 882 | retInfo.setCoerceToType(ConvertType(T: FI->getReturnType())); | 
|---|
| 883 |  | 
|---|
| 884 | for (auto &I : FI->arguments()) | 
|---|
| 885 | if (I.info.canHaveCoerceToType() && I.info.getCoerceToType() == nullptr) | 
|---|
| 886 | I.info.setCoerceToType(ConvertType(T: I.type)); | 
|---|
| 887 |  | 
|---|
| 888 | bool erased = FunctionsBeingProcessed.erase(Ptr: FI); | 
|---|
| 889 | (void)erased; | 
|---|
| 890 | assert(erased && "Not in set?"); | 
|---|
| 891 |  | 
|---|
| 892 | return *FI; | 
|---|
| 893 | } | 
|---|
| 894 |  | 
|---|
| 895 | CGFunctionInfo *CGFunctionInfo::create(unsigned llvmCC, bool instanceMethod, | 
|---|
| 896 | bool chainCall, bool delegateCall, | 
|---|
| 897 | const FunctionType::ExtInfo &info, | 
|---|
| 898 | ArrayRef<ExtParameterInfo> paramInfos, | 
|---|
| 899 | CanQualType resultType, | 
|---|
| 900 | ArrayRef<CanQualType> argTypes, | 
|---|
| 901 | RequiredArgs required) { | 
|---|
| 902 | assert(paramInfos.empty() || paramInfos.size() == argTypes.size()); | 
|---|
| 903 | assert(!required.allowsOptionalArgs() || | 
|---|
| 904 | required.getNumRequiredArgs() <= argTypes.size()); | 
|---|
| 905 |  | 
|---|
| 906 | void *buffer = operator new(totalSizeToAlloc<ArgInfo, ExtParameterInfo>( | 
|---|
| 907 | Counts: argTypes.size() + 1, Counts: paramInfos.size())); | 
|---|
| 908 |  | 
|---|
| 909 | CGFunctionInfo *FI = new (buffer) CGFunctionInfo(); | 
|---|
| 910 | FI->CallingConvention = llvmCC; | 
|---|
| 911 | FI->EffectiveCallingConvention = llvmCC; | 
|---|
| 912 | FI->ASTCallingConvention = info.getCC(); | 
|---|
| 913 | FI->InstanceMethod = instanceMethod; | 
|---|
| 914 | FI->ChainCall = chainCall; | 
|---|
| 915 | FI->DelegateCall = delegateCall; | 
|---|
| 916 | FI->CmseNSCall = info.getCmseNSCall(); | 
|---|
| 917 | FI->NoReturn = info.getNoReturn(); | 
|---|
| 918 | FI->ReturnsRetained = info.getProducesResult(); | 
|---|
| 919 | FI->NoCallerSavedRegs = info.getNoCallerSavedRegs(); | 
|---|
| 920 | FI->NoCfCheck = info.getNoCfCheck(); | 
|---|
| 921 | FI->Required = required; | 
|---|
| 922 | FI->HasRegParm = info.getHasRegParm(); | 
|---|
| 923 | FI->RegParm = info.getRegParm(); | 
|---|
| 924 | FI->ArgStruct = nullptr; | 
|---|
| 925 | FI->ArgStructAlign = 0; | 
|---|
| 926 | FI->NumArgs = argTypes.size(); | 
|---|
| 927 | FI->HasExtParameterInfos = !paramInfos.empty(); | 
|---|
| 928 | FI->getArgsBuffer()[0].type = resultType; | 
|---|
| 929 | FI->MaxVectorWidth = 0; | 
|---|
| 930 | for (unsigned i = 0, e = argTypes.size(); i != e; ++i) | 
|---|
| 931 | FI->getArgsBuffer()[i + 1].type = argTypes[i]; | 
|---|
| 932 | for (unsigned i = 0, e = paramInfos.size(); i != e; ++i) | 
|---|
| 933 | FI->getExtParameterInfosBuffer()[i] = paramInfos[i]; | 
|---|
| 934 | return FI; | 
|---|
| 935 | } | 
|---|
| 936 |  | 
|---|
| 937 | /***/ | 
|---|
| 938 |  | 
|---|
| 939 | namespace { | 
|---|
| 940 | // ABIArgInfo::Expand implementation. | 
|---|
| 941 |  | 
|---|
| 942 | // Specifies the way QualType passed as ABIArgInfo::Expand is expanded. | 
|---|
| 943 | struct TypeExpansion { | 
|---|
| 944 | enum TypeExpansionKind { | 
|---|
| 945 | // Elements of constant arrays are expanded recursively. | 
|---|
| 946 | TEK_ConstantArray, | 
|---|
| 947 | // Record fields are expanded recursively (but if record is a union, only | 
|---|
| 948 | // the field with the largest size is expanded). | 
|---|
| 949 | TEK_Record, | 
|---|
| 950 | // For complex types, real and imaginary parts are expanded recursively. | 
|---|
| 951 | TEK_Complex, | 
|---|
| 952 | // All other types are not expandable. | 
|---|
| 953 | TEK_None | 
|---|
| 954 | }; | 
|---|
| 955 |  | 
|---|
| 956 | const TypeExpansionKind Kind; | 
|---|
| 957 |  | 
|---|
| 958 | TypeExpansion(TypeExpansionKind K) : Kind(K) {} | 
|---|
| 959 | virtual ~TypeExpansion() {} | 
|---|
| 960 | }; | 
|---|
| 961 |  | 
|---|
| 962 | struct ConstantArrayExpansion : TypeExpansion { | 
|---|
| 963 | QualType EltTy; | 
|---|
| 964 | uint64_t NumElts; | 
|---|
| 965 |  | 
|---|
| 966 | ConstantArrayExpansion(QualType EltTy, uint64_t NumElts) | 
|---|
| 967 | : TypeExpansion(TEK_ConstantArray), EltTy(EltTy), NumElts(NumElts) {} | 
|---|
| 968 | static bool classof(const TypeExpansion *TE) { | 
|---|
| 969 | return TE->Kind == TEK_ConstantArray; | 
|---|
| 970 | } | 
|---|
| 971 | }; | 
|---|
| 972 |  | 
|---|
| 973 | struct RecordExpansion : TypeExpansion { | 
|---|
| 974 | SmallVector<const CXXBaseSpecifier *, 1> Bases; | 
|---|
| 975 |  | 
|---|
| 976 | SmallVector<const FieldDecl *, 1> Fields; | 
|---|
| 977 |  | 
|---|
| 978 | RecordExpansion(SmallVector<const CXXBaseSpecifier *, 1> &&Bases, | 
|---|
| 979 | SmallVector<const FieldDecl *, 1> &&Fields) | 
|---|
| 980 | : TypeExpansion(TEK_Record), Bases(std::move(Bases)), | 
|---|
| 981 | Fields(std::move(Fields)) {} | 
|---|
| 982 | static bool classof(const TypeExpansion *TE) { | 
|---|
| 983 | return TE->Kind == TEK_Record; | 
|---|
| 984 | } | 
|---|
| 985 | }; | 
|---|
| 986 |  | 
|---|
| 987 | struct ComplexExpansion : TypeExpansion { | 
|---|
| 988 | QualType EltTy; | 
|---|
| 989 |  | 
|---|
| 990 | ComplexExpansion(QualType EltTy) : TypeExpansion(TEK_Complex), EltTy(EltTy) {} | 
|---|
| 991 | static bool classof(const TypeExpansion *TE) { | 
|---|
| 992 | return TE->Kind == TEK_Complex; | 
|---|
| 993 | } | 
|---|
| 994 | }; | 
|---|
| 995 |  | 
|---|
| 996 | struct NoExpansion : TypeExpansion { | 
|---|
| 997 | NoExpansion() : TypeExpansion(TEK_None) {} | 
|---|
| 998 | static bool classof(const TypeExpansion *TE) { return TE->Kind == TEK_None; } | 
|---|
| 999 | }; | 
|---|
| 1000 | } // namespace | 
|---|
| 1001 |  | 
|---|
| 1002 | static std::unique_ptr<TypeExpansion> | 
|---|
| 1003 | getTypeExpansion(QualType Ty, const ASTContext &Context) { | 
|---|
| 1004 | if (const ConstantArrayType *AT = Context.getAsConstantArrayType(T: Ty)) { | 
|---|
| 1005 | return std::make_unique<ConstantArrayExpansion>(args: AT->getElementType(), | 
|---|
| 1006 | args: AT->getZExtSize()); | 
|---|
| 1007 | } | 
|---|
| 1008 | if (const RecordType *RT = Ty->getAs<RecordType>()) { | 
|---|
| 1009 | SmallVector<const CXXBaseSpecifier *, 1> Bases; | 
|---|
| 1010 | SmallVector<const FieldDecl *, 1> Fields; | 
|---|
| 1011 | const RecordDecl *RD = RT->getDecl(); | 
|---|
| 1012 | assert(!RD->hasFlexibleArrayMember() && | 
|---|
| 1013 | "Cannot expand structure with flexible array."); | 
|---|
| 1014 | if (RD->isUnion()) { | 
|---|
| 1015 | // Unions can be here only in degenerative cases - all the fields are same | 
|---|
| 1016 | // after flattening. Thus we have to use the "largest" field. | 
|---|
| 1017 | const FieldDecl *LargestFD = nullptr; | 
|---|
| 1018 | CharUnits UnionSize = CharUnits::Zero(); | 
|---|
| 1019 |  | 
|---|
| 1020 | for (const auto *FD : RD->fields()) { | 
|---|
| 1021 | if (FD->isZeroLengthBitField()) | 
|---|
| 1022 | continue; | 
|---|
| 1023 | assert(!FD->isBitField() && | 
|---|
| 1024 | "Cannot expand structure with bit-field members."); | 
|---|
| 1025 | CharUnits FieldSize = Context.getTypeSizeInChars(T: FD->getType()); | 
|---|
| 1026 | if (UnionSize < FieldSize) { | 
|---|
| 1027 | UnionSize = FieldSize; | 
|---|
| 1028 | LargestFD = FD; | 
|---|
| 1029 | } | 
|---|
| 1030 | } | 
|---|
| 1031 | if (LargestFD) | 
|---|
| 1032 | Fields.push_back(Elt: LargestFD); | 
|---|
| 1033 | } else { | 
|---|
| 1034 | if (const auto *CXXRD = dyn_cast<CXXRecordDecl>(Val: RD)) { | 
|---|
| 1035 | assert(!CXXRD->isDynamicClass() && | 
|---|
| 1036 | "cannot expand vtable pointers in dynamic classes"); | 
|---|
| 1037 | llvm::append_range(C&: Bases, R: llvm::make_pointer_range(Range: CXXRD->bases())); | 
|---|
| 1038 | } | 
|---|
| 1039 |  | 
|---|
| 1040 | for (const auto *FD : RD->fields()) { | 
|---|
| 1041 | if (FD->isZeroLengthBitField()) | 
|---|
| 1042 | continue; | 
|---|
| 1043 | assert(!FD->isBitField() && | 
|---|
| 1044 | "Cannot expand structure with bit-field members."); | 
|---|
| 1045 | Fields.push_back(Elt: FD); | 
|---|
| 1046 | } | 
|---|
| 1047 | } | 
|---|
| 1048 | return std::make_unique<RecordExpansion>(args: std::move(Bases), | 
|---|
| 1049 | args: std::move(Fields)); | 
|---|
| 1050 | } | 
|---|
| 1051 | if (const ComplexType *CT = Ty->getAs<ComplexType>()) { | 
|---|
| 1052 | return std::make_unique<ComplexExpansion>(args: CT->getElementType()); | 
|---|
| 1053 | } | 
|---|
| 1054 | return std::make_unique<NoExpansion>(); | 
|---|
| 1055 | } | 
|---|
| 1056 |  | 
|---|
| 1057 | static int getExpansionSize(QualType Ty, const ASTContext &Context) { | 
|---|
| 1058 | auto Exp = getTypeExpansion(Ty, Context); | 
|---|
| 1059 | if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) { | 
|---|
| 1060 | return CAExp->NumElts * getExpansionSize(Ty: CAExp->EltTy, Context); | 
|---|
| 1061 | } | 
|---|
| 1062 | if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) { | 
|---|
| 1063 | int Res = 0; | 
|---|
| 1064 | for (auto BS : RExp->Bases) | 
|---|
| 1065 | Res += getExpansionSize(Ty: BS->getType(), Context); | 
|---|
| 1066 | for (auto FD : RExp->Fields) | 
|---|
| 1067 | Res += getExpansionSize(Ty: FD->getType(), Context); | 
|---|
| 1068 | return Res; | 
|---|
| 1069 | } | 
|---|
| 1070 | if (isa<ComplexExpansion>(Val: Exp.get())) | 
|---|
| 1071 | return 2; | 
|---|
| 1072 | assert(isa<NoExpansion>(Exp.get())); | 
|---|
| 1073 | return 1; | 
|---|
| 1074 | } | 
|---|
| 1075 |  | 
|---|
| 1076 | void CodeGenTypes::getExpandedTypes( | 
|---|
| 1077 | QualType Ty, SmallVectorImpl<llvm::Type *>::iterator &TI) { | 
|---|
| 1078 | auto Exp = getTypeExpansion(Ty, Context); | 
|---|
| 1079 | if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) { | 
|---|
| 1080 | for (int i = 0, n = CAExp->NumElts; i < n; i++) { | 
|---|
| 1081 | getExpandedTypes(Ty: CAExp->EltTy, TI); | 
|---|
| 1082 | } | 
|---|
| 1083 | } else if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) { | 
|---|
| 1084 | for (auto BS : RExp->Bases) | 
|---|
| 1085 | getExpandedTypes(Ty: BS->getType(), TI); | 
|---|
| 1086 | for (auto FD : RExp->Fields) | 
|---|
| 1087 | getExpandedTypes(Ty: FD->getType(), TI); | 
|---|
| 1088 | } else if (auto CExp = dyn_cast<ComplexExpansion>(Val: Exp.get())) { | 
|---|
| 1089 | llvm::Type *EltTy = ConvertType(T: CExp->EltTy); | 
|---|
| 1090 | *TI++ = EltTy; | 
|---|
| 1091 | *TI++ = EltTy; | 
|---|
| 1092 | } else { | 
|---|
| 1093 | assert(isa<NoExpansion>(Exp.get())); | 
|---|
| 1094 | *TI++ = ConvertType(T: Ty); | 
|---|
| 1095 | } | 
|---|
| 1096 | } | 
|---|
| 1097 |  | 
|---|
| 1098 | static void forConstantArrayExpansion(CodeGenFunction &CGF, | 
|---|
| 1099 | ConstantArrayExpansion *CAE, | 
|---|
| 1100 | Address BaseAddr, | 
|---|
| 1101 | llvm::function_ref<void(Address)> Fn) { | 
|---|
| 1102 | for (int i = 0, n = CAE->NumElts; i < n; i++) { | 
|---|
| 1103 | Address EltAddr = CGF.Builder.CreateConstGEP2_32(Addr: BaseAddr, Idx0: 0, Idx1: i); | 
|---|
| 1104 | Fn(EltAddr); | 
|---|
| 1105 | } | 
|---|
| 1106 | } | 
|---|
| 1107 |  | 
|---|
| 1108 | void CodeGenFunction::ExpandTypeFromArgs(QualType Ty, LValue LV, | 
|---|
| 1109 | llvm::Function::arg_iterator &AI) { | 
|---|
| 1110 | assert(LV.isSimple() && | 
|---|
| 1111 | "Unexpected non-simple lvalue during struct expansion."); | 
|---|
| 1112 |  | 
|---|
| 1113 | auto Exp = getTypeExpansion(Ty, Context: getContext()); | 
|---|
| 1114 | if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) { | 
|---|
| 1115 | forConstantArrayExpansion( | 
|---|
| 1116 | CGF&: *this, CAE: CAExp, BaseAddr: LV.getAddress(), Fn: [&](Address EltAddr) { | 
|---|
| 1117 | LValue LV = MakeAddrLValue(Addr: EltAddr, T: CAExp->EltTy); | 
|---|
| 1118 | ExpandTypeFromArgs(Ty: CAExp->EltTy, LV, AI); | 
|---|
| 1119 | }); | 
|---|
| 1120 | } else if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) { | 
|---|
| 1121 | Address This = LV.getAddress(); | 
|---|
| 1122 | for (const CXXBaseSpecifier *BS : RExp->Bases) { | 
|---|
| 1123 | // Perform a single step derived-to-base conversion. | 
|---|
| 1124 | Address Base = | 
|---|
| 1125 | GetAddressOfBaseClass(Value: This, Derived: Ty->getAsCXXRecordDecl(), PathBegin: &BS, PathEnd: &BS + 1, | 
|---|
| 1126 | /*NullCheckValue=*/false, Loc: SourceLocation()); | 
|---|
| 1127 | LValue SubLV = MakeAddrLValue(Addr: Base, T: BS->getType()); | 
|---|
| 1128 |  | 
|---|
| 1129 | // Recurse onto bases. | 
|---|
| 1130 | ExpandTypeFromArgs(Ty: BS->getType(), LV: SubLV, AI); | 
|---|
| 1131 | } | 
|---|
| 1132 | for (auto FD : RExp->Fields) { | 
|---|
| 1133 | // FIXME: What are the right qualifiers here? | 
|---|
| 1134 | LValue SubLV = EmitLValueForFieldInitialization(Base: LV, Field: FD); | 
|---|
| 1135 | ExpandTypeFromArgs(Ty: FD->getType(), LV: SubLV, AI); | 
|---|
| 1136 | } | 
|---|
| 1137 | } else if (isa<ComplexExpansion>(Val: Exp.get())) { | 
|---|
| 1138 | auto realValue = &*AI++; | 
|---|
| 1139 | auto imagValue = &*AI++; | 
|---|
| 1140 | EmitStoreOfComplex(V: ComplexPairTy(realValue, imagValue), dest: LV, /*init*/ isInit: true); | 
|---|
| 1141 | } else { | 
|---|
| 1142 | // Call EmitStoreOfScalar except when the lvalue is a bitfield to emit a | 
|---|
| 1143 | // primitive store. | 
|---|
| 1144 | assert(isa<NoExpansion>(Exp.get())); | 
|---|
| 1145 | llvm::Value *Arg = &*AI++; | 
|---|
| 1146 | if (LV.isBitField()) { | 
|---|
| 1147 | EmitStoreThroughLValue(Src: RValue::get(V: Arg), Dst: LV); | 
|---|
| 1148 | } else { | 
|---|
| 1149 | // TODO: currently there are some places are inconsistent in what LLVM | 
|---|
| 1150 | // pointer type they use (see D118744). Once clang uses opaque pointers | 
|---|
| 1151 | // all LLVM pointer types will be the same and we can remove this check. | 
|---|
| 1152 | if (Arg->getType()->isPointerTy()) { | 
|---|
| 1153 | Address Addr = LV.getAddress(); | 
|---|
| 1154 | Arg = Builder.CreateBitCast(V: Arg, DestTy: Addr.getElementType()); | 
|---|
| 1155 | } | 
|---|
| 1156 | EmitStoreOfScalar(value: Arg, lvalue: LV); | 
|---|
| 1157 | } | 
|---|
| 1158 | } | 
|---|
| 1159 | } | 
|---|
| 1160 |  | 
|---|
| 1161 | void CodeGenFunction::ExpandTypeToArgs( | 
|---|
| 1162 | QualType Ty, CallArg Arg, llvm::FunctionType *IRFuncTy, | 
|---|
| 1163 | SmallVectorImpl<llvm::Value *> &IRCallArgs, unsigned &IRCallArgPos) { | 
|---|
| 1164 | auto Exp = getTypeExpansion(Ty, Context: getContext()); | 
|---|
| 1165 | if (auto CAExp = dyn_cast<ConstantArrayExpansion>(Val: Exp.get())) { | 
|---|
| 1166 | Address Addr = Arg.hasLValue() ? Arg.getKnownLValue().getAddress() | 
|---|
| 1167 | : Arg.getKnownRValue().getAggregateAddress(); | 
|---|
| 1168 | forConstantArrayExpansion(CGF&: *this, CAE: CAExp, BaseAddr: Addr, Fn: [&](Address EltAddr) { | 
|---|
| 1169 | CallArg EltArg = | 
|---|
| 1170 | CallArg(convertTempToRValue(addr: EltAddr, type: CAExp->EltTy, Loc: SourceLocation()), | 
|---|
| 1171 | CAExp->EltTy); | 
|---|
| 1172 | ExpandTypeToArgs(Ty: CAExp->EltTy, Arg: EltArg, IRFuncTy, IRCallArgs, | 
|---|
| 1173 | IRCallArgPos); | 
|---|
| 1174 | }); | 
|---|
| 1175 | } else if (auto RExp = dyn_cast<RecordExpansion>(Val: Exp.get())) { | 
|---|
| 1176 | Address This = Arg.hasLValue() ? Arg.getKnownLValue().getAddress() | 
|---|
| 1177 | : Arg.getKnownRValue().getAggregateAddress(); | 
|---|
| 1178 | for (const CXXBaseSpecifier *BS : RExp->Bases) { | 
|---|
| 1179 | // Perform a single step derived-to-base conversion. | 
|---|
| 1180 | Address Base = | 
|---|
| 1181 | GetAddressOfBaseClass(Value: This, Derived: Ty->getAsCXXRecordDecl(), PathBegin: &BS, PathEnd: &BS + 1, | 
|---|
| 1182 | /*NullCheckValue=*/false, Loc: SourceLocation()); | 
|---|
| 1183 | CallArg BaseArg = CallArg(RValue::getAggregate(addr: Base), BS->getType()); | 
|---|
| 1184 |  | 
|---|
| 1185 | // Recurse onto bases. | 
|---|
| 1186 | ExpandTypeToArgs(Ty: BS->getType(), Arg: BaseArg, IRFuncTy, IRCallArgs, | 
|---|
| 1187 | IRCallArgPos); | 
|---|
| 1188 | } | 
|---|
| 1189 |  | 
|---|
| 1190 | LValue LV = MakeAddrLValue(Addr: This, T: Ty); | 
|---|
| 1191 | for (auto FD : RExp->Fields) { | 
|---|
| 1192 | CallArg FldArg = | 
|---|
| 1193 | CallArg(EmitRValueForField(LV, FD, Loc: SourceLocation()), FD->getType()); | 
|---|
| 1194 | ExpandTypeToArgs(Ty: FD->getType(), Arg: FldArg, IRFuncTy, IRCallArgs, | 
|---|
| 1195 | IRCallArgPos); | 
|---|
| 1196 | } | 
|---|
| 1197 | } else if (isa<ComplexExpansion>(Val: Exp.get())) { | 
|---|
| 1198 | ComplexPairTy CV = Arg.getKnownRValue().getComplexVal(); | 
|---|
| 1199 | IRCallArgs[IRCallArgPos++] = CV.first; | 
|---|
| 1200 | IRCallArgs[IRCallArgPos++] = CV.second; | 
|---|
| 1201 | } else { | 
|---|
| 1202 | assert(isa<NoExpansion>(Exp.get())); | 
|---|
| 1203 | auto RV = Arg.getKnownRValue(); | 
|---|
| 1204 | assert(RV.isScalar() && | 
|---|
| 1205 | "Unexpected non-scalar rvalue during struct expansion."); | 
|---|
| 1206 |  | 
|---|
| 1207 | // Insert a bitcast as needed. | 
|---|
| 1208 | llvm::Value *V = RV.getScalarVal(); | 
|---|
| 1209 | if (IRCallArgPos < IRFuncTy->getNumParams() && | 
|---|
| 1210 | V->getType() != IRFuncTy->getParamType(i: IRCallArgPos)) | 
|---|
| 1211 | V = Builder.CreateBitCast(V, DestTy: IRFuncTy->getParamType(i: IRCallArgPos)); | 
|---|
| 1212 |  | 
|---|
| 1213 | IRCallArgs[IRCallArgPos++] = V; | 
|---|
| 1214 | } | 
|---|
| 1215 | } | 
|---|
| 1216 |  | 
|---|
| 1217 | /// Create a temporary allocation for the purposes of coercion. | 
|---|
| 1218 | static RawAddress CreateTempAllocaForCoercion(CodeGenFunction &CGF, | 
|---|
| 1219 | llvm::Type *Ty, | 
|---|
| 1220 | CharUnits MinAlign, | 
|---|
| 1221 | const Twine &Name = "tmp") { | 
|---|
| 1222 | // Don't use an alignment that's worse than what LLVM would prefer. | 
|---|
| 1223 | auto PrefAlign = CGF.CGM.getDataLayout().getPrefTypeAlign(Ty); | 
|---|
| 1224 | CharUnits Align = std::max(a: MinAlign, b: CharUnits::fromQuantity(Quantity: PrefAlign)); | 
|---|
| 1225 |  | 
|---|
| 1226 | return CGF.CreateTempAlloca(Ty, align: Align, Name: Name + ".coerce"); | 
|---|
| 1227 | } | 
|---|
| 1228 |  | 
|---|
| 1229 | /// EnterStructPointerForCoercedAccess - Given a struct pointer that we are | 
|---|
| 1230 | /// accessing some number of bytes out of it, try to gep into the struct to get | 
|---|
| 1231 | /// at its inner goodness.  Dive as deep as possible without entering an element | 
|---|
| 1232 | /// with an in-memory size smaller than DstSize. | 
|---|
| 1233 | static Address EnterStructPointerForCoercedAccess(Address SrcPtr, | 
|---|
| 1234 | llvm::StructType *SrcSTy, | 
|---|
| 1235 | uint64_t DstSize, | 
|---|
| 1236 | CodeGenFunction &CGF) { | 
|---|
| 1237 | // We can't dive into a zero-element struct. | 
|---|
| 1238 | if (SrcSTy->getNumElements() == 0) | 
|---|
| 1239 | return SrcPtr; | 
|---|
| 1240 |  | 
|---|
| 1241 | llvm::Type *FirstElt = SrcSTy->getElementType(N: 0); | 
|---|
| 1242 |  | 
|---|
| 1243 | // If the first elt is at least as large as what we're looking for, or if the | 
|---|
| 1244 | // first element is the same size as the whole struct, we can enter it. The | 
|---|
| 1245 | // comparison must be made on the store size and not the alloca size. Using | 
|---|
| 1246 | // the alloca size may overstate the size of the load. | 
|---|
| 1247 | uint64_t FirstEltSize = CGF.CGM.getDataLayout().getTypeStoreSize(Ty: FirstElt); | 
|---|
| 1248 | if (FirstEltSize < DstSize && | 
|---|
| 1249 | FirstEltSize < CGF.CGM.getDataLayout().getTypeStoreSize(Ty: SrcSTy)) | 
|---|
| 1250 | return SrcPtr; | 
|---|
| 1251 |  | 
|---|
| 1252 | // GEP into the first element. | 
|---|
| 1253 | SrcPtr = CGF.Builder.CreateStructGEP(Addr: SrcPtr, Index: 0, Name: "coerce.dive"); | 
|---|
| 1254 |  | 
|---|
| 1255 | // If the first element is a struct, recurse. | 
|---|
| 1256 | llvm::Type *SrcTy = SrcPtr.getElementType(); | 
|---|
| 1257 | if (llvm::StructType *SrcSTy = dyn_cast<llvm::StructType>(Val: SrcTy)) | 
|---|
| 1258 | return EnterStructPointerForCoercedAccess(SrcPtr, SrcSTy, DstSize, CGF); | 
|---|
| 1259 |  | 
|---|
| 1260 | return SrcPtr; | 
|---|
| 1261 | } | 
|---|
| 1262 |  | 
|---|
| 1263 | /// CoerceIntOrPtrToIntOrPtr - Convert a value Val to the specific Ty where both | 
|---|
| 1264 | /// are either integers or pointers.  This does a truncation of the value if it | 
|---|
| 1265 | /// is too large or a zero extension if it is too small. | 
|---|
| 1266 | /// | 
|---|
| 1267 | /// This behaves as if the value were coerced through memory, so on big-endian | 
|---|
| 1268 | /// targets the high bits are preserved in a truncation, while little-endian | 
|---|
| 1269 | /// targets preserve the low bits. | 
|---|
| 1270 | static llvm::Value *CoerceIntOrPtrToIntOrPtr(llvm::Value *Val, llvm::Type *Ty, | 
|---|
| 1271 | CodeGenFunction &CGF) { | 
|---|
| 1272 | if (Val->getType() == Ty) | 
|---|
| 1273 | return Val; | 
|---|
| 1274 |  | 
|---|
| 1275 | if (isa<llvm::PointerType>(Val: Val->getType())) { | 
|---|
| 1276 | // If this is Pointer->Pointer avoid conversion to and from int. | 
|---|
| 1277 | if (isa<llvm::PointerType>(Val: Ty)) | 
|---|
| 1278 | return CGF.Builder.CreateBitCast(V: Val, DestTy: Ty, Name: "coerce.val"); | 
|---|
| 1279 |  | 
|---|
| 1280 | // Convert the pointer to an integer so we can play with its width. | 
|---|
| 1281 | Val = CGF.Builder.CreatePtrToInt(V: Val, DestTy: CGF.IntPtrTy, Name: "coerce.val.pi"); | 
|---|
| 1282 | } | 
|---|
| 1283 |  | 
|---|
| 1284 | llvm::Type *DestIntTy = Ty; | 
|---|
| 1285 | if (isa<llvm::PointerType>(Val: DestIntTy)) | 
|---|
| 1286 | DestIntTy = CGF.IntPtrTy; | 
|---|
| 1287 |  | 
|---|
| 1288 | if (Val->getType() != DestIntTy) { | 
|---|
| 1289 | const llvm::DataLayout &DL = CGF.CGM.getDataLayout(); | 
|---|
| 1290 | if (DL.isBigEndian()) { | 
|---|
| 1291 | // Preserve the high bits on big-endian targets. | 
|---|
| 1292 | // That is what memory coercion does. | 
|---|
| 1293 | uint64_t SrcSize = DL.getTypeSizeInBits(Ty: Val->getType()); | 
|---|
| 1294 | uint64_t DstSize = DL.getTypeSizeInBits(Ty: DestIntTy); | 
|---|
| 1295 |  | 
|---|
| 1296 | if (SrcSize > DstSize) { | 
|---|
| 1297 | Val = CGF.Builder.CreateLShr(LHS: Val, RHS: SrcSize - DstSize, Name: "coerce.highbits"); | 
|---|
| 1298 | Val = CGF.Builder.CreateTrunc(V: Val, DestTy: DestIntTy, Name: "coerce.val.ii"); | 
|---|
| 1299 | } else { | 
|---|
| 1300 | Val = CGF.Builder.CreateZExt(V: Val, DestTy: DestIntTy, Name: "coerce.val.ii"); | 
|---|
| 1301 | Val = CGF.Builder.CreateShl(LHS: Val, RHS: DstSize - SrcSize, Name: "coerce.highbits"); | 
|---|
| 1302 | } | 
|---|
| 1303 | } else { | 
|---|
| 1304 | // Little-endian targets preserve the low bits. No shifts required. | 
|---|
| 1305 | Val = CGF.Builder.CreateIntCast(V: Val, DestTy: DestIntTy, isSigned: false, Name: "coerce.val.ii"); | 
|---|
| 1306 | } | 
|---|
| 1307 | } | 
|---|
| 1308 |  | 
|---|
| 1309 | if (isa<llvm::PointerType>(Val: Ty)) | 
|---|
| 1310 | Val = CGF.Builder.CreateIntToPtr(V: Val, DestTy: Ty, Name: "coerce.val.ip"); | 
|---|
| 1311 | return Val; | 
|---|
| 1312 | } | 
|---|
| 1313 |  | 
|---|
| 1314 | /// CreateCoercedLoad - Create a load from \arg SrcPtr interpreted as | 
|---|
| 1315 | /// a pointer to an object of type \arg Ty, known to be aligned to | 
|---|
| 1316 | /// \arg SrcAlign bytes. | 
|---|
| 1317 | /// | 
|---|
| 1318 | /// This safely handles the case when the src type is smaller than the | 
|---|
| 1319 | /// destination type; in this situation the values of bits which not | 
|---|
| 1320 | /// present in the src are undefined. | 
|---|
| 1321 | static llvm::Value *CreateCoercedLoad(Address Src, llvm::Type *Ty, | 
|---|
| 1322 | CodeGenFunction &CGF) { | 
|---|
| 1323 | llvm::Type *SrcTy = Src.getElementType(); | 
|---|
| 1324 |  | 
|---|
| 1325 | // If SrcTy and Ty are the same, just do a load. | 
|---|
| 1326 | if (SrcTy == Ty) | 
|---|
| 1327 | return CGF.Builder.CreateLoad(Addr: Src); | 
|---|
| 1328 |  | 
|---|
| 1329 | llvm::TypeSize DstSize = CGF.CGM.getDataLayout().getTypeAllocSize(Ty); | 
|---|
| 1330 |  | 
|---|
| 1331 | if (llvm::StructType *SrcSTy = dyn_cast<llvm::StructType>(Val: SrcTy)) { | 
|---|
| 1332 | Src = EnterStructPointerForCoercedAccess(SrcPtr: Src, SrcSTy, | 
|---|
| 1333 | DstSize: DstSize.getFixedValue(), CGF); | 
|---|
| 1334 | SrcTy = Src.getElementType(); | 
|---|
| 1335 | } | 
|---|
| 1336 |  | 
|---|
| 1337 | llvm::TypeSize SrcSize = CGF.CGM.getDataLayout().getTypeAllocSize(Ty: SrcTy); | 
|---|
| 1338 |  | 
|---|
| 1339 | // If the source and destination are integer or pointer types, just do an | 
|---|
| 1340 | // extension or truncation to the desired type. | 
|---|
| 1341 | if ((isa<llvm::IntegerType>(Val: Ty) || isa<llvm::PointerType>(Val: Ty)) && | 
|---|
| 1342 | (isa<llvm::IntegerType>(Val: SrcTy) || isa<llvm::PointerType>(Val: SrcTy))) { | 
|---|
| 1343 | llvm::Value *Load = CGF.Builder.CreateLoad(Addr: Src); | 
|---|
| 1344 | return CoerceIntOrPtrToIntOrPtr(Val: Load, Ty, CGF); | 
|---|
| 1345 | } | 
|---|
| 1346 |  | 
|---|
| 1347 | // If load is legal, just bitcast the src pointer. | 
|---|
| 1348 | if (!SrcSize.isScalable() && !DstSize.isScalable() && | 
|---|
| 1349 | SrcSize.getFixedValue() >= DstSize.getFixedValue()) { | 
|---|
| 1350 | // Generally SrcSize is never greater than DstSize, since this means we are | 
|---|
| 1351 | // losing bits. However, this can happen in cases where the structure has | 
|---|
| 1352 | // additional padding, for example due to a user specified alignment. | 
|---|
| 1353 | // | 
|---|
| 1354 | // FIXME: Assert that we aren't truncating non-padding bits when have access | 
|---|
| 1355 | // to that information. | 
|---|
| 1356 | Src = Src.withElementType(ElemTy: Ty); | 
|---|
| 1357 | return CGF.Builder.CreateLoad(Addr: Src); | 
|---|
| 1358 | } | 
|---|
| 1359 |  | 
|---|
| 1360 | // If coercing a fixed vector to a scalable vector for ABI compatibility, and | 
|---|
| 1361 | // the types match, use the llvm.vector.insert intrinsic to perform the | 
|---|
| 1362 | // conversion. | 
|---|
| 1363 | if (auto *ScalableDstTy = dyn_cast<llvm::ScalableVectorType>(Val: Ty)) { | 
|---|
| 1364 | if (auto *FixedSrcTy = dyn_cast<llvm::FixedVectorType>(Val: SrcTy)) { | 
|---|
| 1365 | // If we are casting a fixed i8 vector to a scalable i1 predicate | 
|---|
| 1366 | // vector, use a vector insert and bitcast the result. | 
|---|
| 1367 | if (ScalableDstTy->getElementType()->isIntegerTy(Bitwidth: 1) && | 
|---|
| 1368 | FixedSrcTy->getElementType()->isIntegerTy(Bitwidth: 8)) { | 
|---|
| 1369 | ScalableDstTy = llvm::ScalableVectorType::get( | 
|---|
| 1370 | ElementType: FixedSrcTy->getElementType(), | 
|---|
| 1371 | MinNumElts: llvm::divideCeil( | 
|---|
| 1372 | Numerator: ScalableDstTy->getElementCount().getKnownMinValue(), Denominator: 8)); | 
|---|
| 1373 | } | 
|---|
| 1374 | if (ScalableDstTy->getElementType() == FixedSrcTy->getElementType()) { | 
|---|
| 1375 | auto *Load = CGF.Builder.CreateLoad(Addr: Src); | 
|---|
| 1376 | auto *PoisonVec = llvm::PoisonValue::get(T: ScalableDstTy); | 
|---|
| 1377 | llvm::Value *Result = CGF.Builder.CreateInsertVector( | 
|---|
| 1378 | DstType: ScalableDstTy, SrcVec: PoisonVec, SubVec: Load, Idx: uint64_t(0), Name: "cast.scalable"); | 
|---|
| 1379 | ScalableDstTy = cast<llvm::ScalableVectorType>( | 
|---|
| 1380 | Val: llvm::VectorType::getWithSizeAndScalar(SizeTy: ScalableDstTy, EltTy: Ty)); | 
|---|
| 1381 | if (Result->getType() != ScalableDstTy) | 
|---|
| 1382 | Result = CGF.Builder.CreateBitCast(V: Result, DestTy: ScalableDstTy); | 
|---|
| 1383 | if (Result->getType() != Ty) | 
|---|
| 1384 | Result = CGF.Builder.CreateExtractVector(DstType: Ty, SrcVec: Result, Idx: uint64_t(0)); | 
|---|
| 1385 | return Result; | 
|---|
| 1386 | } | 
|---|
| 1387 | } | 
|---|
| 1388 | } | 
|---|
| 1389 |  | 
|---|
| 1390 | // Otherwise do coercion through memory. This is stupid, but simple. | 
|---|
| 1391 | RawAddress Tmp = | 
|---|
| 1392 | CreateTempAllocaForCoercion(CGF, Ty, MinAlign: Src.getAlignment(), Name: Src.getName()); | 
|---|
| 1393 | CGF.Builder.CreateMemCpy( | 
|---|
| 1394 | Dst: Tmp.getPointer(), DstAlign: Tmp.getAlignment().getAsAlign(), | 
|---|
| 1395 | Src: Src.emitRawPointer(CGF), SrcAlign: Src.getAlignment().getAsAlign(), | 
|---|
| 1396 | Size: llvm::ConstantInt::get(Ty: CGF.IntPtrTy, V: SrcSize.getKnownMinValue())); | 
|---|
| 1397 | return CGF.Builder.CreateLoad(Addr: Tmp); | 
|---|
| 1398 | } | 
|---|
| 1399 |  | 
|---|
| 1400 | void CodeGenFunction::CreateCoercedStore(llvm::Value *Src, Address Dst, | 
|---|
| 1401 | llvm::TypeSize DstSize, | 
|---|
| 1402 | bool DstIsVolatile) { | 
|---|
| 1403 | if (!DstSize) | 
|---|
| 1404 | return; | 
|---|
| 1405 |  | 
|---|
| 1406 | llvm::Type *SrcTy = Src->getType(); | 
|---|
| 1407 | llvm::TypeSize SrcSize = CGM.getDataLayout().getTypeAllocSize(Ty: SrcTy); | 
|---|
| 1408 |  | 
|---|
| 1409 | // GEP into structs to try to make types match. | 
|---|
| 1410 | // FIXME: This isn't really that useful with opaque types, but it impacts a | 
|---|
| 1411 | // lot of regression tests. | 
|---|
| 1412 | if (SrcTy != Dst.getElementType()) { | 
|---|
| 1413 | if (llvm::StructType *DstSTy = | 
|---|
| 1414 | dyn_cast<llvm::StructType>(Val: Dst.getElementType())) { | 
|---|
| 1415 | assert(!SrcSize.isScalable()); | 
|---|
| 1416 | Dst = EnterStructPointerForCoercedAccess(SrcPtr: Dst, SrcSTy: DstSTy, | 
|---|
| 1417 | DstSize: SrcSize.getFixedValue(), CGF&: *this); | 
|---|
| 1418 | } | 
|---|
| 1419 | } | 
|---|
| 1420 |  | 
|---|
| 1421 | if (SrcSize.isScalable() || SrcSize <= DstSize) { | 
|---|
| 1422 | if (SrcTy->isIntegerTy() && Dst.getElementType()->isPointerTy() && | 
|---|
| 1423 | SrcSize == CGM.getDataLayout().getTypeAllocSize(Ty: Dst.getElementType())) { | 
|---|
| 1424 | // If the value is supposed to be a pointer, convert it before storing it. | 
|---|
| 1425 | Src = CoerceIntOrPtrToIntOrPtr(Val: Src, Ty: Dst.getElementType(), CGF&: *this); | 
|---|
| 1426 | auto *I = Builder.CreateStore(Val: Src, Addr: Dst, IsVolatile: DstIsVolatile); | 
|---|
| 1427 | addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src); | 
|---|
| 1428 | } else if (llvm::StructType *STy = | 
|---|
| 1429 | dyn_cast<llvm::StructType>(Val: Src->getType())) { | 
|---|
| 1430 | // Prefer scalar stores to first-class aggregate stores. | 
|---|
| 1431 | Dst = Dst.withElementType(ElemTy: SrcTy); | 
|---|
| 1432 | for (unsigned i = 0, e = STy->getNumElements(); i != e; ++i) { | 
|---|
| 1433 | Address EltPtr = Builder.CreateStructGEP(Addr: Dst, Index: i); | 
|---|
| 1434 | llvm::Value *Elt = Builder.CreateExtractValue(Agg: Src, Idxs: i); | 
|---|
| 1435 | auto *I = Builder.CreateStore(Val: Elt, Addr: EltPtr, IsVolatile: DstIsVolatile); | 
|---|
| 1436 | addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Elt); | 
|---|
| 1437 | } | 
|---|
| 1438 | } else { | 
|---|
| 1439 | auto *I = | 
|---|
| 1440 | Builder.CreateStore(Val: Src, Addr: Dst.withElementType(ElemTy: SrcTy), IsVolatile: DstIsVolatile); | 
|---|
| 1441 | addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src); | 
|---|
| 1442 | } | 
|---|
| 1443 | } else if (SrcTy->isIntegerTy()) { | 
|---|
| 1444 | // If the source is a simple integer, coerce it directly. | 
|---|
| 1445 | llvm::Type *DstIntTy = Builder.getIntNTy(N: DstSize.getFixedValue() * 8); | 
|---|
| 1446 | Src = CoerceIntOrPtrToIntOrPtr(Val: Src, Ty: DstIntTy, CGF&: *this); | 
|---|
| 1447 | auto *I = | 
|---|
| 1448 | Builder.CreateStore(Val: Src, Addr: Dst.withElementType(ElemTy: DstIntTy), IsVolatile: DstIsVolatile); | 
|---|
| 1449 | addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src); | 
|---|
| 1450 | } else { | 
|---|
| 1451 | // Otherwise do coercion through memory. This is stupid, but | 
|---|
| 1452 | // simple. | 
|---|
| 1453 |  | 
|---|
| 1454 | // Generally SrcSize is never greater than DstSize, since this means we are | 
|---|
| 1455 | // losing bits. However, this can happen in cases where the structure has | 
|---|
| 1456 | // additional padding, for example due to a user specified alignment. | 
|---|
| 1457 | // | 
|---|
| 1458 | // FIXME: Assert that we aren't truncating non-padding bits when have access | 
|---|
| 1459 | // to that information. | 
|---|
| 1460 | RawAddress Tmp = | 
|---|
| 1461 | CreateTempAllocaForCoercion(CGF&: *this, Ty: SrcTy, MinAlign: Dst.getAlignment()); | 
|---|
| 1462 | Builder.CreateStore(Val: Src, Addr: Tmp); | 
|---|
| 1463 | auto *I = Builder.CreateMemCpy( | 
|---|
| 1464 | Dst: Dst.emitRawPointer(CGF&: *this), DstAlign: Dst.getAlignment().getAsAlign(), | 
|---|
| 1465 | Src: Tmp.getPointer(), SrcAlign: Tmp.getAlignment().getAsAlign(), | 
|---|
| 1466 | Size: Builder.CreateTypeSize(Ty: IntPtrTy, Size: DstSize)); | 
|---|
| 1467 | addInstToCurrentSourceAtom(KeyInstruction: I, Backup: Src); | 
|---|
| 1468 | } | 
|---|
| 1469 | } | 
|---|
| 1470 |  | 
|---|
| 1471 | static Address emitAddressAtOffset(CodeGenFunction &CGF, Address addr, | 
|---|
| 1472 | const ABIArgInfo &info) { | 
|---|
| 1473 | if (unsigned offset = info.getDirectOffset()) { | 
|---|
| 1474 | addr = addr.withElementType(ElemTy: CGF.Int8Ty); | 
|---|
| 1475 | addr = CGF.Builder.CreateConstInBoundsByteGEP( | 
|---|
| 1476 | Addr: addr, Offset: CharUnits::fromQuantity(Quantity: offset)); | 
|---|
| 1477 | addr = addr.withElementType(ElemTy: info.getCoerceToType()); | 
|---|
| 1478 | } | 
|---|
| 1479 | return addr; | 
|---|
| 1480 | } | 
|---|
| 1481 |  | 
|---|
| 1482 | static std::pair<llvm::Value *, bool> | 
|---|
| 1483 | CoerceScalableToFixed(CodeGenFunction &CGF, llvm::FixedVectorType *ToTy, | 
|---|
| 1484 | llvm::ScalableVectorType *FromTy, llvm::Value *V, | 
|---|
| 1485 | StringRef Name = "") { | 
|---|
| 1486 | // If we are casting a scalable i1 predicate vector to a fixed i8 | 
|---|
| 1487 | // vector, first bitcast the source. | 
|---|
| 1488 | if (FromTy->getElementType()->isIntegerTy(Bitwidth: 1) && | 
|---|
| 1489 | ToTy->getElementType() == CGF.Builder.getInt8Ty()) { | 
|---|
| 1490 | if (!FromTy->getElementCount().isKnownMultipleOf(RHS: 8)) { | 
|---|
| 1491 | FromTy = llvm::ScalableVectorType::get( | 
|---|
| 1492 | ElementType: FromTy->getElementType(), | 
|---|
| 1493 | MinNumElts: llvm::alignTo<8>(Value: FromTy->getElementCount().getKnownMinValue())); | 
|---|
| 1494 | llvm::Value *ZeroVec = llvm::Constant::getNullValue(Ty: FromTy); | 
|---|
| 1495 | V = CGF.Builder.CreateInsertVector(DstType: FromTy, SrcVec: ZeroVec, SubVec: V, Idx: uint64_t(0)); | 
|---|
| 1496 | } | 
|---|
| 1497 | FromTy = llvm::ScalableVectorType::get( | 
|---|
| 1498 | ElementType: ToTy->getElementType(), | 
|---|
| 1499 | MinNumElts: FromTy->getElementCount().getKnownMinValue() / 8); | 
|---|
| 1500 | V = CGF.Builder.CreateBitCast(V, DestTy: FromTy); | 
|---|
| 1501 | } | 
|---|
| 1502 | if (FromTy->getElementType() == ToTy->getElementType()) { | 
|---|
| 1503 | V->setName(Name + ".coerce"); | 
|---|
| 1504 | V = CGF.Builder.CreateExtractVector(DstType: ToTy, SrcVec: V, Idx: uint64_t(0), Name: "cast.fixed"); | 
|---|
| 1505 | return {V, true}; | 
|---|
| 1506 | } | 
|---|
| 1507 | return {V, false}; | 
|---|
| 1508 | } | 
|---|
| 1509 |  | 
|---|
| 1510 | namespace { | 
|---|
| 1511 |  | 
|---|
| 1512 | /// Encapsulates information about the way function arguments from | 
|---|
| 1513 | /// CGFunctionInfo should be passed to actual LLVM IR function. | 
|---|
| 1514 | class ClangToLLVMArgMapping { | 
|---|
| 1515 | static const unsigned InvalidIndex = ~0U; | 
|---|
| 1516 | unsigned InallocaArgNo; | 
|---|
| 1517 | unsigned SRetArgNo; | 
|---|
| 1518 | unsigned TotalIRArgs; | 
|---|
| 1519 |  | 
|---|
| 1520 | /// Arguments of LLVM IR function corresponding to single Clang argument. | 
|---|
| 1521 | struct IRArgs { | 
|---|
| 1522 | unsigned PaddingArgIndex; | 
|---|
| 1523 | // Argument is expanded to IR arguments at positions | 
|---|
| 1524 | // [FirstArgIndex, FirstArgIndex + NumberOfArgs). | 
|---|
| 1525 | unsigned FirstArgIndex; | 
|---|
| 1526 | unsigned NumberOfArgs; | 
|---|
| 1527 |  | 
|---|
| 1528 | IRArgs() | 
|---|
| 1529 | : PaddingArgIndex(InvalidIndex), FirstArgIndex(InvalidIndex), | 
|---|
| 1530 | NumberOfArgs(0) {} | 
|---|
| 1531 | }; | 
|---|
| 1532 |  | 
|---|
| 1533 | SmallVector<IRArgs, 8> ArgInfo; | 
|---|
| 1534 |  | 
|---|
| 1535 | public: | 
|---|
| 1536 | ClangToLLVMArgMapping(const ASTContext &Context, const CGFunctionInfo &FI, | 
|---|
| 1537 | bool OnlyRequiredArgs = false) | 
|---|
| 1538 | : InallocaArgNo(InvalidIndex), SRetArgNo(InvalidIndex), TotalIRArgs(0), | 
|---|
| 1539 | ArgInfo(OnlyRequiredArgs ? FI.getNumRequiredArgs() : FI.arg_size()) { | 
|---|
| 1540 | construct(Context, FI, OnlyRequiredArgs); | 
|---|
| 1541 | } | 
|---|
| 1542 |  | 
|---|
| 1543 | bool hasInallocaArg() const { return InallocaArgNo != InvalidIndex; } | 
|---|
| 1544 | unsigned getInallocaArgNo() const { | 
|---|
| 1545 | assert(hasInallocaArg()); | 
|---|
| 1546 | return InallocaArgNo; | 
|---|
| 1547 | } | 
|---|
| 1548 |  | 
|---|
| 1549 | bool hasSRetArg() const { return SRetArgNo != InvalidIndex; } | 
|---|
| 1550 | unsigned getSRetArgNo() const { | 
|---|
| 1551 | assert(hasSRetArg()); | 
|---|
| 1552 | return SRetArgNo; | 
|---|
| 1553 | } | 
|---|
| 1554 |  | 
|---|
| 1555 | unsigned totalIRArgs() const { return TotalIRArgs; } | 
|---|
| 1556 |  | 
|---|
| 1557 | bool hasPaddingArg(unsigned ArgNo) const { | 
|---|
| 1558 | assert(ArgNo < ArgInfo.size()); | 
|---|
| 1559 | return ArgInfo[ArgNo].PaddingArgIndex != InvalidIndex; | 
|---|
| 1560 | } | 
|---|
| 1561 | unsigned getPaddingArgNo(unsigned ArgNo) const { | 
|---|
| 1562 | assert(hasPaddingArg(ArgNo)); | 
|---|
| 1563 | return ArgInfo[ArgNo].PaddingArgIndex; | 
|---|
| 1564 | } | 
|---|
| 1565 |  | 
|---|
| 1566 | /// Returns index of first IR argument corresponding to ArgNo, and their | 
|---|
| 1567 | /// quantity. | 
|---|
| 1568 | std::pair<unsigned, unsigned> getIRArgs(unsigned ArgNo) const { | 
|---|
| 1569 | assert(ArgNo < ArgInfo.size()); | 
|---|
| 1570 | return std::make_pair(x: ArgInfo[ArgNo].FirstArgIndex, | 
|---|
| 1571 | y: ArgInfo[ArgNo].NumberOfArgs); | 
|---|
| 1572 | } | 
|---|
| 1573 |  | 
|---|
| 1574 | private: | 
|---|
| 1575 | void construct(const ASTContext &Context, const CGFunctionInfo &FI, | 
|---|
| 1576 | bool OnlyRequiredArgs); | 
|---|
| 1577 | }; | 
|---|
| 1578 |  | 
|---|
| 1579 | void ClangToLLVMArgMapping::construct(const ASTContext &Context, | 
|---|
| 1580 | const CGFunctionInfo &FI, | 
|---|
| 1581 | bool OnlyRequiredArgs) { | 
|---|
| 1582 | unsigned IRArgNo = 0; | 
|---|
| 1583 | bool SwapThisWithSRet = false; | 
|---|
| 1584 | const ABIArgInfo &RetAI = FI.getReturnInfo(); | 
|---|
| 1585 |  | 
|---|
| 1586 | if (RetAI.getKind() == ABIArgInfo::Indirect) { | 
|---|
| 1587 | SwapThisWithSRet = RetAI.isSRetAfterThis(); | 
|---|
| 1588 | SRetArgNo = SwapThisWithSRet ? 1 : IRArgNo++; | 
|---|
| 1589 | } | 
|---|
| 1590 |  | 
|---|
| 1591 | unsigned ArgNo = 0; | 
|---|
| 1592 | unsigned NumArgs = OnlyRequiredArgs ? FI.getNumRequiredArgs() : FI.arg_size(); | 
|---|
| 1593 | for (CGFunctionInfo::const_arg_iterator I = FI.arg_begin(); ArgNo < NumArgs; | 
|---|
| 1594 | ++I, ++ArgNo) { | 
|---|
| 1595 | assert(I != FI.arg_end()); | 
|---|
| 1596 | QualType ArgType = I->type; | 
|---|
| 1597 | const ABIArgInfo &AI = I->info; | 
|---|
| 1598 | // Collect data about IR arguments corresponding to Clang argument ArgNo. | 
|---|
| 1599 | auto &IRArgs = ArgInfo[ArgNo]; | 
|---|
| 1600 |  | 
|---|
| 1601 | if (AI.getPaddingType()) | 
|---|
| 1602 | IRArgs.PaddingArgIndex = IRArgNo++; | 
|---|
| 1603 |  | 
|---|
| 1604 | switch (AI.getKind()) { | 
|---|
| 1605 | case ABIArgInfo::Extend: | 
|---|
| 1606 | case ABIArgInfo::Direct: { | 
|---|
| 1607 | // FIXME: handle sseregparm someday... | 
|---|
| 1608 | llvm::StructType *STy = dyn_cast<llvm::StructType>(Val: AI.getCoerceToType()); | 
|---|
| 1609 | if (AI.isDirect() && AI.getCanBeFlattened() && STy) { | 
|---|
| 1610 | IRArgs.NumberOfArgs = STy->getNumElements(); | 
|---|
| 1611 | } else { | 
|---|
| 1612 | IRArgs.NumberOfArgs = 1; | 
|---|
| 1613 | } | 
|---|
| 1614 | break; | 
|---|
| 1615 | } | 
|---|
| 1616 | case ABIArgInfo::Indirect: | 
|---|
| 1617 | case ABIArgInfo::IndirectAliased: | 
|---|
| 1618 | IRArgs.NumberOfArgs = 1; | 
|---|
| 1619 | break; | 
|---|
| 1620 | case ABIArgInfo::Ignore: | 
|---|
| 1621 | case ABIArgInfo::InAlloca: | 
|---|
| 1622 | // ignore and inalloca doesn't have matching LLVM parameters. | 
|---|
| 1623 | IRArgs.NumberOfArgs = 0; | 
|---|
| 1624 | break; | 
|---|
| 1625 | case ABIArgInfo::CoerceAndExpand: | 
|---|
| 1626 | IRArgs.NumberOfArgs = AI.getCoerceAndExpandTypeSequence().size(); | 
|---|
| 1627 | break; | 
|---|
| 1628 | case ABIArgInfo::Expand: | 
|---|
| 1629 | IRArgs.NumberOfArgs = getExpansionSize(Ty: ArgType, Context); | 
|---|
| 1630 | break; | 
|---|
| 1631 | } | 
|---|
| 1632 |  | 
|---|
| 1633 | if (IRArgs.NumberOfArgs > 0) { | 
|---|
| 1634 | IRArgs.FirstArgIndex = IRArgNo; | 
|---|
| 1635 | IRArgNo += IRArgs.NumberOfArgs; | 
|---|
| 1636 | } | 
|---|
| 1637 |  | 
|---|
| 1638 | // Skip over the sret parameter when it comes second.  We already handled it | 
|---|
| 1639 | // above. | 
|---|
| 1640 | if (IRArgNo == 1 && SwapThisWithSRet) | 
|---|
| 1641 | IRArgNo++; | 
|---|
| 1642 | } | 
|---|
| 1643 | assert(ArgNo == ArgInfo.size()); | 
|---|
| 1644 |  | 
|---|
| 1645 | if (FI.usesInAlloca()) | 
|---|
| 1646 | InallocaArgNo = IRArgNo++; | 
|---|
| 1647 |  | 
|---|
| 1648 | TotalIRArgs = IRArgNo; | 
|---|
| 1649 | } | 
|---|
| 1650 | } // namespace | 
|---|
| 1651 |  | 
|---|
| 1652 | /***/ | 
|---|
| 1653 |  | 
|---|
| 1654 | bool CodeGenModule::ReturnTypeUsesSRet(const CGFunctionInfo &FI) { | 
|---|
| 1655 | const auto &RI = FI.getReturnInfo(); | 
|---|
| 1656 | return RI.isIndirect() || (RI.isInAlloca() && RI.getInAllocaSRet()); | 
|---|
| 1657 | } | 
|---|
| 1658 |  | 
|---|
| 1659 | bool CodeGenModule::ReturnTypeHasInReg(const CGFunctionInfo &FI) { | 
|---|
| 1660 | const auto &RI = FI.getReturnInfo(); | 
|---|
| 1661 | return RI.getInReg(); | 
|---|
| 1662 | } | 
|---|
| 1663 |  | 
|---|
| 1664 | bool CodeGenModule::ReturnSlotInterferesWithArgs(const CGFunctionInfo &FI) { | 
|---|
| 1665 | return ReturnTypeUsesSRet(FI) && | 
|---|
| 1666 | getTargetCodeGenInfo().doesReturnSlotInterfereWithArgs(); | 
|---|
| 1667 | } | 
|---|
| 1668 |  | 
|---|
| 1669 | bool CodeGenModule::ReturnTypeUsesFPRet(QualType ResultType) { | 
|---|
| 1670 | if (const BuiltinType *BT = ResultType->getAs<BuiltinType>()) { | 
|---|
| 1671 | switch (BT->getKind()) { | 
|---|
| 1672 | default: | 
|---|
| 1673 | return false; | 
|---|
| 1674 | case BuiltinType::Float: | 
|---|
| 1675 | return getTarget().useObjCFPRetForRealType(T: FloatModeKind::Float); | 
|---|
| 1676 | case BuiltinType::Double: | 
|---|
| 1677 | return getTarget().useObjCFPRetForRealType(T: FloatModeKind::Double); | 
|---|
| 1678 | case BuiltinType::LongDouble: | 
|---|
| 1679 | return getTarget().useObjCFPRetForRealType(T: FloatModeKind::LongDouble); | 
|---|
| 1680 | } | 
|---|
| 1681 | } | 
|---|
| 1682 |  | 
|---|
| 1683 | return false; | 
|---|
| 1684 | } | 
|---|
| 1685 |  | 
|---|
| 1686 | bool CodeGenModule::ReturnTypeUsesFP2Ret(QualType ResultType) { | 
|---|
| 1687 | if (const ComplexType *CT = ResultType->getAs<ComplexType>()) { | 
|---|
| 1688 | if (const BuiltinType *BT = CT->getElementType()->getAs<BuiltinType>()) { | 
|---|
| 1689 | if (BT->getKind() == BuiltinType::LongDouble) | 
|---|
| 1690 | return getTarget().useObjCFP2RetForComplexLongDouble(); | 
|---|
| 1691 | } | 
|---|
| 1692 | } | 
|---|
| 1693 |  | 
|---|
| 1694 | return false; | 
|---|
| 1695 | } | 
|---|
| 1696 |  | 
|---|
| 1697 | llvm::FunctionType *CodeGenTypes::GetFunctionType(GlobalDecl GD) { | 
|---|
| 1698 | const CGFunctionInfo &FI = arrangeGlobalDeclaration(GD); | 
|---|
| 1699 | return GetFunctionType(Info: FI); | 
|---|
| 1700 | } | 
|---|
| 1701 |  | 
|---|
| 1702 | llvm::FunctionType *CodeGenTypes::GetFunctionType(const CGFunctionInfo &FI) { | 
|---|
| 1703 |  | 
|---|
| 1704 | bool Inserted = FunctionsBeingProcessed.insert(Ptr: &FI).second; | 
|---|
| 1705 | (void)Inserted; | 
|---|
| 1706 | assert(Inserted && "Recursively being processed?"); | 
|---|
| 1707 |  | 
|---|
| 1708 | llvm::Type *resultType = nullptr; | 
|---|
| 1709 | const ABIArgInfo &retAI = FI.getReturnInfo(); | 
|---|
| 1710 | switch (retAI.getKind()) { | 
|---|
| 1711 | case ABIArgInfo::Expand: | 
|---|
| 1712 | case ABIArgInfo::IndirectAliased: | 
|---|
| 1713 | llvm_unreachable( "Invalid ABI kind for return argument"); | 
|---|
| 1714 |  | 
|---|
| 1715 | case ABIArgInfo::Extend: | 
|---|
| 1716 | case ABIArgInfo::Direct: | 
|---|
| 1717 | resultType = retAI.getCoerceToType(); | 
|---|
| 1718 | break; | 
|---|
| 1719 |  | 
|---|
| 1720 | case ABIArgInfo::InAlloca: | 
|---|
| 1721 | if (retAI.getInAllocaSRet()) { | 
|---|
| 1722 | // sret things on win32 aren't void, they return the sret pointer. | 
|---|
| 1723 | QualType ret = FI.getReturnType(); | 
|---|
| 1724 | unsigned addressSpace = CGM.getTypes().getTargetAddressSpace(T: ret); | 
|---|
| 1725 | resultType = llvm::PointerType::get(C&: getLLVMContext(), AddressSpace: addressSpace); | 
|---|
| 1726 | } else { | 
|---|
| 1727 | resultType = llvm::Type::getVoidTy(C&: getLLVMContext()); | 
|---|
| 1728 | } | 
|---|
| 1729 | break; | 
|---|
| 1730 |  | 
|---|
| 1731 | case ABIArgInfo::Indirect: | 
|---|
| 1732 | case ABIArgInfo::Ignore: | 
|---|
| 1733 | resultType = llvm::Type::getVoidTy(C&: getLLVMContext()); | 
|---|
| 1734 | break; | 
|---|
| 1735 |  | 
|---|
| 1736 | case ABIArgInfo::CoerceAndExpand: | 
|---|
| 1737 | resultType = retAI.getUnpaddedCoerceAndExpandType(); | 
|---|
| 1738 | break; | 
|---|
| 1739 | } | 
|---|
| 1740 |  | 
|---|
| 1741 | ClangToLLVMArgMapping IRFunctionArgs(getContext(), FI, true); | 
|---|
| 1742 | SmallVector<llvm::Type *, 8> ArgTypes(IRFunctionArgs.totalIRArgs()); | 
|---|
| 1743 |  | 
|---|
| 1744 | // Add type for sret argument. | 
|---|
| 1745 | if (IRFunctionArgs.hasSRetArg()) { | 
|---|
| 1746 | ArgTypes[IRFunctionArgs.getSRetArgNo()] = llvm::PointerType::get( | 
|---|
| 1747 | C&: getLLVMContext(), AddressSpace: FI.getReturnInfo().getIndirectAddrSpace()); | 
|---|
| 1748 | } | 
|---|
| 1749 |  | 
|---|
| 1750 | // Add type for inalloca argument. | 
|---|
| 1751 | if (IRFunctionArgs.hasInallocaArg()) | 
|---|
| 1752 | ArgTypes[IRFunctionArgs.getInallocaArgNo()] = | 
|---|
| 1753 | llvm::PointerType::getUnqual(C&: getLLVMContext()); | 
|---|
| 1754 |  | 
|---|
| 1755 | // Add in all of the required arguments. | 
|---|
| 1756 | unsigned ArgNo = 0; | 
|---|
| 1757 | CGFunctionInfo::const_arg_iterator it = FI.arg_begin(), | 
|---|
| 1758 | ie = it + FI.getNumRequiredArgs(); | 
|---|
| 1759 | for (; it != ie; ++it, ++ArgNo) { | 
|---|
| 1760 | const ABIArgInfo &ArgInfo = it->info; | 
|---|
| 1761 |  | 
|---|
| 1762 | // Insert a padding type to ensure proper alignment. | 
|---|
| 1763 | if (IRFunctionArgs.hasPaddingArg(ArgNo)) | 
|---|
| 1764 | ArgTypes[IRFunctionArgs.getPaddingArgNo(ArgNo)] = | 
|---|
| 1765 | ArgInfo.getPaddingType(); | 
|---|
| 1766 |  | 
|---|
| 1767 | unsigned FirstIRArg, NumIRArgs; | 
|---|
| 1768 | std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo); | 
|---|
| 1769 |  | 
|---|
| 1770 | switch (ArgInfo.getKind()) { | 
|---|
| 1771 | case ABIArgInfo::Ignore: | 
|---|
| 1772 | case ABIArgInfo::InAlloca: | 
|---|
| 1773 | assert(NumIRArgs == 0); | 
|---|
| 1774 | break; | 
|---|
| 1775 |  | 
|---|
| 1776 | case ABIArgInfo::Indirect: | 
|---|
| 1777 | assert(NumIRArgs == 1); | 
|---|
| 1778 | // indirect arguments are always on the stack, which is alloca addr space. | 
|---|
| 1779 | ArgTypes[FirstIRArg] = llvm::PointerType::get( | 
|---|
| 1780 | C&: getLLVMContext(), AddressSpace: CGM.getDataLayout().getAllocaAddrSpace()); | 
|---|
| 1781 | break; | 
|---|
| 1782 | case ABIArgInfo::IndirectAliased: | 
|---|
| 1783 | assert(NumIRArgs == 1); | 
|---|
| 1784 | ArgTypes[FirstIRArg] = llvm::PointerType::get( | 
|---|
| 1785 | C&: getLLVMContext(), AddressSpace: ArgInfo.getIndirectAddrSpace()); | 
|---|
| 1786 | break; | 
|---|
| 1787 | case ABIArgInfo::Extend: | 
|---|
| 1788 | case ABIArgInfo::Direct: { | 
|---|
| 1789 | // Fast-isel and the optimizer generally like scalar values better than | 
|---|
| 1790 | // FCAs, so we flatten them if this is safe to do for this argument. | 
|---|
| 1791 | llvm::Type *argType = ArgInfo.getCoerceToType(); | 
|---|
| 1792 | llvm::StructType *st = dyn_cast<llvm::StructType>(Val: argType); | 
|---|
| 1793 | if (st && ArgInfo.isDirect() && ArgInfo.getCanBeFlattened()) { | 
|---|
| 1794 | assert(NumIRArgs == st->getNumElements()); | 
|---|
| 1795 | for (unsigned i = 0, e = st->getNumElements(); i != e; ++i) | 
|---|
| 1796 | ArgTypes[FirstIRArg + i] = st->getElementType(N: i); | 
|---|
| 1797 | } else { | 
|---|
| 1798 | assert(NumIRArgs == 1); | 
|---|
| 1799 | ArgTypes[FirstIRArg] = argType; | 
|---|
| 1800 | } | 
|---|
| 1801 | break; | 
|---|
| 1802 | } | 
|---|
| 1803 |  | 
|---|
| 1804 | case ABIArgInfo::CoerceAndExpand: { | 
|---|
| 1805 | auto ArgTypesIter = ArgTypes.begin() + FirstIRArg; | 
|---|
| 1806 | for (auto *EltTy : ArgInfo.getCoerceAndExpandTypeSequence()) { | 
|---|
| 1807 | *ArgTypesIter++ = EltTy; | 
|---|
| 1808 | } | 
|---|
| 1809 | assert(ArgTypesIter == ArgTypes.begin() + FirstIRArg + NumIRArgs); | 
|---|
| 1810 | break; | 
|---|
| 1811 | } | 
|---|
| 1812 |  | 
|---|
| 1813 | case ABIArgInfo::Expand: | 
|---|
| 1814 | auto ArgTypesIter = ArgTypes.begin() + FirstIRArg; | 
|---|
| 1815 | getExpandedTypes(Ty: it->type, TI&: ArgTypesIter); | 
|---|
| 1816 | assert(ArgTypesIter == ArgTypes.begin() + FirstIRArg + NumIRArgs); | 
|---|
| 1817 | break; | 
|---|
| 1818 | } | 
|---|
| 1819 | } | 
|---|
| 1820 |  | 
|---|
| 1821 | bool Erased = FunctionsBeingProcessed.erase(Ptr: &FI); | 
|---|
| 1822 | (void)Erased; | 
|---|
| 1823 | assert(Erased && "Not in set?"); | 
|---|
| 1824 |  | 
|---|
| 1825 | return llvm::FunctionType::get(Result: resultType, Params: ArgTypes, isVarArg: FI.isVariadic()); | 
|---|
| 1826 | } | 
|---|
| 1827 |  | 
|---|
| 1828 | llvm::Type *CodeGenTypes::GetFunctionTypeForVTable(GlobalDecl GD) { | 
|---|
| 1829 | const CXXMethodDecl *MD = cast<CXXMethodDecl>(Val: GD.getDecl()); | 
|---|
| 1830 | const FunctionProtoType *FPT = MD->getType()->castAs<FunctionProtoType>(); | 
|---|
| 1831 |  | 
|---|
| 1832 | if (!isFuncTypeConvertible(FT: FPT)) | 
|---|
| 1833 | return llvm::StructType::get(Context&: getLLVMContext()); | 
|---|
| 1834 |  | 
|---|
| 1835 | return GetFunctionType(GD); | 
|---|
| 1836 | } | 
|---|
| 1837 |  | 
|---|
| 1838 | static void AddAttributesFromFunctionProtoType(ASTContext &Ctx, | 
|---|
| 1839 | llvm::AttrBuilder &FuncAttrs, | 
|---|
| 1840 | const FunctionProtoType *FPT) { | 
|---|
| 1841 | if (!FPT) | 
|---|
| 1842 | return; | 
|---|
| 1843 |  | 
|---|
| 1844 | if (!isUnresolvedExceptionSpec(ESpecType: FPT->getExceptionSpecType()) && | 
|---|
| 1845 | FPT->isNothrow()) | 
|---|
| 1846 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind); | 
|---|
| 1847 |  | 
|---|
| 1848 | unsigned SMEBits = FPT->getAArch64SMEAttributes(); | 
|---|
| 1849 | if (SMEBits & FunctionType::SME_PStateSMEnabledMask) | 
|---|
| 1850 | FuncAttrs.addAttribute(A: "aarch64_pstate_sm_enabled"); | 
|---|
| 1851 | if (SMEBits & FunctionType::SME_PStateSMCompatibleMask) | 
|---|
| 1852 | FuncAttrs.addAttribute(A: "aarch64_pstate_sm_compatible"); | 
|---|
| 1853 | if (SMEBits & FunctionType::SME_AgnosticZAStateMask) | 
|---|
| 1854 | FuncAttrs.addAttribute(A: "aarch64_za_state_agnostic"); | 
|---|
| 1855 |  | 
|---|
| 1856 | // ZA | 
|---|
| 1857 | if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_Preserves) | 
|---|
| 1858 | FuncAttrs.addAttribute(A: "aarch64_preserves_za"); | 
|---|
| 1859 | if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_In) | 
|---|
| 1860 | FuncAttrs.addAttribute(A: "aarch64_in_za"); | 
|---|
| 1861 | if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_Out) | 
|---|
| 1862 | FuncAttrs.addAttribute(A: "aarch64_out_za"); | 
|---|
| 1863 | if (FunctionType::getArmZAState(AttrBits: SMEBits) == FunctionType::ARM_InOut) | 
|---|
| 1864 | FuncAttrs.addAttribute(A: "aarch64_inout_za"); | 
|---|
| 1865 |  | 
|---|
| 1866 | // ZT0 | 
|---|
| 1867 | if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_Preserves) | 
|---|
| 1868 | FuncAttrs.addAttribute(A: "aarch64_preserves_zt0"); | 
|---|
| 1869 | if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_In) | 
|---|
| 1870 | FuncAttrs.addAttribute(A: "aarch64_in_zt0"); | 
|---|
| 1871 | if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_Out) | 
|---|
| 1872 | FuncAttrs.addAttribute(A: "aarch64_out_zt0"); | 
|---|
| 1873 | if (FunctionType::getArmZT0State(AttrBits: SMEBits) == FunctionType::ARM_InOut) | 
|---|
| 1874 | FuncAttrs.addAttribute(A: "aarch64_inout_zt0"); | 
|---|
| 1875 | } | 
|---|
| 1876 |  | 
|---|
| 1877 | static void AddAttributesFromOMPAssumes(llvm::AttrBuilder &FuncAttrs, | 
|---|
| 1878 | const Decl *Callee) { | 
|---|
| 1879 | if (!Callee) | 
|---|
| 1880 | return; | 
|---|
| 1881 |  | 
|---|
| 1882 | SmallVector<StringRef, 4> Attrs; | 
|---|
| 1883 |  | 
|---|
| 1884 | for (const OMPAssumeAttr *AA : Callee->specific_attrs<OMPAssumeAttr>()) | 
|---|
| 1885 | AA->getAssumption().split(A&: Attrs, Separator: ","); | 
|---|
| 1886 |  | 
|---|
| 1887 | if (!Attrs.empty()) | 
|---|
| 1888 | FuncAttrs.addAttribute(A: llvm::AssumptionAttrKey, | 
|---|
| 1889 | V: llvm::join(Begin: Attrs.begin(), End: Attrs.end(), Separator: ",")); | 
|---|
| 1890 | } | 
|---|
| 1891 |  | 
|---|
| 1892 | bool CodeGenModule::MayDropFunctionReturn(const ASTContext &Context, | 
|---|
| 1893 | QualType ReturnType) const { | 
|---|
| 1894 | // We can't just discard the return value for a record type with a | 
|---|
| 1895 | // complex destructor or a non-trivially copyable type. | 
|---|
| 1896 | if (const RecordType *RT = | 
|---|
| 1897 | ReturnType.getCanonicalType()->getAs<RecordType>()) { | 
|---|
| 1898 | if (const auto *ClassDecl = dyn_cast<CXXRecordDecl>(Val: RT->getDecl())) | 
|---|
| 1899 | return ClassDecl->hasTrivialDestructor(); | 
|---|
| 1900 | } | 
|---|
| 1901 | return ReturnType.isTriviallyCopyableType(Context); | 
|---|
| 1902 | } | 
|---|
| 1903 |  | 
|---|
| 1904 | static bool HasStrictReturn(const CodeGenModule &Module, QualType RetTy, | 
|---|
| 1905 | const Decl *TargetDecl) { | 
|---|
| 1906 | // As-is msan can not tolerate noundef mismatch between caller and | 
|---|
| 1907 | // implementation. Mismatch is possible for e.g. indirect calls from C-caller | 
|---|
| 1908 | // into C++. Such mismatches lead to confusing false reports. To avoid | 
|---|
| 1909 | // expensive workaround on msan we enforce initialization event in uncommon | 
|---|
| 1910 | // cases where it's allowed. | 
|---|
| 1911 | if (Module.getLangOpts().Sanitize.has(K: SanitizerKind::Memory)) | 
|---|
| 1912 | return true; | 
|---|
| 1913 | // C++ explicitly makes returning undefined values UB. C's rule only applies | 
|---|
| 1914 | // to used values, so we never mark them noundef for now. | 
|---|
| 1915 | if (!Module.getLangOpts().CPlusPlus) | 
|---|
| 1916 | return false; | 
|---|
| 1917 | if (TargetDecl) { | 
|---|
| 1918 | if (const FunctionDecl *FDecl = dyn_cast<FunctionDecl>(Val: TargetDecl)) { | 
|---|
| 1919 | if (FDecl->isExternC()) | 
|---|
| 1920 | return false; | 
|---|
| 1921 | } else if (const VarDecl *VDecl = dyn_cast<VarDecl>(Val: TargetDecl)) { | 
|---|
| 1922 | // Function pointer. | 
|---|
| 1923 | if (VDecl->isExternC()) | 
|---|
| 1924 | return false; | 
|---|
| 1925 | } | 
|---|
| 1926 | } | 
|---|
| 1927 |  | 
|---|
| 1928 | // We don't want to be too aggressive with the return checking, unless | 
|---|
| 1929 | // it's explicit in the code opts or we're using an appropriate sanitizer. | 
|---|
| 1930 | // Try to respect what the programmer intended. | 
|---|
| 1931 | return Module.getCodeGenOpts().StrictReturn || | 
|---|
| 1932 | !Module.MayDropFunctionReturn(Context: Module.getContext(), ReturnType: RetTy) || | 
|---|
| 1933 | Module.getLangOpts().Sanitize.has(K: SanitizerKind::Return); | 
|---|
| 1934 | } | 
|---|
| 1935 |  | 
|---|
| 1936 | /// Add denormal-fp-math and denormal-fp-math-f32 as appropriate for the | 
|---|
| 1937 | /// requested denormal behavior, accounting for the overriding behavior of the | 
|---|
| 1938 | /// -f32 case. | 
|---|
| 1939 | static void addDenormalModeAttrs(llvm::DenormalMode FPDenormalMode, | 
|---|
| 1940 | llvm::DenormalMode FP32DenormalMode, | 
|---|
| 1941 | llvm::AttrBuilder &FuncAttrs) { | 
|---|
| 1942 | if (FPDenormalMode != llvm::DenormalMode::getDefault()) | 
|---|
| 1943 | FuncAttrs.addAttribute(A: "denormal-fp-math", V: FPDenormalMode.str()); | 
|---|
| 1944 |  | 
|---|
| 1945 | if (FP32DenormalMode != FPDenormalMode && FP32DenormalMode.isValid()) | 
|---|
| 1946 | FuncAttrs.addAttribute(A: "denormal-fp-math-f32", V: FP32DenormalMode.str()); | 
|---|
| 1947 | } | 
|---|
| 1948 |  | 
|---|
| 1949 | /// Add default attributes to a function, which have merge semantics under | 
|---|
| 1950 | /// -mlink-builtin-bitcode and should not simply overwrite any existing | 
|---|
| 1951 | /// attributes in the linked library. | 
|---|
| 1952 | static void | 
|---|
| 1953 | addMergableDefaultFunctionAttributes(const CodeGenOptions &CodeGenOpts, | 
|---|
| 1954 | llvm::AttrBuilder &FuncAttrs) { | 
|---|
| 1955 | addDenormalModeAttrs(FPDenormalMode: CodeGenOpts.FPDenormalMode, FP32DenormalMode: CodeGenOpts.FP32DenormalMode, | 
|---|
| 1956 | FuncAttrs); | 
|---|
| 1957 | } | 
|---|
| 1958 |  | 
|---|
| 1959 | static void getTrivialDefaultFunctionAttributes( | 
|---|
| 1960 | StringRef Name, bool HasOptnone, const CodeGenOptions &CodeGenOpts, | 
|---|
| 1961 | const LangOptions &LangOpts, bool AttrOnCallSite, | 
|---|
| 1962 | llvm::AttrBuilder &FuncAttrs) { | 
|---|
| 1963 | // OptimizeNoneAttr takes precedence over -Os or -Oz. No warning needed. | 
|---|
| 1964 | if (!HasOptnone) { | 
|---|
| 1965 | if (CodeGenOpts.OptimizeSize) | 
|---|
| 1966 | FuncAttrs.addAttribute(Val: llvm::Attribute::OptimizeForSize); | 
|---|
| 1967 | if (CodeGenOpts.OptimizeSize == 2) | 
|---|
| 1968 | FuncAttrs.addAttribute(Val: llvm::Attribute::MinSize); | 
|---|
| 1969 | } | 
|---|
| 1970 |  | 
|---|
| 1971 | if (CodeGenOpts.DisableRedZone) | 
|---|
| 1972 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoRedZone); | 
|---|
| 1973 | if (CodeGenOpts.IndirectTlsSegRefs) | 
|---|
| 1974 | FuncAttrs.addAttribute(A: "indirect-tls-seg-refs"); | 
|---|
| 1975 | if (CodeGenOpts.NoImplicitFloat) | 
|---|
| 1976 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoImplicitFloat); | 
|---|
| 1977 |  | 
|---|
| 1978 | if (AttrOnCallSite) { | 
|---|
| 1979 | // Attributes that should go on the call site only. | 
|---|
| 1980 | // FIXME: Look for 'BuiltinAttr' on the function rather than re-checking | 
|---|
| 1981 | // the -fno-builtin-foo list. | 
|---|
| 1982 | if (!CodeGenOpts.SimplifyLibCalls || LangOpts.isNoBuiltinFunc(Name)) | 
|---|
| 1983 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoBuiltin); | 
|---|
| 1984 | if (!CodeGenOpts.TrapFuncName.empty()) | 
|---|
| 1985 | FuncAttrs.addAttribute(A: "trap-func-name", V: CodeGenOpts.TrapFuncName); | 
|---|
| 1986 | } else { | 
|---|
| 1987 | switch (CodeGenOpts.getFramePointer()) { | 
|---|
| 1988 | case CodeGenOptions::FramePointerKind::None: | 
|---|
| 1989 | // This is the default behavior. | 
|---|
| 1990 | break; | 
|---|
| 1991 | case CodeGenOptions::FramePointerKind::Reserved: | 
|---|
| 1992 | case CodeGenOptions::FramePointerKind::NonLeaf: | 
|---|
| 1993 | case CodeGenOptions::FramePointerKind::All: | 
|---|
| 1994 | FuncAttrs.addAttribute(A: "frame-pointer", | 
|---|
| 1995 | V: CodeGenOptions::getFramePointerKindName( | 
|---|
| 1996 | Kind: CodeGenOpts.getFramePointer())); | 
|---|
| 1997 | } | 
|---|
| 1998 |  | 
|---|
| 1999 | if (CodeGenOpts.LessPreciseFPMAD) | 
|---|
| 2000 | FuncAttrs.addAttribute(A: "less-precise-fpmad", V: "true"); | 
|---|
| 2001 |  | 
|---|
| 2002 | if (CodeGenOpts.NullPointerIsValid) | 
|---|
| 2003 | FuncAttrs.addAttribute(Val: llvm::Attribute::NullPointerIsValid); | 
|---|
| 2004 |  | 
|---|
| 2005 | if (LangOpts.getDefaultExceptionMode() == LangOptions::FPE_Ignore) | 
|---|
| 2006 | FuncAttrs.addAttribute(A: "no-trapping-math", V: "true"); | 
|---|
| 2007 |  | 
|---|
| 2008 | // TODO: Are these all needed? | 
|---|
| 2009 | // unsafe/inf/nan/nsz are handled by instruction-level FastMathFlags. | 
|---|
| 2010 | if (LangOpts.NoHonorInfs) | 
|---|
| 2011 | FuncAttrs.addAttribute(A: "no-infs-fp-math", V: "true"); | 
|---|
| 2012 | if (LangOpts.NoHonorNaNs) | 
|---|
| 2013 | FuncAttrs.addAttribute(A: "no-nans-fp-math", V: "true"); | 
|---|
| 2014 | if (LangOpts.ApproxFunc) | 
|---|
| 2015 | FuncAttrs.addAttribute(A: "approx-func-fp-math", V: "true"); | 
|---|
| 2016 | if (LangOpts.AllowFPReassoc && LangOpts.AllowRecip && | 
|---|
| 2017 | LangOpts.NoSignedZero && LangOpts.ApproxFunc && | 
|---|
| 2018 | (LangOpts.getDefaultFPContractMode() == | 
|---|
| 2019 | LangOptions::FPModeKind::FPM_Fast || | 
|---|
| 2020 | LangOpts.getDefaultFPContractMode() == | 
|---|
| 2021 | LangOptions::FPModeKind::FPM_FastHonorPragmas)) | 
|---|
| 2022 | FuncAttrs.addAttribute(A: "unsafe-fp-math", V: "true"); | 
|---|
| 2023 | if (CodeGenOpts.SoftFloat) | 
|---|
| 2024 | FuncAttrs.addAttribute(A: "use-soft-float", V: "true"); | 
|---|
| 2025 | FuncAttrs.addAttribute(A: "stack-protector-buffer-size", | 
|---|
| 2026 | V: llvm::utostr(X: CodeGenOpts.SSPBufferSize)); | 
|---|
| 2027 | if (LangOpts.NoSignedZero) | 
|---|
| 2028 | FuncAttrs.addAttribute(A: "no-signed-zeros-fp-math", V: "true"); | 
|---|
| 2029 |  | 
|---|
| 2030 | // TODO: Reciprocal estimate codegen options should apply to instructions? | 
|---|
| 2031 | const std::vector<std::string> &Recips = CodeGenOpts.Reciprocals; | 
|---|
| 2032 | if (!Recips.empty()) | 
|---|
| 2033 | FuncAttrs.addAttribute(A: "reciprocal-estimates", V: llvm::join(R: Recips, Separator: ",")); | 
|---|
| 2034 |  | 
|---|
| 2035 | if (!CodeGenOpts.PreferVectorWidth.empty() && | 
|---|
| 2036 | CodeGenOpts.PreferVectorWidth != "none") | 
|---|
| 2037 | FuncAttrs.addAttribute(A: "prefer-vector-width", | 
|---|
| 2038 | V: CodeGenOpts.PreferVectorWidth); | 
|---|
| 2039 |  | 
|---|
| 2040 | if (CodeGenOpts.StackRealignment) | 
|---|
| 2041 | FuncAttrs.addAttribute(A: "stackrealign"); | 
|---|
| 2042 | if (CodeGenOpts.Backchain) | 
|---|
| 2043 | FuncAttrs.addAttribute(A: "backchain"); | 
|---|
| 2044 | if (CodeGenOpts.EnableSegmentedStacks) | 
|---|
| 2045 | FuncAttrs.addAttribute(A: "split-stack"); | 
|---|
| 2046 |  | 
|---|
| 2047 | if (CodeGenOpts.SpeculativeLoadHardening) | 
|---|
| 2048 | FuncAttrs.addAttribute(Val: llvm::Attribute::SpeculativeLoadHardening); | 
|---|
| 2049 |  | 
|---|
| 2050 | // Add zero-call-used-regs attribute. | 
|---|
| 2051 | switch (CodeGenOpts.getZeroCallUsedRegs()) { | 
|---|
| 2052 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::Skip: | 
|---|
| 2053 | FuncAttrs.removeAttribute(A: "zero-call-used-regs"); | 
|---|
| 2054 | break; | 
|---|
| 2055 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::UsedGPRArg: | 
|---|
| 2056 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used-gpr-arg"); | 
|---|
| 2057 | break; | 
|---|
| 2058 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::UsedGPR: | 
|---|
| 2059 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used-gpr"); | 
|---|
| 2060 | break; | 
|---|
| 2061 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::UsedArg: | 
|---|
| 2062 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used-arg"); | 
|---|
| 2063 | break; | 
|---|
| 2064 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::Used: | 
|---|
| 2065 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "used"); | 
|---|
| 2066 | break; | 
|---|
| 2067 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::AllGPRArg: | 
|---|
| 2068 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all-gpr-arg"); | 
|---|
| 2069 | break; | 
|---|
| 2070 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::AllGPR: | 
|---|
| 2071 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all-gpr"); | 
|---|
| 2072 | break; | 
|---|
| 2073 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::AllArg: | 
|---|
| 2074 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all-arg"); | 
|---|
| 2075 | break; | 
|---|
| 2076 | case llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind::All: | 
|---|
| 2077 | FuncAttrs.addAttribute(A: "zero-call-used-regs", V: "all"); | 
|---|
| 2078 | break; | 
|---|
| 2079 | } | 
|---|
| 2080 | } | 
|---|
| 2081 |  | 
|---|
| 2082 | if (LangOpts.assumeFunctionsAreConvergent()) { | 
|---|
| 2083 | // Conservatively, mark all functions and calls in CUDA and OpenCL as | 
|---|
| 2084 | // convergent (meaning, they may call an intrinsically convergent op, such | 
|---|
| 2085 | // as __syncthreads() / barrier(), and so can't have certain optimizations | 
|---|
| 2086 | // applied around them).  LLVM will remove this attribute where it safely | 
|---|
| 2087 | // can. | 
|---|
| 2088 | FuncAttrs.addAttribute(Val: llvm::Attribute::Convergent); | 
|---|
| 2089 | } | 
|---|
| 2090 |  | 
|---|
| 2091 | // TODO: NoUnwind attribute should be added for other GPU modes HIP, | 
|---|
| 2092 | // OpenMP offload. AFAIK, neither of them support exceptions in device code. | 
|---|
| 2093 | if ((LangOpts.CUDA && LangOpts.CUDAIsDevice) || LangOpts.OpenCL || | 
|---|
| 2094 | LangOpts.SYCLIsDevice) { | 
|---|
| 2095 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind); | 
|---|
| 2096 | } | 
|---|
| 2097 |  | 
|---|
| 2098 | if (CodeGenOpts.SaveRegParams && !AttrOnCallSite) | 
|---|
| 2099 | FuncAttrs.addAttribute(A: "save-reg-params"); | 
|---|
| 2100 |  | 
|---|
| 2101 | for (StringRef Attr : CodeGenOpts.DefaultFunctionAttrs) { | 
|---|
| 2102 | StringRef Var, Value; | 
|---|
| 2103 | std::tie(args&: Var, args&: Value) = Attr.split(Separator: '='); | 
|---|
| 2104 | FuncAttrs.addAttribute(A: Var, V: Value); | 
|---|
| 2105 | } | 
|---|
| 2106 |  | 
|---|
| 2107 | TargetInfo::BranchProtectionInfo BPI(LangOpts); | 
|---|
| 2108 | TargetCodeGenInfo::initBranchProtectionFnAttributes(BPI, FuncAttrs); | 
|---|
| 2109 | } | 
|---|
| 2110 |  | 
|---|
| 2111 | /// Merges `target-features` from \TargetOpts and \F, and sets the result in | 
|---|
| 2112 | /// \FuncAttr | 
|---|
| 2113 | /// * features from \F are always kept | 
|---|
| 2114 | /// * a feature from \TargetOpts is kept if itself and its opposite are absent | 
|---|
| 2115 | /// from \F | 
|---|
| 2116 | static void | 
|---|
| 2117 | overrideFunctionFeaturesWithTargetFeatures(llvm::AttrBuilder &FuncAttr, | 
|---|
| 2118 | const llvm::Function &F, | 
|---|
| 2119 | const TargetOptions &TargetOpts) { | 
|---|
| 2120 | auto FFeatures = F.getFnAttribute(Kind: "target-features"); | 
|---|
| 2121 |  | 
|---|
| 2122 | llvm::StringSet<> MergedNames; | 
|---|
| 2123 | SmallVector<StringRef> MergedFeatures; | 
|---|
| 2124 | MergedFeatures.reserve(N: TargetOpts.Features.size()); | 
|---|
| 2125 |  | 
|---|
| 2126 | auto AddUnmergedFeatures = [&](auto &&FeatureRange) { | 
|---|
| 2127 | for (StringRef Feature : FeatureRange) { | 
|---|
| 2128 | if (Feature.empty()) | 
|---|
| 2129 | continue; | 
|---|
| 2130 | assert(Feature[0] == '+' || Feature[0] == '-'); | 
|---|
| 2131 | StringRef Name = Feature.drop_front(N: 1); | 
|---|
| 2132 | bool Merged = !MergedNames.insert(key: Name).second; | 
|---|
| 2133 | if (!Merged) | 
|---|
| 2134 | MergedFeatures.push_back(Elt: Feature); | 
|---|
| 2135 | } | 
|---|
| 2136 | }; | 
|---|
| 2137 |  | 
|---|
| 2138 | if (FFeatures.isValid()) | 
|---|
| 2139 | AddUnmergedFeatures(llvm::split(Str: FFeatures.getValueAsString(), Separator: ',')); | 
|---|
| 2140 | AddUnmergedFeatures(TargetOpts.Features); | 
|---|
| 2141 |  | 
|---|
| 2142 | if (!MergedFeatures.empty()) { | 
|---|
| 2143 | llvm::sort(C&: MergedFeatures); | 
|---|
| 2144 | FuncAttr.addAttribute(A: "target-features", V: llvm::join(R&: MergedFeatures, Separator: ",")); | 
|---|
| 2145 | } | 
|---|
| 2146 | } | 
|---|
| 2147 |  | 
|---|
| 2148 | void CodeGen::mergeDefaultFunctionDefinitionAttributes( | 
|---|
| 2149 | llvm::Function &F, const CodeGenOptions &CodeGenOpts, | 
|---|
| 2150 | const LangOptions &LangOpts, const TargetOptions &TargetOpts, | 
|---|
| 2151 | bool WillInternalize) { | 
|---|
| 2152 |  | 
|---|
| 2153 | llvm::AttrBuilder FuncAttrs(F.getContext()); | 
|---|
| 2154 | // Here we only extract the options that are relevant compared to the version | 
|---|
| 2155 | // from GetCPUAndFeaturesAttributes. | 
|---|
| 2156 | if (!TargetOpts.CPU.empty()) | 
|---|
| 2157 | FuncAttrs.addAttribute(A: "target-cpu", V: TargetOpts.CPU); | 
|---|
| 2158 | if (!TargetOpts.TuneCPU.empty()) | 
|---|
| 2159 | FuncAttrs.addAttribute(A: "tune-cpu", V: TargetOpts.TuneCPU); | 
|---|
| 2160 |  | 
|---|
| 2161 | ::getTrivialDefaultFunctionAttributes(Name: F.getName(), HasOptnone: F.hasOptNone(), | 
|---|
| 2162 | CodeGenOpts, LangOpts, | 
|---|
| 2163 | /*AttrOnCallSite=*/false, FuncAttrs); | 
|---|
| 2164 |  | 
|---|
| 2165 | if (!WillInternalize && F.isInterposable()) { | 
|---|
| 2166 | // Do not promote "dynamic" denormal-fp-math to this translation unit's | 
|---|
| 2167 | // setting for weak functions that won't be internalized. The user has no | 
|---|
| 2168 | // real control for how builtin bitcode is linked, so we shouldn't assume | 
|---|
| 2169 | // later copies will use a consistent mode. | 
|---|
| 2170 | F.addFnAttrs(Attrs: FuncAttrs); | 
|---|
| 2171 | return; | 
|---|
| 2172 | } | 
|---|
| 2173 |  | 
|---|
| 2174 | llvm::AttributeMask AttrsToRemove; | 
|---|
| 2175 |  | 
|---|
| 2176 | llvm::DenormalMode DenormModeToMerge = F.getDenormalModeRaw(); | 
|---|
| 2177 | llvm::DenormalMode DenormModeToMergeF32 = F.getDenormalModeF32Raw(); | 
|---|
| 2178 | llvm::DenormalMode Merged = | 
|---|
| 2179 | CodeGenOpts.FPDenormalMode.mergeCalleeMode(Callee: DenormModeToMerge); | 
|---|
| 2180 | llvm::DenormalMode MergedF32 = CodeGenOpts.FP32DenormalMode; | 
|---|
| 2181 |  | 
|---|
| 2182 | if (DenormModeToMergeF32.isValid()) { | 
|---|
| 2183 | MergedF32 = | 
|---|
| 2184 | CodeGenOpts.FP32DenormalMode.mergeCalleeMode(Callee: DenormModeToMergeF32); | 
|---|
| 2185 | } | 
|---|
| 2186 |  | 
|---|
| 2187 | if (Merged == llvm::DenormalMode::getDefault()) { | 
|---|
| 2188 | AttrsToRemove.addAttribute(A: "denormal-fp-math"); | 
|---|
| 2189 | } else if (Merged != DenormModeToMerge) { | 
|---|
| 2190 | // Overwrite existing attribute | 
|---|
| 2191 | FuncAttrs.addAttribute(A: "denormal-fp-math", | 
|---|
| 2192 | V: CodeGenOpts.FPDenormalMode.str()); | 
|---|
| 2193 | } | 
|---|
| 2194 |  | 
|---|
| 2195 | if (MergedF32 == llvm::DenormalMode::getDefault()) { | 
|---|
| 2196 | AttrsToRemove.addAttribute(A: "denormal-fp-math-f32"); | 
|---|
| 2197 | } else if (MergedF32 != DenormModeToMergeF32) { | 
|---|
| 2198 | // Overwrite existing attribute | 
|---|
| 2199 | FuncAttrs.addAttribute(A: "denormal-fp-math-f32", | 
|---|
| 2200 | V: CodeGenOpts.FP32DenormalMode.str()); | 
|---|
| 2201 | } | 
|---|
| 2202 |  | 
|---|
| 2203 | F.removeFnAttrs(Attrs: AttrsToRemove); | 
|---|
| 2204 | addDenormalModeAttrs(FPDenormalMode: Merged, FP32DenormalMode: MergedF32, FuncAttrs); | 
|---|
| 2205 |  | 
|---|
| 2206 | overrideFunctionFeaturesWithTargetFeatures(FuncAttr&: FuncAttrs, F, TargetOpts); | 
|---|
| 2207 |  | 
|---|
| 2208 | F.addFnAttrs(Attrs: FuncAttrs); | 
|---|
| 2209 | } | 
|---|
| 2210 |  | 
|---|
| 2211 | void CodeGenModule::getTrivialDefaultFunctionAttributes( | 
|---|
| 2212 | StringRef Name, bool HasOptnone, bool AttrOnCallSite, | 
|---|
| 2213 | llvm::AttrBuilder &FuncAttrs) { | 
|---|
| 2214 | ::getTrivialDefaultFunctionAttributes(Name, HasOptnone, CodeGenOpts: getCodeGenOpts(), | 
|---|
| 2215 | LangOpts: getLangOpts(), AttrOnCallSite, | 
|---|
| 2216 | FuncAttrs); | 
|---|
| 2217 | } | 
|---|
| 2218 |  | 
|---|
| 2219 | void CodeGenModule::getDefaultFunctionAttributes(StringRef Name, | 
|---|
| 2220 | bool HasOptnone, | 
|---|
| 2221 | bool AttrOnCallSite, | 
|---|
| 2222 | llvm::AttrBuilder &FuncAttrs) { | 
|---|
| 2223 | getTrivialDefaultFunctionAttributes(Name, HasOptnone, AttrOnCallSite, | 
|---|
| 2224 | FuncAttrs); | 
|---|
| 2225 |  | 
|---|
| 2226 | if (!AttrOnCallSite) | 
|---|
| 2227 | TargetCodeGenInfo::initPointerAuthFnAttributes(Opts: CodeGenOpts.PointerAuth, | 
|---|
| 2228 | FuncAttrs); | 
|---|
| 2229 |  | 
|---|
| 2230 | // If we're just getting the default, get the default values for mergeable | 
|---|
| 2231 | // attributes. | 
|---|
| 2232 | if (!AttrOnCallSite) | 
|---|
| 2233 | addMergableDefaultFunctionAttributes(CodeGenOpts, FuncAttrs); | 
|---|
| 2234 | } | 
|---|
| 2235 |  | 
|---|
| 2236 | void CodeGenModule::addDefaultFunctionDefinitionAttributes( | 
|---|
| 2237 | llvm::AttrBuilder &attrs) { | 
|---|
| 2238 | getDefaultFunctionAttributes(/*function name*/ Name: "", /*optnone*/ HasOptnone: false, | 
|---|
| 2239 | /*for call*/ AttrOnCallSite: false, FuncAttrs&: attrs); | 
|---|
| 2240 | GetCPUAndFeaturesAttributes(GD: GlobalDecl(), AttrBuilder&: attrs); | 
|---|
| 2241 | } | 
|---|
| 2242 |  | 
|---|
| 2243 | static void addNoBuiltinAttributes(llvm::AttrBuilder &FuncAttrs, | 
|---|
| 2244 | const LangOptions &LangOpts, | 
|---|
| 2245 | const NoBuiltinAttr *NBA = nullptr) { | 
|---|
| 2246 | auto AddNoBuiltinAttr = [&FuncAttrs](StringRef BuiltinName) { | 
|---|
| 2247 | SmallString<32> AttributeName; | 
|---|
| 2248 | AttributeName += "no-builtin-"; | 
|---|
| 2249 | AttributeName += BuiltinName; | 
|---|
| 2250 | FuncAttrs.addAttribute(A: AttributeName); | 
|---|
| 2251 | }; | 
|---|
| 2252 |  | 
|---|
| 2253 | // First, handle the language options passed through -fno-builtin. | 
|---|
| 2254 | if (LangOpts.NoBuiltin) { | 
|---|
| 2255 | // -fno-builtin disables them all. | 
|---|
| 2256 | FuncAttrs.addAttribute(A: "no-builtins"); | 
|---|
| 2257 | return; | 
|---|
| 2258 | } | 
|---|
| 2259 |  | 
|---|
| 2260 | // Then, add attributes for builtins specified through -fno-builtin-<name>. | 
|---|
| 2261 | llvm::for_each(Range: LangOpts.NoBuiltinFuncs, F: AddNoBuiltinAttr); | 
|---|
| 2262 |  | 
|---|
| 2263 | // Now, let's check the __attribute__((no_builtin("...")) attribute added to | 
|---|
| 2264 | // the source. | 
|---|
| 2265 | if (!NBA) | 
|---|
| 2266 | return; | 
|---|
| 2267 |  | 
|---|
| 2268 | // If there is a wildcard in the builtin names specified through the | 
|---|
| 2269 | // attribute, disable them all. | 
|---|
| 2270 | if (llvm::is_contained(Range: NBA->builtinNames(), Element: "*")) { | 
|---|
| 2271 | FuncAttrs.addAttribute(A: "no-builtins"); | 
|---|
| 2272 | return; | 
|---|
| 2273 | } | 
|---|
| 2274 |  | 
|---|
| 2275 | // And last, add the rest of the builtin names. | 
|---|
| 2276 | llvm::for_each(Range: NBA->builtinNames(), F: AddNoBuiltinAttr); | 
|---|
| 2277 | } | 
|---|
| 2278 |  | 
|---|
| 2279 | static bool DetermineNoUndef(QualType QTy, CodeGenTypes &Types, | 
|---|
| 2280 | const llvm::DataLayout &DL, const ABIArgInfo &AI, | 
|---|
| 2281 | bool CheckCoerce = true) { | 
|---|
| 2282 | llvm::Type *Ty = Types.ConvertTypeForMem(T: QTy); | 
|---|
| 2283 | if (AI.getKind() == ABIArgInfo::Indirect || | 
|---|
| 2284 | AI.getKind() == ABIArgInfo::IndirectAliased) | 
|---|
| 2285 | return true; | 
|---|
| 2286 | if (AI.getKind() == ABIArgInfo::Extend && !AI.isNoExt()) | 
|---|
| 2287 | return true; | 
|---|
| 2288 | if (!DL.typeSizeEqualsStoreSize(Ty)) | 
|---|
| 2289 | // TODO: This will result in a modest amount of values not marked noundef | 
|---|
| 2290 | // when they could be. We care about values that *invisibly* contain undef | 
|---|
| 2291 | // bits from the perspective of LLVM IR. | 
|---|
| 2292 | return false; | 
|---|
| 2293 | if (CheckCoerce && AI.canHaveCoerceToType()) { | 
|---|
| 2294 | llvm::Type *CoerceTy = AI.getCoerceToType(); | 
|---|
| 2295 | if (llvm::TypeSize::isKnownGT(LHS: DL.getTypeSizeInBits(Ty: CoerceTy), | 
|---|
| 2296 | RHS: DL.getTypeSizeInBits(Ty))) | 
|---|
| 2297 | // If we're coercing to a type with a greater size than the canonical one, | 
|---|
| 2298 | // we're introducing new undef bits. | 
|---|
| 2299 | // Coercing to a type of smaller or equal size is ok, as we know that | 
|---|
| 2300 | // there's no internal padding (typeSizeEqualsStoreSize). | 
|---|
| 2301 | return false; | 
|---|
| 2302 | } | 
|---|
| 2303 | if (QTy->isBitIntType()) | 
|---|
| 2304 | return true; | 
|---|
| 2305 | if (QTy->isReferenceType()) | 
|---|
| 2306 | return true; | 
|---|
| 2307 | if (QTy->isNullPtrType()) | 
|---|
| 2308 | return false; | 
|---|
| 2309 | if (QTy->isMemberPointerType()) | 
|---|
| 2310 | // TODO: Some member pointers are `noundef`, but it depends on the ABI. For | 
|---|
| 2311 | // now, never mark them. | 
|---|
| 2312 | return false; | 
|---|
| 2313 | if (QTy->isScalarType()) { | 
|---|
| 2314 | if (const ComplexType *Complex = dyn_cast<ComplexType>(Val&: QTy)) | 
|---|
| 2315 | return DetermineNoUndef(QTy: Complex->getElementType(), Types, DL, AI, CheckCoerce: false); | 
|---|
| 2316 | return true; | 
|---|
| 2317 | } | 
|---|
| 2318 | if (const VectorType *Vector = dyn_cast<VectorType>(Val&: QTy)) | 
|---|
| 2319 | return DetermineNoUndef(QTy: Vector->getElementType(), Types, DL, AI, CheckCoerce: false); | 
|---|
| 2320 | if (const MatrixType *Matrix = dyn_cast<MatrixType>(Val&: QTy)) | 
|---|
| 2321 | return DetermineNoUndef(QTy: Matrix->getElementType(), Types, DL, AI, CheckCoerce: false); | 
|---|
| 2322 | if (const ArrayType *Array = dyn_cast<ArrayType>(Val&: QTy)) | 
|---|
| 2323 | return DetermineNoUndef(QTy: Array->getElementType(), Types, DL, AI, CheckCoerce: false); | 
|---|
| 2324 |  | 
|---|
| 2325 | // TODO: Some structs may be `noundef`, in specific situations. | 
|---|
| 2326 | return false; | 
|---|
| 2327 | } | 
|---|
| 2328 |  | 
|---|
| 2329 | /// Check if the argument of a function has maybe_undef attribute. | 
|---|
| 2330 | static bool IsArgumentMaybeUndef(const Decl *TargetDecl, | 
|---|
| 2331 | unsigned NumRequiredArgs, unsigned ArgNo) { | 
|---|
| 2332 | const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl); | 
|---|
| 2333 | if (!FD) | 
|---|
| 2334 | return false; | 
|---|
| 2335 |  | 
|---|
| 2336 | // Assume variadic arguments do not have maybe_undef attribute. | 
|---|
| 2337 | if (ArgNo >= NumRequiredArgs) | 
|---|
| 2338 | return false; | 
|---|
| 2339 |  | 
|---|
| 2340 | // Check if argument has maybe_undef attribute. | 
|---|
| 2341 | if (ArgNo < FD->getNumParams()) { | 
|---|
| 2342 | const ParmVarDecl *Param = FD->getParamDecl(i: ArgNo); | 
|---|
| 2343 | if (Param && Param->hasAttr<MaybeUndefAttr>()) | 
|---|
| 2344 | return true; | 
|---|
| 2345 | } | 
|---|
| 2346 |  | 
|---|
| 2347 | return false; | 
|---|
| 2348 | } | 
|---|
| 2349 |  | 
|---|
| 2350 | /// Test if it's legal to apply nofpclass for the given parameter type and it's | 
|---|
| 2351 | /// lowered IR type. | 
|---|
| 2352 | static bool canApplyNoFPClass(const ABIArgInfo &AI, QualType ParamType, | 
|---|
| 2353 | bool IsReturn) { | 
|---|
| 2354 | // Should only apply to FP types in the source, not ABI promoted. | 
|---|
| 2355 | if (!ParamType->hasFloatingRepresentation()) | 
|---|
| 2356 | return false; | 
|---|
| 2357 |  | 
|---|
| 2358 | // The promoted-to IR type also needs to support nofpclass. | 
|---|
| 2359 | llvm::Type *IRTy = AI.getCoerceToType(); | 
|---|
| 2360 | if (llvm::AttributeFuncs::isNoFPClassCompatibleType(Ty: IRTy)) | 
|---|
| 2361 | return true; | 
|---|
| 2362 |  | 
|---|
| 2363 | if (llvm::StructType *ST = dyn_cast<llvm::StructType>(Val: IRTy)) { | 
|---|
| 2364 | return !IsReturn && AI.getCanBeFlattened() && | 
|---|
| 2365 | llvm::all_of(Range: ST->elements(), | 
|---|
| 2366 | P: llvm::AttributeFuncs::isNoFPClassCompatibleType); | 
|---|
| 2367 | } | 
|---|
| 2368 |  | 
|---|
| 2369 | return false; | 
|---|
| 2370 | } | 
|---|
| 2371 |  | 
|---|
| 2372 | /// Return the nofpclass mask that can be applied to floating-point parameters. | 
|---|
| 2373 | static llvm::FPClassTest getNoFPClassTestMask(const LangOptions &LangOpts) { | 
|---|
| 2374 | llvm::FPClassTest Mask = llvm::fcNone; | 
|---|
| 2375 | if (LangOpts.NoHonorInfs) | 
|---|
| 2376 | Mask |= llvm::fcInf; | 
|---|
| 2377 | if (LangOpts.NoHonorNaNs) | 
|---|
| 2378 | Mask |= llvm::fcNan; | 
|---|
| 2379 | return Mask; | 
|---|
| 2380 | } | 
|---|
| 2381 |  | 
|---|
| 2382 | void CodeGenModule::AdjustMemoryAttribute(StringRef Name, | 
|---|
| 2383 | CGCalleeInfo CalleeInfo, | 
|---|
| 2384 | llvm::AttributeList &Attrs) { | 
|---|
| 2385 | if (Attrs.getMemoryEffects().getModRef() == llvm::ModRefInfo::NoModRef) { | 
|---|
| 2386 | Attrs = Attrs.removeFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::Memory); | 
|---|
| 2387 | llvm::Attribute MemoryAttr = llvm::Attribute::getWithMemoryEffects( | 
|---|
| 2388 | Context&: getLLVMContext(), ME: llvm::MemoryEffects::writeOnly()); | 
|---|
| 2389 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Attr: MemoryAttr); | 
|---|
| 2390 | } | 
|---|
| 2391 | } | 
|---|
| 2392 |  | 
|---|
| 2393 | /// Construct the IR attribute list of a function or call. | 
|---|
| 2394 | /// | 
|---|
| 2395 | /// When adding an attribute, please consider where it should be handled: | 
|---|
| 2396 | /// | 
|---|
| 2397 | ///   - getDefaultFunctionAttributes is for attributes that are essentially | 
|---|
| 2398 | ///     part of the global target configuration (but perhaps can be | 
|---|
| 2399 | ///     overridden on a per-function basis).  Adding attributes there | 
|---|
| 2400 | ///     will cause them to also be set in frontends that build on Clang's | 
|---|
| 2401 | ///     target-configuration logic, as well as for code defined in library | 
|---|
| 2402 | ///     modules such as CUDA's libdevice. | 
|---|
| 2403 | /// | 
|---|
| 2404 | ///   - ConstructAttributeList builds on top of getDefaultFunctionAttributes | 
|---|
| 2405 | ///     and adds declaration-specific, convention-specific, and | 
|---|
| 2406 | ///     frontend-specific logic.  The last is of particular importance: | 
|---|
| 2407 | ///     attributes that restrict how the frontend generates code must be | 
|---|
| 2408 | ///     added here rather than getDefaultFunctionAttributes. | 
|---|
| 2409 | /// | 
|---|
| 2410 | void CodeGenModule::ConstructAttributeList(StringRef Name, | 
|---|
| 2411 | const CGFunctionInfo &FI, | 
|---|
| 2412 | CGCalleeInfo CalleeInfo, | 
|---|
| 2413 | llvm::AttributeList &AttrList, | 
|---|
| 2414 | unsigned &CallingConv, | 
|---|
| 2415 | bool AttrOnCallSite, bool IsThunk) { | 
|---|
| 2416 | llvm::AttrBuilder FuncAttrs(getLLVMContext()); | 
|---|
| 2417 | llvm::AttrBuilder RetAttrs(getLLVMContext()); | 
|---|
| 2418 |  | 
|---|
| 2419 | // Collect function IR attributes from the CC lowering. | 
|---|
| 2420 | // We'll collect the paramete and result attributes later. | 
|---|
| 2421 | CallingConv = FI.getEffectiveCallingConvention(); | 
|---|
| 2422 | if (FI.isNoReturn()) | 
|---|
| 2423 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoReturn); | 
|---|
| 2424 | if (FI.isCmseNSCall()) | 
|---|
| 2425 | FuncAttrs.addAttribute(A: "cmse_nonsecure_call"); | 
|---|
| 2426 |  | 
|---|
| 2427 | // Collect function IR attributes from the callee prototype if we have one. | 
|---|
| 2428 | AddAttributesFromFunctionProtoType(Ctx&: getContext(), FuncAttrs, | 
|---|
| 2429 | FPT: CalleeInfo.getCalleeFunctionProtoType()); | 
|---|
| 2430 | const Decl *TargetDecl = CalleeInfo.getCalleeDecl().getDecl(); | 
|---|
| 2431 |  | 
|---|
| 2432 | // Attach assumption attributes to the declaration. If this is a call | 
|---|
| 2433 | // site, attach assumptions from the caller to the call as well. | 
|---|
| 2434 | AddAttributesFromOMPAssumes(FuncAttrs, Callee: TargetDecl); | 
|---|
| 2435 |  | 
|---|
| 2436 | bool HasOptnone = false; | 
|---|
| 2437 | // The NoBuiltinAttr attached to the target FunctionDecl. | 
|---|
| 2438 | const NoBuiltinAttr *NBA = nullptr; | 
|---|
| 2439 |  | 
|---|
| 2440 | // Some ABIs may result in additional accesses to arguments that may | 
|---|
| 2441 | // otherwise not be present. | 
|---|
| 2442 | auto AddPotentialArgAccess = [&]() { | 
|---|
| 2443 | llvm::Attribute A = FuncAttrs.getAttribute(Kind: llvm::Attribute::Memory); | 
|---|
| 2444 | if (A.isValid()) | 
|---|
| 2445 | FuncAttrs.addMemoryAttr(ME: A.getMemoryEffects() | | 
|---|
| 2446 | llvm::MemoryEffects::argMemOnly()); | 
|---|
| 2447 | }; | 
|---|
| 2448 |  | 
|---|
| 2449 | // Collect function IR attributes based on declaration-specific | 
|---|
| 2450 | // information. | 
|---|
| 2451 | // FIXME: handle sseregparm someday... | 
|---|
| 2452 | if (TargetDecl) { | 
|---|
| 2453 | if (TargetDecl->hasAttr<ReturnsTwiceAttr>()) | 
|---|
| 2454 | FuncAttrs.addAttribute(Val: llvm::Attribute::ReturnsTwice); | 
|---|
| 2455 | if (TargetDecl->hasAttr<NoThrowAttr>()) | 
|---|
| 2456 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind); | 
|---|
| 2457 | if (TargetDecl->hasAttr<NoReturnAttr>()) | 
|---|
| 2458 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoReturn); | 
|---|
| 2459 | if (TargetDecl->hasAttr<ColdAttr>()) | 
|---|
| 2460 | FuncAttrs.addAttribute(Val: llvm::Attribute::Cold); | 
|---|
| 2461 | if (TargetDecl->hasAttr<HotAttr>()) | 
|---|
| 2462 | FuncAttrs.addAttribute(Val: llvm::Attribute::Hot); | 
|---|
| 2463 | if (TargetDecl->hasAttr<NoDuplicateAttr>()) | 
|---|
| 2464 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoDuplicate); | 
|---|
| 2465 | if (TargetDecl->hasAttr<ConvergentAttr>()) | 
|---|
| 2466 | FuncAttrs.addAttribute(Val: llvm::Attribute::Convergent); | 
|---|
| 2467 |  | 
|---|
| 2468 | if (const FunctionDecl *Fn = dyn_cast<FunctionDecl>(Val: TargetDecl)) { | 
|---|
| 2469 | AddAttributesFromFunctionProtoType( | 
|---|
| 2470 | Ctx&: getContext(), FuncAttrs, FPT: Fn->getType()->getAs<FunctionProtoType>()); | 
|---|
| 2471 | if (AttrOnCallSite && Fn->isReplaceableGlobalAllocationFunction()) { | 
|---|
| 2472 | // A sane operator new returns a non-aliasing pointer. | 
|---|
| 2473 | auto Kind = Fn->getDeclName().getCXXOverloadedOperator(); | 
|---|
| 2474 | if (getCodeGenOpts().AssumeSaneOperatorNew && | 
|---|
| 2475 | (Kind == OO_New || Kind == OO_Array_New)) | 
|---|
| 2476 | RetAttrs.addAttribute(Val: llvm::Attribute::NoAlias); | 
|---|
| 2477 | } | 
|---|
| 2478 | const CXXMethodDecl *MD = dyn_cast<CXXMethodDecl>(Val: Fn); | 
|---|
| 2479 | const bool IsVirtualCall = MD && MD->isVirtual(); | 
|---|
| 2480 | // Don't use [[noreturn]], _Noreturn or [[no_builtin]] for a call to a | 
|---|
| 2481 | // virtual function. These attributes are not inherited by overloads. | 
|---|
| 2482 | if (!(AttrOnCallSite && IsVirtualCall)) { | 
|---|
| 2483 | if (Fn->isNoReturn()) | 
|---|
| 2484 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoReturn); | 
|---|
| 2485 | NBA = Fn->getAttr<NoBuiltinAttr>(); | 
|---|
| 2486 | } | 
|---|
| 2487 | } | 
|---|
| 2488 |  | 
|---|
| 2489 | if (isa<FunctionDecl>(Val: TargetDecl) || isa<VarDecl>(Val: TargetDecl)) { | 
|---|
| 2490 | // Only place nomerge attribute on call sites, never functions. This | 
|---|
| 2491 | // allows it to work on indirect virtual function calls. | 
|---|
| 2492 | if (AttrOnCallSite && TargetDecl->hasAttr<NoMergeAttr>()) | 
|---|
| 2493 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoMerge); | 
|---|
| 2494 | } | 
|---|
| 2495 |  | 
|---|
| 2496 | // 'const', 'pure' and 'noalias' attributed functions are also nounwind. | 
|---|
| 2497 | if (TargetDecl->hasAttr<ConstAttr>()) { | 
|---|
| 2498 | FuncAttrs.addMemoryAttr(ME: llvm::MemoryEffects::none()); | 
|---|
| 2499 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind); | 
|---|
| 2500 | // gcc specifies that 'const' functions have greater restrictions than | 
|---|
| 2501 | // 'pure' functions, so they also cannot have infinite loops. | 
|---|
| 2502 | FuncAttrs.addAttribute(Val: llvm::Attribute::WillReturn); | 
|---|
| 2503 | } else if (TargetDecl->hasAttr<PureAttr>()) { | 
|---|
| 2504 | FuncAttrs.addMemoryAttr(ME: llvm::MemoryEffects::readOnly()); | 
|---|
| 2505 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind); | 
|---|
| 2506 | // gcc specifies that 'pure' functions cannot have infinite loops. | 
|---|
| 2507 | FuncAttrs.addAttribute(Val: llvm::Attribute::WillReturn); | 
|---|
| 2508 | } else if (TargetDecl->hasAttr<NoAliasAttr>()) { | 
|---|
| 2509 | FuncAttrs.addMemoryAttr(ME: llvm::MemoryEffects::inaccessibleOrArgMemOnly()); | 
|---|
| 2510 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoUnwind); | 
|---|
| 2511 | } | 
|---|
| 2512 | if (const auto *RA = TargetDecl->getAttr<RestrictAttr>(); | 
|---|
| 2513 | RA && RA->getDeallocator() == nullptr) | 
|---|
| 2514 | RetAttrs.addAttribute(Val: llvm::Attribute::NoAlias); | 
|---|
| 2515 | if (TargetDecl->hasAttr<ReturnsNonNullAttr>() && | 
|---|
| 2516 | !CodeGenOpts.NullPointerIsValid) | 
|---|
| 2517 | RetAttrs.addAttribute(Val: llvm::Attribute::NonNull); | 
|---|
| 2518 | if (TargetDecl->hasAttr<AnyX86NoCallerSavedRegistersAttr>()) | 
|---|
| 2519 | FuncAttrs.addAttribute(A: "no_caller_saved_registers"); | 
|---|
| 2520 | if (TargetDecl->hasAttr<AnyX86NoCfCheckAttr>()) | 
|---|
| 2521 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoCfCheck); | 
|---|
| 2522 | if (TargetDecl->hasAttr<LeafAttr>()) | 
|---|
| 2523 | FuncAttrs.addAttribute(Val: llvm::Attribute::NoCallback); | 
|---|
| 2524 | if (TargetDecl->hasAttr<BPFFastCallAttr>()) | 
|---|
| 2525 | FuncAttrs.addAttribute(A: "bpf_fastcall"); | 
|---|
| 2526 |  | 
|---|
| 2527 | HasOptnone = TargetDecl->hasAttr<OptimizeNoneAttr>(); | 
|---|
| 2528 | if (auto *AllocSize = TargetDecl->getAttr<AllocSizeAttr>()) { | 
|---|
| 2529 | std::optional<unsigned> NumElemsParam; | 
|---|
| 2530 | if (AllocSize->getNumElemsParam().isValid()) | 
|---|
| 2531 | NumElemsParam = AllocSize->getNumElemsParam().getLLVMIndex(); | 
|---|
| 2532 | FuncAttrs.addAllocSizeAttr(ElemSizeArg: AllocSize->getElemSizeParam().getLLVMIndex(), | 
|---|
| 2533 | NumElemsArg: NumElemsParam); | 
|---|
| 2534 | } | 
|---|
| 2535 |  | 
|---|
| 2536 | if (DeviceKernelAttr::isOpenCLSpelling( | 
|---|
| 2537 | A: TargetDecl->getAttr<DeviceKernelAttr>()) && | 
|---|
| 2538 | CallingConv != CallingConv::CC_C && | 
|---|
| 2539 | CallingConv != CallingConv::CC_SpirFunction) { | 
|---|
| 2540 | // Check CallingConv to avoid adding uniform-work-group-size attribute to | 
|---|
| 2541 | // OpenCL Kernel Stub | 
|---|
| 2542 | if (getLangOpts().OpenCLVersion <= 120) { | 
|---|
| 2543 | // OpenCL v1.2 Work groups are always uniform | 
|---|
| 2544 | FuncAttrs.addAttribute(A: "uniform-work-group-size", V: "true"); | 
|---|
| 2545 | } else { | 
|---|
| 2546 | // OpenCL v2.0 Work groups may be whether uniform or not. | 
|---|
| 2547 | // '-cl-uniform-work-group-size' compile option gets a hint | 
|---|
| 2548 | // to the compiler that the global work-size be a multiple of | 
|---|
| 2549 | // the work-group size specified to clEnqueueNDRangeKernel | 
|---|
| 2550 | // (i.e. work groups are uniform). | 
|---|
| 2551 | FuncAttrs.addAttribute( | 
|---|
| 2552 | A: "uniform-work-group-size", | 
|---|
| 2553 | V: llvm::toStringRef(B: getLangOpts().OffloadUniformBlock)); | 
|---|
| 2554 | } | 
|---|
| 2555 | } | 
|---|
| 2556 |  | 
|---|
| 2557 | if (TargetDecl->hasAttr<CUDAGlobalAttr>() && | 
|---|
| 2558 | getLangOpts().OffloadUniformBlock) | 
|---|
| 2559 | FuncAttrs.addAttribute(A: "uniform-work-group-size", V: "true"); | 
|---|
| 2560 |  | 
|---|
| 2561 | if (TargetDecl->hasAttr<ArmLocallyStreamingAttr>()) | 
|---|
| 2562 | FuncAttrs.addAttribute(A: "aarch64_pstate_sm_body"); | 
|---|
| 2563 | } | 
|---|
| 2564 |  | 
|---|
| 2565 | // Attach "no-builtins" attributes to: | 
|---|
| 2566 | // * call sites: both `nobuiltin` and "no-builtins" or "no-builtin-<name>". | 
|---|
| 2567 | // * definitions: "no-builtins" or "no-builtin-<name>" only. | 
|---|
| 2568 | // The attributes can come from: | 
|---|
| 2569 | // * LangOpts: -ffreestanding, -fno-builtin, -fno-builtin-<name> | 
|---|
| 2570 | // * FunctionDecl attributes: __attribute__((no_builtin(...))) | 
|---|
| 2571 | addNoBuiltinAttributes(FuncAttrs, LangOpts: getLangOpts(), NBA); | 
|---|
| 2572 |  | 
|---|
| 2573 | // Collect function IR attributes based on global settiings. | 
|---|
| 2574 | getDefaultFunctionAttributes(Name, HasOptnone, AttrOnCallSite, FuncAttrs); | 
|---|
| 2575 |  | 
|---|
| 2576 | // Override some default IR attributes based on declaration-specific | 
|---|
| 2577 | // information. | 
|---|
| 2578 | if (TargetDecl) { | 
|---|
| 2579 | if (TargetDecl->hasAttr<NoSpeculativeLoadHardeningAttr>()) | 
|---|
| 2580 | FuncAttrs.removeAttribute(Val: llvm::Attribute::SpeculativeLoadHardening); | 
|---|
| 2581 | if (TargetDecl->hasAttr<SpeculativeLoadHardeningAttr>()) | 
|---|
| 2582 | FuncAttrs.addAttribute(Val: llvm::Attribute::SpeculativeLoadHardening); | 
|---|
| 2583 | if (TargetDecl->hasAttr<NoSplitStackAttr>()) | 
|---|
| 2584 | FuncAttrs.removeAttribute(A: "split-stack"); | 
|---|
| 2585 | if (TargetDecl->hasAttr<ZeroCallUsedRegsAttr>()) { | 
|---|
| 2586 | // A function "__attribute__((...))" overrides the command-line flag. | 
|---|
| 2587 | auto Kind = | 
|---|
| 2588 | TargetDecl->getAttr<ZeroCallUsedRegsAttr>()->getZeroCallUsedRegs(); | 
|---|
| 2589 | FuncAttrs.removeAttribute(A: "zero-call-used-regs"); | 
|---|
| 2590 | FuncAttrs.addAttribute( | 
|---|
| 2591 | A: "zero-call-used-regs", | 
|---|
| 2592 | V: ZeroCallUsedRegsAttr::ConvertZeroCallUsedRegsKindToStr(Val: Kind)); | 
|---|
| 2593 | } | 
|---|
| 2594 |  | 
|---|
| 2595 | // Add NonLazyBind attribute to function declarations when -fno-plt | 
|---|
| 2596 | // is used. | 
|---|
| 2597 | // FIXME: what if we just haven't processed the function definition | 
|---|
| 2598 | // yet, or if it's an external definition like C99 inline? | 
|---|
| 2599 | if (CodeGenOpts.NoPLT) { | 
|---|
| 2600 | if (auto *Fn = dyn_cast<FunctionDecl>(Val: TargetDecl)) { | 
|---|
| 2601 | if (!Fn->isDefined() && !AttrOnCallSite) { | 
|---|
| 2602 | FuncAttrs.addAttribute(Val: llvm::Attribute::NonLazyBind); | 
|---|
| 2603 | } | 
|---|
| 2604 | } | 
|---|
| 2605 | } | 
|---|
| 2606 | // Remove 'convergent' if requested. | 
|---|
| 2607 | if (TargetDecl->hasAttr<NoConvergentAttr>()) | 
|---|
| 2608 | FuncAttrs.removeAttribute(Val: llvm::Attribute::Convergent); | 
|---|
| 2609 | } | 
|---|
| 2610 |  | 
|---|
| 2611 | // Add "sample-profile-suffix-elision-policy" attribute for internal linkage | 
|---|
| 2612 | // functions with -funique-internal-linkage-names. | 
|---|
| 2613 | if (TargetDecl && CodeGenOpts.UniqueInternalLinkageNames) { | 
|---|
| 2614 | if (const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl)) { | 
|---|
| 2615 | if (!FD->isExternallyVisible()) | 
|---|
| 2616 | FuncAttrs.addAttribute(A: "sample-profile-suffix-elision-policy", | 
|---|
| 2617 | V: "selected"); | 
|---|
| 2618 | } | 
|---|
| 2619 | } | 
|---|
| 2620 |  | 
|---|
| 2621 | // Collect non-call-site function IR attributes from declaration-specific | 
|---|
| 2622 | // information. | 
|---|
| 2623 | if (!AttrOnCallSite) { | 
|---|
| 2624 | if (TargetDecl && TargetDecl->hasAttr<CmseNSEntryAttr>()) | 
|---|
| 2625 | FuncAttrs.addAttribute(A: "cmse_nonsecure_entry"); | 
|---|
| 2626 |  | 
|---|
| 2627 | // Whether tail calls are enabled. | 
|---|
| 2628 | auto shouldDisableTailCalls = [&] { | 
|---|
| 2629 | // Should this be honored in getDefaultFunctionAttributes? | 
|---|
| 2630 | if (CodeGenOpts.DisableTailCalls) | 
|---|
| 2631 | return true; | 
|---|
| 2632 |  | 
|---|
| 2633 | if (!TargetDecl) | 
|---|
| 2634 | return false; | 
|---|
| 2635 |  | 
|---|
| 2636 | if (TargetDecl->hasAttr<DisableTailCallsAttr>() || | 
|---|
| 2637 | TargetDecl->hasAttr<AnyX86InterruptAttr>()) | 
|---|
| 2638 | return true; | 
|---|
| 2639 |  | 
|---|
| 2640 | if (CodeGenOpts.NoEscapingBlockTailCalls) { | 
|---|
| 2641 | if (const auto *BD = dyn_cast<BlockDecl>(Val: TargetDecl)) | 
|---|
| 2642 | if (!BD->doesNotEscape()) | 
|---|
| 2643 | return true; | 
|---|
| 2644 | } | 
|---|
| 2645 |  | 
|---|
| 2646 | return false; | 
|---|
| 2647 | }; | 
|---|
| 2648 | if (shouldDisableTailCalls()) | 
|---|
| 2649 | FuncAttrs.addAttribute(A: "disable-tail-calls", V: "true"); | 
|---|
| 2650 |  | 
|---|
| 2651 | // These functions require the returns_twice attribute for correct codegen, | 
|---|
| 2652 | // but the attribute may not be added if -fno-builtin is specified. We | 
|---|
| 2653 | // explicitly add that attribute here. | 
|---|
| 2654 | static const llvm::StringSet<> ReturnsTwiceFn{ | 
|---|
| 2655 | "_setjmpex", "setjmp", "_setjmp", "vfork", | 
|---|
| 2656 | "sigsetjmp", "__sigsetjmp", "savectx", "getcontext"}; | 
|---|
| 2657 | if (ReturnsTwiceFn.contains(key: Name)) | 
|---|
| 2658 | FuncAttrs.addAttribute(Val: llvm::Attribute::ReturnsTwice); | 
|---|
| 2659 |  | 
|---|
| 2660 | // CPU/feature overrides.  addDefaultFunctionDefinitionAttributes | 
|---|
| 2661 | // handles these separately to set them based on the global defaults. | 
|---|
| 2662 | GetCPUAndFeaturesAttributes(GD: CalleeInfo.getCalleeDecl(), AttrBuilder&: FuncAttrs); | 
|---|
| 2663 |  | 
|---|
| 2664 | // Windows hotpatching support | 
|---|
| 2665 | if (!MSHotPatchFunctions.empty()) { | 
|---|
| 2666 | bool IsHotPatched = llvm::binary_search(Range&: MSHotPatchFunctions, Value&: Name); | 
|---|
| 2667 | if (IsHotPatched) | 
|---|
| 2668 | FuncAttrs.addAttribute(A: "marked_for_windows_hot_patching"); | 
|---|
| 2669 | } | 
|---|
| 2670 | } | 
|---|
| 2671 |  | 
|---|
| 2672 | // Mark functions that are replaceable by the loader. | 
|---|
| 2673 | if (CodeGenOpts.isLoaderReplaceableFunctionName(FuncName: Name)) | 
|---|
| 2674 | FuncAttrs.addAttribute(A: "loader-replaceable"); | 
|---|
| 2675 |  | 
|---|
| 2676 | // Collect attributes from arguments and return values. | 
|---|
| 2677 | ClangToLLVMArgMapping IRFunctionArgs(getContext(), FI); | 
|---|
| 2678 |  | 
|---|
| 2679 | QualType RetTy = FI.getReturnType(); | 
|---|
| 2680 | const ABIArgInfo &RetAI = FI.getReturnInfo(); | 
|---|
| 2681 | const llvm::DataLayout &DL = getDataLayout(); | 
|---|
| 2682 |  | 
|---|
| 2683 | // Determine if the return type could be partially undef | 
|---|
| 2684 | if (CodeGenOpts.EnableNoundefAttrs && | 
|---|
| 2685 | HasStrictReturn(Module: *this, RetTy, TargetDecl)) { | 
|---|
| 2686 | if (!RetTy->isVoidType() && RetAI.getKind() != ABIArgInfo::Indirect && | 
|---|
| 2687 | DetermineNoUndef(QTy: RetTy, Types&: getTypes(), DL, AI: RetAI)) | 
|---|
| 2688 | RetAttrs.addAttribute(Val: llvm::Attribute::NoUndef); | 
|---|
| 2689 | } | 
|---|
| 2690 |  | 
|---|
| 2691 | switch (RetAI.getKind()) { | 
|---|
| 2692 | case ABIArgInfo::Extend: | 
|---|
| 2693 | if (RetAI.isSignExt()) | 
|---|
| 2694 | RetAttrs.addAttribute(Val: llvm::Attribute::SExt); | 
|---|
| 2695 | else if (RetAI.isZeroExt()) | 
|---|
| 2696 | RetAttrs.addAttribute(Val: llvm::Attribute::ZExt); | 
|---|
| 2697 | else | 
|---|
| 2698 | RetAttrs.addAttribute(Val: llvm::Attribute::NoExt); | 
|---|
| 2699 | [[fallthrough]]; | 
|---|
| 2700 | case ABIArgInfo::Direct: | 
|---|
| 2701 | if (RetAI.getInReg()) | 
|---|
| 2702 | RetAttrs.addAttribute(Val: llvm::Attribute::InReg); | 
|---|
| 2703 |  | 
|---|
| 2704 | if (canApplyNoFPClass(AI: RetAI, ParamType: RetTy, IsReturn: true)) | 
|---|
| 2705 | RetAttrs.addNoFPClassAttr(NoFPClassMask: getNoFPClassTestMask(LangOpts: getLangOpts())); | 
|---|
| 2706 |  | 
|---|
| 2707 | break; | 
|---|
| 2708 | case ABIArgInfo::Ignore: | 
|---|
| 2709 | break; | 
|---|
| 2710 |  | 
|---|
| 2711 | case ABIArgInfo::InAlloca: | 
|---|
| 2712 | case ABIArgInfo::Indirect: { | 
|---|
| 2713 | // inalloca and sret disable readnone and readonly | 
|---|
| 2714 | AddPotentialArgAccess(); | 
|---|
| 2715 | break; | 
|---|
| 2716 | } | 
|---|
| 2717 |  | 
|---|
| 2718 | case ABIArgInfo::CoerceAndExpand: | 
|---|
| 2719 | break; | 
|---|
| 2720 |  | 
|---|
| 2721 | case ABIArgInfo::Expand: | 
|---|
| 2722 | case ABIArgInfo::IndirectAliased: | 
|---|
| 2723 | llvm_unreachable( "Invalid ABI kind for return argument"); | 
|---|
| 2724 | } | 
|---|
| 2725 |  | 
|---|
| 2726 | if (!IsThunk) { | 
|---|
| 2727 | // FIXME: fix this properly, https://reviews.llvm.org/D100388 | 
|---|
| 2728 | if (const auto *RefTy = RetTy->getAs<ReferenceType>()) { | 
|---|
| 2729 | QualType PTy = RefTy->getPointeeType(); | 
|---|
| 2730 | if (!PTy->isIncompleteType() && PTy->isConstantSizeType()) | 
|---|
| 2731 | RetAttrs.addDereferenceableAttr( | 
|---|
| 2732 | Bytes: getMinimumObjectSize(Ty: PTy).getQuantity()); | 
|---|
| 2733 | if (getTypes().getTargetAddressSpace(T: PTy) == 0 && | 
|---|
| 2734 | !CodeGenOpts.NullPointerIsValid) | 
|---|
| 2735 | RetAttrs.addAttribute(Val: llvm::Attribute::NonNull); | 
|---|
| 2736 | if (PTy->isObjectType()) { | 
|---|
| 2737 | llvm::Align Alignment = | 
|---|
| 2738 | getNaturalPointeeTypeAlignment(T: RetTy).getAsAlign(); | 
|---|
| 2739 | RetAttrs.addAlignmentAttr(Align: Alignment); | 
|---|
| 2740 | } | 
|---|
| 2741 | } | 
|---|
| 2742 | } | 
|---|
| 2743 |  | 
|---|
| 2744 | bool hasUsedSRet = false; | 
|---|
| 2745 | SmallVector<llvm::AttributeSet, 4> ArgAttrs(IRFunctionArgs.totalIRArgs()); | 
|---|
| 2746 |  | 
|---|
| 2747 | // Attach attributes to sret. | 
|---|
| 2748 | if (IRFunctionArgs.hasSRetArg()) { | 
|---|
| 2749 | llvm::AttrBuilder SRETAttrs(getLLVMContext()); | 
|---|
| 2750 | SRETAttrs.addStructRetAttr(Ty: getTypes().ConvertTypeForMem(T: RetTy)); | 
|---|
| 2751 | SRETAttrs.addAttribute(Val: llvm::Attribute::Writable); | 
|---|
| 2752 | SRETAttrs.addAttribute(Val: llvm::Attribute::DeadOnUnwind); | 
|---|
| 2753 | hasUsedSRet = true; | 
|---|
| 2754 | if (RetAI.getInReg()) | 
|---|
| 2755 | SRETAttrs.addAttribute(Val: llvm::Attribute::InReg); | 
|---|
| 2756 | SRETAttrs.addAlignmentAttr(Align: RetAI.getIndirectAlign().getQuantity()); | 
|---|
| 2757 | ArgAttrs[IRFunctionArgs.getSRetArgNo()] = | 
|---|
| 2758 | llvm::AttributeSet::get(C&: getLLVMContext(), B: SRETAttrs); | 
|---|
| 2759 | } | 
|---|
| 2760 |  | 
|---|
| 2761 | // Attach attributes to inalloca argument. | 
|---|
| 2762 | if (IRFunctionArgs.hasInallocaArg()) { | 
|---|
| 2763 | llvm::AttrBuilder Attrs(getLLVMContext()); | 
|---|
| 2764 | Attrs.addInAllocaAttr(Ty: FI.getArgStruct()); | 
|---|
| 2765 | ArgAttrs[IRFunctionArgs.getInallocaArgNo()] = | 
|---|
| 2766 | llvm::AttributeSet::get(C&: getLLVMContext(), B: Attrs); | 
|---|
| 2767 | } | 
|---|
| 2768 |  | 
|---|
| 2769 | // Apply `nonnull`, `dereferenceable(N)` and `align N` to the `this` argument, | 
|---|
| 2770 | // unless this is a thunk function. | 
|---|
| 2771 | // FIXME: fix this properly, https://reviews.llvm.org/D100388 | 
|---|
| 2772 | if (FI.isInstanceMethod() && !IRFunctionArgs.hasInallocaArg() && | 
|---|
| 2773 | !FI.arg_begin()->type->isVoidPointerType() && !IsThunk) { | 
|---|
| 2774 | auto IRArgs = IRFunctionArgs.getIRArgs(ArgNo: 0); | 
|---|
| 2775 |  | 
|---|
| 2776 | assert(IRArgs.second == 1 && "Expected only a single `this` pointer."); | 
|---|
| 2777 |  | 
|---|
| 2778 | llvm::AttrBuilder Attrs(getLLVMContext()); | 
|---|
| 2779 |  | 
|---|
| 2780 | QualType ThisTy = FI.arg_begin()->type.getTypePtr()->getPointeeType(); | 
|---|
| 2781 |  | 
|---|
| 2782 | if (!CodeGenOpts.NullPointerIsValid && | 
|---|
| 2783 | getTypes().getTargetAddressSpace(T: FI.arg_begin()->type) == 0) { | 
|---|
| 2784 | Attrs.addAttribute(Val: llvm::Attribute::NonNull); | 
|---|
| 2785 | Attrs.addDereferenceableAttr(Bytes: getMinimumObjectSize(Ty: ThisTy).getQuantity()); | 
|---|
| 2786 | } else { | 
|---|
| 2787 | // FIXME dereferenceable should be correct here, regardless of | 
|---|
| 2788 | // NullPointerIsValid. However, dereferenceable currently does not always | 
|---|
| 2789 | // respect NullPointerIsValid and may imply nonnull and break the program. | 
|---|
| 2790 | // See https://reviews.llvm.org/D66618 for discussions. | 
|---|
| 2791 | Attrs.addDereferenceableOrNullAttr( | 
|---|
| 2792 | Bytes: getMinimumObjectSize( | 
|---|
| 2793 | Ty: FI.arg_begin()->type.castAs<PointerType>()->getPointeeType()) | 
|---|
| 2794 | .getQuantity()); | 
|---|
| 2795 | } | 
|---|
| 2796 |  | 
|---|
| 2797 | llvm::Align Alignment = | 
|---|
| 2798 | getNaturalTypeAlignment(T: ThisTy, /*BaseInfo=*/nullptr, | 
|---|
| 2799 | /*TBAAInfo=*/nullptr, /*forPointeeType=*/true) | 
|---|
| 2800 | .getAsAlign(); | 
|---|
| 2801 | Attrs.addAlignmentAttr(Align: Alignment); | 
|---|
| 2802 |  | 
|---|
| 2803 | ArgAttrs[IRArgs.first] = llvm::AttributeSet::get(C&: getLLVMContext(), B: Attrs); | 
|---|
| 2804 | } | 
|---|
| 2805 |  | 
|---|
| 2806 | unsigned ArgNo = 0; | 
|---|
| 2807 | for (CGFunctionInfo::const_arg_iterator I = FI.arg_begin(), E = FI.arg_end(); | 
|---|
| 2808 | I != E; ++I, ++ArgNo) { | 
|---|
| 2809 | QualType ParamType = I->type; | 
|---|
| 2810 | const ABIArgInfo &AI = I->info; | 
|---|
| 2811 | llvm::AttrBuilder Attrs(getLLVMContext()); | 
|---|
| 2812 |  | 
|---|
| 2813 | // Add attribute for padding argument, if necessary. | 
|---|
| 2814 | if (IRFunctionArgs.hasPaddingArg(ArgNo)) { | 
|---|
| 2815 | if (AI.getPaddingInReg()) { | 
|---|
| 2816 | ArgAttrs[IRFunctionArgs.getPaddingArgNo(ArgNo)] = | 
|---|
| 2817 | llvm::AttributeSet::get(C&: getLLVMContext(), | 
|---|
| 2818 | B: llvm::AttrBuilder(getLLVMContext()) | 
|---|
| 2819 | .addAttribute(Val: llvm::Attribute::InReg)); | 
|---|
| 2820 | } | 
|---|
| 2821 | } | 
|---|
| 2822 |  | 
|---|
| 2823 | // Decide whether the argument we're handling could be partially undef | 
|---|
| 2824 | if (CodeGenOpts.EnableNoundefAttrs && | 
|---|
| 2825 | DetermineNoUndef(QTy: ParamType, Types&: getTypes(), DL, AI)) { | 
|---|
| 2826 | Attrs.addAttribute(Val: llvm::Attribute::NoUndef); | 
|---|
| 2827 | } | 
|---|
| 2828 |  | 
|---|
| 2829 | // 'restrict' -> 'noalias' is done in EmitFunctionProlog when we | 
|---|
| 2830 | // have the corresponding parameter variable.  It doesn't make | 
|---|
| 2831 | // sense to do it here because parameters are so messed up. | 
|---|
| 2832 | switch (AI.getKind()) { | 
|---|
| 2833 | case ABIArgInfo::Extend: | 
|---|
| 2834 | if (AI.isSignExt()) | 
|---|
| 2835 | Attrs.addAttribute(Val: llvm::Attribute::SExt); | 
|---|
| 2836 | else if (AI.isZeroExt()) | 
|---|
| 2837 | Attrs.addAttribute(Val: llvm::Attribute::ZExt); | 
|---|
| 2838 | else | 
|---|
| 2839 | Attrs.addAttribute(Val: llvm::Attribute::NoExt); | 
|---|
| 2840 | [[fallthrough]]; | 
|---|
| 2841 | case ABIArgInfo::Direct: | 
|---|
| 2842 | if (ArgNo == 0 && FI.isChainCall()) | 
|---|
| 2843 | Attrs.addAttribute(Val: llvm::Attribute::Nest); | 
|---|
| 2844 | else if (AI.getInReg()) | 
|---|
| 2845 | Attrs.addAttribute(Val: llvm::Attribute::InReg); | 
|---|
| 2846 | Attrs.addStackAlignmentAttr(Align: llvm::MaybeAlign(AI.getDirectAlign())); | 
|---|
| 2847 |  | 
|---|
| 2848 | if (canApplyNoFPClass(AI, ParamType, IsReturn: false)) | 
|---|
| 2849 | Attrs.addNoFPClassAttr(NoFPClassMask: getNoFPClassTestMask(LangOpts: getLangOpts())); | 
|---|
| 2850 | break; | 
|---|
| 2851 | case ABIArgInfo::Indirect: { | 
|---|
| 2852 | if (AI.getInReg()) | 
|---|
| 2853 | Attrs.addAttribute(Val: llvm::Attribute::InReg); | 
|---|
| 2854 |  | 
|---|
| 2855 | if (AI.getIndirectByVal()) | 
|---|
| 2856 | Attrs.addByValAttr(Ty: getTypes().ConvertTypeForMem(T: ParamType)); | 
|---|
| 2857 |  | 
|---|
| 2858 | auto *Decl = ParamType->getAsRecordDecl(); | 
|---|
| 2859 | if (CodeGenOpts.PassByValueIsNoAlias && Decl && | 
|---|
| 2860 | Decl->getArgPassingRestrictions() == | 
|---|
| 2861 | RecordArgPassingKind::CanPassInRegs) | 
|---|
| 2862 | // When calling the function, the pointer passed in will be the only | 
|---|
| 2863 | // reference to the underlying object. Mark it accordingly. | 
|---|
| 2864 | Attrs.addAttribute(Val: llvm::Attribute::NoAlias); | 
|---|
| 2865 |  | 
|---|
| 2866 | // TODO: We could add the byref attribute if not byval, but it would | 
|---|
| 2867 | // require updating many testcases. | 
|---|
| 2868 |  | 
|---|
| 2869 | CharUnits Align = AI.getIndirectAlign(); | 
|---|
| 2870 |  | 
|---|
| 2871 | // In a byval argument, it is important that the required | 
|---|
| 2872 | // alignment of the type is honored, as LLVM might be creating a | 
|---|
| 2873 | // *new* stack object, and needs to know what alignment to give | 
|---|
| 2874 | // it. (Sometimes it can deduce a sensible alignment on its own, | 
|---|
| 2875 | // but not if clang decides it must emit a packed struct, or the | 
|---|
| 2876 | // user specifies increased alignment requirements.) | 
|---|
| 2877 | // | 
|---|
| 2878 | // This is different from indirect *not* byval, where the object | 
|---|
| 2879 | // exists already, and the align attribute is purely | 
|---|
| 2880 | // informative. | 
|---|
| 2881 | assert(!Align.isZero()); | 
|---|
| 2882 |  | 
|---|
| 2883 | // For now, only add this when we have a byval argument. | 
|---|
| 2884 | // TODO: be less lazy about updating test cases. | 
|---|
| 2885 | if (AI.getIndirectByVal()) | 
|---|
| 2886 | Attrs.addAlignmentAttr(Align: Align.getQuantity()); | 
|---|
| 2887 |  | 
|---|
| 2888 | // byval disables readnone and readonly. | 
|---|
| 2889 | AddPotentialArgAccess(); | 
|---|
| 2890 | break; | 
|---|
| 2891 | } | 
|---|
| 2892 | case ABIArgInfo::IndirectAliased: { | 
|---|
| 2893 | CharUnits Align = AI.getIndirectAlign(); | 
|---|
| 2894 | Attrs.addByRefAttr(Ty: getTypes().ConvertTypeForMem(T: ParamType)); | 
|---|
| 2895 | Attrs.addAlignmentAttr(Align: Align.getQuantity()); | 
|---|
| 2896 | break; | 
|---|
| 2897 | } | 
|---|
| 2898 | case ABIArgInfo::Ignore: | 
|---|
| 2899 | case ABIArgInfo::Expand: | 
|---|
| 2900 | case ABIArgInfo::CoerceAndExpand: | 
|---|
| 2901 | break; | 
|---|
| 2902 |  | 
|---|
| 2903 | case ABIArgInfo::InAlloca: | 
|---|
| 2904 | // inalloca disables readnone and readonly. | 
|---|
| 2905 | AddPotentialArgAccess(); | 
|---|
| 2906 | continue; | 
|---|
| 2907 | } | 
|---|
| 2908 |  | 
|---|
| 2909 | if (const auto *RefTy = ParamType->getAs<ReferenceType>()) { | 
|---|
| 2910 | QualType PTy = RefTy->getPointeeType(); | 
|---|
| 2911 | if (!PTy->isIncompleteType() && PTy->isConstantSizeType()) | 
|---|
| 2912 | Attrs.addDereferenceableAttr(Bytes: getMinimumObjectSize(Ty: PTy).getQuantity()); | 
|---|
| 2913 | if (getTypes().getTargetAddressSpace(T: PTy) == 0 && | 
|---|
| 2914 | !CodeGenOpts.NullPointerIsValid) | 
|---|
| 2915 | Attrs.addAttribute(Val: llvm::Attribute::NonNull); | 
|---|
| 2916 | if (PTy->isObjectType()) { | 
|---|
| 2917 | llvm::Align Alignment = | 
|---|
| 2918 | getNaturalPointeeTypeAlignment(T: ParamType).getAsAlign(); | 
|---|
| 2919 | Attrs.addAlignmentAttr(Align: Alignment); | 
|---|
| 2920 | } | 
|---|
| 2921 | } | 
|---|
| 2922 |  | 
|---|
| 2923 | // From OpenCL spec v3.0.10 section 6.3.5 Alignment of Types: | 
|---|
| 2924 | // > For arguments to a __kernel function declared to be a pointer to a | 
|---|
| 2925 | // > data type, the OpenCL compiler can assume that the pointee is always | 
|---|
| 2926 | // > appropriately aligned as required by the data type. | 
|---|
| 2927 | if (TargetDecl && | 
|---|
| 2928 | DeviceKernelAttr::isOpenCLSpelling( | 
|---|
| 2929 | A: TargetDecl->getAttr<DeviceKernelAttr>()) && | 
|---|
| 2930 | ParamType->isPointerType()) { | 
|---|
| 2931 | QualType PTy = ParamType->getPointeeType(); | 
|---|
| 2932 | if (!PTy->isIncompleteType() && PTy->isConstantSizeType()) { | 
|---|
| 2933 | llvm::Align Alignment = | 
|---|
| 2934 | getNaturalPointeeTypeAlignment(T: ParamType).getAsAlign(); | 
|---|
| 2935 | Attrs.addAlignmentAttr(Align: Alignment); | 
|---|
| 2936 | } | 
|---|
| 2937 | } | 
|---|
| 2938 |  | 
|---|
| 2939 | switch (FI.getExtParameterInfo(argIndex: ArgNo).getABI()) { | 
|---|
| 2940 | case ParameterABI::HLSLOut: | 
|---|
| 2941 | case ParameterABI::HLSLInOut: | 
|---|
| 2942 | Attrs.addAttribute(Val: llvm::Attribute::NoAlias); | 
|---|
| 2943 | break; | 
|---|
| 2944 | case ParameterABI::Ordinary: | 
|---|
| 2945 | break; | 
|---|
| 2946 |  | 
|---|
| 2947 | case ParameterABI::SwiftIndirectResult: { | 
|---|
| 2948 | // Add 'sret' if we haven't already used it for something, but | 
|---|
| 2949 | // only if the result is void. | 
|---|
| 2950 | if (!hasUsedSRet && RetTy->isVoidType()) { | 
|---|
| 2951 | Attrs.addStructRetAttr(Ty: getTypes().ConvertTypeForMem(T: ParamType)); | 
|---|
| 2952 | hasUsedSRet = true; | 
|---|
| 2953 | } | 
|---|
| 2954 |  | 
|---|
| 2955 | // Add 'noalias' in either case. | 
|---|
| 2956 | Attrs.addAttribute(Val: llvm::Attribute::NoAlias); | 
|---|
| 2957 |  | 
|---|
| 2958 | // Add 'dereferenceable' and 'alignment'. | 
|---|
| 2959 | auto PTy = ParamType->getPointeeType(); | 
|---|
| 2960 | if (!PTy->isIncompleteType() && PTy->isConstantSizeType()) { | 
|---|
| 2961 | auto info = getContext().getTypeInfoInChars(T: PTy); | 
|---|
| 2962 | Attrs.addDereferenceableAttr(Bytes: info.Width.getQuantity()); | 
|---|
| 2963 | Attrs.addAlignmentAttr(Align: info.Align.getAsAlign()); | 
|---|
| 2964 | } | 
|---|
| 2965 | break; | 
|---|
| 2966 | } | 
|---|
| 2967 |  | 
|---|
| 2968 | case ParameterABI::SwiftErrorResult: | 
|---|
| 2969 | Attrs.addAttribute(Val: llvm::Attribute::SwiftError); | 
|---|
| 2970 | break; | 
|---|
| 2971 |  | 
|---|
| 2972 | case ParameterABI::SwiftContext: | 
|---|
| 2973 | Attrs.addAttribute(Val: llvm::Attribute::SwiftSelf); | 
|---|
| 2974 | break; | 
|---|
| 2975 |  | 
|---|
| 2976 | case ParameterABI::SwiftAsyncContext: | 
|---|
| 2977 | Attrs.addAttribute(Val: llvm::Attribute::SwiftAsync); | 
|---|
| 2978 | break; | 
|---|
| 2979 | } | 
|---|
| 2980 |  | 
|---|
| 2981 | if (FI.getExtParameterInfo(argIndex: ArgNo).isNoEscape()) | 
|---|
| 2982 | Attrs.addCapturesAttr(CI: llvm::CaptureInfo::none()); | 
|---|
| 2983 |  | 
|---|
| 2984 | if (Attrs.hasAttributes()) { | 
|---|
| 2985 | unsigned FirstIRArg, NumIRArgs; | 
|---|
| 2986 | std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo); | 
|---|
| 2987 | for (unsigned i = 0; i < NumIRArgs; i++) | 
|---|
| 2988 | ArgAttrs[FirstIRArg + i] = ArgAttrs[FirstIRArg + i].addAttributes( | 
|---|
| 2989 | C&: getLLVMContext(), AS: llvm::AttributeSet::get(C&: getLLVMContext(), B: Attrs)); | 
|---|
| 2990 | } | 
|---|
| 2991 | } | 
|---|
| 2992 | assert(ArgNo == FI.arg_size()); | 
|---|
| 2993 |  | 
|---|
| 2994 | AttrList = llvm::AttributeList::get( | 
|---|
| 2995 | C&: getLLVMContext(), FnAttrs: llvm::AttributeSet::get(C&: getLLVMContext(), B: FuncAttrs), | 
|---|
| 2996 | RetAttrs: llvm::AttributeSet::get(C&: getLLVMContext(), B: RetAttrs), ArgAttrs); | 
|---|
| 2997 | } | 
|---|
| 2998 |  | 
|---|
| 2999 | /// An argument came in as a promoted argument; demote it back to its | 
|---|
| 3000 | /// declared type. | 
|---|
| 3001 | static llvm::Value *emitArgumentDemotion(CodeGenFunction &CGF, | 
|---|
| 3002 | const VarDecl *var, | 
|---|
| 3003 | llvm::Value *value) { | 
|---|
| 3004 | llvm::Type *varType = CGF.ConvertType(T: var->getType()); | 
|---|
| 3005 |  | 
|---|
| 3006 | // This can happen with promotions that actually don't change the | 
|---|
| 3007 | // underlying type, like the enum promotions. | 
|---|
| 3008 | if (value->getType() == varType) | 
|---|
| 3009 | return value; | 
|---|
| 3010 |  | 
|---|
| 3011 | assert((varType->isIntegerTy() || varType->isFloatingPointTy()) && | 
|---|
| 3012 | "unexpected promotion type"); | 
|---|
| 3013 |  | 
|---|
| 3014 | if (isa<llvm::IntegerType>(Val: varType)) | 
|---|
| 3015 | return CGF.Builder.CreateTrunc(V: value, DestTy: varType, Name: "arg.unpromote"); | 
|---|
| 3016 |  | 
|---|
| 3017 | return CGF.Builder.CreateFPCast(V: value, DestTy: varType, Name: "arg.unpromote"); | 
|---|
| 3018 | } | 
|---|
| 3019 |  | 
|---|
| 3020 | /// Returns the attribute (either parameter attribute, or function | 
|---|
| 3021 | /// attribute), which declares argument ArgNo to be non-null. | 
|---|
| 3022 | static const NonNullAttr *getNonNullAttr(const Decl *FD, const ParmVarDecl *PVD, | 
|---|
| 3023 | QualType ArgType, unsigned ArgNo) { | 
|---|
| 3024 | // FIXME: __attribute__((nonnull)) can also be applied to: | 
|---|
| 3025 | //   - references to pointers, where the pointee is known to be | 
|---|
| 3026 | //     nonnull (apparently a Clang extension) | 
|---|
| 3027 | //   - transparent unions containing pointers | 
|---|
| 3028 | // In the former case, LLVM IR cannot represent the constraint. In | 
|---|
| 3029 | // the latter case, we have no guarantee that the transparent union | 
|---|
| 3030 | // is in fact passed as a pointer. | 
|---|
| 3031 | if (!ArgType->isAnyPointerType() && !ArgType->isBlockPointerType()) | 
|---|
| 3032 | return nullptr; | 
|---|
| 3033 | // First, check attribute on parameter itself. | 
|---|
| 3034 | if (PVD) { | 
|---|
| 3035 | if (auto ParmNNAttr = PVD->getAttr<NonNullAttr>()) | 
|---|
| 3036 | return ParmNNAttr; | 
|---|
| 3037 | } | 
|---|
| 3038 | // Check function attributes. | 
|---|
| 3039 | if (!FD) | 
|---|
| 3040 | return nullptr; | 
|---|
| 3041 | for (const auto *NNAttr : FD->specific_attrs<NonNullAttr>()) { | 
|---|
| 3042 | if (NNAttr->isNonNull(IdxAST: ArgNo)) | 
|---|
| 3043 | return NNAttr; | 
|---|
| 3044 | } | 
|---|
| 3045 | return nullptr; | 
|---|
| 3046 | } | 
|---|
| 3047 |  | 
|---|
| 3048 | namespace { | 
|---|
| 3049 | struct CopyBackSwiftError final : EHScopeStack::Cleanup { | 
|---|
| 3050 | Address Temp; | 
|---|
| 3051 | Address Arg; | 
|---|
| 3052 | CopyBackSwiftError(Address temp, Address arg) : Temp(temp), Arg(arg) {} | 
|---|
| 3053 | void Emit(CodeGenFunction &CGF, Flags flags) override { | 
|---|
| 3054 | llvm::Value *errorValue = CGF.Builder.CreateLoad(Addr: Temp); | 
|---|
| 3055 | CGF.Builder.CreateStore(Val: errorValue, Addr: Arg); | 
|---|
| 3056 | } | 
|---|
| 3057 | }; | 
|---|
| 3058 | } // namespace | 
|---|
| 3059 |  | 
|---|
| 3060 | void CodeGenFunction::EmitFunctionProlog(const CGFunctionInfo &FI, | 
|---|
| 3061 | llvm::Function *Fn, | 
|---|
| 3062 | const FunctionArgList &Args) { | 
|---|
| 3063 | if (CurCodeDecl && CurCodeDecl->hasAttr<NakedAttr>()) | 
|---|
| 3064 | // Naked functions don't have prologues. | 
|---|
| 3065 | return; | 
|---|
| 3066 |  | 
|---|
| 3067 | // If this is an implicit-return-zero function, go ahead and | 
|---|
| 3068 | // initialize the return value.  TODO: it might be nice to have | 
|---|
| 3069 | // a more general mechanism for this that didn't require synthesized | 
|---|
| 3070 | // return statements. | 
|---|
| 3071 | if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: CurCodeDecl)) { | 
|---|
| 3072 | if (FD->hasImplicitReturnZero()) { | 
|---|
| 3073 | QualType RetTy = FD->getReturnType().getUnqualifiedType(); | 
|---|
| 3074 | llvm::Type *LLVMTy = CGM.getTypes().ConvertType(T: RetTy); | 
|---|
| 3075 | llvm::Constant *Zero = llvm::Constant::getNullValue(Ty: LLVMTy); | 
|---|
| 3076 | Builder.CreateStore(Val: Zero, Addr: ReturnValue); | 
|---|
| 3077 | } | 
|---|
| 3078 | } | 
|---|
| 3079 |  | 
|---|
| 3080 | // FIXME: We no longer need the types from FunctionArgList; lift up and | 
|---|
| 3081 | // simplify. | 
|---|
| 3082 |  | 
|---|
| 3083 | ClangToLLVMArgMapping IRFunctionArgs(CGM.getContext(), FI); | 
|---|
| 3084 | assert(Fn->arg_size() == IRFunctionArgs.totalIRArgs()); | 
|---|
| 3085 |  | 
|---|
| 3086 | // If we're using inalloca, all the memory arguments are GEPs off of the last | 
|---|
| 3087 | // parameter, which is a pointer to the complete memory area. | 
|---|
| 3088 | Address ArgStruct = Address::invalid(); | 
|---|
| 3089 | if (IRFunctionArgs.hasInallocaArg()) | 
|---|
| 3090 | ArgStruct = Address(Fn->getArg(i: IRFunctionArgs.getInallocaArgNo()), | 
|---|
| 3091 | FI.getArgStruct(), FI.getArgStructAlignment()); | 
|---|
| 3092 |  | 
|---|
| 3093 | // Name the struct return parameter. | 
|---|
| 3094 | if (IRFunctionArgs.hasSRetArg()) { | 
|---|
| 3095 | auto AI = Fn->getArg(i: IRFunctionArgs.getSRetArgNo()); | 
|---|
| 3096 | AI->setName( "agg.result"); | 
|---|
| 3097 | AI->addAttr(Kind: llvm::Attribute::NoAlias); | 
|---|
| 3098 | } | 
|---|
| 3099 |  | 
|---|
| 3100 | // Track if we received the parameter as a pointer (indirect, byval, or | 
|---|
| 3101 | // inalloca).  If already have a pointer, EmitParmDecl doesn't need to copy it | 
|---|
| 3102 | // into a local alloca for us. | 
|---|
| 3103 | SmallVector<ParamValue, 16> ArgVals; | 
|---|
| 3104 | ArgVals.reserve(N: Args.size()); | 
|---|
| 3105 |  | 
|---|
| 3106 | // Create a pointer value for every parameter declaration.  This usually | 
|---|
| 3107 | // entails copying one or more LLVM IR arguments into an alloca.  Don't push | 
|---|
| 3108 | // any cleanups or do anything that might unwind.  We do that separately, so | 
|---|
| 3109 | // we can push the cleanups in the correct order for the ABI. | 
|---|
| 3110 | assert(FI.arg_size() == Args.size() && | 
|---|
| 3111 | "Mismatch between function signature & arguments."); | 
|---|
| 3112 | unsigned ArgNo = 0; | 
|---|
| 3113 | CGFunctionInfo::const_arg_iterator info_it = FI.arg_begin(); | 
|---|
| 3114 | for (FunctionArgList::const_iterator i = Args.begin(), e = Args.end(); i != e; | 
|---|
| 3115 | ++i, ++info_it, ++ArgNo) { | 
|---|
| 3116 | const VarDecl *Arg = *i; | 
|---|
| 3117 | const ABIArgInfo &ArgI = info_it->info; | 
|---|
| 3118 |  | 
|---|
| 3119 | bool isPromoted = | 
|---|
| 3120 | isa<ParmVarDecl>(Val: Arg) && cast<ParmVarDecl>(Val: Arg)->isKNRPromoted(); | 
|---|
| 3121 | // We are converting from ABIArgInfo type to VarDecl type directly, unless | 
|---|
| 3122 | // the parameter is promoted. In this case we convert to | 
|---|
| 3123 | // CGFunctionInfo::ArgInfo type with subsequent argument demotion. | 
|---|
| 3124 | QualType Ty = isPromoted ? info_it->type : Arg->getType(); | 
|---|
| 3125 | assert(hasScalarEvaluationKind(Ty) == | 
|---|
| 3126 | hasScalarEvaluationKind(Arg->getType())); | 
|---|
| 3127 |  | 
|---|
| 3128 | unsigned FirstIRArg, NumIRArgs; | 
|---|
| 3129 | std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo); | 
|---|
| 3130 |  | 
|---|
| 3131 | switch (ArgI.getKind()) { | 
|---|
| 3132 | case ABIArgInfo::InAlloca: { | 
|---|
| 3133 | assert(NumIRArgs == 0); | 
|---|
| 3134 | auto FieldIndex = ArgI.getInAllocaFieldIndex(); | 
|---|
| 3135 | Address V = | 
|---|
| 3136 | Builder.CreateStructGEP(Addr: ArgStruct, Index: FieldIndex, Name: Arg->getName()); | 
|---|
| 3137 | if (ArgI.getInAllocaIndirect()) | 
|---|
| 3138 | V = Address(Builder.CreateLoad(Addr: V), ConvertTypeForMem(T: Ty), | 
|---|
| 3139 | getContext().getTypeAlignInChars(T: Ty)); | 
|---|
| 3140 | ArgVals.push_back(Elt: ParamValue::forIndirect(addr: V)); | 
|---|
| 3141 | break; | 
|---|
| 3142 | } | 
|---|
| 3143 |  | 
|---|
| 3144 | case ABIArgInfo::Indirect: | 
|---|
| 3145 | case ABIArgInfo::IndirectAliased: { | 
|---|
| 3146 | assert(NumIRArgs == 1); | 
|---|
| 3147 | Address ParamAddr = makeNaturalAddressForPointer( | 
|---|
| 3148 | Ptr: Fn->getArg(i: FirstIRArg), T: Ty, Alignment: ArgI.getIndirectAlign(), ForPointeeType: false, BaseInfo: nullptr, | 
|---|
| 3149 | TBAAInfo: nullptr, IsKnownNonNull: KnownNonNull); | 
|---|
| 3150 |  | 
|---|
| 3151 | if (!hasScalarEvaluationKind(T: Ty)) { | 
|---|
| 3152 | // Aggregates and complex variables are accessed by reference. All we | 
|---|
| 3153 | // need to do is realign the value, if requested. Also, if the address | 
|---|
| 3154 | // may be aliased, copy it to ensure that the parameter variable is | 
|---|
| 3155 | // mutable and has a unique adress, as C requires. | 
|---|
| 3156 | if (ArgI.getIndirectRealign() || ArgI.isIndirectAliased()) { | 
|---|
| 3157 | RawAddress AlignedTemp = CreateMemTemp(T: Ty, Name: "coerce"); | 
|---|
| 3158 |  | 
|---|
| 3159 | // Copy from the incoming argument pointer to the temporary with the | 
|---|
| 3160 | // appropriate alignment. | 
|---|
| 3161 | // | 
|---|
| 3162 | // FIXME: We should have a common utility for generating an aggregate | 
|---|
| 3163 | // copy. | 
|---|
| 3164 | CharUnits Size = getContext().getTypeSizeInChars(T: Ty); | 
|---|
| 3165 | Builder.CreateMemCpy( | 
|---|
| 3166 | Dst: AlignedTemp.getPointer(), DstAlign: AlignedTemp.getAlignment().getAsAlign(), | 
|---|
| 3167 | Src: ParamAddr.emitRawPointer(CGF&: *this), | 
|---|
| 3168 | SrcAlign: ParamAddr.getAlignment().getAsAlign(), | 
|---|
| 3169 | Size: llvm::ConstantInt::get(Ty: IntPtrTy, V: Size.getQuantity())); | 
|---|
| 3170 | ParamAddr = AlignedTemp; | 
|---|
| 3171 | } | 
|---|
| 3172 | ArgVals.push_back(Elt: ParamValue::forIndirect(addr: ParamAddr)); | 
|---|
| 3173 | } else { | 
|---|
| 3174 | // Load scalar value from indirect argument. | 
|---|
| 3175 | llvm::Value *V = | 
|---|
| 3176 | EmitLoadOfScalar(Addr: ParamAddr, Volatile: false, Ty, Loc: Arg->getBeginLoc()); | 
|---|
| 3177 |  | 
|---|
| 3178 | if (isPromoted) | 
|---|
| 3179 | V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V); | 
|---|
| 3180 | ArgVals.push_back(Elt: ParamValue::forDirect(value: V)); | 
|---|
| 3181 | } | 
|---|
| 3182 | break; | 
|---|
| 3183 | } | 
|---|
| 3184 |  | 
|---|
| 3185 | case ABIArgInfo::Extend: | 
|---|
| 3186 | case ABIArgInfo::Direct: { | 
|---|
| 3187 | auto AI = Fn->getArg(i: FirstIRArg); | 
|---|
| 3188 | llvm::Type *LTy = ConvertType(T: Arg->getType()); | 
|---|
| 3189 |  | 
|---|
| 3190 | // Prepare parameter attributes. So far, only attributes for pointer | 
|---|
| 3191 | // parameters are prepared. See | 
|---|
| 3192 | // http://llvm.org/docs/LangRef.html#paramattrs. | 
|---|
| 3193 | if (ArgI.getDirectOffset() == 0 && LTy->isPointerTy() && | 
|---|
| 3194 | ArgI.getCoerceToType()->isPointerTy()) { | 
|---|
| 3195 | assert(NumIRArgs == 1); | 
|---|
| 3196 |  | 
|---|
| 3197 | if (const ParmVarDecl *PVD = dyn_cast<ParmVarDecl>(Val: Arg)) { | 
|---|
| 3198 | // Set `nonnull` attribute if any. | 
|---|
| 3199 | if (getNonNullAttr(FD: CurCodeDecl, PVD, ArgType: PVD->getType(), | 
|---|
| 3200 | ArgNo: PVD->getFunctionScopeIndex()) && | 
|---|
| 3201 | !CGM.getCodeGenOpts().NullPointerIsValid) | 
|---|
| 3202 | AI->addAttr(Kind: llvm::Attribute::NonNull); | 
|---|
| 3203 |  | 
|---|
| 3204 | QualType OTy = PVD->getOriginalType(); | 
|---|
| 3205 | if (const auto *ArrTy = getContext().getAsConstantArrayType(T: OTy)) { | 
|---|
| 3206 | // A C99 array parameter declaration with the static keyword also | 
|---|
| 3207 | // indicates dereferenceability, and if the size is constant we can | 
|---|
| 3208 | // use the dereferenceable attribute (which requires the size in | 
|---|
| 3209 | // bytes). | 
|---|
| 3210 | if (ArrTy->getSizeModifier() == ArraySizeModifier::Static) { | 
|---|
| 3211 | QualType ETy = ArrTy->getElementType(); | 
|---|
| 3212 | llvm::Align Alignment = | 
|---|
| 3213 | CGM.getNaturalTypeAlignment(T: ETy).getAsAlign(); | 
|---|
| 3214 | AI->addAttrs(B&: llvm::AttrBuilder(getLLVMContext()) | 
|---|
| 3215 | .addAlignmentAttr(Align: Alignment)); | 
|---|
| 3216 | uint64_t ArrSize = ArrTy->getZExtSize(); | 
|---|
| 3217 | if (!ETy->isIncompleteType() && ETy->isConstantSizeType() && | 
|---|
| 3218 | ArrSize) { | 
|---|
| 3219 | llvm::AttrBuilder Attrs(getLLVMContext()); | 
|---|
| 3220 | Attrs.addDereferenceableAttr( | 
|---|
| 3221 | Bytes: getContext().getTypeSizeInChars(T: ETy).getQuantity() * | 
|---|
| 3222 | ArrSize); | 
|---|
| 3223 | AI->addAttrs(B&: Attrs); | 
|---|
| 3224 | } else if (getContext().getTargetInfo().getNullPointerValue( | 
|---|
| 3225 | AddrSpace: ETy.getAddressSpace()) == 0 && | 
|---|
| 3226 | !CGM.getCodeGenOpts().NullPointerIsValid) { | 
|---|
| 3227 | AI->addAttr(Kind: llvm::Attribute::NonNull); | 
|---|
| 3228 | } | 
|---|
| 3229 | } | 
|---|
| 3230 | } else if (const auto *ArrTy = | 
|---|
| 3231 | getContext().getAsVariableArrayType(T: OTy)) { | 
|---|
| 3232 | // For C99 VLAs with the static keyword, we don't know the size so | 
|---|
| 3233 | // we can't use the dereferenceable attribute, but in addrspace(0) | 
|---|
| 3234 | // we know that it must be nonnull. | 
|---|
| 3235 | if (ArrTy->getSizeModifier() == ArraySizeModifier::Static) { | 
|---|
| 3236 | QualType ETy = ArrTy->getElementType(); | 
|---|
| 3237 | llvm::Align Alignment = | 
|---|
| 3238 | CGM.getNaturalTypeAlignment(T: ETy).getAsAlign(); | 
|---|
| 3239 | AI->addAttrs(B&: llvm::AttrBuilder(getLLVMContext()) | 
|---|
| 3240 | .addAlignmentAttr(Align: Alignment)); | 
|---|
| 3241 | if (!getTypes().getTargetAddressSpace(T: ETy) && | 
|---|
| 3242 | !CGM.getCodeGenOpts().NullPointerIsValid) | 
|---|
| 3243 | AI->addAttr(Kind: llvm::Attribute::NonNull); | 
|---|
| 3244 | } | 
|---|
| 3245 | } | 
|---|
| 3246 |  | 
|---|
| 3247 | // Set `align` attribute if any. | 
|---|
| 3248 | const auto *AVAttr = PVD->getAttr<AlignValueAttr>(); | 
|---|
| 3249 | if (!AVAttr) | 
|---|
| 3250 | if (const auto *TOTy = OTy->getAs<TypedefType>()) | 
|---|
| 3251 | AVAttr = TOTy->getDecl()->getAttr<AlignValueAttr>(); | 
|---|
| 3252 | if (AVAttr && !SanOpts.has(K: SanitizerKind::Alignment)) { | 
|---|
| 3253 | // If alignment-assumption sanitizer is enabled, we do *not* add | 
|---|
| 3254 | // alignment attribute here, but emit normal alignment assumption, | 
|---|
| 3255 | // so the UBSAN check could function. | 
|---|
| 3256 | llvm::ConstantInt *AlignmentCI = | 
|---|
| 3257 | cast<llvm::ConstantInt>(Val: EmitScalarExpr(E: AVAttr->getAlignment())); | 
|---|
| 3258 | uint64_t AlignmentInt = | 
|---|
| 3259 | AlignmentCI->getLimitedValue(Limit: llvm::Value::MaximumAlignment); | 
|---|
| 3260 | if (AI->getParamAlign().valueOrOne() < AlignmentInt) { | 
|---|
| 3261 | AI->removeAttr(Kind: llvm::Attribute::AttrKind::Alignment); | 
|---|
| 3262 | AI->addAttrs(B&: llvm::AttrBuilder(getLLVMContext()) | 
|---|
| 3263 | .addAlignmentAttr(Align: llvm::Align(AlignmentInt))); | 
|---|
| 3264 | } | 
|---|
| 3265 | } | 
|---|
| 3266 | } | 
|---|
| 3267 |  | 
|---|
| 3268 | // Set 'noalias' if an argument type has the `restrict` qualifier. | 
|---|
| 3269 | if (Arg->getType().isRestrictQualified()) | 
|---|
| 3270 | AI->addAttr(Kind: llvm::Attribute::NoAlias); | 
|---|
| 3271 | } | 
|---|
| 3272 |  | 
|---|
| 3273 | // Prepare the argument value. If we have the trivial case, handle it | 
|---|
| 3274 | // with no muss and fuss. | 
|---|
| 3275 | if (!isa<llvm::StructType>(Val: ArgI.getCoerceToType()) && | 
|---|
| 3276 | ArgI.getCoerceToType() == ConvertType(T: Ty) && | 
|---|
| 3277 | ArgI.getDirectOffset() == 0) { | 
|---|
| 3278 | assert(NumIRArgs == 1); | 
|---|
| 3279 |  | 
|---|
| 3280 | // LLVM expects swifterror parameters to be used in very restricted | 
|---|
| 3281 | // ways.  Copy the value into a less-restricted temporary. | 
|---|
| 3282 | llvm::Value *V = AI; | 
|---|
| 3283 | if (FI.getExtParameterInfo(argIndex: ArgNo).getABI() == | 
|---|
| 3284 | ParameterABI::SwiftErrorResult) { | 
|---|
| 3285 | QualType pointeeTy = Ty->getPointeeType(); | 
|---|
| 3286 | assert(pointeeTy->isPointerType()); | 
|---|
| 3287 | RawAddress temp = | 
|---|
| 3288 | CreateMemTemp(T: pointeeTy, Align: getPointerAlign(), Name: "swifterror.temp"); | 
|---|
| 3289 | Address arg = makeNaturalAddressForPointer( | 
|---|
| 3290 | Ptr: V, T: pointeeTy, Alignment: getContext().getTypeAlignInChars(T: pointeeTy)); | 
|---|
| 3291 | llvm::Value *incomingErrorValue = Builder.CreateLoad(Addr: arg); | 
|---|
| 3292 | Builder.CreateStore(Val: incomingErrorValue, Addr: temp); | 
|---|
| 3293 | V = temp.getPointer(); | 
|---|
| 3294 |  | 
|---|
| 3295 | // Push a cleanup to copy the value back at the end of the function. | 
|---|
| 3296 | // The convention does not guarantee that the value will be written | 
|---|
| 3297 | // back if the function exits with an unwind exception. | 
|---|
| 3298 | EHStack.pushCleanup<CopyBackSwiftError>(Kind: NormalCleanup, A: temp, A: arg); | 
|---|
| 3299 | } | 
|---|
| 3300 |  | 
|---|
| 3301 | // Ensure the argument is the correct type. | 
|---|
| 3302 | if (V->getType() != ArgI.getCoerceToType()) | 
|---|
| 3303 | V = Builder.CreateBitCast(V, DestTy: ArgI.getCoerceToType()); | 
|---|
| 3304 |  | 
|---|
| 3305 | if (isPromoted) | 
|---|
| 3306 | V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V); | 
|---|
| 3307 |  | 
|---|
| 3308 | // Because of merging of function types from multiple decls it is | 
|---|
| 3309 | // possible for the type of an argument to not match the corresponding | 
|---|
| 3310 | // type in the function type. Since we are codegening the callee | 
|---|
| 3311 | // in here, add a cast to the argument type. | 
|---|
| 3312 | llvm::Type *LTy = ConvertType(T: Arg->getType()); | 
|---|
| 3313 | if (V->getType() != LTy) | 
|---|
| 3314 | V = Builder.CreateBitCast(V, DestTy: LTy); | 
|---|
| 3315 |  | 
|---|
| 3316 | ArgVals.push_back(Elt: ParamValue::forDirect(value: V)); | 
|---|
| 3317 | break; | 
|---|
| 3318 | } | 
|---|
| 3319 |  | 
|---|
| 3320 | // VLST arguments are coerced to VLATs at the function boundary for | 
|---|
| 3321 | // ABI consistency. If this is a VLST that was coerced to | 
|---|
| 3322 | // a VLAT at the function boundary and the types match up, use | 
|---|
| 3323 | // llvm.vector.extract to convert back to the original VLST. | 
|---|
| 3324 | if (auto *VecTyTo = dyn_cast<llvm::FixedVectorType>(Val: ConvertType(T: Ty))) { | 
|---|
| 3325 | llvm::Value *ArgVal = Fn->getArg(i: FirstIRArg); | 
|---|
| 3326 | if (auto *VecTyFrom = | 
|---|
| 3327 | dyn_cast<llvm::ScalableVectorType>(Val: ArgVal->getType())) { | 
|---|
| 3328 | auto [Coerced, Extracted] = CoerceScalableToFixed( | 
|---|
| 3329 | CGF&: *this, ToTy: VecTyTo, FromTy: VecTyFrom, V: ArgVal, Name: Arg->getName()); | 
|---|
| 3330 | if (Extracted) { | 
|---|
| 3331 | assert(NumIRArgs == 1); | 
|---|
| 3332 | ArgVals.push_back(Elt: ParamValue::forDirect(value: Coerced)); | 
|---|
| 3333 | break; | 
|---|
| 3334 | } | 
|---|
| 3335 | } | 
|---|
| 3336 | } | 
|---|
| 3337 |  | 
|---|
| 3338 | // Struct of fixed-length vectors and struct of array of fixed-length | 
|---|
| 3339 | // vector in VLS calling convention are coerced to vector tuple | 
|---|
| 3340 | // type(represented as TargetExtType) and scalable vector type | 
|---|
| 3341 | // respectively, they're no longer handled as struct. | 
|---|
| 3342 | if (ArgI.isDirect() && isa<llvm::StructType>(Val: ConvertType(T: Ty)) && | 
|---|
| 3343 | (isa<llvm::TargetExtType>(Val: ArgI.getCoerceToType()) || | 
|---|
| 3344 | isa<llvm::ScalableVectorType>(Val: ArgI.getCoerceToType()))) { | 
|---|
| 3345 | ArgVals.push_back(Elt: ParamValue::forDirect(value: AI)); | 
|---|
| 3346 | break; | 
|---|
| 3347 | } | 
|---|
| 3348 |  | 
|---|
| 3349 | llvm::StructType *STy = | 
|---|
| 3350 | dyn_cast<llvm::StructType>(Val: ArgI.getCoerceToType()); | 
|---|
| 3351 | Address Alloca = | 
|---|
| 3352 | CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg), Name: Arg->getName()); | 
|---|
| 3353 |  | 
|---|
| 3354 | // Pointer to store into. | 
|---|
| 3355 | Address Ptr = emitAddressAtOffset(CGF&: *this, addr: Alloca, info: ArgI); | 
|---|
| 3356 |  | 
|---|
| 3357 | // Fast-isel and the optimizer generally like scalar values better than | 
|---|
| 3358 | // FCAs, so we flatten them if this is safe to do for this argument. | 
|---|
| 3359 | if (ArgI.isDirect() && ArgI.getCanBeFlattened() && STy && | 
|---|
| 3360 | STy->getNumElements() > 1) { | 
|---|
| 3361 | llvm::TypeSize StructSize = CGM.getDataLayout().getTypeAllocSize(Ty: STy); | 
|---|
| 3362 | llvm::TypeSize PtrElementSize = | 
|---|
| 3363 | CGM.getDataLayout().getTypeAllocSize(Ty: Ptr.getElementType()); | 
|---|
| 3364 | if (StructSize.isScalable()) { | 
|---|
| 3365 | assert(STy->containsHomogeneousScalableVectorTypes() && | 
|---|
| 3366 | "ABI only supports structure with homogeneous scalable vector " | 
|---|
| 3367 | "type"); | 
|---|
| 3368 | assert(StructSize == PtrElementSize && | 
|---|
| 3369 | "Only allow non-fractional movement of structure with" | 
|---|
| 3370 | "homogeneous scalable vector type"); | 
|---|
| 3371 | assert(STy->getNumElements() == NumIRArgs); | 
|---|
| 3372 |  | 
|---|
| 3373 | llvm::Value *LoadedStructValue = llvm::PoisonValue::get(T: STy); | 
|---|
| 3374 | for (unsigned i = 0, e = STy->getNumElements(); i != e; ++i) { | 
|---|
| 3375 | auto *AI = Fn->getArg(i: FirstIRArg + i); | 
|---|
| 3376 | AI->setName(Arg->getName() + ".coerce"+ Twine(i)); | 
|---|
| 3377 | LoadedStructValue = | 
|---|
| 3378 | Builder.CreateInsertValue(Agg: LoadedStructValue, Val: AI, Idxs: i); | 
|---|
| 3379 | } | 
|---|
| 3380 |  | 
|---|
| 3381 | Builder.CreateStore(Val: LoadedStructValue, Addr: Ptr); | 
|---|
| 3382 | } else { | 
|---|
| 3383 | uint64_t SrcSize = StructSize.getFixedValue(); | 
|---|
| 3384 | uint64_t DstSize = PtrElementSize.getFixedValue(); | 
|---|
| 3385 |  | 
|---|
| 3386 | Address AddrToStoreInto = Address::invalid(); | 
|---|
| 3387 | if (SrcSize <= DstSize) { | 
|---|
| 3388 | AddrToStoreInto = Ptr.withElementType(ElemTy: STy); | 
|---|
| 3389 | } else { | 
|---|
| 3390 | AddrToStoreInto = | 
|---|
| 3391 | CreateTempAlloca(Ty: STy, align: Alloca.getAlignment(), Name: "coerce"); | 
|---|
| 3392 | } | 
|---|
| 3393 |  | 
|---|
| 3394 | assert(STy->getNumElements() == NumIRArgs); | 
|---|
| 3395 | for (unsigned i = 0, e = STy->getNumElements(); i != e; ++i) { | 
|---|
| 3396 | auto AI = Fn->getArg(i: FirstIRArg + i); | 
|---|
| 3397 | AI->setName(Arg->getName() + ".coerce"+ Twine(i)); | 
|---|
| 3398 | Address EltPtr = Builder.CreateStructGEP(Addr: AddrToStoreInto, Index: i); | 
|---|
| 3399 | Builder.CreateStore(Val: AI, Addr: EltPtr); | 
|---|
| 3400 | } | 
|---|
| 3401 |  | 
|---|
| 3402 | if (SrcSize > DstSize) { | 
|---|
| 3403 | Builder.CreateMemCpy(Dest: Ptr, Src: AddrToStoreInto, Size: DstSize); | 
|---|
| 3404 | } | 
|---|
| 3405 | } | 
|---|
| 3406 | } else { | 
|---|
| 3407 | // Simple case, just do a coerced store of the argument into the alloca. | 
|---|
| 3408 | assert(NumIRArgs == 1); | 
|---|
| 3409 | auto AI = Fn->getArg(i: FirstIRArg); | 
|---|
| 3410 | AI->setName(Arg->getName() + ".coerce"); | 
|---|
| 3411 | CreateCoercedStore( | 
|---|
| 3412 | Src: AI, Dst: Ptr, | 
|---|
| 3413 | DstSize: llvm::TypeSize::getFixed( | 
|---|
| 3414 | ExactSize: getContext().getTypeSizeInChars(T: Ty).getQuantity() - | 
|---|
| 3415 | ArgI.getDirectOffset()), | 
|---|
| 3416 | /*DstIsVolatile=*/false); | 
|---|
| 3417 | } | 
|---|
| 3418 |  | 
|---|
| 3419 | // Match to what EmitParmDecl is expecting for this type. | 
|---|
| 3420 | if (CodeGenFunction::hasScalarEvaluationKind(T: Ty)) { | 
|---|
| 3421 | llvm::Value *V = | 
|---|
| 3422 | EmitLoadOfScalar(Addr: Alloca, Volatile: false, Ty, Loc: Arg->getBeginLoc()); | 
|---|
| 3423 | if (isPromoted) | 
|---|
| 3424 | V = emitArgumentDemotion(CGF&: *this, var: Arg, value: V); | 
|---|
| 3425 | ArgVals.push_back(Elt: ParamValue::forDirect(value: V)); | 
|---|
| 3426 | } else { | 
|---|
| 3427 | ArgVals.push_back(Elt: ParamValue::forIndirect(addr: Alloca)); | 
|---|
| 3428 | } | 
|---|
| 3429 | break; | 
|---|
| 3430 | } | 
|---|
| 3431 |  | 
|---|
| 3432 | case ABIArgInfo::CoerceAndExpand: { | 
|---|
| 3433 | // Reconstruct into a temporary. | 
|---|
| 3434 | Address alloca = CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg)); | 
|---|
| 3435 | ArgVals.push_back(Elt: ParamValue::forIndirect(addr: alloca)); | 
|---|
| 3436 |  | 
|---|
| 3437 | auto coercionType = ArgI.getCoerceAndExpandType(); | 
|---|
| 3438 | auto unpaddedCoercionType = ArgI.getUnpaddedCoerceAndExpandType(); | 
|---|
| 3439 | auto *unpaddedStruct = dyn_cast<llvm::StructType>(Val: unpaddedCoercionType); | 
|---|
| 3440 |  | 
|---|
| 3441 | alloca = alloca.withElementType(ElemTy: coercionType); | 
|---|
| 3442 |  | 
|---|
| 3443 | unsigned argIndex = FirstIRArg; | 
|---|
| 3444 | unsigned unpaddedIndex = 0; | 
|---|
| 3445 | for (unsigned i = 0, e = coercionType->getNumElements(); i != e; ++i) { | 
|---|
| 3446 | llvm::Type *eltType = coercionType->getElementType(N: i); | 
|---|
| 3447 | if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType)) | 
|---|
| 3448 | continue; | 
|---|
| 3449 |  | 
|---|
| 3450 | auto eltAddr = Builder.CreateStructGEP(Addr: alloca, Index: i); | 
|---|
| 3451 | llvm::Value *elt = Fn->getArg(i: argIndex++); | 
|---|
| 3452 |  | 
|---|
| 3453 | auto paramType = unpaddedStruct | 
|---|
| 3454 | ? unpaddedStruct->getElementType(N: unpaddedIndex++) | 
|---|
| 3455 | : unpaddedCoercionType; | 
|---|
| 3456 |  | 
|---|
| 3457 | if (auto *VecTyTo = dyn_cast<llvm::FixedVectorType>(Val: eltType)) { | 
|---|
| 3458 | if (auto *VecTyFrom = dyn_cast<llvm::ScalableVectorType>(Val: paramType)) { | 
|---|
| 3459 | bool ; | 
|---|
| 3460 | std::tie(args&: elt, args&: Extracted) = CoerceScalableToFixed( | 
|---|
| 3461 | CGF&: *this, ToTy: VecTyTo, FromTy: VecTyFrom, V: elt, Name: elt->getName()); | 
|---|
| 3462 | assert(Extracted && "Unexpected scalable to fixed vector coercion"); | 
|---|
| 3463 | } | 
|---|
| 3464 | } | 
|---|
| 3465 | Builder.CreateStore(Val: elt, Addr: eltAddr); | 
|---|
| 3466 | } | 
|---|
| 3467 | assert(argIndex == FirstIRArg + NumIRArgs); | 
|---|
| 3468 | break; | 
|---|
| 3469 | } | 
|---|
| 3470 |  | 
|---|
| 3471 | case ABIArgInfo::Expand: { | 
|---|
| 3472 | // If this structure was expanded into multiple arguments then | 
|---|
| 3473 | // we need to create a temporary and reconstruct it from the | 
|---|
| 3474 | // arguments. | 
|---|
| 3475 | Address Alloca = CreateMemTemp(T: Ty, Align: getContext().getDeclAlign(D: Arg)); | 
|---|
| 3476 | LValue LV = MakeAddrLValue(Addr: Alloca, T: Ty); | 
|---|
| 3477 | ArgVals.push_back(Elt: ParamValue::forIndirect(addr: Alloca)); | 
|---|
| 3478 |  | 
|---|
| 3479 | auto FnArgIter = Fn->arg_begin() + FirstIRArg; | 
|---|
| 3480 | ExpandTypeFromArgs(Ty, LV, AI&: FnArgIter); | 
|---|
| 3481 | assert(FnArgIter == Fn->arg_begin() + FirstIRArg + NumIRArgs); | 
|---|
| 3482 | for (unsigned i = 0, e = NumIRArgs; i != e; ++i) { | 
|---|
| 3483 | auto AI = Fn->getArg(i: FirstIRArg + i); | 
|---|
| 3484 | AI->setName(Arg->getName() + "."+ Twine(i)); | 
|---|
| 3485 | } | 
|---|
| 3486 | break; | 
|---|
| 3487 | } | 
|---|
| 3488 |  | 
|---|
| 3489 | case ABIArgInfo::Ignore: | 
|---|
| 3490 | assert(NumIRArgs == 0); | 
|---|
| 3491 | // Initialize the local variable appropriately. | 
|---|
| 3492 | if (!hasScalarEvaluationKind(T: Ty)) { | 
|---|
| 3493 | ArgVals.push_back(Elt: ParamValue::forIndirect(addr: CreateMemTemp(T: Ty))); | 
|---|
| 3494 | } else { | 
|---|
| 3495 | llvm::Value *U = llvm::UndefValue::get(T: ConvertType(T: Arg->getType())); | 
|---|
| 3496 | ArgVals.push_back(Elt: ParamValue::forDirect(value: U)); | 
|---|
| 3497 | } | 
|---|
| 3498 | break; | 
|---|
| 3499 | } | 
|---|
| 3500 | } | 
|---|
| 3501 |  | 
|---|
| 3502 | if (getTarget().getCXXABI().areArgsDestroyedLeftToRightInCallee()) { | 
|---|
| 3503 | for (int I = Args.size() - 1; I >= 0; --I) | 
|---|
| 3504 | EmitParmDecl(D: *Args[I], Arg: ArgVals[I], ArgNo: I + 1); | 
|---|
| 3505 | } else { | 
|---|
| 3506 | for (unsigned I = 0, E = Args.size(); I != E; ++I) | 
|---|
| 3507 | EmitParmDecl(D: *Args[I], Arg: ArgVals[I], ArgNo: I + 1); | 
|---|
| 3508 | } | 
|---|
| 3509 | } | 
|---|
| 3510 |  | 
|---|
| 3511 | static void eraseUnusedBitCasts(llvm::Instruction *insn) { | 
|---|
| 3512 | while (insn->use_empty()) { | 
|---|
| 3513 | llvm::BitCastInst *bitcast = dyn_cast<llvm::BitCastInst>(Val: insn); | 
|---|
| 3514 | if (!bitcast) | 
|---|
| 3515 | return; | 
|---|
| 3516 |  | 
|---|
| 3517 | // This is "safe" because we would have used a ConstantExpr otherwise. | 
|---|
| 3518 | insn = cast<llvm::Instruction>(Val: bitcast->getOperand(i_nocapture: 0)); | 
|---|
| 3519 | bitcast->eraseFromParent(); | 
|---|
| 3520 | } | 
|---|
| 3521 | } | 
|---|
| 3522 |  | 
|---|
| 3523 | /// Try to emit a fused autorelease of a return result. | 
|---|
| 3524 | static llvm::Value *tryEmitFusedAutoreleaseOfResult(CodeGenFunction &CGF, | 
|---|
| 3525 | llvm::Value *result) { | 
|---|
| 3526 | // We must be immediately followed the cast. | 
|---|
| 3527 | llvm::BasicBlock *BB = CGF.Builder.GetInsertBlock(); | 
|---|
| 3528 | if (BB->empty()) | 
|---|
| 3529 | return nullptr; | 
|---|
| 3530 | if (&BB->back() != result) | 
|---|
| 3531 | return nullptr; | 
|---|
| 3532 |  | 
|---|
| 3533 | llvm::Type *resultType = result->getType(); | 
|---|
| 3534 |  | 
|---|
| 3535 | // result is in a BasicBlock and is therefore an Instruction. | 
|---|
| 3536 | llvm::Instruction *generator = cast<llvm::Instruction>(Val: result); | 
|---|
| 3537 |  | 
|---|
| 3538 | SmallVector<llvm::Instruction *, 4> InstsToKill; | 
|---|
| 3539 |  | 
|---|
| 3540 | // Look for: | 
|---|
| 3541 | //  %generator = bitcast %type1* %generator2 to %type2* | 
|---|
| 3542 | while (llvm::BitCastInst *bitcast = dyn_cast<llvm::BitCastInst>(Val: generator)) { | 
|---|
| 3543 | // We would have emitted this as a constant if the operand weren't | 
|---|
| 3544 | // an Instruction. | 
|---|
| 3545 | generator = cast<llvm::Instruction>(Val: bitcast->getOperand(i_nocapture: 0)); | 
|---|
| 3546 |  | 
|---|
| 3547 | // Require the generator to be immediately followed by the cast. | 
|---|
| 3548 | if (generator->getNextNode() != bitcast) | 
|---|
| 3549 | return nullptr; | 
|---|
| 3550 |  | 
|---|
| 3551 | InstsToKill.push_back(Elt: bitcast); | 
|---|
| 3552 | } | 
|---|
| 3553 |  | 
|---|
| 3554 | // Look for: | 
|---|
| 3555 | //   %generator = call i8* @objc_retain(i8* %originalResult) | 
|---|
| 3556 | // or | 
|---|
| 3557 | //   %generator = call i8* @objc_retainAutoreleasedReturnValue(i8* %originalResult) | 
|---|
| 3558 | llvm::CallInst *call = dyn_cast<llvm::CallInst>(Val: generator); | 
|---|
| 3559 | if (!call) | 
|---|
| 3560 | return nullptr; | 
|---|
| 3561 |  | 
|---|
| 3562 | bool doRetainAutorelease; | 
|---|
| 3563 |  | 
|---|
| 3564 | if (call->getCalledOperand() == CGF.CGM.getObjCEntrypoints().objc_retain) { | 
|---|
| 3565 | doRetainAutorelease = true; | 
|---|
| 3566 | } else if (call->getCalledOperand() == | 
|---|
| 3567 | CGF.CGM.getObjCEntrypoints().objc_retainAutoreleasedReturnValue) { | 
|---|
| 3568 | doRetainAutorelease = false; | 
|---|
| 3569 |  | 
|---|
| 3570 | // If we emitted an assembly marker for this call (and the | 
|---|
| 3571 | // ARCEntrypoints field should have been set if so), go looking | 
|---|
| 3572 | // for that call.  If we can't find it, we can't do this | 
|---|
| 3573 | // optimization.  But it should always be the immediately previous | 
|---|
| 3574 | // instruction, unless we needed bitcasts around the call. | 
|---|
| 3575 | if (CGF.CGM.getObjCEntrypoints().retainAutoreleasedReturnValueMarker) { | 
|---|
| 3576 | llvm::Instruction *prev = call->getPrevNode(); | 
|---|
| 3577 | assert(prev); | 
|---|
| 3578 | if (isa<llvm::BitCastInst>(Val: prev)) { | 
|---|
| 3579 | prev = prev->getPrevNode(); | 
|---|
| 3580 | assert(prev); | 
|---|
| 3581 | } | 
|---|
| 3582 | assert(isa<llvm::CallInst>(prev)); | 
|---|
| 3583 | assert(cast<llvm::CallInst>(prev)->getCalledOperand() == | 
|---|
| 3584 | CGF.CGM.getObjCEntrypoints().retainAutoreleasedReturnValueMarker); | 
|---|
| 3585 | InstsToKill.push_back(Elt: prev); | 
|---|
| 3586 | } | 
|---|
| 3587 | } else { | 
|---|
| 3588 | return nullptr; | 
|---|
| 3589 | } | 
|---|
| 3590 |  | 
|---|
| 3591 | result = call->getArgOperand(i: 0); | 
|---|
| 3592 | InstsToKill.push_back(Elt: call); | 
|---|
| 3593 |  | 
|---|
| 3594 | // Keep killing bitcasts, for sanity.  Note that we no longer care | 
|---|
| 3595 | // about precise ordering as long as there's exactly one use. | 
|---|
| 3596 | while (llvm::BitCastInst *bitcast = dyn_cast<llvm::BitCastInst>(Val: result)) { | 
|---|
| 3597 | if (!bitcast->hasOneUse()) | 
|---|
| 3598 | break; | 
|---|
| 3599 | InstsToKill.push_back(Elt: bitcast); | 
|---|
| 3600 | result = bitcast->getOperand(i_nocapture: 0); | 
|---|
| 3601 | } | 
|---|
| 3602 |  | 
|---|
| 3603 | // Delete all the unnecessary instructions, from latest to earliest. | 
|---|
| 3604 | for (auto *I : InstsToKill) | 
|---|
| 3605 | I->eraseFromParent(); | 
|---|
| 3606 |  | 
|---|
| 3607 | // Do the fused retain/autorelease if we were asked to. | 
|---|
| 3608 | if (doRetainAutorelease) | 
|---|
| 3609 | result = CGF.EmitARCRetainAutoreleaseReturnValue(value: result); | 
|---|
| 3610 |  | 
|---|
| 3611 | // Cast back to the result type. | 
|---|
| 3612 | return CGF.Builder.CreateBitCast(V: result, DestTy: resultType); | 
|---|
| 3613 | } | 
|---|
| 3614 |  | 
|---|
| 3615 | /// If this is a +1 of the value of an immutable 'self', remove it. | 
|---|
| 3616 | static llvm::Value *tryRemoveRetainOfSelf(CodeGenFunction &CGF, | 
|---|
| 3617 | llvm::Value *result) { | 
|---|
| 3618 | // This is only applicable to a method with an immutable 'self'. | 
|---|
| 3619 | const ObjCMethodDecl *method = | 
|---|
| 3620 | dyn_cast_or_null<ObjCMethodDecl>(Val: CGF.CurCodeDecl); | 
|---|
| 3621 | if (!method) | 
|---|
| 3622 | return nullptr; | 
|---|
| 3623 | const VarDecl *self = method->getSelfDecl(); | 
|---|
| 3624 | if (!self->getType().isConstQualified()) | 
|---|
| 3625 | return nullptr; | 
|---|
| 3626 |  | 
|---|
| 3627 | // Look for a retain call. Note: stripPointerCasts looks through returned arg | 
|---|
| 3628 | // functions, which would cause us to miss the retain. | 
|---|
| 3629 | llvm::CallInst *retainCall = dyn_cast<llvm::CallInst>(Val: result); | 
|---|
| 3630 | if (!retainCall || retainCall->getCalledOperand() != | 
|---|
| 3631 | CGF.CGM.getObjCEntrypoints().objc_retain) | 
|---|
| 3632 | return nullptr; | 
|---|
| 3633 |  | 
|---|
| 3634 | // Look for an ordinary load of 'self'. | 
|---|
| 3635 | llvm::Value *retainedValue = retainCall->getArgOperand(i: 0); | 
|---|
| 3636 | llvm::LoadInst *load = | 
|---|
| 3637 | dyn_cast<llvm::LoadInst>(Val: retainedValue->stripPointerCasts()); | 
|---|
| 3638 | if (!load || load->isAtomic() || load->isVolatile() || | 
|---|
| 3639 | load->getPointerOperand() != CGF.GetAddrOfLocalVar(VD: self).getBasePointer()) | 
|---|
| 3640 | return nullptr; | 
|---|
| 3641 |  | 
|---|
| 3642 | // Okay!  Burn it all down.  This relies for correctness on the | 
|---|
| 3643 | // assumption that the retain is emitted as part of the return and | 
|---|
| 3644 | // that thereafter everything is used "linearly". | 
|---|
| 3645 | llvm::Type *resultType = result->getType(); | 
|---|
| 3646 | eraseUnusedBitCasts(insn: cast<llvm::Instruction>(Val: result)); | 
|---|
| 3647 | assert(retainCall->use_empty()); | 
|---|
| 3648 | retainCall->eraseFromParent(); | 
|---|
| 3649 | eraseUnusedBitCasts(insn: cast<llvm::Instruction>(Val: retainedValue)); | 
|---|
| 3650 |  | 
|---|
| 3651 | return CGF.Builder.CreateBitCast(V: load, DestTy: resultType); | 
|---|
| 3652 | } | 
|---|
| 3653 |  | 
|---|
| 3654 | /// Emit an ARC autorelease of the result of a function. | 
|---|
| 3655 | /// | 
|---|
| 3656 | /// \return the value to actually return from the function | 
|---|
| 3657 | static llvm::Value *emitAutoreleaseOfResult(CodeGenFunction &CGF, | 
|---|
| 3658 | llvm::Value *result) { | 
|---|
| 3659 | // If we're returning 'self', kill the initial retain.  This is a | 
|---|
| 3660 | // heuristic attempt to "encourage correctness" in the really unfortunate | 
|---|
| 3661 | // case where we have a return of self during a dealloc and we desperately | 
|---|
| 3662 | // need to avoid the possible autorelease. | 
|---|
| 3663 | if (llvm::Value *self = tryRemoveRetainOfSelf(CGF, result)) | 
|---|
| 3664 | return self; | 
|---|
| 3665 |  | 
|---|
| 3666 | // At -O0, try to emit a fused retain/autorelease. | 
|---|
| 3667 | if (CGF.shouldUseFusedARCCalls()) | 
|---|
| 3668 | if (llvm::Value *fused = tryEmitFusedAutoreleaseOfResult(CGF, result)) | 
|---|
| 3669 | return fused; | 
|---|
| 3670 |  | 
|---|
| 3671 | return CGF.EmitARCAutoreleaseReturnValue(value: result); | 
|---|
| 3672 | } | 
|---|
| 3673 |  | 
|---|
| 3674 | /// Heuristically search for a dominating store to the return-value slot. | 
|---|
| 3675 | static llvm::StoreInst *findDominatingStoreToReturnValue(CodeGenFunction &CGF) { | 
|---|
| 3676 | llvm::Value *ReturnValuePtr = CGF.ReturnValue.getBasePointer(); | 
|---|
| 3677 |  | 
|---|
| 3678 | // Check if a User is a store which pointerOperand is the ReturnValue. | 
|---|
| 3679 | // We are looking for stores to the ReturnValue, not for stores of the | 
|---|
| 3680 | // ReturnValue to some other location. | 
|---|
| 3681 | auto GetStoreIfValid = [&CGF, | 
|---|
| 3682 | ReturnValuePtr](llvm::User *U) -> llvm::StoreInst * { | 
|---|
| 3683 | auto *SI = dyn_cast<llvm::StoreInst>(Val: U); | 
|---|
| 3684 | if (!SI || SI->getPointerOperand() != ReturnValuePtr || | 
|---|
| 3685 | SI->getValueOperand()->getType() != CGF.ReturnValue.getElementType()) | 
|---|
| 3686 | return nullptr; | 
|---|
| 3687 | // These aren't actually possible for non-coerced returns, and we | 
|---|
| 3688 | // only care about non-coerced returns on this code path. | 
|---|
| 3689 | // All memory instructions inside __try block are volatile. | 
|---|
| 3690 | assert(!SI->isAtomic() && | 
|---|
| 3691 | (!SI->isVolatile() || CGF.currentFunctionUsesSEHTry())); | 
|---|
| 3692 | return SI; | 
|---|
| 3693 | }; | 
|---|
| 3694 | // If there are multiple uses of the return-value slot, just check | 
|---|
| 3695 | // for something immediately preceding the IP.  Sometimes this can | 
|---|
| 3696 | // happen with how we generate implicit-returns; it can also happen | 
|---|
| 3697 | // with noreturn cleanups. | 
|---|
| 3698 | if (!ReturnValuePtr->hasOneUse()) { | 
|---|
| 3699 | llvm::BasicBlock *IP = CGF.Builder.GetInsertBlock(); | 
|---|
| 3700 | if (IP->empty()) | 
|---|
| 3701 | return nullptr; | 
|---|
| 3702 |  | 
|---|
| 3703 | // Look at directly preceding instruction, skipping bitcasts, lifetime | 
|---|
| 3704 | // markers, and fake uses and their operands. | 
|---|
| 3705 | const llvm::Instruction *LoadIntoFakeUse = nullptr; | 
|---|
| 3706 | for (llvm::Instruction &I : llvm::reverse(C&: *IP)) { | 
|---|
| 3707 | // Ignore instructions that are just loads for fake uses; the load should | 
|---|
| 3708 | // immediately precede the fake use, so we only need to remember the | 
|---|
| 3709 | // operand for the last fake use seen. | 
|---|
| 3710 | if (LoadIntoFakeUse == &I) | 
|---|
| 3711 | continue; | 
|---|
| 3712 | if (isa<llvm::BitCastInst>(Val: &I)) | 
|---|
| 3713 | continue; | 
|---|
| 3714 | if (auto *II = dyn_cast<llvm::IntrinsicInst>(Val: &I)) { | 
|---|
| 3715 | if (II->getIntrinsicID() == llvm::Intrinsic::lifetime_end) | 
|---|
| 3716 | continue; | 
|---|
| 3717 |  | 
|---|
| 3718 | if (II->getIntrinsicID() == llvm::Intrinsic::fake_use) { | 
|---|
| 3719 | LoadIntoFakeUse = dyn_cast<llvm::Instruction>(Val: II->getArgOperand(i: 0)); | 
|---|
| 3720 | continue; | 
|---|
| 3721 | } | 
|---|
| 3722 | } | 
|---|
| 3723 | return GetStoreIfValid(&I); | 
|---|
| 3724 | } | 
|---|
| 3725 | return nullptr; | 
|---|
| 3726 | } | 
|---|
| 3727 |  | 
|---|
| 3728 | llvm::StoreInst *store = GetStoreIfValid(ReturnValuePtr->user_back()); | 
|---|
| 3729 | if (!store) | 
|---|
| 3730 | return nullptr; | 
|---|
| 3731 |  | 
|---|
| 3732 | // Now do a first-and-dirty dominance check: just walk up the | 
|---|
| 3733 | // single-predecessors chain from the current insertion point. | 
|---|
| 3734 | llvm::BasicBlock *StoreBB = store->getParent(); | 
|---|
| 3735 | llvm::BasicBlock *IP = CGF.Builder.GetInsertBlock(); | 
|---|
| 3736 | llvm::SmallPtrSet<llvm::BasicBlock *, 4> SeenBBs; | 
|---|
| 3737 | while (IP != StoreBB) { | 
|---|
| 3738 | if (!SeenBBs.insert(Ptr: IP).second || !(IP = IP->getSinglePredecessor())) | 
|---|
| 3739 | return nullptr; | 
|---|
| 3740 | } | 
|---|
| 3741 |  | 
|---|
| 3742 | // Okay, the store's basic block dominates the insertion point; we | 
|---|
| 3743 | // can do our thing. | 
|---|
| 3744 | return store; | 
|---|
| 3745 | } | 
|---|
| 3746 |  | 
|---|
| 3747 | // Helper functions for EmitCMSEClearRecord | 
|---|
| 3748 |  | 
|---|
| 3749 | // Set the bits corresponding to a field having width `BitWidth` and located at | 
|---|
| 3750 | // offset `BitOffset` (from the least significant bit) within a storage unit of | 
|---|
| 3751 | // `Bits.size()` bytes. Each element of `Bits` corresponds to one target byte. | 
|---|
| 3752 | // Use little-endian layout, i.e.`Bits[0]` is the LSB. | 
|---|
| 3753 | static void setBitRange(SmallVectorImpl<uint64_t> &Bits, int BitOffset, | 
|---|
| 3754 | int BitWidth, int CharWidth) { | 
|---|
| 3755 | assert(CharWidth <= 64); | 
|---|
| 3756 | assert(static_cast<unsigned>(BitWidth) <= Bits.size() * CharWidth); | 
|---|
| 3757 |  | 
|---|
| 3758 | int Pos = 0; | 
|---|
| 3759 | if (BitOffset >= CharWidth) { | 
|---|
| 3760 | Pos += BitOffset / CharWidth; | 
|---|
| 3761 | BitOffset = BitOffset % CharWidth; | 
|---|
| 3762 | } | 
|---|
| 3763 |  | 
|---|
| 3764 | const uint64_t Used = (uint64_t(1) << CharWidth) - 1; | 
|---|
| 3765 | if (BitOffset + BitWidth >= CharWidth) { | 
|---|
| 3766 | Bits[Pos++] |= (Used << BitOffset) & Used; | 
|---|
| 3767 | BitWidth -= CharWidth - BitOffset; | 
|---|
| 3768 | BitOffset = 0; | 
|---|
| 3769 | } | 
|---|
| 3770 |  | 
|---|
| 3771 | while (BitWidth >= CharWidth) { | 
|---|
| 3772 | Bits[Pos++] = Used; | 
|---|
| 3773 | BitWidth -= CharWidth; | 
|---|
| 3774 | } | 
|---|
| 3775 |  | 
|---|
| 3776 | if (BitWidth > 0) | 
|---|
| 3777 | Bits[Pos++] |= (Used >> (CharWidth - BitWidth)) << BitOffset; | 
|---|
| 3778 | } | 
|---|
| 3779 |  | 
|---|
| 3780 | // Set the bits corresponding to a field having width `BitWidth` and located at | 
|---|
| 3781 | // offset `BitOffset` (from the least significant bit) within a storage unit of | 
|---|
| 3782 | // `StorageSize` bytes, located at `StorageOffset` in `Bits`. Each element of | 
|---|
| 3783 | // `Bits` corresponds to one target byte. Use target endian layout. | 
|---|
| 3784 | static void setBitRange(SmallVectorImpl<uint64_t> &Bits, int StorageOffset, | 
|---|
| 3785 | int StorageSize, int BitOffset, int BitWidth, | 
|---|
| 3786 | int CharWidth, bool BigEndian) { | 
|---|
| 3787 |  | 
|---|
| 3788 | SmallVector<uint64_t, 8> TmpBits(StorageSize); | 
|---|
| 3789 | setBitRange(Bits&: TmpBits, BitOffset, BitWidth, CharWidth); | 
|---|
| 3790 |  | 
|---|
| 3791 | if (BigEndian) | 
|---|
| 3792 | std::reverse(first: TmpBits.begin(), last: TmpBits.end()); | 
|---|
| 3793 |  | 
|---|
| 3794 | for (uint64_t V : TmpBits) | 
|---|
| 3795 | Bits[StorageOffset++] |= V; | 
|---|
| 3796 | } | 
|---|
| 3797 |  | 
|---|
| 3798 | static void setUsedBits(CodeGenModule &, QualType, int, | 
|---|
| 3799 | SmallVectorImpl<uint64_t> &); | 
|---|
| 3800 |  | 
|---|
| 3801 | // Set the bits in `Bits`, which correspond to the value representations of | 
|---|
| 3802 | // the actual members of the record type `RTy`. Note that this function does | 
|---|
| 3803 | // not handle base classes, virtual tables, etc, since they cannot happen in | 
|---|
| 3804 | // CMSE function arguments or return. The bit mask corresponds to the target | 
|---|
| 3805 | // memory layout, i.e. it's endian dependent. | 
|---|
| 3806 | static void setUsedBits(CodeGenModule &CGM, const RecordType *RTy, int Offset, | 
|---|
| 3807 | SmallVectorImpl<uint64_t> &Bits) { | 
|---|
| 3808 | ASTContext &Context = CGM.getContext(); | 
|---|
| 3809 | int CharWidth = Context.getCharWidth(); | 
|---|
| 3810 | const RecordDecl *RD = RTy->getDecl()->getDefinition(); | 
|---|
| 3811 | const ASTRecordLayout &ASTLayout = Context.getASTRecordLayout(D: RD); | 
|---|
| 3812 | const CGRecordLayout &Layout = CGM.getTypes().getCGRecordLayout(RD); | 
|---|
| 3813 |  | 
|---|
| 3814 | int Idx = 0; | 
|---|
| 3815 | for (auto I = RD->field_begin(), E = RD->field_end(); I != E; ++I, ++Idx) { | 
|---|
| 3816 | const FieldDecl *F = *I; | 
|---|
| 3817 |  | 
|---|
| 3818 | if (F->isUnnamedBitField() || F->isZeroLengthBitField() || | 
|---|
| 3819 | F->getType()->isIncompleteArrayType()) | 
|---|
| 3820 | continue; | 
|---|
| 3821 |  | 
|---|
| 3822 | if (F->isBitField()) { | 
|---|
| 3823 | const CGBitFieldInfo &BFI = Layout.getBitFieldInfo(FD: F); | 
|---|
| 3824 | setBitRange(Bits, StorageOffset: Offset + BFI.StorageOffset.getQuantity(), | 
|---|
| 3825 | StorageSize: BFI.StorageSize / CharWidth, BitOffset: BFI.Offset, BitWidth: BFI.Size, CharWidth, | 
|---|
| 3826 | BigEndian: CGM.getDataLayout().isBigEndian()); | 
|---|
| 3827 | continue; | 
|---|
| 3828 | } | 
|---|
| 3829 |  | 
|---|
| 3830 | setUsedBits(CGM, F->getType(), | 
|---|
| 3831 | Offset + ASTLayout.getFieldOffset(FieldNo: Idx) / CharWidth, Bits); | 
|---|
| 3832 | } | 
|---|
| 3833 | } | 
|---|
| 3834 |  | 
|---|
| 3835 | // Set the bits in `Bits`, which correspond to the value representations of | 
|---|
| 3836 | // the elements of an array type `ATy`. | 
|---|
| 3837 | static void setUsedBits(CodeGenModule &CGM, const ConstantArrayType *ATy, | 
|---|
| 3838 | int Offset, SmallVectorImpl<uint64_t> &Bits) { | 
|---|
| 3839 | const ASTContext &Context = CGM.getContext(); | 
|---|
| 3840 |  | 
|---|
| 3841 | QualType ETy = Context.getBaseElementType(VAT: ATy); | 
|---|
| 3842 | int Size = Context.getTypeSizeInChars(T: ETy).getQuantity(); | 
|---|
| 3843 | SmallVector<uint64_t, 4> TmpBits(Size); | 
|---|
| 3844 | setUsedBits(CGM, ETy, 0, TmpBits); | 
|---|
| 3845 |  | 
|---|
| 3846 | for (int I = 0, N = Context.getConstantArrayElementCount(CA: ATy); I < N; ++I) { | 
|---|
| 3847 | auto Src = TmpBits.begin(); | 
|---|
| 3848 | auto Dst = Bits.begin() + Offset + I * Size; | 
|---|
| 3849 | for (int J = 0; J < Size; ++J) | 
|---|
| 3850 | *Dst++ |= *Src++; | 
|---|
| 3851 | } | 
|---|
| 3852 | } | 
|---|
| 3853 |  | 
|---|
| 3854 | // Set the bits in `Bits`, which correspond to the value representations of | 
|---|
| 3855 | // the type `QTy`. | 
|---|
| 3856 | static void setUsedBits(CodeGenModule &CGM, QualType QTy, int Offset, | 
|---|
| 3857 | SmallVectorImpl<uint64_t> &Bits) { | 
|---|
| 3858 | if (const auto *RTy = QTy->getAs<RecordType>()) | 
|---|
| 3859 | return setUsedBits(CGM, RTy, Offset, Bits); | 
|---|
| 3860 |  | 
|---|
| 3861 | ASTContext &Context = CGM.getContext(); | 
|---|
| 3862 | if (const auto *ATy = Context.getAsConstantArrayType(T: QTy)) | 
|---|
| 3863 | return setUsedBits(CGM, ATy, Offset, Bits); | 
|---|
| 3864 |  | 
|---|
| 3865 | int Size = Context.getTypeSizeInChars(T: QTy).getQuantity(); | 
|---|
| 3866 | if (Size <= 0) | 
|---|
| 3867 | return; | 
|---|
| 3868 |  | 
|---|
| 3869 | std::fill_n(first: Bits.begin() + Offset, n: Size, | 
|---|
| 3870 | value: (uint64_t(1) << Context.getCharWidth()) - 1); | 
|---|
| 3871 | } | 
|---|
| 3872 |  | 
|---|
| 3873 | static uint64_t buildMultiCharMask(const SmallVectorImpl<uint64_t> &Bits, | 
|---|
| 3874 | int Pos, int Size, int CharWidth, | 
|---|
| 3875 | bool BigEndian) { | 
|---|
| 3876 | assert(Size > 0); | 
|---|
| 3877 | uint64_t Mask = 0; | 
|---|
| 3878 | if (BigEndian) { | 
|---|
| 3879 | for (auto P = Bits.begin() + Pos, E = Bits.begin() + Pos + Size; P != E; | 
|---|
| 3880 | ++P) | 
|---|
| 3881 | Mask = (Mask << CharWidth) | *P; | 
|---|
| 3882 | } else { | 
|---|
| 3883 | auto P = Bits.begin() + Pos + Size, End = Bits.begin() + Pos; | 
|---|
| 3884 | do | 
|---|
| 3885 | Mask = (Mask << CharWidth) | *--P; | 
|---|
| 3886 | while (P != End); | 
|---|
| 3887 | } | 
|---|
| 3888 | return Mask; | 
|---|
| 3889 | } | 
|---|
| 3890 |  | 
|---|
| 3891 | // Emit code to clear the bits in a record, which aren't a part of any user | 
|---|
| 3892 | // declared member, when the record is a function return. | 
|---|
| 3893 | llvm::Value *CodeGenFunction::EmitCMSEClearRecord(llvm::Value *Src, | 
|---|
| 3894 | llvm::IntegerType *ITy, | 
|---|
| 3895 | QualType QTy) { | 
|---|
| 3896 | assert(Src->getType() == ITy); | 
|---|
| 3897 | assert(ITy->getScalarSizeInBits() <= 64); | 
|---|
| 3898 |  | 
|---|
| 3899 | const llvm::DataLayout &DataLayout = CGM.getDataLayout(); | 
|---|
| 3900 | int Size = DataLayout.getTypeStoreSize(Ty: ITy); | 
|---|
| 3901 | SmallVector<uint64_t, 4> Bits(Size); | 
|---|
| 3902 | setUsedBits(CGM, RTy: QTy->castAs<RecordType>(), Offset: 0, Bits); | 
|---|
| 3903 |  | 
|---|
| 3904 | int CharWidth = CGM.getContext().getCharWidth(); | 
|---|
| 3905 | uint64_t Mask = | 
|---|
| 3906 | buildMultiCharMask(Bits, Pos: 0, Size, CharWidth, BigEndian: DataLayout.isBigEndian()); | 
|---|
| 3907 |  | 
|---|
| 3908 | return Builder.CreateAnd(LHS: Src, RHS: Mask, Name: "cmse.clear"); | 
|---|
| 3909 | } | 
|---|
| 3910 |  | 
|---|
| 3911 | // Emit code to clear the bits in a record, which aren't a part of any user | 
|---|
| 3912 | // declared member, when the record is a function argument. | 
|---|
| 3913 | llvm::Value *CodeGenFunction::EmitCMSEClearRecord(llvm::Value *Src, | 
|---|
| 3914 | llvm::ArrayType *ATy, | 
|---|
| 3915 | QualType QTy) { | 
|---|
| 3916 | const llvm::DataLayout &DataLayout = CGM.getDataLayout(); | 
|---|
| 3917 | int Size = DataLayout.getTypeStoreSize(Ty: ATy); | 
|---|
| 3918 | SmallVector<uint64_t, 16> Bits(Size); | 
|---|
| 3919 | setUsedBits(CGM, RTy: QTy->castAs<RecordType>(), Offset: 0, Bits); | 
|---|
| 3920 |  | 
|---|
| 3921 | // Clear each element of the LLVM array. | 
|---|
| 3922 | int CharWidth = CGM.getContext().getCharWidth(); | 
|---|
| 3923 | int CharsPerElt = | 
|---|
| 3924 | ATy->getArrayElementType()->getScalarSizeInBits() / CharWidth; | 
|---|
| 3925 | int MaskIndex = 0; | 
|---|
| 3926 | llvm::Value *R = llvm::PoisonValue::get(T: ATy); | 
|---|
| 3927 | for (int I = 0, N = ATy->getArrayNumElements(); I != N; ++I) { | 
|---|
| 3928 | uint64_t Mask = buildMultiCharMask(Bits, Pos: MaskIndex, Size: CharsPerElt, CharWidth, | 
|---|
| 3929 | BigEndian: DataLayout.isBigEndian()); | 
|---|
| 3930 | MaskIndex += CharsPerElt; | 
|---|
| 3931 | llvm::Value *T0 = Builder.CreateExtractValue(Agg: Src, Idxs: I); | 
|---|
| 3932 | llvm::Value *T1 = Builder.CreateAnd(LHS: T0, RHS: Mask, Name: "cmse.clear"); | 
|---|
| 3933 | R = Builder.CreateInsertValue(Agg: R, Val: T1, Idxs: I); | 
|---|
| 3934 | } | 
|---|
| 3935 |  | 
|---|
| 3936 | return R; | 
|---|
| 3937 | } | 
|---|
| 3938 |  | 
|---|
| 3939 | void CodeGenFunction::EmitFunctionEpilog( | 
|---|
| 3940 | const CGFunctionInfo &FI, bool EmitRetDbgLoc, SourceLocation EndLoc, | 
|---|
| 3941 | uint64_t RetKeyInstructionsSourceAtom) { | 
|---|
| 3942 | if (FI.isNoReturn()) { | 
|---|
| 3943 | // Noreturn functions don't return. | 
|---|
| 3944 | EmitUnreachable(Loc: EndLoc); | 
|---|
| 3945 | return; | 
|---|
| 3946 | } | 
|---|
| 3947 |  | 
|---|
| 3948 | if (CurCodeDecl && CurCodeDecl->hasAttr<NakedAttr>()) { | 
|---|
| 3949 | // Naked functions don't have epilogues. | 
|---|
| 3950 | Builder.CreateUnreachable(); | 
|---|
| 3951 | return; | 
|---|
| 3952 | } | 
|---|
| 3953 |  | 
|---|
| 3954 | // Functions with no result always return void. | 
|---|
| 3955 | if (!ReturnValue.isValid()) { | 
|---|
| 3956 | auto *I = Builder.CreateRetVoid(); | 
|---|
| 3957 | if (RetKeyInstructionsSourceAtom) | 
|---|
| 3958 | addInstToSpecificSourceAtom(KeyInstruction: I, Backup: nullptr, Atom: RetKeyInstructionsSourceAtom); | 
|---|
| 3959 | else | 
|---|
| 3960 | addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr); | 
|---|
| 3961 | return; | 
|---|
| 3962 | } | 
|---|
| 3963 |  | 
|---|
| 3964 | llvm::DebugLoc RetDbgLoc; | 
|---|
| 3965 | llvm::Value *RV = nullptr; | 
|---|
| 3966 | QualType RetTy = FI.getReturnType(); | 
|---|
| 3967 | const ABIArgInfo &RetAI = FI.getReturnInfo(); | 
|---|
| 3968 |  | 
|---|
| 3969 | switch (RetAI.getKind()) { | 
|---|
| 3970 | case ABIArgInfo::InAlloca: | 
|---|
| 3971 | // Aggregates get evaluated directly into the destination.  Sometimes we | 
|---|
| 3972 | // need to return the sret value in a register, though. | 
|---|
| 3973 | assert(hasAggregateEvaluationKind(RetTy)); | 
|---|
| 3974 | if (RetAI.getInAllocaSRet()) { | 
|---|
| 3975 | llvm::Function::arg_iterator EI = CurFn->arg_end(); | 
|---|
| 3976 | --EI; | 
|---|
| 3977 | llvm::Value *ArgStruct = &*EI; | 
|---|
| 3978 | llvm::Value *SRet = Builder.CreateStructGEP( | 
|---|
| 3979 | Ty: FI.getArgStruct(), Ptr: ArgStruct, Idx: RetAI.getInAllocaFieldIndex()); | 
|---|
| 3980 | llvm::Type *Ty = | 
|---|
| 3981 | cast<llvm::GetElementPtrInst>(Val: SRet)->getResultElementType(); | 
|---|
| 3982 | RV = Builder.CreateAlignedLoad(Ty, Addr: SRet, Align: getPointerAlign(), Name: "sret"); | 
|---|
| 3983 | } | 
|---|
| 3984 | break; | 
|---|
| 3985 |  | 
|---|
| 3986 | case ABIArgInfo::Indirect: { | 
|---|
| 3987 | auto AI = CurFn->arg_begin(); | 
|---|
| 3988 | if (RetAI.isSRetAfterThis()) | 
|---|
| 3989 | ++AI; | 
|---|
| 3990 | switch (getEvaluationKind(T: RetTy)) { | 
|---|
| 3991 | case TEK_Complex: { | 
|---|
| 3992 | ComplexPairTy RT = | 
|---|
| 3993 | EmitLoadOfComplex(src: MakeAddrLValue(Addr: ReturnValue, T: RetTy), loc: EndLoc); | 
|---|
| 3994 | EmitStoreOfComplex(V: RT, dest: MakeNaturalAlignAddrLValue(V: &*AI, T: RetTy), | 
|---|
| 3995 | /*isInit*/ true); | 
|---|
| 3996 | break; | 
|---|
| 3997 | } | 
|---|
| 3998 | case TEK_Aggregate: | 
|---|
| 3999 | // Do nothing; aggregates get evaluated directly into the destination. | 
|---|
| 4000 | break; | 
|---|
| 4001 | case TEK_Scalar: { | 
|---|
| 4002 | LValueBaseInfo BaseInfo; | 
|---|
| 4003 | TBAAAccessInfo TBAAInfo; | 
|---|
| 4004 | CharUnits Alignment = | 
|---|
| 4005 | CGM.getNaturalTypeAlignment(T: RetTy, BaseInfo: &BaseInfo, TBAAInfo: &TBAAInfo); | 
|---|
| 4006 | Address ArgAddr(&*AI, ConvertType(T: RetTy), Alignment); | 
|---|
| 4007 | LValue ArgVal = | 
|---|
| 4008 | LValue::MakeAddr(Addr: ArgAddr, type: RetTy, Context&: getContext(), BaseInfo, TBAAInfo); | 
|---|
| 4009 | EmitStoreOfScalar( | 
|---|
| 4010 | value: EmitLoadOfScalar(lvalue: MakeAddrLValue(Addr: ReturnValue, T: RetTy), Loc: EndLoc), lvalue: ArgVal, | 
|---|
| 4011 | /*isInit*/ true); | 
|---|
| 4012 | break; | 
|---|
| 4013 | } | 
|---|
| 4014 | } | 
|---|
| 4015 | break; | 
|---|
| 4016 | } | 
|---|
| 4017 |  | 
|---|
| 4018 | case ABIArgInfo::Extend: | 
|---|
| 4019 | case ABIArgInfo::Direct: | 
|---|
| 4020 | if (RetAI.getCoerceToType() == ConvertType(T: RetTy) && | 
|---|
| 4021 | RetAI.getDirectOffset() == 0) { | 
|---|
| 4022 | // The internal return value temp always will have pointer-to-return-type | 
|---|
| 4023 | // type, just do a load. | 
|---|
| 4024 |  | 
|---|
| 4025 | // If there is a dominating store to ReturnValue, we can elide | 
|---|
| 4026 | // the load, zap the store, and usually zap the alloca. | 
|---|
| 4027 | if (llvm::StoreInst *SI = findDominatingStoreToReturnValue(CGF&: *this)) { | 
|---|
| 4028 | // Reuse the debug location from the store unless there is | 
|---|
| 4029 | // cleanup code to be emitted between the store and return | 
|---|
| 4030 | // instruction. | 
|---|
| 4031 | if (EmitRetDbgLoc && !AutoreleaseResult) | 
|---|
| 4032 | RetDbgLoc = SI->getDebugLoc(); | 
|---|
| 4033 | // Get the stored value and nuke the now-dead store. | 
|---|
| 4034 | RV = SI->getValueOperand(); | 
|---|
| 4035 | SI->eraseFromParent(); | 
|---|
| 4036 |  | 
|---|
| 4037 | // Otherwise, we have to do a simple load. | 
|---|
| 4038 | } else { | 
|---|
| 4039 | RV = Builder.CreateLoad(Addr: ReturnValue); | 
|---|
| 4040 | } | 
|---|
| 4041 | } else { | 
|---|
| 4042 | // If the value is offset in memory, apply the offset now. | 
|---|
| 4043 | Address V = emitAddressAtOffset(CGF&: *this, addr: ReturnValue, info: RetAI); | 
|---|
| 4044 |  | 
|---|
| 4045 | RV = CreateCoercedLoad(Src: V, Ty: RetAI.getCoerceToType(), CGF&: *this); | 
|---|
| 4046 | } | 
|---|
| 4047 |  | 
|---|
| 4048 | // In ARC, end functions that return a retainable type with a call | 
|---|
| 4049 | // to objc_autoreleaseReturnValue. | 
|---|
| 4050 | if (AutoreleaseResult) { | 
|---|
| 4051 | #ifndef NDEBUG | 
|---|
| 4052 | // Type::isObjCRetainabletype has to be called on a QualType that hasn't | 
|---|
| 4053 | // been stripped of the typedefs, so we cannot use RetTy here. Get the | 
|---|
| 4054 | // original return type of FunctionDecl, CurCodeDecl, and BlockDecl from | 
|---|
| 4055 | // CurCodeDecl or BlockInfo. | 
|---|
| 4056 | QualType RT; | 
|---|
| 4057 |  | 
|---|
| 4058 | if (auto *FD = dyn_cast<FunctionDecl>(CurCodeDecl)) | 
|---|
| 4059 | RT = FD->getReturnType(); | 
|---|
| 4060 | else if (auto *MD = dyn_cast<ObjCMethodDecl>(CurCodeDecl)) | 
|---|
| 4061 | RT = MD->getReturnType(); | 
|---|
| 4062 | else if (isa<BlockDecl>(CurCodeDecl)) | 
|---|
| 4063 | RT = BlockInfo->BlockExpression->getFunctionType()->getReturnType(); | 
|---|
| 4064 | else | 
|---|
| 4065 | llvm_unreachable( "Unexpected function/method type"); | 
|---|
| 4066 |  | 
|---|
| 4067 | assert(getLangOpts().ObjCAutoRefCount && !FI.isReturnsRetained() && | 
|---|
| 4068 | RT->isObjCRetainableType()); | 
|---|
| 4069 | #endif | 
|---|
| 4070 | RV = emitAutoreleaseOfResult(CGF&: *this, result: RV); | 
|---|
| 4071 | } | 
|---|
| 4072 |  | 
|---|
| 4073 | break; | 
|---|
| 4074 |  | 
|---|
| 4075 | case ABIArgInfo::Ignore: | 
|---|
| 4076 | break; | 
|---|
| 4077 |  | 
|---|
| 4078 | case ABIArgInfo::CoerceAndExpand: { | 
|---|
| 4079 | auto coercionType = RetAI.getCoerceAndExpandType(); | 
|---|
| 4080 | auto unpaddedCoercionType = RetAI.getUnpaddedCoerceAndExpandType(); | 
|---|
| 4081 | auto *unpaddedStruct = dyn_cast<llvm::StructType>(Val: unpaddedCoercionType); | 
|---|
| 4082 |  | 
|---|
| 4083 | // Load all of the coerced elements out into results. | 
|---|
| 4084 | llvm::SmallVector<llvm::Value *, 4> results; | 
|---|
| 4085 | Address addr = ReturnValue.withElementType(ElemTy: coercionType); | 
|---|
| 4086 | unsigned unpaddedIndex = 0; | 
|---|
| 4087 | for (unsigned i = 0, e = coercionType->getNumElements(); i != e; ++i) { | 
|---|
| 4088 | auto coercedEltType = coercionType->getElementType(N: i); | 
|---|
| 4089 | if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType: coercedEltType)) | 
|---|
| 4090 | continue; | 
|---|
| 4091 |  | 
|---|
| 4092 | auto eltAddr = Builder.CreateStructGEP(Addr: addr, Index: i); | 
|---|
| 4093 | llvm::Value *elt = CreateCoercedLoad( | 
|---|
| 4094 | Src: eltAddr, | 
|---|
| 4095 | Ty: unpaddedStruct ? unpaddedStruct->getElementType(N: unpaddedIndex++) | 
|---|
| 4096 | : unpaddedCoercionType, | 
|---|
| 4097 | CGF&: *this); | 
|---|
| 4098 | results.push_back(Elt: elt); | 
|---|
| 4099 | } | 
|---|
| 4100 |  | 
|---|
| 4101 | // If we have one result, it's the single direct result type. | 
|---|
| 4102 | if (results.size() == 1) { | 
|---|
| 4103 | RV = results[0]; | 
|---|
| 4104 |  | 
|---|
| 4105 | // Otherwise, we need to make a first-class aggregate. | 
|---|
| 4106 | } else { | 
|---|
| 4107 | // Construct a return type that lacks padding elements. | 
|---|
| 4108 | llvm::Type *returnType = RetAI.getUnpaddedCoerceAndExpandType(); | 
|---|
| 4109 |  | 
|---|
| 4110 | RV = llvm::PoisonValue::get(T: returnType); | 
|---|
| 4111 | for (unsigned i = 0, e = results.size(); i != e; ++i) { | 
|---|
| 4112 | RV = Builder.CreateInsertValue(Agg: RV, Val: results[i], Idxs: i); | 
|---|
| 4113 | } | 
|---|
| 4114 | } | 
|---|
| 4115 | break; | 
|---|
| 4116 | } | 
|---|
| 4117 | case ABIArgInfo::Expand: | 
|---|
| 4118 | case ABIArgInfo::IndirectAliased: | 
|---|
| 4119 | llvm_unreachable( "Invalid ABI kind for return argument"); | 
|---|
| 4120 | } | 
|---|
| 4121 |  | 
|---|
| 4122 | llvm::Instruction *Ret; | 
|---|
| 4123 | if (RV) { | 
|---|
| 4124 | if (CurFuncDecl && CurFuncDecl->hasAttr<CmseNSEntryAttr>()) { | 
|---|
| 4125 | // For certain return types, clear padding bits, as they may reveal | 
|---|
| 4126 | // sensitive information. | 
|---|
| 4127 | // Small struct/union types are passed as integers. | 
|---|
| 4128 | auto *ITy = dyn_cast<llvm::IntegerType>(Val: RV->getType()); | 
|---|
| 4129 | if (ITy != nullptr && isa<RecordType>(Val: RetTy.getCanonicalType())) | 
|---|
| 4130 | RV = EmitCMSEClearRecord(Src: RV, ITy, QTy: RetTy); | 
|---|
| 4131 | } | 
|---|
| 4132 | EmitReturnValueCheck(RV); | 
|---|
| 4133 | Ret = Builder.CreateRet(V: RV); | 
|---|
| 4134 | } else { | 
|---|
| 4135 | Ret = Builder.CreateRetVoid(); | 
|---|
| 4136 | } | 
|---|
| 4137 |  | 
|---|
| 4138 | if (RetDbgLoc) | 
|---|
| 4139 | Ret->setDebugLoc(std::move(RetDbgLoc)); | 
|---|
| 4140 |  | 
|---|
| 4141 | llvm::Value *Backup = RV ? Ret->getOperand(i: 0) : nullptr; | 
|---|
| 4142 | if (RetKeyInstructionsSourceAtom) | 
|---|
| 4143 | addInstToSpecificSourceAtom(KeyInstruction: Ret, Backup, Atom: RetKeyInstructionsSourceAtom); | 
|---|
| 4144 | else | 
|---|
| 4145 | addInstToNewSourceAtom(KeyInstruction: Ret, Backup); | 
|---|
| 4146 | } | 
|---|
| 4147 |  | 
|---|
| 4148 | void CodeGenFunction::EmitReturnValueCheck(llvm::Value *RV) { | 
|---|
| 4149 | // A current decl may not be available when emitting vtable thunks. | 
|---|
| 4150 | if (!CurCodeDecl) | 
|---|
| 4151 | return; | 
|---|
| 4152 |  | 
|---|
| 4153 | // If the return block isn't reachable, neither is this check, so don't emit | 
|---|
| 4154 | // it. | 
|---|
| 4155 | if (ReturnBlock.isValid() && ReturnBlock.getBlock()->use_empty()) | 
|---|
| 4156 | return; | 
|---|
| 4157 |  | 
|---|
| 4158 | ReturnsNonNullAttr *RetNNAttr = nullptr; | 
|---|
| 4159 | if (SanOpts.has(K: SanitizerKind::ReturnsNonnullAttribute)) | 
|---|
| 4160 | RetNNAttr = CurCodeDecl->getAttr<ReturnsNonNullAttr>(); | 
|---|
| 4161 |  | 
|---|
| 4162 | if (!RetNNAttr && !requiresReturnValueNullabilityCheck()) | 
|---|
| 4163 | return; | 
|---|
| 4164 |  | 
|---|
| 4165 | // Prefer the returns_nonnull attribute if it's present. | 
|---|
| 4166 | SourceLocation AttrLoc; | 
|---|
| 4167 | SanitizerKind::SanitizerOrdinal CheckKind; | 
|---|
| 4168 | SanitizerHandler Handler; | 
|---|
| 4169 | if (RetNNAttr) { | 
|---|
| 4170 | assert(!requiresReturnValueNullabilityCheck() && | 
|---|
| 4171 | "Cannot check nullability and the nonnull attribute"); | 
|---|
| 4172 | AttrLoc = RetNNAttr->getLocation(); | 
|---|
| 4173 | CheckKind = SanitizerKind::SO_ReturnsNonnullAttribute; | 
|---|
| 4174 | Handler = SanitizerHandler::NonnullReturn; | 
|---|
| 4175 | } else { | 
|---|
| 4176 | if (auto *DD = dyn_cast<DeclaratorDecl>(Val: CurCodeDecl)) | 
|---|
| 4177 | if (auto *TSI = DD->getTypeSourceInfo()) | 
|---|
| 4178 | if (auto FTL = TSI->getTypeLoc().getAsAdjusted<FunctionTypeLoc>()) | 
|---|
| 4179 | AttrLoc = FTL.getReturnLoc().findNullabilityLoc(); | 
|---|
| 4180 | CheckKind = SanitizerKind::SO_NullabilityReturn; | 
|---|
| 4181 | Handler = SanitizerHandler::NullabilityReturn; | 
|---|
| 4182 | } | 
|---|
| 4183 |  | 
|---|
| 4184 | SanitizerDebugLocation SanScope(this, {CheckKind}, Handler); | 
|---|
| 4185 |  | 
|---|
| 4186 | // Make sure the "return" source location is valid. If we're checking a | 
|---|
| 4187 | // nullability annotation, make sure the preconditions for the check are met. | 
|---|
| 4188 | llvm::BasicBlock *Check = createBasicBlock(name: "nullcheck"); | 
|---|
| 4189 | llvm::BasicBlock *NoCheck = createBasicBlock(name: "no.nullcheck"); | 
|---|
| 4190 | llvm::Value *SLocPtr = Builder.CreateLoad(Addr: ReturnLocation, Name: "return.sloc.load"); | 
|---|
| 4191 | llvm::Value *CanNullCheck = Builder.CreateIsNotNull(Arg: SLocPtr); | 
|---|
| 4192 | if (requiresReturnValueNullabilityCheck()) | 
|---|
| 4193 | CanNullCheck = | 
|---|
| 4194 | Builder.CreateAnd(LHS: CanNullCheck, RHS: RetValNullabilityPrecondition); | 
|---|
| 4195 | Builder.CreateCondBr(Cond: CanNullCheck, True: Check, False: NoCheck); | 
|---|
| 4196 | EmitBlock(BB: Check); | 
|---|
| 4197 |  | 
|---|
| 4198 | // Now do the null check. | 
|---|
| 4199 | llvm::Value *Cond = Builder.CreateIsNotNull(Arg: RV); | 
|---|
| 4200 | llvm::Constant *StaticData[] = {EmitCheckSourceLocation(Loc: AttrLoc)}; | 
|---|
| 4201 | llvm::Value *DynamicData[] = {SLocPtr}; | 
|---|
| 4202 | EmitCheck(Checked: std::make_pair(x&: Cond, y&: CheckKind), Check: Handler, StaticArgs: StaticData, DynamicArgs: DynamicData); | 
|---|
| 4203 |  | 
|---|
| 4204 | EmitBlock(BB: NoCheck); | 
|---|
| 4205 |  | 
|---|
| 4206 | #ifndef NDEBUG | 
|---|
| 4207 | // The return location should not be used after the check has been emitted. | 
|---|
| 4208 | ReturnLocation = Address::invalid(); | 
|---|
| 4209 | #endif | 
|---|
| 4210 | } | 
|---|
| 4211 |  | 
|---|
| 4212 | static bool isInAllocaArgument(CGCXXABI &ABI, QualType type) { | 
|---|
| 4213 | const CXXRecordDecl *RD = type->getAsCXXRecordDecl(); | 
|---|
| 4214 | return RD && ABI.getRecordArgABI(RD) == CGCXXABI::RAA_DirectInMemory; | 
|---|
| 4215 | } | 
|---|
| 4216 |  | 
|---|
| 4217 | static AggValueSlot createPlaceholderSlot(CodeGenFunction &CGF, QualType Ty) { | 
|---|
| 4218 | // FIXME: Generate IR in one pass, rather than going back and fixing up these | 
|---|
| 4219 | // placeholders. | 
|---|
| 4220 | llvm::Type *IRTy = CGF.ConvertTypeForMem(T: Ty); | 
|---|
| 4221 | llvm::Type *IRPtrTy = llvm::PointerType::getUnqual(C&: CGF.getLLVMContext()); | 
|---|
| 4222 | llvm::Value *Placeholder = llvm::PoisonValue::get(T: IRPtrTy); | 
|---|
| 4223 |  | 
|---|
| 4224 | // FIXME: When we generate this IR in one pass, we shouldn't need | 
|---|
| 4225 | // this win32-specific alignment hack. | 
|---|
| 4226 | CharUnits Align = CharUnits::fromQuantity(Quantity: 4); | 
|---|
| 4227 | Placeholder = CGF.Builder.CreateAlignedLoad(Ty: IRPtrTy, Addr: Placeholder, Align); | 
|---|
| 4228 |  | 
|---|
| 4229 | return AggValueSlot::forAddr( | 
|---|
| 4230 | addr: Address(Placeholder, IRTy, Align), quals: Ty.getQualifiers(), | 
|---|
| 4231 | isDestructed: AggValueSlot::IsNotDestructed, needsGC: AggValueSlot::DoesNotNeedGCBarriers, | 
|---|
| 4232 | isAliased: AggValueSlot::IsNotAliased, mayOverlap: AggValueSlot::DoesNotOverlap); | 
|---|
| 4233 | } | 
|---|
| 4234 |  | 
|---|
| 4235 | void CodeGenFunction::EmitDelegateCallArg(CallArgList &args, | 
|---|
| 4236 | const VarDecl *param, | 
|---|
| 4237 | SourceLocation loc) { | 
|---|
| 4238 | // StartFunction converted the ABI-lowered parameter(s) into a | 
|---|
| 4239 | // local alloca.  We need to turn that into an r-value suitable | 
|---|
| 4240 | // for EmitCall. | 
|---|
| 4241 | Address local = GetAddrOfLocalVar(VD: param); | 
|---|
| 4242 |  | 
|---|
| 4243 | QualType type = param->getType(); | 
|---|
| 4244 |  | 
|---|
| 4245 | // GetAddrOfLocalVar returns a pointer-to-pointer for references, | 
|---|
| 4246 | // but the argument needs to be the original pointer. | 
|---|
| 4247 | if (type->isReferenceType()) { | 
|---|
| 4248 | args.add(rvalue: RValue::get(V: Builder.CreateLoad(Addr: local)), type); | 
|---|
| 4249 |  | 
|---|
| 4250 | // In ARC, move out of consumed arguments so that the release cleanup | 
|---|
| 4251 | // entered by StartFunction doesn't cause an over-release.  This isn't | 
|---|
| 4252 | // optimal -O0 code generation, but it should get cleaned up when | 
|---|
| 4253 | // optimization is enabled.  This also assumes that delegate calls are | 
|---|
| 4254 | // performed exactly once for a set of arguments, but that should be safe. | 
|---|
| 4255 | } else if (getLangOpts().ObjCAutoRefCount && | 
|---|
| 4256 | param->hasAttr<NSConsumedAttr>() && type->isObjCRetainableType()) { | 
|---|
| 4257 | llvm::Value *ptr = Builder.CreateLoad(Addr: local); | 
|---|
| 4258 | auto null = | 
|---|
| 4259 | llvm::ConstantPointerNull::get(T: cast<llvm::PointerType>(Val: ptr->getType())); | 
|---|
| 4260 | Builder.CreateStore(Val: null, Addr: local); | 
|---|
| 4261 | args.add(rvalue: RValue::get(V: ptr), type); | 
|---|
| 4262 |  | 
|---|
| 4263 | // For the most part, we just need to load the alloca, except that | 
|---|
| 4264 | // aggregate r-values are actually pointers to temporaries. | 
|---|
| 4265 | } else { | 
|---|
| 4266 | args.add(rvalue: convertTempToRValue(addr: local, type, Loc: loc), type); | 
|---|
| 4267 | } | 
|---|
| 4268 |  | 
|---|
| 4269 | // Deactivate the cleanup for the callee-destructed param that was pushed. | 
|---|
| 4270 | if (type->isRecordType() && !CurFuncIsThunk && | 
|---|
| 4271 | type->castAs<RecordType>()->getDecl()->isParamDestroyedInCallee() && | 
|---|
| 4272 | param->needsDestruction(Ctx: getContext())) { | 
|---|
| 4273 | EHScopeStack::stable_iterator cleanup = | 
|---|
| 4274 | CalleeDestructedParamCleanups.lookup(Val: cast<ParmVarDecl>(Val: param)); | 
|---|
| 4275 | assert(cleanup.isValid() && | 
|---|
| 4276 | "cleanup for callee-destructed param not recorded"); | 
|---|
| 4277 | // This unreachable is a temporary marker which will be removed later. | 
|---|
| 4278 | llvm::Instruction *isActive = Builder.CreateUnreachable(); | 
|---|
| 4279 | args.addArgCleanupDeactivation(Cleanup: cleanup, IsActiveIP: isActive); | 
|---|
| 4280 | } | 
|---|
| 4281 | } | 
|---|
| 4282 |  | 
|---|
| 4283 | static bool isProvablyNull(llvm::Value *addr) { | 
|---|
| 4284 | return llvm::isa_and_nonnull<llvm::ConstantPointerNull>(Val: addr); | 
|---|
| 4285 | } | 
|---|
| 4286 |  | 
|---|
| 4287 | static bool isProvablyNonNull(Address Addr, CodeGenFunction &CGF) { | 
|---|
| 4288 | return llvm::isKnownNonZero(V: Addr.getBasePointer(), Q: CGF.CGM.getDataLayout()); | 
|---|
| 4289 | } | 
|---|
| 4290 |  | 
|---|
| 4291 | /// Emit the actual writing-back of a writeback. | 
|---|
| 4292 | static void emitWriteback(CodeGenFunction &CGF, | 
|---|
| 4293 | const CallArgList::Writeback &writeback) { | 
|---|
| 4294 | const LValue &srcLV = writeback.Source; | 
|---|
| 4295 | Address srcAddr = srcLV.getAddress(); | 
|---|
| 4296 | assert(!isProvablyNull(srcAddr.getBasePointer()) && | 
|---|
| 4297 | "shouldn't have writeback for provably null argument"); | 
|---|
| 4298 |  | 
|---|
| 4299 | if (writeback.WritebackExpr) { | 
|---|
| 4300 | CGF.EmitIgnoredExpr(E: writeback.WritebackExpr); | 
|---|
| 4301 |  | 
|---|
| 4302 | if (writeback.LifetimeSz) | 
|---|
| 4303 | CGF.EmitLifetimeEnd(Size: writeback.LifetimeSz, | 
|---|
| 4304 | Addr: writeback.Temporary.getBasePointer()); | 
|---|
| 4305 | return; | 
|---|
| 4306 | } | 
|---|
| 4307 |  | 
|---|
| 4308 | llvm::BasicBlock *contBB = nullptr; | 
|---|
| 4309 |  | 
|---|
| 4310 | // If the argument wasn't provably non-null, we need to null check | 
|---|
| 4311 | // before doing the store. | 
|---|
| 4312 | bool provablyNonNull = isProvablyNonNull(Addr: srcAddr, CGF); | 
|---|
| 4313 |  | 
|---|
| 4314 | if (!provablyNonNull) { | 
|---|
| 4315 | llvm::BasicBlock *writebackBB = CGF.createBasicBlock(name: "icr.writeback"); | 
|---|
| 4316 | contBB = CGF.createBasicBlock(name: "icr.done"); | 
|---|
| 4317 |  | 
|---|
| 4318 | llvm::Value *isNull = CGF.Builder.CreateIsNull(Addr: srcAddr, Name: "icr.isnull"); | 
|---|
| 4319 | CGF.Builder.CreateCondBr(Cond: isNull, True: contBB, False: writebackBB); | 
|---|
| 4320 | CGF.EmitBlock(BB: writebackBB); | 
|---|
| 4321 | } | 
|---|
| 4322 |  | 
|---|
| 4323 | // Load the value to writeback. | 
|---|
| 4324 | llvm::Value *value = CGF.Builder.CreateLoad(Addr: writeback.Temporary); | 
|---|
| 4325 |  | 
|---|
| 4326 | // Cast it back, in case we're writing an id to a Foo* or something. | 
|---|
| 4327 | value = CGF.Builder.CreateBitCast(V: value, DestTy: srcAddr.getElementType(), | 
|---|
| 4328 | Name: "icr.writeback-cast"); | 
|---|
| 4329 |  | 
|---|
| 4330 | // Perform the writeback. | 
|---|
| 4331 |  | 
|---|
| 4332 | // If we have a "to use" value, it's something we need to emit a use | 
|---|
| 4333 | // of.  This has to be carefully threaded in: if it's done after the | 
|---|
| 4334 | // release it's potentially undefined behavior (and the optimizer | 
|---|
| 4335 | // will ignore it), and if it happens before the retain then the | 
|---|
| 4336 | // optimizer could move the release there. | 
|---|
| 4337 | if (writeback.ToUse) { | 
|---|
| 4338 | assert(srcLV.getObjCLifetime() == Qualifiers::OCL_Strong); | 
|---|
| 4339 |  | 
|---|
| 4340 | // Retain the new value.  No need to block-copy here:  the block's | 
|---|
| 4341 | // being passed up the stack. | 
|---|
| 4342 | value = CGF.EmitARCRetainNonBlock(value); | 
|---|
| 4343 |  | 
|---|
| 4344 | // Emit the intrinsic use here. | 
|---|
| 4345 | CGF.EmitARCIntrinsicUse(values: writeback.ToUse); | 
|---|
| 4346 |  | 
|---|
| 4347 | // Load the old value (primitively). | 
|---|
| 4348 | llvm::Value *oldValue = CGF.EmitLoadOfScalar(lvalue: srcLV, Loc: SourceLocation()); | 
|---|
| 4349 |  | 
|---|
| 4350 | // Put the new value in place (primitively). | 
|---|
| 4351 | CGF.EmitStoreOfScalar(value, lvalue: srcLV, /*init*/ isInit: false); | 
|---|
| 4352 |  | 
|---|
| 4353 | // Release the old value. | 
|---|
| 4354 | CGF.EmitARCRelease(value: oldValue, precise: srcLV.isARCPreciseLifetime()); | 
|---|
| 4355 |  | 
|---|
| 4356 | // Otherwise, we can just do a normal lvalue store. | 
|---|
| 4357 | } else { | 
|---|
| 4358 | CGF.EmitStoreThroughLValue(Src: RValue::get(V: value), Dst: srcLV); | 
|---|
| 4359 | } | 
|---|
| 4360 |  | 
|---|
| 4361 | // Jump to the continuation block. | 
|---|
| 4362 | if (!provablyNonNull) | 
|---|
| 4363 | CGF.EmitBlock(BB: contBB); | 
|---|
| 4364 | } | 
|---|
| 4365 |  | 
|---|
| 4366 | static void deactivateArgCleanupsBeforeCall(CodeGenFunction &CGF, | 
|---|
| 4367 | const CallArgList &CallArgs) { | 
|---|
| 4368 | ArrayRef<CallArgList::CallArgCleanup> Cleanups = | 
|---|
| 4369 | CallArgs.getCleanupsToDeactivate(); | 
|---|
| 4370 | // Iterate in reverse to increase the likelihood of popping the cleanup. | 
|---|
| 4371 | for (const auto &I : llvm::reverse(C&: Cleanups)) { | 
|---|
| 4372 | CGF.DeactivateCleanupBlock(Cleanup: I.Cleanup, DominatingIP: I.IsActiveIP); | 
|---|
| 4373 | I.IsActiveIP->eraseFromParent(); | 
|---|
| 4374 | } | 
|---|
| 4375 | } | 
|---|
| 4376 |  | 
|---|
| 4377 | static const Expr *maybeGetUnaryAddrOfOperand(const Expr *E) { | 
|---|
| 4378 | if (const UnaryOperator *uop = dyn_cast<UnaryOperator>(Val: E->IgnoreParens())) | 
|---|
| 4379 | if (uop->getOpcode() == UO_AddrOf) | 
|---|
| 4380 | return uop->getSubExpr(); | 
|---|
| 4381 | return nullptr; | 
|---|
| 4382 | } | 
|---|
| 4383 |  | 
|---|
| 4384 | /// Emit an argument that's being passed call-by-writeback.  That is, | 
|---|
| 4385 | /// we are passing the address of an __autoreleased temporary; it | 
|---|
| 4386 | /// might be copy-initialized with the current value of the given | 
|---|
| 4387 | /// address, but it will definitely be copied out of after the call. | 
|---|
| 4388 | static void emitWritebackArg(CodeGenFunction &CGF, CallArgList &args, | 
|---|
| 4389 | const ObjCIndirectCopyRestoreExpr *CRE) { | 
|---|
| 4390 | LValue srcLV; | 
|---|
| 4391 |  | 
|---|
| 4392 | // Make an optimistic effort to emit the address as an l-value. | 
|---|
| 4393 | // This can fail if the argument expression is more complicated. | 
|---|
| 4394 | if (const Expr *lvExpr = maybeGetUnaryAddrOfOperand(E: CRE->getSubExpr())) { | 
|---|
| 4395 | srcLV = CGF.EmitLValue(E: lvExpr); | 
|---|
| 4396 |  | 
|---|
| 4397 | // Otherwise, just emit it as a scalar. | 
|---|
| 4398 | } else { | 
|---|
| 4399 | Address srcAddr = CGF.EmitPointerWithAlignment(Addr: CRE->getSubExpr()); | 
|---|
| 4400 |  | 
|---|
| 4401 | QualType srcAddrType = | 
|---|
| 4402 | CRE->getSubExpr()->getType()->castAs<PointerType>()->getPointeeType(); | 
|---|
| 4403 | srcLV = CGF.MakeAddrLValue(Addr: srcAddr, T: srcAddrType); | 
|---|
| 4404 | } | 
|---|
| 4405 | Address srcAddr = srcLV.getAddress(); | 
|---|
| 4406 |  | 
|---|
| 4407 | // The dest and src types don't necessarily match in LLVM terms | 
|---|
| 4408 | // because of the crazy ObjC compatibility rules. | 
|---|
| 4409 |  | 
|---|
| 4410 | llvm::PointerType *destType = | 
|---|
| 4411 | cast<llvm::PointerType>(Val: CGF.ConvertType(T: CRE->getType())); | 
|---|
| 4412 | llvm::Type *destElemType = | 
|---|
| 4413 | CGF.ConvertTypeForMem(T: CRE->getType()->getPointeeType()); | 
|---|
| 4414 |  | 
|---|
| 4415 | // If the address is a constant null, just pass the appropriate null. | 
|---|
| 4416 | if (isProvablyNull(addr: srcAddr.getBasePointer())) { | 
|---|
| 4417 | args.add(rvalue: RValue::get(V: llvm::ConstantPointerNull::get(T: destType)), | 
|---|
| 4418 | type: CRE->getType()); | 
|---|
| 4419 | return; | 
|---|
| 4420 | } | 
|---|
| 4421 |  | 
|---|
| 4422 | // Create the temporary. | 
|---|
| 4423 | Address temp = | 
|---|
| 4424 | CGF.CreateTempAlloca(Ty: destElemType, align: CGF.getPointerAlign(), Name: "icr.temp"); | 
|---|
| 4425 | // Loading an l-value can introduce a cleanup if the l-value is __weak, | 
|---|
| 4426 | // and that cleanup will be conditional if we can't prove that the l-value | 
|---|
| 4427 | // isn't null, so we need to register a dominating point so that the cleanups | 
|---|
| 4428 | // system will make valid IR. | 
|---|
| 4429 | CodeGenFunction::ConditionalEvaluation condEval(CGF); | 
|---|
| 4430 |  | 
|---|
| 4431 | // Zero-initialize it if we're not doing a copy-initialization. | 
|---|
| 4432 | bool shouldCopy = CRE->shouldCopy(); | 
|---|
| 4433 | if (!shouldCopy) { | 
|---|
| 4434 | llvm::Value *null = | 
|---|
| 4435 | llvm::ConstantPointerNull::get(T: cast<llvm::PointerType>(Val: destElemType)); | 
|---|
| 4436 | CGF.Builder.CreateStore(Val: null, Addr: temp); | 
|---|
| 4437 | } | 
|---|
| 4438 |  | 
|---|
| 4439 | llvm::BasicBlock *contBB = nullptr; | 
|---|
| 4440 | llvm::BasicBlock *originBB = nullptr; | 
|---|
| 4441 |  | 
|---|
| 4442 | // If the address is *not* known to be non-null, we need to switch. | 
|---|
| 4443 | llvm::Value *finalArgument; | 
|---|
| 4444 |  | 
|---|
| 4445 | bool provablyNonNull = isProvablyNonNull(Addr: srcAddr, CGF); | 
|---|
| 4446 |  | 
|---|
| 4447 | if (provablyNonNull) { | 
|---|
| 4448 | finalArgument = temp.emitRawPointer(CGF); | 
|---|
| 4449 | } else { | 
|---|
| 4450 | llvm::Value *isNull = CGF.Builder.CreateIsNull(Addr: srcAddr, Name: "icr.isnull"); | 
|---|
| 4451 |  | 
|---|
| 4452 | finalArgument = CGF.Builder.CreateSelect( | 
|---|
| 4453 | C: isNull, True: llvm::ConstantPointerNull::get(T: destType), | 
|---|
| 4454 | False: temp.emitRawPointer(CGF), Name: "icr.argument"); | 
|---|
| 4455 |  | 
|---|
| 4456 | // If we need to copy, then the load has to be conditional, which | 
|---|
| 4457 | // means we need control flow. | 
|---|
| 4458 | if (shouldCopy) { | 
|---|
| 4459 | originBB = CGF.Builder.GetInsertBlock(); | 
|---|
| 4460 | contBB = CGF.createBasicBlock(name: "icr.cont"); | 
|---|
| 4461 | llvm::BasicBlock *copyBB = CGF.createBasicBlock(name: "icr.copy"); | 
|---|
| 4462 | CGF.Builder.CreateCondBr(Cond: isNull, True: contBB, False: copyBB); | 
|---|
| 4463 | CGF.EmitBlock(BB: copyBB); | 
|---|
| 4464 | condEval.begin(CGF); | 
|---|
| 4465 | } | 
|---|
| 4466 | } | 
|---|
| 4467 |  | 
|---|
| 4468 | llvm::Value *valueToUse = nullptr; | 
|---|
| 4469 |  | 
|---|
| 4470 | // Perform a copy if necessary. | 
|---|
| 4471 | if (shouldCopy) { | 
|---|
| 4472 | RValue srcRV = CGF.EmitLoadOfLValue(V: srcLV, Loc: SourceLocation()); | 
|---|
| 4473 | assert(srcRV.isScalar()); | 
|---|
| 4474 |  | 
|---|
| 4475 | llvm::Value *src = srcRV.getScalarVal(); | 
|---|
| 4476 | src = CGF.Builder.CreateBitCast(V: src, DestTy: destElemType, Name: "icr.cast"); | 
|---|
| 4477 |  | 
|---|
| 4478 | // Use an ordinary store, not a store-to-lvalue. | 
|---|
| 4479 | CGF.Builder.CreateStore(Val: src, Addr: temp); | 
|---|
| 4480 |  | 
|---|
| 4481 | // If optimization is enabled, and the value was held in a | 
|---|
| 4482 | // __strong variable, we need to tell the optimizer that this | 
|---|
| 4483 | // value has to stay alive until we're doing the store back. | 
|---|
| 4484 | // This is because the temporary is effectively unretained, | 
|---|
| 4485 | // and so otherwise we can violate the high-level semantics. | 
|---|
| 4486 | if (CGF.CGM.getCodeGenOpts().OptimizationLevel != 0 && | 
|---|
| 4487 | srcLV.getObjCLifetime() == Qualifiers::OCL_Strong) { | 
|---|
| 4488 | valueToUse = src; | 
|---|
| 4489 | } | 
|---|
| 4490 | } | 
|---|
| 4491 |  | 
|---|
| 4492 | // Finish the control flow if we needed it. | 
|---|
| 4493 | if (shouldCopy && !provablyNonNull) { | 
|---|
| 4494 | llvm::BasicBlock *copyBB = CGF.Builder.GetInsertBlock(); | 
|---|
| 4495 | CGF.EmitBlock(BB: contBB); | 
|---|
| 4496 |  | 
|---|
| 4497 | // Make a phi for the value to intrinsically use. | 
|---|
| 4498 | if (valueToUse) { | 
|---|
| 4499 | llvm::PHINode *phiToUse = | 
|---|
| 4500 | CGF.Builder.CreatePHI(Ty: valueToUse->getType(), NumReservedValues: 2, Name: "icr.to-use"); | 
|---|
| 4501 | phiToUse->addIncoming(V: valueToUse, BB: copyBB); | 
|---|
| 4502 | phiToUse->addIncoming(V: llvm::PoisonValue::get(T: valueToUse->getType()), | 
|---|
| 4503 | BB: originBB); | 
|---|
| 4504 | valueToUse = phiToUse; | 
|---|
| 4505 | } | 
|---|
| 4506 |  | 
|---|
| 4507 | condEval.end(CGF); | 
|---|
| 4508 | } | 
|---|
| 4509 |  | 
|---|
| 4510 | args.addWriteback(srcLV, temporary: temp, toUse: valueToUse); | 
|---|
| 4511 | args.add(rvalue: RValue::get(V: finalArgument), type: CRE->getType()); | 
|---|
| 4512 | } | 
|---|
| 4513 |  | 
|---|
| 4514 | void CallArgList::allocateArgumentMemory(CodeGenFunction &CGF) { | 
|---|
| 4515 | assert(!StackBase); | 
|---|
| 4516 |  | 
|---|
| 4517 | // Save the stack. | 
|---|
| 4518 | StackBase = CGF.Builder.CreateStackSave(Name: "inalloca.save"); | 
|---|
| 4519 | } | 
|---|
| 4520 |  | 
|---|
| 4521 | void CallArgList::freeArgumentMemory(CodeGenFunction &CGF) const { | 
|---|
| 4522 | if (StackBase) { | 
|---|
| 4523 | // Restore the stack after the call. | 
|---|
| 4524 | CGF.Builder.CreateStackRestore(Ptr: StackBase); | 
|---|
| 4525 | } | 
|---|
| 4526 | } | 
|---|
| 4527 |  | 
|---|
| 4528 | void CodeGenFunction::EmitNonNullArgCheck(RValue RV, QualType ArgType, | 
|---|
| 4529 | SourceLocation ArgLoc, | 
|---|
| 4530 | AbstractCallee AC, unsigned ParmNum) { | 
|---|
| 4531 | if (!AC.getDecl() || !(SanOpts.has(K: SanitizerKind::NonnullAttribute) || | 
|---|
| 4532 | SanOpts.has(K: SanitizerKind::NullabilityArg))) | 
|---|
| 4533 | return; | 
|---|
| 4534 |  | 
|---|
| 4535 | // The param decl may be missing in a variadic function. | 
|---|
| 4536 | auto PVD = ParmNum < AC.getNumParams() ? AC.getParamDecl(I: ParmNum) : nullptr; | 
|---|
| 4537 | unsigned ArgNo = PVD ? PVD->getFunctionScopeIndex() : ParmNum; | 
|---|
| 4538 |  | 
|---|
| 4539 | // Prefer the nonnull attribute if it's present. | 
|---|
| 4540 | const NonNullAttr *NNAttr = nullptr; | 
|---|
| 4541 | if (SanOpts.has(K: SanitizerKind::NonnullAttribute)) | 
|---|
| 4542 | NNAttr = getNonNullAttr(FD: AC.getDecl(), PVD, ArgType, ArgNo); | 
|---|
| 4543 |  | 
|---|
| 4544 | bool CanCheckNullability = false; | 
|---|
| 4545 | if (SanOpts.has(K: SanitizerKind::NullabilityArg) && !NNAttr && PVD && | 
|---|
| 4546 | !PVD->getType()->isRecordType()) { | 
|---|
| 4547 | auto Nullability = PVD->getType()->getNullability(); | 
|---|
| 4548 | CanCheckNullability = Nullability && | 
|---|
| 4549 | *Nullability == NullabilityKind::NonNull && | 
|---|
| 4550 | PVD->getTypeSourceInfo(); | 
|---|
| 4551 | } | 
|---|
| 4552 |  | 
|---|
| 4553 | if (!NNAttr && !CanCheckNullability) | 
|---|
| 4554 | return; | 
|---|
| 4555 |  | 
|---|
| 4556 | SourceLocation AttrLoc; | 
|---|
| 4557 | SanitizerKind::SanitizerOrdinal CheckKind; | 
|---|
| 4558 | SanitizerHandler Handler; | 
|---|
| 4559 | if (NNAttr) { | 
|---|
| 4560 | AttrLoc = NNAttr->getLocation(); | 
|---|
| 4561 | CheckKind = SanitizerKind::SO_NonnullAttribute; | 
|---|
| 4562 | Handler = SanitizerHandler::NonnullArg; | 
|---|
| 4563 | } else { | 
|---|
| 4564 | AttrLoc = PVD->getTypeSourceInfo()->getTypeLoc().findNullabilityLoc(); | 
|---|
| 4565 | CheckKind = SanitizerKind::SO_NullabilityArg; | 
|---|
| 4566 | Handler = SanitizerHandler::NullabilityArg; | 
|---|
| 4567 | } | 
|---|
| 4568 |  | 
|---|
| 4569 | SanitizerDebugLocation SanScope(this, {CheckKind}, Handler); | 
|---|
| 4570 | llvm::Value *Cond = EmitNonNullRValueCheck(RV, T: ArgType); | 
|---|
| 4571 | llvm::Constant *StaticData[] = { | 
|---|
| 4572 | EmitCheckSourceLocation(Loc: ArgLoc), | 
|---|
| 4573 | EmitCheckSourceLocation(Loc: AttrLoc), | 
|---|
| 4574 | llvm::ConstantInt::get(Ty: Int32Ty, V: ArgNo + 1), | 
|---|
| 4575 | }; | 
|---|
| 4576 | EmitCheck(Checked: std::make_pair(x&: Cond, y&: CheckKind), Check: Handler, StaticArgs: StaticData, DynamicArgs: {}); | 
|---|
| 4577 | } | 
|---|
| 4578 |  | 
|---|
| 4579 | void CodeGenFunction::EmitNonNullArgCheck(Address Addr, QualType ArgType, | 
|---|
| 4580 | SourceLocation ArgLoc, | 
|---|
| 4581 | AbstractCallee AC, unsigned ParmNum) { | 
|---|
| 4582 | if (!AC.getDecl() || !(SanOpts.has(K: SanitizerKind::NonnullAttribute) || | 
|---|
| 4583 | SanOpts.has(K: SanitizerKind::NullabilityArg))) | 
|---|
| 4584 | return; | 
|---|
| 4585 |  | 
|---|
| 4586 | EmitNonNullArgCheck(RV: RValue::get(Addr, CGF&: *this), ArgType, ArgLoc, AC, ParmNum); | 
|---|
| 4587 | } | 
|---|
| 4588 |  | 
|---|
| 4589 | // Check if the call is going to use the inalloca convention. This needs to | 
|---|
| 4590 | // agree with CGFunctionInfo::usesInAlloca. The CGFunctionInfo is arranged | 
|---|
| 4591 | // later, so we can't check it directly. | 
|---|
| 4592 | static bool hasInAllocaArgs(CodeGenModule &CGM, CallingConv ExplicitCC, | 
|---|
| 4593 | ArrayRef<QualType> ArgTypes) { | 
|---|
| 4594 | // The Swift calling conventions don't go through the target-specific | 
|---|
| 4595 | // argument classification, they never use inalloca. | 
|---|
| 4596 | // TODO: Consider limiting inalloca use to only calling conventions supported | 
|---|
| 4597 | // by MSVC. | 
|---|
| 4598 | if (ExplicitCC == CC_Swift || ExplicitCC == CC_SwiftAsync) | 
|---|
| 4599 | return false; | 
|---|
| 4600 | if (!CGM.getTarget().getCXXABI().isMicrosoft()) | 
|---|
| 4601 | return false; | 
|---|
| 4602 | return llvm::any_of(Range&: ArgTypes, P: [&](QualType Ty) { | 
|---|
| 4603 | return isInAllocaArgument(ABI&: CGM.getCXXABI(), type: Ty); | 
|---|
| 4604 | }); | 
|---|
| 4605 | } | 
|---|
| 4606 |  | 
|---|
| 4607 | #ifndef NDEBUG | 
|---|
| 4608 | // Determine whether the given argument is an Objective-C method | 
|---|
| 4609 | // that may have type parameters in its signature. | 
|---|
| 4610 | static bool isObjCMethodWithTypeParams(const ObjCMethodDecl *method) { | 
|---|
| 4611 | const DeclContext *dc = method->getDeclContext(); | 
|---|
| 4612 | if (const ObjCInterfaceDecl *classDecl = dyn_cast<ObjCInterfaceDecl>(dc)) { | 
|---|
| 4613 | return classDecl->getTypeParamListAsWritten(); | 
|---|
| 4614 | } | 
|---|
| 4615 |  | 
|---|
| 4616 | if (const ObjCCategoryDecl *catDecl = dyn_cast<ObjCCategoryDecl>(dc)) { | 
|---|
| 4617 | return catDecl->getTypeParamList(); | 
|---|
| 4618 | } | 
|---|
| 4619 |  | 
|---|
| 4620 | return false; | 
|---|
| 4621 | } | 
|---|
| 4622 | #endif | 
|---|
| 4623 |  | 
|---|
| 4624 | /// EmitCallArgs - Emit call arguments for a function. | 
|---|
| 4625 | void CodeGenFunction::EmitCallArgs( | 
|---|
| 4626 | CallArgList &Args, PrototypeWrapper Prototype, | 
|---|
| 4627 | llvm::iterator_range<CallExpr::const_arg_iterator> ArgRange, | 
|---|
| 4628 | AbstractCallee AC, unsigned ParamsToSkip, EvaluationOrder Order) { | 
|---|
| 4629 | SmallVector<QualType, 16> ArgTypes; | 
|---|
| 4630 |  | 
|---|
| 4631 | assert((ParamsToSkip == 0 || Prototype.P) && | 
|---|
| 4632 | "Can't skip parameters if type info is not provided"); | 
|---|
| 4633 |  | 
|---|
| 4634 | // This variable only captures *explicitly* written conventions, not those | 
|---|
| 4635 | // applied by default via command line flags or target defaults, such as | 
|---|
| 4636 | // thiscall, aapcs, stdcall via -mrtd, etc. Computing that correctly would | 
|---|
| 4637 | // require knowing if this is a C++ instance method or being able to see | 
|---|
| 4638 | // unprototyped FunctionTypes. | 
|---|
| 4639 | CallingConv ExplicitCC = CC_C; | 
|---|
| 4640 |  | 
|---|
| 4641 | // First, if a prototype was provided, use those argument types. | 
|---|
| 4642 | bool IsVariadic = false; | 
|---|
| 4643 | if (Prototype.P) { | 
|---|
| 4644 | const auto *MD = dyn_cast<const ObjCMethodDecl *>(Val&: Prototype.P); | 
|---|
| 4645 | if (MD) { | 
|---|
| 4646 | IsVariadic = MD->isVariadic(); | 
|---|
| 4647 | ExplicitCC = getCallingConventionForDecl( | 
|---|
| 4648 | D: MD, IsTargetDefaultMSABI: CGM.getTarget().getTriple().isOSWindows()); | 
|---|
| 4649 | ArgTypes.assign(in_start: MD->param_type_begin() + ParamsToSkip, | 
|---|
| 4650 | in_end: MD->param_type_end()); | 
|---|
| 4651 | } else { | 
|---|
| 4652 | const auto *FPT = cast<const FunctionProtoType *>(Val&: Prototype.P); | 
|---|
| 4653 | IsVariadic = FPT->isVariadic(); | 
|---|
| 4654 | ExplicitCC = FPT->getExtInfo().getCC(); | 
|---|
| 4655 | ArgTypes.assign(in_start: FPT->param_type_begin() + ParamsToSkip, | 
|---|
| 4656 | in_end: FPT->param_type_end()); | 
|---|
| 4657 | } | 
|---|
| 4658 |  | 
|---|
| 4659 | #ifndef NDEBUG | 
|---|
| 4660 | // Check that the prototyped types match the argument expression types. | 
|---|
| 4661 | bool isGenericMethod = MD && isObjCMethodWithTypeParams(MD); | 
|---|
| 4662 | CallExpr::const_arg_iterator Arg = ArgRange.begin(); | 
|---|
| 4663 | for (QualType Ty : ArgTypes) { | 
|---|
| 4664 | assert(Arg != ArgRange.end() && "Running over edge of argument list!"); | 
|---|
| 4665 | assert( | 
|---|
| 4666 | (isGenericMethod || Ty->isVariablyModifiedType() || | 
|---|
| 4667 | Ty.getNonReferenceType()->isObjCRetainableType() || | 
|---|
| 4668 | getContext() | 
|---|
| 4669 | .getCanonicalType(Ty.getNonReferenceType()) | 
|---|
| 4670 | .getTypePtr() == | 
|---|
| 4671 | getContext().getCanonicalType((*Arg)->getType()).getTypePtr()) && | 
|---|
| 4672 | "type mismatch in call argument!"); | 
|---|
| 4673 | ++Arg; | 
|---|
| 4674 | } | 
|---|
| 4675 |  | 
|---|
| 4676 | // Either we've emitted all the call args, or we have a call to variadic | 
|---|
| 4677 | // function. | 
|---|
| 4678 | assert((Arg == ArgRange.end() || IsVariadic) && | 
|---|
| 4679 | "Extra arguments in non-variadic function!"); | 
|---|
| 4680 | #endif | 
|---|
| 4681 | } | 
|---|
| 4682 |  | 
|---|
| 4683 | // If we still have any arguments, emit them using the type of the argument. | 
|---|
| 4684 | for (auto *A : llvm::drop_begin(RangeOrContainer&: ArgRange, N: ArgTypes.size())) | 
|---|
| 4685 | ArgTypes.push_back(Elt: IsVariadic ? getVarArgType(Arg: A) : A->getType()); | 
|---|
| 4686 | assert((int)ArgTypes.size() == (ArgRange.end() - ArgRange.begin())); | 
|---|
| 4687 |  | 
|---|
| 4688 | // We must evaluate arguments from right to left in the MS C++ ABI, | 
|---|
| 4689 | // because arguments are destroyed left to right in the callee. As a special | 
|---|
| 4690 | // case, there are certain language constructs that require left-to-right | 
|---|
| 4691 | // evaluation, and in those cases we consider the evaluation order requirement | 
|---|
| 4692 | // to trump the "destruction order is reverse construction order" guarantee. | 
|---|
| 4693 | bool LeftToRight = | 
|---|
| 4694 | CGM.getTarget().getCXXABI().areArgsDestroyedLeftToRightInCallee() | 
|---|
| 4695 | ? Order == EvaluationOrder::ForceLeftToRight | 
|---|
| 4696 | : Order != EvaluationOrder::ForceRightToLeft; | 
|---|
| 4697 |  | 
|---|
| 4698 | auto MaybeEmitImplicitObjectSize = [&](unsigned I, const Expr *Arg, | 
|---|
| 4699 | RValue EmittedArg) { | 
|---|
| 4700 | if (!AC.hasFunctionDecl() || I >= AC.getNumParams()) | 
|---|
| 4701 | return; | 
|---|
| 4702 | auto *PS = AC.getParamDecl(I)->getAttr<PassObjectSizeAttr>(); | 
|---|
| 4703 | if (PS == nullptr) | 
|---|
| 4704 | return; | 
|---|
| 4705 |  | 
|---|
| 4706 | const auto &Context = getContext(); | 
|---|
| 4707 | auto SizeTy = Context.getSizeType(); | 
|---|
| 4708 | auto T = Builder.getIntNTy(N: Context.getTypeSize(T: SizeTy)); | 
|---|
| 4709 | assert(EmittedArg.getScalarVal() && "We emitted nothing for the arg?"); | 
|---|
| 4710 | llvm::Value *V = evaluateOrEmitBuiltinObjectSize( | 
|---|
| 4711 | E: Arg, Type: PS->getType(), ResType: T, EmittedE: EmittedArg.getScalarVal(), IsDynamic: PS->isDynamic()); | 
|---|
| 4712 | Args.add(rvalue: RValue::get(V), type: SizeTy); | 
|---|
| 4713 | // If we're emitting args in reverse, be sure to do so with | 
|---|
| 4714 | // pass_object_size, as well. | 
|---|
| 4715 | if (!LeftToRight) | 
|---|
| 4716 | std::swap(a&: Args.back(), b&: *(&Args.back() - 1)); | 
|---|
| 4717 | }; | 
|---|
| 4718 |  | 
|---|
| 4719 | // Insert a stack save if we're going to need any inalloca args. | 
|---|
| 4720 | if (hasInAllocaArgs(CGM, ExplicitCC, ArgTypes)) { | 
|---|
| 4721 | assert(getTarget().getTriple().getArch() == llvm::Triple::x86 && | 
|---|
| 4722 | "inalloca only supported on x86"); | 
|---|
| 4723 | Args.allocateArgumentMemory(CGF&: *this); | 
|---|
| 4724 | } | 
|---|
| 4725 |  | 
|---|
| 4726 | // Evaluate each argument in the appropriate order. | 
|---|
| 4727 | size_t CallArgsStart = Args.size(); | 
|---|
| 4728 | for (unsigned I = 0, E = ArgTypes.size(); I != E; ++I) { | 
|---|
| 4729 | unsigned Idx = LeftToRight ? I : E - I - 1; | 
|---|
| 4730 | CallExpr::const_arg_iterator Arg = ArgRange.begin() + Idx; | 
|---|
| 4731 | unsigned InitialArgSize = Args.size(); | 
|---|
| 4732 | // If *Arg is an ObjCIndirectCopyRestoreExpr, check that either the types of | 
|---|
| 4733 | // the argument and parameter match or the objc method is parameterized. | 
|---|
| 4734 | assert((!isa<ObjCIndirectCopyRestoreExpr>(*Arg) || | 
|---|
| 4735 | getContext().hasSameUnqualifiedType((*Arg)->getType(), | 
|---|
| 4736 | ArgTypes[Idx]) || | 
|---|
| 4737 | (isa<ObjCMethodDecl>(AC.getDecl()) && | 
|---|
| 4738 | isObjCMethodWithTypeParams(cast<ObjCMethodDecl>(AC.getDecl())))) && | 
|---|
| 4739 | "Argument and parameter types don't match"); | 
|---|
| 4740 | EmitCallArg(args&: Args, E: *Arg, ArgType: ArgTypes[Idx]); | 
|---|
| 4741 | // In particular, we depend on it being the last arg in Args, and the | 
|---|
| 4742 | // objectsize bits depend on there only being one arg if !LeftToRight. | 
|---|
| 4743 | assert(InitialArgSize + 1 == Args.size() && | 
|---|
| 4744 | "The code below depends on only adding one arg per EmitCallArg"); | 
|---|
| 4745 | (void)InitialArgSize; | 
|---|
| 4746 | // Since pointer argument are never emitted as LValue, it is safe to emit | 
|---|
| 4747 | // non-null argument check for r-value only. | 
|---|
| 4748 | if (!Args.back().hasLValue()) { | 
|---|
| 4749 | RValue RVArg = Args.back().getKnownRValue(); | 
|---|
| 4750 | EmitNonNullArgCheck(RV: RVArg, ArgType: ArgTypes[Idx], ArgLoc: (*Arg)->getExprLoc(), AC, | 
|---|
| 4751 | ParmNum: ParamsToSkip + Idx); | 
|---|
| 4752 | // @llvm.objectsize should never have side-effects and shouldn't need | 
|---|
| 4753 | // destruction/cleanups, so we can safely "emit" it after its arg, | 
|---|
| 4754 | // regardless of right-to-leftness | 
|---|
| 4755 | MaybeEmitImplicitObjectSize(Idx, *Arg, RVArg); | 
|---|
| 4756 | } | 
|---|
| 4757 | } | 
|---|
| 4758 |  | 
|---|
| 4759 | if (!LeftToRight) { | 
|---|
| 4760 | // Un-reverse the arguments we just evaluated so they match up with the LLVM | 
|---|
| 4761 | // IR function. | 
|---|
| 4762 | std::reverse(first: Args.begin() + CallArgsStart, last: Args.end()); | 
|---|
| 4763 |  | 
|---|
| 4764 | // Reverse the writebacks to match the MSVC ABI. | 
|---|
| 4765 | Args.reverseWritebacks(); | 
|---|
| 4766 | } | 
|---|
| 4767 | } | 
|---|
| 4768 |  | 
|---|
| 4769 | namespace { | 
|---|
| 4770 |  | 
|---|
| 4771 | struct DestroyUnpassedArg final : EHScopeStack::Cleanup { | 
|---|
| 4772 | DestroyUnpassedArg(Address Addr, QualType Ty) : Addr(Addr), Ty(Ty) {} | 
|---|
| 4773 |  | 
|---|
| 4774 | Address Addr; | 
|---|
| 4775 | QualType Ty; | 
|---|
| 4776 |  | 
|---|
| 4777 | void Emit(CodeGenFunction &CGF, Flags flags) override { | 
|---|
| 4778 | QualType::DestructionKind DtorKind = Ty.isDestructedType(); | 
|---|
| 4779 | if (DtorKind == QualType::DK_cxx_destructor) { | 
|---|
| 4780 | const CXXDestructorDecl *Dtor = Ty->getAsCXXRecordDecl()->getDestructor(); | 
|---|
| 4781 | assert(!Dtor->isTrivial()); | 
|---|
| 4782 | CGF.EmitCXXDestructorCall(D: Dtor, Type: Dtor_Complete, /*for vbase*/ ForVirtualBase: false, | 
|---|
| 4783 | /*Delegating=*/false, This: Addr, ThisTy: Ty); | 
|---|
| 4784 | } else { | 
|---|
| 4785 | CGF.callCStructDestructor(Dst: CGF.MakeAddrLValue(Addr, T: Ty)); | 
|---|
| 4786 | } | 
|---|
| 4787 | } | 
|---|
| 4788 | }; | 
|---|
| 4789 |  | 
|---|
| 4790 | struct DisableDebugLocationUpdates { | 
|---|
| 4791 | CodeGenFunction &CGF; | 
|---|
| 4792 | bool disabledDebugInfo; | 
|---|
| 4793 | DisableDebugLocationUpdates(CodeGenFunction &CGF, const Expr *E) : CGF(CGF) { | 
|---|
| 4794 | if ((disabledDebugInfo = isa<CXXDefaultArgExpr>(Val: E) && CGF.getDebugInfo())) | 
|---|
| 4795 | CGF.disableDebugInfo(); | 
|---|
| 4796 | } | 
|---|
| 4797 | ~DisableDebugLocationUpdates() { | 
|---|
| 4798 | if (disabledDebugInfo) | 
|---|
| 4799 | CGF.enableDebugInfo(); | 
|---|
| 4800 | } | 
|---|
| 4801 | }; | 
|---|
| 4802 |  | 
|---|
| 4803 | } // end anonymous namespace | 
|---|
| 4804 |  | 
|---|
| 4805 | RValue CallArg::getRValue(CodeGenFunction &CGF) const { | 
|---|
| 4806 | if (!HasLV) | 
|---|
| 4807 | return RV; | 
|---|
| 4808 | LValue Copy = CGF.MakeAddrLValue(Addr: CGF.CreateMemTemp(T: Ty), T: Ty); | 
|---|
| 4809 | CGF.EmitAggregateCopy(Dest: Copy, Src: LV, EltTy: Ty, MayOverlap: AggValueSlot::DoesNotOverlap, | 
|---|
| 4810 | isVolatile: LV.isVolatile()); | 
|---|
| 4811 | IsUsed = true; | 
|---|
| 4812 | return RValue::getAggregate(addr: Copy.getAddress()); | 
|---|
| 4813 | } | 
|---|
| 4814 |  | 
|---|
| 4815 | void CallArg::copyInto(CodeGenFunction &CGF, Address Addr) const { | 
|---|
| 4816 | LValue Dst = CGF.MakeAddrLValue(Addr, T: Ty); | 
|---|
| 4817 | if (!HasLV && RV.isScalar()) | 
|---|
| 4818 | CGF.EmitStoreOfScalar(value: RV.getScalarVal(), lvalue: Dst, /*isInit=*/true); | 
|---|
| 4819 | else if (!HasLV && RV.isComplex()) | 
|---|
| 4820 | CGF.EmitStoreOfComplex(V: RV.getComplexVal(), dest: Dst, /*init=*/isInit: true); | 
|---|
| 4821 | else { | 
|---|
| 4822 | auto Addr = HasLV ? LV.getAddress() : RV.getAggregateAddress(); | 
|---|
| 4823 | LValue SrcLV = CGF.MakeAddrLValue(Addr, T: Ty); | 
|---|
| 4824 | // We assume that call args are never copied into subobjects. | 
|---|
| 4825 | CGF.EmitAggregateCopy(Dest: Dst, Src: SrcLV, EltTy: Ty, MayOverlap: AggValueSlot::DoesNotOverlap, | 
|---|
| 4826 | isVolatile: HasLV ? LV.isVolatileQualified() | 
|---|
| 4827 | : RV.isVolatileQualified()); | 
|---|
| 4828 | } | 
|---|
| 4829 | IsUsed = true; | 
|---|
| 4830 | } | 
|---|
| 4831 |  | 
|---|
| 4832 | void CodeGenFunction::EmitWritebacks(const CallArgList &args) { | 
|---|
| 4833 | for (const auto &I : args.writebacks()) | 
|---|
| 4834 | emitWriteback(CGF&: *this, writeback: I); | 
|---|
| 4835 | } | 
|---|
| 4836 |  | 
|---|
| 4837 | void CodeGenFunction::EmitCallArg(CallArgList &args, const Expr *E, | 
|---|
| 4838 | QualType type) { | 
|---|
| 4839 | DisableDebugLocationUpdates Dis(*this, E); | 
|---|
| 4840 | if (const ObjCIndirectCopyRestoreExpr *CRE = | 
|---|
| 4841 | dyn_cast<ObjCIndirectCopyRestoreExpr>(Val: E)) { | 
|---|
| 4842 | assert(getLangOpts().ObjCAutoRefCount); | 
|---|
| 4843 | return emitWritebackArg(CGF&: *this, args, CRE); | 
|---|
| 4844 | } | 
|---|
| 4845 |  | 
|---|
| 4846 | // Add writeback for HLSLOutParamExpr. | 
|---|
| 4847 | // Needs to be before the assert below because HLSLOutArgExpr is an LValue | 
|---|
| 4848 | // and is not a reference. | 
|---|
| 4849 | if (const HLSLOutArgExpr *OE = dyn_cast<HLSLOutArgExpr>(Val: E)) { | 
|---|
| 4850 | EmitHLSLOutArgExpr(E: OE, Args&: args, Ty: type); | 
|---|
| 4851 | return; | 
|---|
| 4852 | } | 
|---|
| 4853 |  | 
|---|
| 4854 | assert(type->isReferenceType() == E->isGLValue() && | 
|---|
| 4855 | "reference binding to unmaterialized r-value!"); | 
|---|
| 4856 |  | 
|---|
| 4857 | if (E->isGLValue()) { | 
|---|
| 4858 | assert(E->getObjectKind() == OK_Ordinary); | 
|---|
| 4859 | return args.add(rvalue: EmitReferenceBindingToExpr(E), type); | 
|---|
| 4860 | } | 
|---|
| 4861 |  | 
|---|
| 4862 | bool HasAggregateEvalKind = hasAggregateEvaluationKind(T: type); | 
|---|
| 4863 |  | 
|---|
| 4864 | // In the Microsoft C++ ABI, aggregate arguments are destructed by the callee. | 
|---|
| 4865 | // However, we still have to push an EH-only cleanup in case we unwind before | 
|---|
| 4866 | // we make it to the call. | 
|---|
| 4867 | if (type->isRecordType() && | 
|---|
| 4868 | type->castAs<RecordType>()->getDecl()->isParamDestroyedInCallee()) { | 
|---|
| 4869 | // If we're using inalloca, use the argument memory.  Otherwise, use a | 
|---|
| 4870 | // temporary. | 
|---|
| 4871 | AggValueSlot Slot = args.isUsingInAlloca() | 
|---|
| 4872 | ? createPlaceholderSlot(CGF&: *this, Ty: type) | 
|---|
| 4873 | : CreateAggTemp(T: type, Name: "agg.tmp"); | 
|---|
| 4874 |  | 
|---|
| 4875 | bool DestroyedInCallee = true, NeedsCleanup = true; | 
|---|
| 4876 | if (const auto *RD = type->getAsCXXRecordDecl()) | 
|---|
| 4877 | DestroyedInCallee = RD->hasNonTrivialDestructor(); | 
|---|
| 4878 | else | 
|---|
| 4879 | NeedsCleanup = type.isDestructedType(); | 
|---|
| 4880 |  | 
|---|
| 4881 | if (DestroyedInCallee) | 
|---|
| 4882 | Slot.setExternallyDestructed(); | 
|---|
| 4883 |  | 
|---|
| 4884 | EmitAggExpr(E, AS: Slot); | 
|---|
| 4885 | RValue RV = Slot.asRValue(); | 
|---|
| 4886 | args.add(rvalue: RV, type); | 
|---|
| 4887 |  | 
|---|
| 4888 | if (DestroyedInCallee && NeedsCleanup) { | 
|---|
| 4889 | // Create a no-op GEP between the placeholder and the cleanup so we can | 
|---|
| 4890 | // RAUW it successfully.  It also serves as a marker of the first | 
|---|
| 4891 | // instruction where the cleanup is active. | 
|---|
| 4892 | pushFullExprCleanup<DestroyUnpassedArg>(kind: NormalAndEHCleanup, | 
|---|
| 4893 | A: Slot.getAddress(), A: type); | 
|---|
| 4894 | // This unreachable is a temporary marker which will be removed later. | 
|---|
| 4895 | llvm::Instruction *IsActive = | 
|---|
| 4896 | Builder.CreateFlagLoad(Addr: llvm::Constant::getNullValue(Ty: Int8PtrTy)); | 
|---|
| 4897 | args.addArgCleanupDeactivation(Cleanup: EHStack.stable_begin(), IsActiveIP: IsActive); | 
|---|
| 4898 | } | 
|---|
| 4899 | return; | 
|---|
| 4900 | } | 
|---|
| 4901 |  | 
|---|
| 4902 | if (HasAggregateEvalKind && isa<ImplicitCastExpr>(Val: E) && | 
|---|
| 4903 | cast<CastExpr>(Val: E)->getCastKind() == CK_LValueToRValue && | 
|---|
| 4904 | !type->isArrayParameterType() && !type.isNonTrivialToPrimitiveCopy()) { | 
|---|
| 4905 | LValue L = EmitLValue(E: cast<CastExpr>(Val: E)->getSubExpr()); | 
|---|
| 4906 | assert(L.isSimple()); | 
|---|
| 4907 | args.addUncopiedAggregate(LV: L, type); | 
|---|
| 4908 | return; | 
|---|
| 4909 | } | 
|---|
| 4910 |  | 
|---|
| 4911 | args.add(rvalue: EmitAnyExprToTemp(E), type); | 
|---|
| 4912 | } | 
|---|
| 4913 |  | 
|---|
| 4914 | QualType CodeGenFunction::getVarArgType(const Expr *Arg) { | 
|---|
| 4915 | // System headers on Windows define NULL to 0 instead of 0LL on Win64. MSVC | 
|---|
| 4916 | // implicitly widens null pointer constants that are arguments to varargs | 
|---|
| 4917 | // functions to pointer-sized ints. | 
|---|
| 4918 | if (!getTarget().getTriple().isOSWindows()) | 
|---|
| 4919 | return Arg->getType(); | 
|---|
| 4920 |  | 
|---|
| 4921 | if (Arg->getType()->isIntegerType() && | 
|---|
| 4922 | getContext().getTypeSize(T: Arg->getType()) < | 
|---|
| 4923 | getContext().getTargetInfo().getPointerWidth(AddrSpace: LangAS::Default) && | 
|---|
| 4924 | Arg->isNullPointerConstant(Ctx&: getContext(), | 
|---|
| 4925 | NPC: Expr::NPC_ValueDependentIsNotNull)) { | 
|---|
| 4926 | return getContext().getIntPtrType(); | 
|---|
| 4927 | } | 
|---|
| 4928 |  | 
|---|
| 4929 | return Arg->getType(); | 
|---|
| 4930 | } | 
|---|
| 4931 |  | 
|---|
| 4932 | // In ObjC ARC mode with no ObjC ARC exception safety, tell the ARC | 
|---|
| 4933 | // optimizer it can aggressively ignore unwind edges. | 
|---|
| 4934 | void CodeGenFunction::AddObjCARCExceptionMetadata(llvm::Instruction *Inst) { | 
|---|
| 4935 | if (CGM.getCodeGenOpts().OptimizationLevel != 0 && | 
|---|
| 4936 | !CGM.getCodeGenOpts().ObjCAutoRefCountExceptions) | 
|---|
| 4937 | Inst->setMetadata(Kind: "clang.arc.no_objc_arc_exceptions", | 
|---|
| 4938 | Node: CGM.getNoObjCARCExceptionsMetadata()); | 
|---|
| 4939 | } | 
|---|
| 4940 |  | 
|---|
| 4941 | /// Emits a call to the given no-arguments nounwind runtime function. | 
|---|
| 4942 | llvm::CallInst * | 
|---|
| 4943 | CodeGenFunction::EmitNounwindRuntimeCall(llvm::FunctionCallee callee, | 
|---|
| 4944 | const llvm::Twine &name) { | 
|---|
| 4945 | return EmitNounwindRuntimeCall(callee, args: ArrayRef<llvm::Value *>(), name); | 
|---|
| 4946 | } | 
|---|
| 4947 |  | 
|---|
| 4948 | /// Emits a call to the given nounwind runtime function. | 
|---|
| 4949 | llvm::CallInst * | 
|---|
| 4950 | CodeGenFunction::EmitNounwindRuntimeCall(llvm::FunctionCallee callee, | 
|---|
| 4951 | ArrayRef<Address> args, | 
|---|
| 4952 | const llvm::Twine &name) { | 
|---|
| 4953 | SmallVector<llvm::Value *, 3> values; | 
|---|
| 4954 | for (auto arg : args) | 
|---|
| 4955 | values.push_back(Elt: arg.emitRawPointer(CGF&: *this)); | 
|---|
| 4956 | return EmitNounwindRuntimeCall(callee, args: values, name); | 
|---|
| 4957 | } | 
|---|
| 4958 |  | 
|---|
| 4959 | llvm::CallInst * | 
|---|
| 4960 | CodeGenFunction::EmitNounwindRuntimeCall(llvm::FunctionCallee callee, | 
|---|
| 4961 | ArrayRef<llvm::Value *> args, | 
|---|
| 4962 | const llvm::Twine &name) { | 
|---|
| 4963 | llvm::CallInst *call = EmitRuntimeCall(callee, args, name); | 
|---|
| 4964 | call->setDoesNotThrow(); | 
|---|
| 4965 | return call; | 
|---|
| 4966 | } | 
|---|
| 4967 |  | 
|---|
| 4968 | /// Emits a simple call (never an invoke) to the given no-arguments | 
|---|
| 4969 | /// runtime function. | 
|---|
| 4970 | llvm::CallInst *CodeGenFunction::EmitRuntimeCall(llvm::FunctionCallee callee, | 
|---|
| 4971 | const llvm::Twine &name) { | 
|---|
| 4972 | return EmitRuntimeCall(callee, args: {}, name); | 
|---|
| 4973 | } | 
|---|
| 4974 |  | 
|---|
| 4975 | // Calls which may throw must have operand bundles indicating which funclet | 
|---|
| 4976 | // they are nested within. | 
|---|
| 4977 | SmallVector<llvm::OperandBundleDef, 1> | 
|---|
| 4978 | CodeGenFunction::getBundlesForFunclet(llvm::Value *Callee) { | 
|---|
| 4979 | // There is no need for a funclet operand bundle if we aren't inside a | 
|---|
| 4980 | // funclet. | 
|---|
| 4981 | if (!CurrentFuncletPad) | 
|---|
| 4982 | return (SmallVector<llvm::OperandBundleDef, 1>()); | 
|---|
| 4983 |  | 
|---|
| 4984 | // Skip intrinsics which cannot throw (as long as they don't lower into | 
|---|
| 4985 | // regular function calls in the course of IR transformations). | 
|---|
| 4986 | if (auto *CalleeFn = dyn_cast<llvm::Function>(Val: Callee->stripPointerCasts())) { | 
|---|
| 4987 | if (CalleeFn->isIntrinsic() && CalleeFn->doesNotThrow()) { | 
|---|
| 4988 | auto IID = CalleeFn->getIntrinsicID(); | 
|---|
| 4989 | if (!llvm::IntrinsicInst::mayLowerToFunctionCall(IID)) | 
|---|
| 4990 | return (SmallVector<llvm::OperandBundleDef, 1>()); | 
|---|
| 4991 | } | 
|---|
| 4992 | } | 
|---|
| 4993 |  | 
|---|
| 4994 | SmallVector<llvm::OperandBundleDef, 1> BundleList; | 
|---|
| 4995 | BundleList.emplace_back(Args: "funclet", Args&: CurrentFuncletPad); | 
|---|
| 4996 | return BundleList; | 
|---|
| 4997 | } | 
|---|
| 4998 |  | 
|---|
| 4999 | /// Emits a simple call (never an invoke) to the given runtime function. | 
|---|
| 5000 | llvm::CallInst *CodeGenFunction::EmitRuntimeCall(llvm::FunctionCallee callee, | 
|---|
| 5001 | ArrayRef<llvm::Value *> args, | 
|---|
| 5002 | const llvm::Twine &name) { | 
|---|
| 5003 | llvm::CallInst *call = Builder.CreateCall( | 
|---|
| 5004 | Callee: callee, Args: args, OpBundles: getBundlesForFunclet(Callee: callee.getCallee()), Name: name); | 
|---|
| 5005 | call->setCallingConv(getRuntimeCC()); | 
|---|
| 5006 |  | 
|---|
| 5007 | if (CGM.shouldEmitConvergenceTokens() && call->isConvergent()) | 
|---|
| 5008 | return cast<llvm::CallInst>(Val: addConvergenceControlToken(Input: call)); | 
|---|
| 5009 | return call; | 
|---|
| 5010 | } | 
|---|
| 5011 |  | 
|---|
| 5012 | /// Emits a call or invoke to the given noreturn runtime function. | 
|---|
| 5013 | void CodeGenFunction::EmitNoreturnRuntimeCallOrInvoke( | 
|---|
| 5014 | llvm::FunctionCallee callee, ArrayRef<llvm::Value *> args) { | 
|---|
| 5015 | SmallVector<llvm::OperandBundleDef, 1> BundleList = | 
|---|
| 5016 | getBundlesForFunclet(Callee: callee.getCallee()); | 
|---|
| 5017 |  | 
|---|
| 5018 | if (getInvokeDest()) { | 
|---|
| 5019 | llvm::InvokeInst *invoke = Builder.CreateInvoke( | 
|---|
| 5020 | Callee: callee, NormalDest: getUnreachableBlock(), UnwindDest: getInvokeDest(), Args: args, OpBundles: BundleList); | 
|---|
| 5021 | invoke->setDoesNotReturn(); | 
|---|
| 5022 | invoke->setCallingConv(getRuntimeCC()); | 
|---|
| 5023 | } else { | 
|---|
| 5024 | llvm::CallInst *call = Builder.CreateCall(Callee: callee, Args: args, OpBundles: BundleList); | 
|---|
| 5025 | call->setDoesNotReturn(); | 
|---|
| 5026 | call->setCallingConv(getRuntimeCC()); | 
|---|
| 5027 | Builder.CreateUnreachable(); | 
|---|
| 5028 | } | 
|---|
| 5029 | } | 
|---|
| 5030 |  | 
|---|
| 5031 | /// Emits a call or invoke instruction to the given nullary runtime function. | 
|---|
| 5032 | llvm::CallBase * | 
|---|
| 5033 | CodeGenFunction::EmitRuntimeCallOrInvoke(llvm::FunctionCallee callee, | 
|---|
| 5034 | const Twine &name) { | 
|---|
| 5035 | return EmitRuntimeCallOrInvoke(callee, args: {}, name); | 
|---|
| 5036 | } | 
|---|
| 5037 |  | 
|---|
| 5038 | /// Emits a call or invoke instruction to the given runtime function. | 
|---|
| 5039 | llvm::CallBase * | 
|---|
| 5040 | CodeGenFunction::EmitRuntimeCallOrInvoke(llvm::FunctionCallee callee, | 
|---|
| 5041 | ArrayRef<llvm::Value *> args, | 
|---|
| 5042 | const Twine &name) { | 
|---|
| 5043 | llvm::CallBase *call = EmitCallOrInvoke(Callee: callee, Args: args, Name: name); | 
|---|
| 5044 | call->setCallingConv(getRuntimeCC()); | 
|---|
| 5045 | return call; | 
|---|
| 5046 | } | 
|---|
| 5047 |  | 
|---|
| 5048 | /// Emits a call or invoke instruction to the given function, depending | 
|---|
| 5049 | /// on the current state of the EH stack. | 
|---|
| 5050 | llvm::CallBase *CodeGenFunction::EmitCallOrInvoke(llvm::FunctionCallee Callee, | 
|---|
| 5051 | ArrayRef<llvm::Value *> Args, | 
|---|
| 5052 | const Twine &Name) { | 
|---|
| 5053 | llvm::BasicBlock *InvokeDest = getInvokeDest(); | 
|---|
| 5054 | SmallVector<llvm::OperandBundleDef, 1> BundleList = | 
|---|
| 5055 | getBundlesForFunclet(Callee: Callee.getCallee()); | 
|---|
| 5056 |  | 
|---|
| 5057 | llvm::CallBase *Inst; | 
|---|
| 5058 | if (!InvokeDest) | 
|---|
| 5059 | Inst = Builder.CreateCall(Callee, Args, OpBundles: BundleList, Name); | 
|---|
| 5060 | else { | 
|---|
| 5061 | llvm::BasicBlock *ContBB = createBasicBlock(name: "invoke.cont"); | 
|---|
| 5062 | Inst = Builder.CreateInvoke(Callee, NormalDest: ContBB, UnwindDest: InvokeDest, Args, OpBundles: BundleList, | 
|---|
| 5063 | Name); | 
|---|
| 5064 | EmitBlock(BB: ContBB); | 
|---|
| 5065 | } | 
|---|
| 5066 |  | 
|---|
| 5067 | // In ObjC ARC mode with no ObjC ARC exception safety, tell the ARC | 
|---|
| 5068 | // optimizer it can aggressively ignore unwind edges. | 
|---|
| 5069 | if (CGM.getLangOpts().ObjCAutoRefCount) | 
|---|
| 5070 | AddObjCARCExceptionMetadata(Inst); | 
|---|
| 5071 |  | 
|---|
| 5072 | return Inst; | 
|---|
| 5073 | } | 
|---|
| 5074 |  | 
|---|
| 5075 | void CodeGenFunction::deferPlaceholderReplacement(llvm::Instruction *Old, | 
|---|
| 5076 | llvm::Value *New) { | 
|---|
| 5077 | DeferredReplacements.push_back( | 
|---|
| 5078 | Elt: std::make_pair(x: llvm::WeakTrackingVH(Old), y&: New)); | 
|---|
| 5079 | } | 
|---|
| 5080 |  | 
|---|
| 5081 | namespace { | 
|---|
| 5082 |  | 
|---|
| 5083 | /// Specify given \p NewAlign as the alignment of return value attribute. If | 
|---|
| 5084 | /// such attribute already exists, re-set it to the maximal one of two options. | 
|---|
| 5085 | [[nodiscard]] llvm::AttributeList | 
|---|
| 5086 | maybeRaiseRetAlignmentAttribute(llvm::LLVMContext &Ctx, | 
|---|
| 5087 | const llvm::AttributeList &Attrs, | 
|---|
| 5088 | llvm::Align NewAlign) { | 
|---|
| 5089 | llvm::Align CurAlign = Attrs.getRetAlignment().valueOrOne(); | 
|---|
| 5090 | if (CurAlign >= NewAlign) | 
|---|
| 5091 | return Attrs; | 
|---|
| 5092 | llvm::Attribute AlignAttr = llvm::Attribute::getWithAlignment(Context&: Ctx, Alignment: NewAlign); | 
|---|
| 5093 | return Attrs.removeRetAttribute(C&: Ctx, Kind: llvm::Attribute::AttrKind::Alignment) | 
|---|
| 5094 | .addRetAttribute(C&: Ctx, Attr: AlignAttr); | 
|---|
| 5095 | } | 
|---|
| 5096 |  | 
|---|
| 5097 | template <typename AlignedAttrTy> class AbstractAssumeAlignedAttrEmitter { | 
|---|
| 5098 | protected: | 
|---|
| 5099 | CodeGenFunction &CGF; | 
|---|
| 5100 |  | 
|---|
| 5101 | /// We do nothing if this is, or becomes, nullptr. | 
|---|
| 5102 | const AlignedAttrTy *AA = nullptr; | 
|---|
| 5103 |  | 
|---|
| 5104 | llvm::Value *Alignment = nullptr;      // May or may not be a constant. | 
|---|
| 5105 | llvm::ConstantInt *OffsetCI = nullptr; // Constant, hopefully zero. | 
|---|
| 5106 |  | 
|---|
| 5107 | AbstractAssumeAlignedAttrEmitter(CodeGenFunction &CGF_, const Decl *FuncDecl) | 
|---|
| 5108 | : CGF(CGF_) { | 
|---|
| 5109 | if (!FuncDecl) | 
|---|
| 5110 | return; | 
|---|
| 5111 | AA = FuncDecl->getAttr<AlignedAttrTy>(); | 
|---|
| 5112 | } | 
|---|
| 5113 |  | 
|---|
| 5114 | public: | 
|---|
| 5115 | /// If we can, materialize the alignment as an attribute on return value. | 
|---|
| 5116 | [[nodiscard]] llvm::AttributeList | 
|---|
| 5117 | TryEmitAsCallSiteAttribute(const llvm::AttributeList &Attrs) { | 
|---|
| 5118 | if (!AA || OffsetCI || CGF.SanOpts.has(K: SanitizerKind::Alignment)) | 
|---|
| 5119 | return Attrs; | 
|---|
| 5120 | const auto *AlignmentCI = dyn_cast<llvm::ConstantInt>(Val: Alignment); | 
|---|
| 5121 | if (!AlignmentCI) | 
|---|
| 5122 | return Attrs; | 
|---|
| 5123 | // We may legitimately have non-power-of-2 alignment here. | 
|---|
| 5124 | // If so, this is UB land, emit it via `@llvm.assume` instead. | 
|---|
| 5125 | if (!AlignmentCI->getValue().isPowerOf2()) | 
|---|
| 5126 | return Attrs; | 
|---|
| 5127 | llvm::AttributeList NewAttrs = maybeRaiseRetAlignmentAttribute( | 
|---|
| 5128 | Ctx&: CGF.getLLVMContext(), Attrs, | 
|---|
| 5129 | NewAlign: llvm::Align( | 
|---|
| 5130 | AlignmentCI->getLimitedValue(Limit: llvm::Value::MaximumAlignment))); | 
|---|
| 5131 | AA = nullptr; // We're done. Disallow doing anything else. | 
|---|
| 5132 | return NewAttrs; | 
|---|
| 5133 | } | 
|---|
| 5134 |  | 
|---|
| 5135 | /// Emit alignment assumption. | 
|---|
| 5136 | /// This is a general fallback that we take if either there is an offset, | 
|---|
| 5137 | /// or the alignment is variable or we are sanitizing for alignment. | 
|---|
| 5138 | void EmitAsAnAssumption(SourceLocation Loc, QualType RetTy, RValue &Ret) { | 
|---|
| 5139 | if (!AA) | 
|---|
| 5140 | return; | 
|---|
| 5141 | CGF.emitAlignmentAssumption(Ret.getScalarVal(), RetTy, Loc, | 
|---|
| 5142 | AA->getLocation(), Alignment, OffsetCI); | 
|---|
| 5143 | AA = nullptr; // We're done. Disallow doing anything else. | 
|---|
| 5144 | } | 
|---|
| 5145 | }; | 
|---|
| 5146 |  | 
|---|
| 5147 | /// Helper data structure to emit `AssumeAlignedAttr`. | 
|---|
| 5148 | class AssumeAlignedAttrEmitter final | 
|---|
| 5149 | : public AbstractAssumeAlignedAttrEmitter<AssumeAlignedAttr> { | 
|---|
| 5150 | public: | 
|---|
| 5151 | AssumeAlignedAttrEmitter(CodeGenFunction &CGF_, const Decl *FuncDecl) | 
|---|
| 5152 | : AbstractAssumeAlignedAttrEmitter(CGF_, FuncDecl) { | 
|---|
| 5153 | if (!AA) | 
|---|
| 5154 | return; | 
|---|
| 5155 | // It is guaranteed that the alignment/offset are constants. | 
|---|
| 5156 | Alignment = cast<llvm::ConstantInt>(Val: CGF.EmitScalarExpr(E: AA->getAlignment())); | 
|---|
| 5157 | if (Expr *Offset = AA->getOffset()) { | 
|---|
| 5158 | OffsetCI = cast<llvm::ConstantInt>(Val: CGF.EmitScalarExpr(E: Offset)); | 
|---|
| 5159 | if (OffsetCI->isNullValue()) // Canonicalize zero offset to no offset. | 
|---|
| 5160 | OffsetCI = nullptr; | 
|---|
| 5161 | } | 
|---|
| 5162 | } | 
|---|
| 5163 | }; | 
|---|
| 5164 |  | 
|---|
| 5165 | /// Helper data structure to emit `AllocAlignAttr`. | 
|---|
| 5166 | class AllocAlignAttrEmitter final | 
|---|
| 5167 | : public AbstractAssumeAlignedAttrEmitter<AllocAlignAttr> { | 
|---|
| 5168 | public: | 
|---|
| 5169 | AllocAlignAttrEmitter(CodeGenFunction &CGF_, const Decl *FuncDecl, | 
|---|
| 5170 | const CallArgList &CallArgs) | 
|---|
| 5171 | : AbstractAssumeAlignedAttrEmitter(CGF_, FuncDecl) { | 
|---|
| 5172 | if (!AA) | 
|---|
| 5173 | return; | 
|---|
| 5174 | // Alignment may or may not be a constant, and that is okay. | 
|---|
| 5175 | Alignment = CallArgs[AA->getParamIndex().getLLVMIndex()] | 
|---|
| 5176 | .getRValue(CGF) | 
|---|
| 5177 | .getScalarVal(); | 
|---|
| 5178 | } | 
|---|
| 5179 | }; | 
|---|
| 5180 |  | 
|---|
| 5181 | } // namespace | 
|---|
| 5182 |  | 
|---|
| 5183 | static unsigned getMaxVectorWidth(const llvm::Type *Ty) { | 
|---|
| 5184 | if (auto *VT = dyn_cast<llvm::VectorType>(Val: Ty)) | 
|---|
| 5185 | return VT->getPrimitiveSizeInBits().getKnownMinValue(); | 
|---|
| 5186 | if (auto *AT = dyn_cast<llvm::ArrayType>(Val: Ty)) | 
|---|
| 5187 | return getMaxVectorWidth(Ty: AT->getElementType()); | 
|---|
| 5188 |  | 
|---|
| 5189 | unsigned MaxVectorWidth = 0; | 
|---|
| 5190 | if (auto *ST = dyn_cast<llvm::StructType>(Val: Ty)) | 
|---|
| 5191 | for (auto *I : ST->elements()) | 
|---|
| 5192 | MaxVectorWidth = std::max(a: MaxVectorWidth, b: getMaxVectorWidth(Ty: I)); | 
|---|
| 5193 | return MaxVectorWidth; | 
|---|
| 5194 | } | 
|---|
| 5195 |  | 
|---|
| 5196 | RValue CodeGenFunction::EmitCall(const CGFunctionInfo &CallInfo, | 
|---|
| 5197 | const CGCallee &Callee, | 
|---|
| 5198 | ReturnValueSlot ReturnValue, | 
|---|
| 5199 | const CallArgList &CallArgs, | 
|---|
| 5200 | llvm::CallBase **callOrInvoke, bool IsMustTail, | 
|---|
| 5201 | SourceLocation Loc, | 
|---|
| 5202 | bool IsVirtualFunctionPointerThunk) { | 
|---|
| 5203 | // FIXME: We no longer need the types from CallArgs; lift up and simplify. | 
|---|
| 5204 |  | 
|---|
| 5205 | assert(Callee.isOrdinary() || Callee.isVirtual()); | 
|---|
| 5206 |  | 
|---|
| 5207 | // Handle struct-return functions by passing a pointer to the | 
|---|
| 5208 | // location that we would like to return into. | 
|---|
| 5209 | QualType RetTy = CallInfo.getReturnType(); | 
|---|
| 5210 | const ABIArgInfo &RetAI = CallInfo.getReturnInfo(); | 
|---|
| 5211 |  | 
|---|
| 5212 | llvm::FunctionType *IRFuncTy = getTypes().GetFunctionType(FI: CallInfo); | 
|---|
| 5213 |  | 
|---|
| 5214 | const Decl *TargetDecl = Callee.getAbstractInfo().getCalleeDecl().getDecl(); | 
|---|
| 5215 | if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl)) { | 
|---|
| 5216 | // We can only guarantee that a function is called from the correct | 
|---|
| 5217 | // context/function based on the appropriate target attributes, | 
|---|
| 5218 | // so only check in the case where we have both always_inline and target | 
|---|
| 5219 | // since otherwise we could be making a conditional call after a check for | 
|---|
| 5220 | // the proper cpu features (and it won't cause code generation issues due to | 
|---|
| 5221 | // function based code generation). | 
|---|
| 5222 | if (TargetDecl->hasAttr<AlwaysInlineAttr>() && | 
|---|
| 5223 | (TargetDecl->hasAttr<TargetAttr>() || | 
|---|
| 5224 | (CurFuncDecl && CurFuncDecl->hasAttr<TargetAttr>()))) | 
|---|
| 5225 | checkTargetFeatures(Loc, TargetDecl: FD); | 
|---|
| 5226 | } | 
|---|
| 5227 |  | 
|---|
| 5228 | // Some architectures (such as x86-64) have the ABI changed based on | 
|---|
| 5229 | // attribute-target/features. Give them a chance to diagnose. | 
|---|
| 5230 | const FunctionDecl *CallerDecl = dyn_cast_or_null<FunctionDecl>(Val: CurCodeDecl); | 
|---|
| 5231 | const FunctionDecl *CalleeDecl = dyn_cast_or_null<FunctionDecl>(Val: TargetDecl); | 
|---|
| 5232 | CGM.getTargetCodeGenInfo().checkFunctionCallABI(CGM, CallLoc: Loc, Caller: CallerDecl, | 
|---|
| 5233 | Callee: CalleeDecl, Args: CallArgs, ReturnType: RetTy); | 
|---|
| 5234 |  | 
|---|
| 5235 | // 1. Set up the arguments. | 
|---|
| 5236 |  | 
|---|
| 5237 | // If we're using inalloca, insert the allocation after the stack save. | 
|---|
| 5238 | // FIXME: Do this earlier rather than hacking it in here! | 
|---|
| 5239 | RawAddress ArgMemory = RawAddress::invalid(); | 
|---|
| 5240 | if (llvm::StructType *ArgStruct = CallInfo.getArgStruct()) { | 
|---|
| 5241 | const llvm::DataLayout &DL = CGM.getDataLayout(); | 
|---|
| 5242 | llvm::Instruction *IP = CallArgs.getStackBase(); | 
|---|
| 5243 | llvm::AllocaInst *AI; | 
|---|
| 5244 | if (IP) { | 
|---|
| 5245 | IP = IP->getNextNode(); | 
|---|
| 5246 | AI = new llvm::AllocaInst(ArgStruct, DL.getAllocaAddrSpace(), "argmem", | 
|---|
| 5247 | IP->getIterator()); | 
|---|
| 5248 | } else { | 
|---|
| 5249 | AI = CreateTempAlloca(Ty: ArgStruct, Name: "argmem"); | 
|---|
| 5250 | } | 
|---|
| 5251 | auto Align = CallInfo.getArgStructAlignment(); | 
|---|
| 5252 | AI->setAlignment(Align.getAsAlign()); | 
|---|
| 5253 | AI->setUsedWithInAlloca(true); | 
|---|
| 5254 | assert(AI->isUsedWithInAlloca() && !AI->isStaticAlloca()); | 
|---|
| 5255 | ArgMemory = RawAddress(AI, ArgStruct, Align); | 
|---|
| 5256 | } | 
|---|
| 5257 |  | 
|---|
| 5258 | ClangToLLVMArgMapping IRFunctionArgs(CGM.getContext(), CallInfo); | 
|---|
| 5259 | SmallVector<llvm::Value *, 16> IRCallArgs(IRFunctionArgs.totalIRArgs()); | 
|---|
| 5260 |  | 
|---|
| 5261 | // If the call returns a temporary with struct return, create a temporary | 
|---|
| 5262 | // alloca to hold the result, unless one is given to us. | 
|---|
| 5263 | Address SRetPtr = Address::invalid(); | 
|---|
| 5264 | llvm::Value *UnusedReturnSizePtr = nullptr; | 
|---|
| 5265 | if (RetAI.isIndirect() || RetAI.isInAlloca() || RetAI.isCoerceAndExpand()) { | 
|---|
| 5266 | // For virtual function pointer thunks and musttail calls, we must always | 
|---|
| 5267 | // forward an incoming SRet pointer to the callee, because a local alloca | 
|---|
| 5268 | // would be de-allocated before the call. These cases both guarantee that | 
|---|
| 5269 | // there will be an incoming SRet argument of the correct type. | 
|---|
| 5270 | if ((IsVirtualFunctionPointerThunk || IsMustTail) && RetAI.isIndirect()) { | 
|---|
| 5271 | SRetPtr = makeNaturalAddressForPointer(Ptr: CurFn->arg_begin() + | 
|---|
| 5272 | IRFunctionArgs.getSRetArgNo(), | 
|---|
| 5273 | T: RetTy, Alignment: CharUnits::fromQuantity(Quantity: 1)); | 
|---|
| 5274 | } else if (!ReturnValue.isNull()) { | 
|---|
| 5275 | SRetPtr = ReturnValue.getAddress(); | 
|---|
| 5276 | } else { | 
|---|
| 5277 | SRetPtr = CreateMemTempWithoutCast(T: RetTy, Name: "tmp"); | 
|---|
| 5278 | if (HaveInsertPoint() && ReturnValue.isUnused()) { | 
|---|
| 5279 | llvm::TypeSize size = | 
|---|
| 5280 | CGM.getDataLayout().getTypeAllocSize(Ty: ConvertTypeForMem(T: RetTy)); | 
|---|
| 5281 | UnusedReturnSizePtr = EmitLifetimeStart(Size: size, Addr: SRetPtr.getBasePointer()); | 
|---|
| 5282 | } | 
|---|
| 5283 | } | 
|---|
| 5284 | if (IRFunctionArgs.hasSRetArg()) { | 
|---|
| 5285 | // A mismatch between the allocated return value's AS and the target's | 
|---|
| 5286 | // chosen IndirectAS can happen e.g. when passing the this pointer through | 
|---|
| 5287 | // a chain involving stores to / loads from the DefaultAS; we address this | 
|---|
| 5288 | // here, symmetrically with the handling we have for normal pointer args. | 
|---|
| 5289 | if (SRetPtr.getAddressSpace() != RetAI.getIndirectAddrSpace()) { | 
|---|
| 5290 | llvm::Value *V = SRetPtr.getBasePointer(); | 
|---|
| 5291 | LangAS SAS = getLangASFromTargetAS(TargetAS: SRetPtr.getAddressSpace()); | 
|---|
| 5292 | llvm::Type *Ty = llvm::PointerType::get(C&: getLLVMContext(), | 
|---|
| 5293 | AddressSpace: RetAI.getIndirectAddrSpace()); | 
|---|
| 5294 |  | 
|---|
| 5295 | SRetPtr = SRetPtr.withPointer( | 
|---|
| 5296 | NewPointer: getTargetHooks().performAddrSpaceCast(CGF&: *this, V, SrcAddr: SAS, DestTy: Ty, IsNonNull: true), | 
|---|
| 5297 | IsKnownNonNull: SRetPtr.isKnownNonNull()); | 
|---|
| 5298 | } | 
|---|
| 5299 | IRCallArgs[IRFunctionArgs.getSRetArgNo()] = | 
|---|
| 5300 | getAsNaturalPointerTo(Addr: SRetPtr, PointeeType: RetTy); | 
|---|
| 5301 | } else if (RetAI.isInAlloca()) { | 
|---|
| 5302 | Address Addr = | 
|---|
| 5303 | Builder.CreateStructGEP(Addr: ArgMemory, Index: RetAI.getInAllocaFieldIndex()); | 
|---|
| 5304 | Builder.CreateStore(Val: getAsNaturalPointerTo(Addr: SRetPtr, PointeeType: RetTy), Addr); | 
|---|
| 5305 | } | 
|---|
| 5306 | } | 
|---|
| 5307 |  | 
|---|
| 5308 | RawAddress swiftErrorTemp = RawAddress::invalid(); | 
|---|
| 5309 | Address swiftErrorArg = Address::invalid(); | 
|---|
| 5310 |  | 
|---|
| 5311 | // When passing arguments using temporary allocas, we need to add the | 
|---|
| 5312 | // appropriate lifetime markers. This vector keeps track of all the lifetime | 
|---|
| 5313 | // markers that need to be ended right after the call. | 
|---|
| 5314 | SmallVector<CallLifetimeEnd, 2> CallLifetimeEndAfterCall; | 
|---|
| 5315 |  | 
|---|
| 5316 | // Translate all of the arguments as necessary to match the IR lowering. | 
|---|
| 5317 | assert(CallInfo.arg_size() == CallArgs.size() && | 
|---|
| 5318 | "Mismatch between function signature & arguments."); | 
|---|
| 5319 | unsigned ArgNo = 0; | 
|---|
| 5320 | CGFunctionInfo::const_arg_iterator info_it = CallInfo.arg_begin(); | 
|---|
| 5321 | for (CallArgList::const_iterator I = CallArgs.begin(), E = CallArgs.end(); | 
|---|
| 5322 | I != E; ++I, ++info_it, ++ArgNo) { | 
|---|
| 5323 | const ABIArgInfo &ArgInfo = info_it->info; | 
|---|
| 5324 |  | 
|---|
| 5325 | // Insert a padding argument to ensure proper alignment. | 
|---|
| 5326 | if (IRFunctionArgs.hasPaddingArg(ArgNo)) | 
|---|
| 5327 | IRCallArgs[IRFunctionArgs.getPaddingArgNo(ArgNo)] = | 
|---|
| 5328 | llvm::UndefValue::get(T: ArgInfo.getPaddingType()); | 
|---|
| 5329 |  | 
|---|
| 5330 | unsigned FirstIRArg, NumIRArgs; | 
|---|
| 5331 | std::tie(args&: FirstIRArg, args&: NumIRArgs) = IRFunctionArgs.getIRArgs(ArgNo); | 
|---|
| 5332 |  | 
|---|
| 5333 | bool ArgHasMaybeUndefAttr = | 
|---|
| 5334 | IsArgumentMaybeUndef(TargetDecl, NumRequiredArgs: CallInfo.getNumRequiredArgs(), ArgNo); | 
|---|
| 5335 |  | 
|---|
| 5336 | switch (ArgInfo.getKind()) { | 
|---|
| 5337 | case ABIArgInfo::InAlloca: { | 
|---|
| 5338 | assert(NumIRArgs == 0); | 
|---|
| 5339 | assert(getTarget().getTriple().getArch() == llvm::Triple::x86); | 
|---|
| 5340 | if (I->isAggregate()) { | 
|---|
| 5341 | RawAddress Addr = I->hasLValue() | 
|---|
| 5342 | ? I->getKnownLValue().getAddress() | 
|---|
| 5343 | : I->getKnownRValue().getAggregateAddress(); | 
|---|
| 5344 | llvm::Instruction *Placeholder = | 
|---|
| 5345 | cast<llvm::Instruction>(Val: Addr.getPointer()); | 
|---|
| 5346 |  | 
|---|
| 5347 | if (!ArgInfo.getInAllocaIndirect()) { | 
|---|
| 5348 | // Replace the placeholder with the appropriate argument slot GEP. | 
|---|
| 5349 | CGBuilderTy::InsertPoint IP = Builder.saveIP(); | 
|---|
| 5350 | Builder.SetInsertPoint(Placeholder); | 
|---|
| 5351 | Addr = Builder.CreateStructGEP(Addr: ArgMemory, | 
|---|
| 5352 | Index: ArgInfo.getInAllocaFieldIndex()); | 
|---|
| 5353 | Builder.restoreIP(IP); | 
|---|
| 5354 | } else { | 
|---|
| 5355 | // For indirect things such as overaligned structs, replace the | 
|---|
| 5356 | // placeholder with a regular aggregate temporary alloca. Store the | 
|---|
| 5357 | // address of this alloca into the struct. | 
|---|
| 5358 | Addr = CreateMemTemp(T: info_it->type, Name: "inalloca.indirect.tmp"); | 
|---|
| 5359 | Address ArgSlot = Builder.CreateStructGEP( | 
|---|
| 5360 | Addr: ArgMemory, Index: ArgInfo.getInAllocaFieldIndex()); | 
|---|
| 5361 | Builder.CreateStore(Val: Addr.getPointer(), Addr: ArgSlot); | 
|---|
| 5362 | } | 
|---|
| 5363 | deferPlaceholderReplacement(Old: Placeholder, New: Addr.getPointer()); | 
|---|
| 5364 | } else if (ArgInfo.getInAllocaIndirect()) { | 
|---|
| 5365 | // Make a temporary alloca and store the address of it into the argument | 
|---|
| 5366 | // struct. | 
|---|
| 5367 | RawAddress Addr = CreateMemTempWithoutCast( | 
|---|
| 5368 | T: I->Ty, Align: getContext().getTypeAlignInChars(T: I->Ty), | 
|---|
| 5369 | Name: "indirect-arg-temp"); | 
|---|
| 5370 | I->copyInto(CGF&: *this, Addr); | 
|---|
| 5371 | Address ArgSlot = | 
|---|
| 5372 | Builder.CreateStructGEP(Addr: ArgMemory, Index: ArgInfo.getInAllocaFieldIndex()); | 
|---|
| 5373 | Builder.CreateStore(Val: Addr.getPointer(), Addr: ArgSlot); | 
|---|
| 5374 | } else { | 
|---|
| 5375 | // Store the RValue into the argument struct. | 
|---|
| 5376 | Address Addr = | 
|---|
| 5377 | Builder.CreateStructGEP(Addr: ArgMemory, Index: ArgInfo.getInAllocaFieldIndex()); | 
|---|
| 5378 | Addr = Addr.withElementType(ElemTy: ConvertTypeForMem(T: I->Ty)); | 
|---|
| 5379 | I->copyInto(CGF&: *this, Addr); | 
|---|
| 5380 | } | 
|---|
| 5381 | break; | 
|---|
| 5382 | } | 
|---|
| 5383 |  | 
|---|
| 5384 | case ABIArgInfo::Indirect: | 
|---|
| 5385 | case ABIArgInfo::IndirectAliased: { | 
|---|
| 5386 | assert(NumIRArgs == 1); | 
|---|
| 5387 | if (I->isAggregate()) { | 
|---|
| 5388 | // We want to avoid creating an unnecessary temporary+copy here; | 
|---|
| 5389 | // however, we need one in three cases: | 
|---|
| 5390 | // 1. If the argument is not byval, and we are required to copy the | 
|---|
| 5391 | //    source.  (This case doesn't occur on any common architecture.) | 
|---|
| 5392 | // 2. If the argument is byval, RV is not sufficiently aligned, and | 
|---|
| 5393 | //    we cannot force it to be sufficiently aligned. | 
|---|
| 5394 | // 3. If the argument is byval, but RV is not located in default | 
|---|
| 5395 | //    or alloca address space. | 
|---|
| 5396 | Address Addr = I->hasLValue() | 
|---|
| 5397 | ? I->getKnownLValue().getAddress() | 
|---|
| 5398 | : I->getKnownRValue().getAggregateAddress(); | 
|---|
| 5399 | CharUnits Align = ArgInfo.getIndirectAlign(); | 
|---|
| 5400 | const llvm::DataLayout *TD = &CGM.getDataLayout(); | 
|---|
| 5401 |  | 
|---|
| 5402 | assert((FirstIRArg >= IRFuncTy->getNumParams() || | 
|---|
| 5403 | IRFuncTy->getParamType(FirstIRArg)->getPointerAddressSpace() == | 
|---|
| 5404 | TD->getAllocaAddrSpace()) && | 
|---|
| 5405 | "indirect argument must be in alloca address space"); | 
|---|
| 5406 |  | 
|---|
| 5407 | bool NeedCopy = false; | 
|---|
| 5408 | if (Addr.getAlignment() < Align && | 
|---|
| 5409 | llvm::getOrEnforceKnownAlignment(V: Addr.emitRawPointer(CGF&: *this), | 
|---|
| 5410 | PrefAlign: Align.getAsAlign(), | 
|---|
| 5411 | DL: *TD) < Align.getAsAlign()) { | 
|---|
| 5412 | NeedCopy = true; | 
|---|
| 5413 | } else if (I->hasLValue()) { | 
|---|
| 5414 | auto LV = I->getKnownLValue(); | 
|---|
| 5415 |  | 
|---|
| 5416 | bool isByValOrRef = | 
|---|
| 5417 | ArgInfo.isIndirectAliased() || ArgInfo.getIndirectByVal(); | 
|---|
| 5418 |  | 
|---|
| 5419 | if (!isByValOrRef || | 
|---|
| 5420 | (LV.getAlignment() < getContext().getTypeAlignInChars(T: I->Ty))) { | 
|---|
| 5421 | NeedCopy = true; | 
|---|
| 5422 | } | 
|---|
| 5423 |  | 
|---|
| 5424 | if (isByValOrRef && Addr.getType()->getAddressSpace() != | 
|---|
| 5425 | ArgInfo.getIndirectAddrSpace()) { | 
|---|
| 5426 | NeedCopy = true; | 
|---|
| 5427 | } | 
|---|
| 5428 | } | 
|---|
| 5429 |  | 
|---|
| 5430 | if (!NeedCopy) { | 
|---|
| 5431 | // Skip the extra memcpy call. | 
|---|
| 5432 | llvm::Value *V = getAsNaturalPointerTo(Addr, PointeeType: I->Ty); | 
|---|
| 5433 | auto *T = llvm::PointerType::get(C&: CGM.getLLVMContext(), | 
|---|
| 5434 | AddressSpace: ArgInfo.getIndirectAddrSpace()); | 
|---|
| 5435 |  | 
|---|
| 5436 | // FIXME: This should not depend on the language address spaces, and | 
|---|
| 5437 | // only the contextual values. If the address space mismatches, see if | 
|---|
| 5438 | // we can look through a cast to a compatible address space value, | 
|---|
| 5439 | // otherwise emit a copy. | 
|---|
| 5440 | llvm::Value *Val = getTargetHooks().performAddrSpaceCast( | 
|---|
| 5441 | CGF&: *this, V, SrcAddr: I->Ty.getAddressSpace(), DestTy: T, IsNonNull: true); | 
|---|
| 5442 | if (ArgHasMaybeUndefAttr) | 
|---|
| 5443 | Val = Builder.CreateFreeze(V: Val); | 
|---|
| 5444 | IRCallArgs[FirstIRArg] = Val; | 
|---|
| 5445 | break; | 
|---|
| 5446 | } | 
|---|
| 5447 | } else if (I->getType()->isArrayParameterType()) { | 
|---|
| 5448 | // Don't produce a temporary for ArrayParameterType arguments. | 
|---|
| 5449 | // ArrayParameterType arguments are only created from | 
|---|
| 5450 | // HLSL_ArrayRValue casts and HLSLOutArgExpr expressions, both | 
|---|
| 5451 | // of which create temporaries already. This allows us to just use the | 
|---|
| 5452 | // scalar for the decayed array pointer as the argument directly. | 
|---|
| 5453 | IRCallArgs[FirstIRArg] = I->getKnownRValue().getScalarVal(); | 
|---|
| 5454 | break; | 
|---|
| 5455 | } | 
|---|
| 5456 |  | 
|---|
| 5457 | // For non-aggregate args and aggregate args meeting conditions above | 
|---|
| 5458 | // we need to create an aligned temporary, and copy to it. | 
|---|
| 5459 | RawAddress AI = CreateMemTempWithoutCast( | 
|---|
| 5460 | T: I->Ty, Align: ArgInfo.getIndirectAlign(), Name: "byval-temp"); | 
|---|
| 5461 | llvm::Value *Val = getAsNaturalPointerTo(Addr: AI, PointeeType: I->Ty); | 
|---|
| 5462 | if (ArgHasMaybeUndefAttr) | 
|---|
| 5463 | Val = Builder.CreateFreeze(V: Val); | 
|---|
| 5464 | IRCallArgs[FirstIRArg] = Val; | 
|---|
| 5465 |  | 
|---|
| 5466 | // Emit lifetime markers for the temporary alloca. | 
|---|
| 5467 | llvm::TypeSize ByvalTempElementSize = | 
|---|
| 5468 | CGM.getDataLayout().getTypeAllocSize(Ty: AI.getElementType()); | 
|---|
| 5469 | llvm::Value *LifetimeSize = | 
|---|
| 5470 | EmitLifetimeStart(Size: ByvalTempElementSize, Addr: AI.getPointer()); | 
|---|
| 5471 |  | 
|---|
| 5472 | // Add cleanup code to emit the end lifetime marker after the call. | 
|---|
| 5473 | if (LifetimeSize) // In case we disabled lifetime markers. | 
|---|
| 5474 | CallLifetimeEndAfterCall.emplace_back(Args&: AI, Args&: LifetimeSize); | 
|---|
| 5475 |  | 
|---|
| 5476 | // Generate the copy. | 
|---|
| 5477 | I->copyInto(CGF&: *this, Addr: AI); | 
|---|
| 5478 | break; | 
|---|
| 5479 | } | 
|---|
| 5480 |  | 
|---|
| 5481 | case ABIArgInfo::Ignore: | 
|---|
| 5482 | assert(NumIRArgs == 0); | 
|---|
| 5483 | break; | 
|---|
| 5484 |  | 
|---|
| 5485 | case ABIArgInfo::Extend: | 
|---|
| 5486 | case ABIArgInfo::Direct: { | 
|---|
| 5487 | if (!isa<llvm::StructType>(Val: ArgInfo.getCoerceToType()) && | 
|---|
| 5488 | ArgInfo.getCoerceToType() == ConvertType(T: info_it->type) && | 
|---|
| 5489 | ArgInfo.getDirectOffset() == 0) { | 
|---|
| 5490 | assert(NumIRArgs == 1); | 
|---|
| 5491 | llvm::Value *V; | 
|---|
| 5492 | if (!I->isAggregate()) | 
|---|
| 5493 | V = I->getKnownRValue().getScalarVal(); | 
|---|
| 5494 | else | 
|---|
| 5495 | V = Builder.CreateLoad( | 
|---|
| 5496 | Addr: I->hasLValue() ? I->getKnownLValue().getAddress() | 
|---|
| 5497 | : I->getKnownRValue().getAggregateAddress()); | 
|---|
| 5498 |  | 
|---|
| 5499 | // Implement swifterror by copying into a new swifterror argument. | 
|---|
| 5500 | // We'll write back in the normal path out of the call. | 
|---|
| 5501 | if (CallInfo.getExtParameterInfo(argIndex: ArgNo).getABI() == | 
|---|
| 5502 | ParameterABI::SwiftErrorResult) { | 
|---|
| 5503 | assert(!swiftErrorTemp.isValid() && "multiple swifterror args"); | 
|---|
| 5504 |  | 
|---|
| 5505 | QualType pointeeTy = I->Ty->getPointeeType(); | 
|---|
| 5506 | swiftErrorArg = makeNaturalAddressForPointer( | 
|---|
| 5507 | Ptr: V, T: pointeeTy, Alignment: getContext().getTypeAlignInChars(T: pointeeTy)); | 
|---|
| 5508 |  | 
|---|
| 5509 | swiftErrorTemp = | 
|---|
| 5510 | CreateMemTemp(T: pointeeTy, Align: getPointerAlign(), Name: "swifterror.temp"); | 
|---|
| 5511 | V = swiftErrorTemp.getPointer(); | 
|---|
| 5512 | cast<llvm::AllocaInst>(Val: V)->setSwiftError(true); | 
|---|
| 5513 |  | 
|---|
| 5514 | llvm::Value *errorValue = Builder.CreateLoad(Addr: swiftErrorArg); | 
|---|
| 5515 | Builder.CreateStore(Val: errorValue, Addr: swiftErrorTemp); | 
|---|
| 5516 | } | 
|---|
| 5517 |  | 
|---|
| 5518 | // We might have to widen integers, but we should never truncate. | 
|---|
| 5519 | if (ArgInfo.getCoerceToType() != V->getType() && | 
|---|
| 5520 | V->getType()->isIntegerTy()) | 
|---|
| 5521 | V = Builder.CreateZExt(V, DestTy: ArgInfo.getCoerceToType()); | 
|---|
| 5522 |  | 
|---|
| 5523 | // The only plausible mismatch here would be for pointer address spaces. | 
|---|
| 5524 | // We assume that the target has a reasonable mapping for the DefaultAS | 
|---|
| 5525 | // (it can be casted to from incoming specific ASes), and insert an AS | 
|---|
| 5526 | // cast to address the mismatch. | 
|---|
| 5527 | if (FirstIRArg < IRFuncTy->getNumParams() && | 
|---|
| 5528 | V->getType() != IRFuncTy->getParamType(i: FirstIRArg)) { | 
|---|
| 5529 | assert(V->getType()->isPointerTy() && "Only pointers can mismatch!"); | 
|---|
| 5530 | auto ActualAS = I->Ty.getAddressSpace(); | 
|---|
| 5531 | V = getTargetHooks().performAddrSpaceCast( | 
|---|
| 5532 | CGF&: *this, V, SrcAddr: ActualAS, DestTy: IRFuncTy->getParamType(i: FirstIRArg)); | 
|---|
| 5533 | } | 
|---|
| 5534 |  | 
|---|
| 5535 | if (ArgHasMaybeUndefAttr) | 
|---|
| 5536 | V = Builder.CreateFreeze(V); | 
|---|
| 5537 | IRCallArgs[FirstIRArg] = V; | 
|---|
| 5538 | break; | 
|---|
| 5539 | } | 
|---|
| 5540 |  | 
|---|
| 5541 | llvm::StructType *STy = | 
|---|
| 5542 | dyn_cast<llvm::StructType>(Val: ArgInfo.getCoerceToType()); | 
|---|
| 5543 |  | 
|---|
| 5544 | // FIXME: Avoid the conversion through memory if possible. | 
|---|
| 5545 | Address Src = Address::invalid(); | 
|---|
| 5546 | if (!I->isAggregate()) { | 
|---|
| 5547 | Src = CreateMemTemp(T: I->Ty, Name: "coerce"); | 
|---|
| 5548 | I->copyInto(CGF&: *this, Addr: Src); | 
|---|
| 5549 | } else { | 
|---|
| 5550 | Src = I->hasLValue() ? I->getKnownLValue().getAddress() | 
|---|
| 5551 | : I->getKnownRValue().getAggregateAddress(); | 
|---|
| 5552 | } | 
|---|
| 5553 |  | 
|---|
| 5554 | // If the value is offset in memory, apply the offset now. | 
|---|
| 5555 | Src = emitAddressAtOffset(CGF&: *this, addr: Src, info: ArgInfo); | 
|---|
| 5556 |  | 
|---|
| 5557 | // Fast-isel and the optimizer generally like scalar values better than | 
|---|
| 5558 | // FCAs, so we flatten them if this is safe to do for this argument. | 
|---|
| 5559 | if (STy && ArgInfo.isDirect() && ArgInfo.getCanBeFlattened()) { | 
|---|
| 5560 | llvm::Type *SrcTy = Src.getElementType(); | 
|---|
| 5561 | llvm::TypeSize SrcTypeSize = | 
|---|
| 5562 | CGM.getDataLayout().getTypeAllocSize(Ty: SrcTy); | 
|---|
| 5563 | llvm::TypeSize DstTypeSize = CGM.getDataLayout().getTypeAllocSize(Ty: STy); | 
|---|
| 5564 | if (SrcTypeSize.isScalable()) { | 
|---|
| 5565 | assert(STy->containsHomogeneousScalableVectorTypes() && | 
|---|
| 5566 | "ABI only supports structure with homogeneous scalable vector " | 
|---|
| 5567 | "type"); | 
|---|
| 5568 | assert(SrcTypeSize == DstTypeSize && | 
|---|
| 5569 | "Only allow non-fractional movement of structure with " | 
|---|
| 5570 | "homogeneous scalable vector type"); | 
|---|
| 5571 | assert(NumIRArgs == STy->getNumElements()); | 
|---|
| 5572 |  | 
|---|
| 5573 | llvm::Value *StoredStructValue = | 
|---|
| 5574 | Builder.CreateLoad(Addr: Src, Name: Src.getName() + ".tuple"); | 
|---|
| 5575 | for (unsigned i = 0, e = STy->getNumElements(); i != e; ++i) { | 
|---|
| 5576 | llvm::Value * = Builder.CreateExtractValue( | 
|---|
| 5577 | Agg: StoredStructValue, Idxs: i, Name: Src.getName() + ".extract"+ Twine(i)); | 
|---|
| 5578 | IRCallArgs[FirstIRArg + i] = Extract; | 
|---|
| 5579 | } | 
|---|
| 5580 | } else { | 
|---|
| 5581 | uint64_t SrcSize = SrcTypeSize.getFixedValue(); | 
|---|
| 5582 | uint64_t DstSize = DstTypeSize.getFixedValue(); | 
|---|
| 5583 |  | 
|---|
| 5584 | // If the source type is smaller than the destination type of the | 
|---|
| 5585 | // coerce-to logic, copy the source value into a temp alloca the size | 
|---|
| 5586 | // of the destination type to allow loading all of it. The bits past | 
|---|
| 5587 | // the source value are left undef. | 
|---|
| 5588 | if (SrcSize < DstSize) { | 
|---|
| 5589 | Address TempAlloca = CreateTempAlloca(Ty: STy, align: Src.getAlignment(), | 
|---|
| 5590 | Name: Src.getName() + ".coerce"); | 
|---|
| 5591 | Builder.CreateMemCpy(Dest: TempAlloca, Src, Size: SrcSize); | 
|---|
| 5592 | Src = TempAlloca; | 
|---|
| 5593 | } else { | 
|---|
| 5594 | Src = Src.withElementType(ElemTy: STy); | 
|---|
| 5595 | } | 
|---|
| 5596 |  | 
|---|
| 5597 | assert(NumIRArgs == STy->getNumElements()); | 
|---|
| 5598 | for (unsigned i = 0, e = STy->getNumElements(); i != e; ++i) { | 
|---|
| 5599 | Address EltPtr = Builder.CreateStructGEP(Addr: Src, Index: i); | 
|---|
| 5600 | llvm::Value *LI = Builder.CreateLoad(Addr: EltPtr); | 
|---|
| 5601 | if (ArgHasMaybeUndefAttr) | 
|---|
| 5602 | LI = Builder.CreateFreeze(V: LI); | 
|---|
| 5603 | IRCallArgs[FirstIRArg + i] = LI; | 
|---|
| 5604 | } | 
|---|
| 5605 | } | 
|---|
| 5606 | } else { | 
|---|
| 5607 | // In the simple case, just pass the coerced loaded value. | 
|---|
| 5608 | assert(NumIRArgs == 1); | 
|---|
| 5609 | llvm::Value *Load = | 
|---|
| 5610 | CreateCoercedLoad(Src, Ty: ArgInfo.getCoerceToType(), CGF&: *this); | 
|---|
| 5611 |  | 
|---|
| 5612 | if (CallInfo.isCmseNSCall()) { | 
|---|
| 5613 | // For certain parameter types, clear padding bits, as they may reveal | 
|---|
| 5614 | // sensitive information. | 
|---|
| 5615 | // Small struct/union types are passed as integer arrays. | 
|---|
| 5616 | auto *ATy = dyn_cast<llvm::ArrayType>(Val: Load->getType()); | 
|---|
| 5617 | if (ATy != nullptr && isa<RecordType>(Val: I->Ty.getCanonicalType())) | 
|---|
| 5618 | Load = EmitCMSEClearRecord(Src: Load, ATy, QTy: I->Ty); | 
|---|
| 5619 | } | 
|---|
| 5620 |  | 
|---|
| 5621 | if (ArgHasMaybeUndefAttr) | 
|---|
| 5622 | Load = Builder.CreateFreeze(V: Load); | 
|---|
| 5623 | IRCallArgs[FirstIRArg] = Load; | 
|---|
| 5624 | } | 
|---|
| 5625 |  | 
|---|
| 5626 | break; | 
|---|
| 5627 | } | 
|---|
| 5628 |  | 
|---|
| 5629 | case ABIArgInfo::CoerceAndExpand: { | 
|---|
| 5630 | auto coercionType = ArgInfo.getCoerceAndExpandType(); | 
|---|
| 5631 | auto layout = CGM.getDataLayout().getStructLayout(Ty: coercionType); | 
|---|
| 5632 | auto unpaddedCoercionType = ArgInfo.getUnpaddedCoerceAndExpandType(); | 
|---|
| 5633 | auto *unpaddedStruct = dyn_cast<llvm::StructType>(Val: unpaddedCoercionType); | 
|---|
| 5634 |  | 
|---|
| 5635 | llvm::Value *tempSize = nullptr; | 
|---|
| 5636 | Address addr = Address::invalid(); | 
|---|
| 5637 | RawAddress AllocaAddr = RawAddress::invalid(); | 
|---|
| 5638 | if (I->isAggregate()) { | 
|---|
| 5639 | addr = I->hasLValue() ? I->getKnownLValue().getAddress() | 
|---|
| 5640 | : I->getKnownRValue().getAggregateAddress(); | 
|---|
| 5641 |  | 
|---|
| 5642 | } else { | 
|---|
| 5643 | RValue RV = I->getKnownRValue(); | 
|---|
| 5644 | assert(RV.isScalar()); // complex should always just be direct | 
|---|
| 5645 |  | 
|---|
| 5646 | llvm::Type *scalarType = RV.getScalarVal()->getType(); | 
|---|
| 5647 | auto scalarSize = CGM.getDataLayout().getTypeAllocSize(Ty: scalarType); | 
|---|
| 5648 | auto scalarAlign = CGM.getDataLayout().getPrefTypeAlign(Ty: scalarType); | 
|---|
| 5649 |  | 
|---|
| 5650 | // Materialize to a temporary. | 
|---|
| 5651 | addr = CreateTempAlloca(Ty: RV.getScalarVal()->getType(), | 
|---|
| 5652 | align: CharUnits::fromQuantity(Quantity: std::max( | 
|---|
| 5653 | a: layout->getAlignment(), b: scalarAlign)), | 
|---|
| 5654 | Name: "tmp", | 
|---|
| 5655 | /*ArraySize=*/nullptr, Alloca: &AllocaAddr); | 
|---|
| 5656 | tempSize = EmitLifetimeStart(Size: scalarSize, Addr: AllocaAddr.getPointer()); | 
|---|
| 5657 |  | 
|---|
| 5658 | Builder.CreateStore(Val: RV.getScalarVal(), Addr: addr); | 
|---|
| 5659 | } | 
|---|
| 5660 |  | 
|---|
| 5661 | addr = addr.withElementType(ElemTy: coercionType); | 
|---|
| 5662 |  | 
|---|
| 5663 | unsigned IRArgPos = FirstIRArg; | 
|---|
| 5664 | unsigned unpaddedIndex = 0; | 
|---|
| 5665 | for (unsigned i = 0, e = coercionType->getNumElements(); i != e; ++i) { | 
|---|
| 5666 | llvm::Type *eltType = coercionType->getElementType(N: i); | 
|---|
| 5667 | if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType)) | 
|---|
| 5668 | continue; | 
|---|
| 5669 | Address eltAddr = Builder.CreateStructGEP(Addr: addr, Index: i); | 
|---|
| 5670 | llvm::Value *elt = CreateCoercedLoad( | 
|---|
| 5671 | Src: eltAddr, | 
|---|
| 5672 | Ty: unpaddedStruct ? unpaddedStruct->getElementType(N: unpaddedIndex++) | 
|---|
| 5673 | : unpaddedCoercionType, | 
|---|
| 5674 | CGF&: *this); | 
|---|
| 5675 | if (ArgHasMaybeUndefAttr) | 
|---|
| 5676 | elt = Builder.CreateFreeze(V: elt); | 
|---|
| 5677 | IRCallArgs[IRArgPos++] = elt; | 
|---|
| 5678 | } | 
|---|
| 5679 | assert(IRArgPos == FirstIRArg + NumIRArgs); | 
|---|
| 5680 |  | 
|---|
| 5681 | if (tempSize) { | 
|---|
| 5682 | EmitLifetimeEnd(Size: tempSize, Addr: AllocaAddr.getPointer()); | 
|---|
| 5683 | } | 
|---|
| 5684 |  | 
|---|
| 5685 | break; | 
|---|
| 5686 | } | 
|---|
| 5687 |  | 
|---|
| 5688 | case ABIArgInfo::Expand: { | 
|---|
| 5689 | unsigned IRArgPos = FirstIRArg; | 
|---|
| 5690 | ExpandTypeToArgs(Ty: I->Ty, Arg: *I, IRFuncTy, IRCallArgs, IRCallArgPos&: IRArgPos); | 
|---|
| 5691 | assert(IRArgPos == FirstIRArg + NumIRArgs); | 
|---|
| 5692 | break; | 
|---|
| 5693 | } | 
|---|
| 5694 | } | 
|---|
| 5695 | } | 
|---|
| 5696 |  | 
|---|
| 5697 | const CGCallee &ConcreteCallee = Callee.prepareConcreteCallee(CGF&: *this); | 
|---|
| 5698 | llvm::Value *CalleePtr = ConcreteCallee.getFunctionPointer(); | 
|---|
| 5699 |  | 
|---|
| 5700 | // If we're using inalloca, set up that argument. | 
|---|
| 5701 | if (ArgMemory.isValid()) { | 
|---|
| 5702 | llvm::Value *Arg = ArgMemory.getPointer(); | 
|---|
| 5703 | assert(IRFunctionArgs.hasInallocaArg()); | 
|---|
| 5704 | IRCallArgs[IRFunctionArgs.getInallocaArgNo()] = Arg; | 
|---|
| 5705 | } | 
|---|
| 5706 |  | 
|---|
| 5707 | // 2. Prepare the function pointer. | 
|---|
| 5708 |  | 
|---|
| 5709 | // If the callee is a bitcast of a non-variadic function to have a | 
|---|
| 5710 | // variadic function pointer type, check to see if we can remove the | 
|---|
| 5711 | // bitcast.  This comes up with unprototyped functions. | 
|---|
| 5712 | // | 
|---|
| 5713 | // This makes the IR nicer, but more importantly it ensures that we | 
|---|
| 5714 | // can inline the function at -O0 if it is marked always_inline. | 
|---|
| 5715 | auto simplifyVariadicCallee = [](llvm::FunctionType *CalleeFT, | 
|---|
| 5716 | llvm::Value *Ptr) -> llvm::Function * { | 
|---|
| 5717 | if (!CalleeFT->isVarArg()) | 
|---|
| 5718 | return nullptr; | 
|---|
| 5719 |  | 
|---|
| 5720 | // Get underlying value if it's a bitcast | 
|---|
| 5721 | if (llvm::ConstantExpr *CE = dyn_cast<llvm::ConstantExpr>(Val: Ptr)) { | 
|---|
| 5722 | if (CE->getOpcode() == llvm::Instruction::BitCast) | 
|---|
| 5723 | Ptr = CE->getOperand(i_nocapture: 0); | 
|---|
| 5724 | } | 
|---|
| 5725 |  | 
|---|
| 5726 | llvm::Function *OrigFn = dyn_cast<llvm::Function>(Val: Ptr); | 
|---|
| 5727 | if (!OrigFn) | 
|---|
| 5728 | return nullptr; | 
|---|
| 5729 |  | 
|---|
| 5730 | llvm::FunctionType *OrigFT = OrigFn->getFunctionType(); | 
|---|
| 5731 |  | 
|---|
| 5732 | // If the original type is variadic, or if any of the component types | 
|---|
| 5733 | // disagree, we cannot remove the cast. | 
|---|
| 5734 | if (OrigFT->isVarArg() || | 
|---|
| 5735 | OrigFT->getNumParams() != CalleeFT->getNumParams() || | 
|---|
| 5736 | OrigFT->getReturnType() != CalleeFT->getReturnType()) | 
|---|
| 5737 | return nullptr; | 
|---|
| 5738 |  | 
|---|
| 5739 | for (unsigned i = 0, e = OrigFT->getNumParams(); i != e; ++i) | 
|---|
| 5740 | if (OrigFT->getParamType(i) != CalleeFT->getParamType(i)) | 
|---|
| 5741 | return nullptr; | 
|---|
| 5742 |  | 
|---|
| 5743 | return OrigFn; | 
|---|
| 5744 | }; | 
|---|
| 5745 |  | 
|---|
| 5746 | if (llvm::Function *OrigFn = simplifyVariadicCallee(IRFuncTy, CalleePtr)) { | 
|---|
| 5747 | CalleePtr = OrigFn; | 
|---|
| 5748 | IRFuncTy = OrigFn->getFunctionType(); | 
|---|
| 5749 | } | 
|---|
| 5750 |  | 
|---|
| 5751 | // 3. Perform the actual call. | 
|---|
| 5752 |  | 
|---|
| 5753 | // Deactivate any cleanups that we're supposed to do immediately before | 
|---|
| 5754 | // the call. | 
|---|
| 5755 | if (!CallArgs.getCleanupsToDeactivate().empty()) | 
|---|
| 5756 | deactivateArgCleanupsBeforeCall(CGF&: *this, CallArgs); | 
|---|
| 5757 |  | 
|---|
| 5758 | // Update the largest vector width if any arguments have vector types. | 
|---|
| 5759 | for (unsigned i = 0; i < IRCallArgs.size(); ++i) | 
|---|
| 5760 | LargestVectorWidth = std::max(a: LargestVectorWidth, | 
|---|
| 5761 | b: getMaxVectorWidth(Ty: IRCallArgs[i]->getType())); | 
|---|
| 5762 |  | 
|---|
| 5763 | // Compute the calling convention and attributes. | 
|---|
| 5764 | unsigned CallingConv; | 
|---|
| 5765 | llvm::AttributeList Attrs; | 
|---|
| 5766 | CGM.ConstructAttributeList(Name: CalleePtr->getName(), FI: CallInfo, | 
|---|
| 5767 | CalleeInfo: Callee.getAbstractInfo(), AttrList&: Attrs, CallingConv, | 
|---|
| 5768 | /*AttrOnCallSite=*/true, | 
|---|
| 5769 | /*IsThunk=*/false); | 
|---|
| 5770 |  | 
|---|
| 5771 | if (CallingConv == llvm::CallingConv::X86_VectorCall && | 
|---|
| 5772 | getTarget().getTriple().isWindowsArm64EC()) { | 
|---|
| 5773 | CGM.Error(loc: Loc, error: "__vectorcall calling convention is not currently " | 
|---|
| 5774 | "supported"); | 
|---|
| 5775 | } | 
|---|
| 5776 |  | 
|---|
| 5777 | if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: CurFuncDecl)) { | 
|---|
| 5778 | if (FD->hasAttr<StrictFPAttr>()) | 
|---|
| 5779 | // All calls within a strictfp function are marked strictfp | 
|---|
| 5780 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::StrictFP); | 
|---|
| 5781 |  | 
|---|
| 5782 | // If -ffast-math is enabled and the function is guarded by an | 
|---|
| 5783 | // '__attribute__((optnone)) adjust the memory attribute so the BE emits the | 
|---|
| 5784 | // library call instead of the intrinsic. | 
|---|
| 5785 | if (FD->hasAttr<OptimizeNoneAttr>() && getLangOpts().FastMath) | 
|---|
| 5786 | CGM.AdjustMemoryAttribute(Name: CalleePtr->getName(), CalleeInfo: Callee.getAbstractInfo(), | 
|---|
| 5787 | Attrs); | 
|---|
| 5788 | } | 
|---|
| 5789 | // Add call-site nomerge attribute if exists. | 
|---|
| 5790 | if (InNoMergeAttributedStmt) | 
|---|
| 5791 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::NoMerge); | 
|---|
| 5792 |  | 
|---|
| 5793 | // Add call-site noinline attribute if exists. | 
|---|
| 5794 | if (InNoInlineAttributedStmt) | 
|---|
| 5795 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::NoInline); | 
|---|
| 5796 |  | 
|---|
| 5797 | // Add call-site always_inline attribute if exists. | 
|---|
| 5798 | // Note: This corresponds to the [[clang::always_inline]] statement attribute. | 
|---|
| 5799 | if (InAlwaysInlineAttributedStmt && | 
|---|
| 5800 | !CGM.getTargetCodeGenInfo().wouldInliningViolateFunctionCallABI( | 
|---|
| 5801 | Caller: CallerDecl, Callee: CalleeDecl)) | 
|---|
| 5802 | Attrs = | 
|---|
| 5803 | Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::AlwaysInline); | 
|---|
| 5804 |  | 
|---|
| 5805 | // Remove call-site convergent attribute if requested. | 
|---|
| 5806 | if (InNoConvergentAttributedStmt) | 
|---|
| 5807 | Attrs = | 
|---|
| 5808 | Attrs.removeFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::Convergent); | 
|---|
| 5809 |  | 
|---|
| 5810 | // Apply some call-site-specific attributes. | 
|---|
| 5811 | // TODO: work this into building the attribute set. | 
|---|
| 5812 |  | 
|---|
| 5813 | // Apply always_inline to all calls within flatten functions. | 
|---|
| 5814 | // FIXME: should this really take priority over __try, below? | 
|---|
| 5815 | if (CurCodeDecl && CurCodeDecl->hasAttr<FlattenAttr>() && | 
|---|
| 5816 | !InNoInlineAttributedStmt && | 
|---|
| 5817 | !(TargetDecl && TargetDecl->hasAttr<NoInlineAttr>()) && | 
|---|
| 5818 | !CGM.getTargetCodeGenInfo().wouldInliningViolateFunctionCallABI( | 
|---|
| 5819 | Caller: CallerDecl, Callee: CalleeDecl)) { | 
|---|
| 5820 | Attrs = | 
|---|
| 5821 | Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::AlwaysInline); | 
|---|
| 5822 | } | 
|---|
| 5823 |  | 
|---|
| 5824 | // Disable inlining inside SEH __try blocks. | 
|---|
| 5825 | if (isSEHTryScope()) { | 
|---|
| 5826 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::NoInline); | 
|---|
| 5827 | } | 
|---|
| 5828 |  | 
|---|
| 5829 | // Decide whether to use a call or an invoke. | 
|---|
| 5830 | bool CannotThrow; | 
|---|
| 5831 | if (currentFunctionUsesSEHTry()) { | 
|---|
| 5832 | // SEH cares about asynchronous exceptions, so everything can "throw." | 
|---|
| 5833 | CannotThrow = false; | 
|---|
| 5834 | } else if (isCleanupPadScope() && | 
|---|
| 5835 | EHPersonality::get(CGF&: *this).isMSVCXXPersonality()) { | 
|---|
| 5836 | // The MSVC++ personality will implicitly terminate the program if an | 
|---|
| 5837 | // exception is thrown during a cleanup outside of a try/catch. | 
|---|
| 5838 | // We don't need to model anything in IR to get this behavior. | 
|---|
| 5839 | CannotThrow = true; | 
|---|
| 5840 | } else { | 
|---|
| 5841 | // Otherwise, nounwind call sites will never throw. | 
|---|
| 5842 | CannotThrow = Attrs.hasFnAttr(Kind: llvm::Attribute::NoUnwind); | 
|---|
| 5843 |  | 
|---|
| 5844 | if (auto *FPtr = dyn_cast<llvm::Function>(Val: CalleePtr)) | 
|---|
| 5845 | if (FPtr->hasFnAttribute(Kind: llvm::Attribute::NoUnwind)) | 
|---|
| 5846 | CannotThrow = true; | 
|---|
| 5847 | } | 
|---|
| 5848 |  | 
|---|
| 5849 | // If we made a temporary, be sure to clean up after ourselves. Note that we | 
|---|
| 5850 | // can't depend on being inside of an ExprWithCleanups, so we need to manually | 
|---|
| 5851 | // pop this cleanup later on. Being eager about this is OK, since this | 
|---|
| 5852 | // temporary is 'invisible' outside of the callee. | 
|---|
| 5853 | if (UnusedReturnSizePtr) | 
|---|
| 5854 | pushFullExprCleanup<CallLifetimeEnd>(kind: NormalEHLifetimeMarker, A: SRetPtr, | 
|---|
| 5855 | A: UnusedReturnSizePtr); | 
|---|
| 5856 |  | 
|---|
| 5857 | llvm::BasicBlock *InvokeDest = CannotThrow ? nullptr : getInvokeDest(); | 
|---|
| 5858 |  | 
|---|
| 5859 | SmallVector<llvm::OperandBundleDef, 1> BundleList = | 
|---|
| 5860 | getBundlesForFunclet(Callee: CalleePtr); | 
|---|
| 5861 |  | 
|---|
| 5862 | if (SanOpts.has(K: SanitizerKind::KCFI) && | 
|---|
| 5863 | !isa_and_nonnull<FunctionDecl>(Val: TargetDecl)) | 
|---|
| 5864 | EmitKCFIOperandBundle(Callee: ConcreteCallee, Bundles&: BundleList); | 
|---|
| 5865 |  | 
|---|
| 5866 | // Add the pointer-authentication bundle. | 
|---|
| 5867 | EmitPointerAuthOperandBundle(Info: ConcreteCallee.getPointerAuthInfo(), Bundles&: BundleList); | 
|---|
| 5868 |  | 
|---|
| 5869 | if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(Val: CurFuncDecl)) | 
|---|
| 5870 | if (FD->hasAttr<StrictFPAttr>()) | 
|---|
| 5871 | // All calls within a strictfp function are marked strictfp | 
|---|
| 5872 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: llvm::Attribute::StrictFP); | 
|---|
| 5873 |  | 
|---|
| 5874 | AssumeAlignedAttrEmitter AssumeAlignedAttrEmitter(*this, TargetDecl); | 
|---|
| 5875 | Attrs = AssumeAlignedAttrEmitter.TryEmitAsCallSiteAttribute(Attrs); | 
|---|
| 5876 |  | 
|---|
| 5877 | AllocAlignAttrEmitter AllocAlignAttrEmitter(*this, TargetDecl, CallArgs); | 
|---|
| 5878 | Attrs = AllocAlignAttrEmitter.TryEmitAsCallSiteAttribute(Attrs); | 
|---|
| 5879 |  | 
|---|
| 5880 | // Emit the actual call/invoke instruction. | 
|---|
| 5881 | llvm::CallBase *CI; | 
|---|
| 5882 | if (!InvokeDest) { | 
|---|
| 5883 | CI = Builder.CreateCall(FTy: IRFuncTy, Callee: CalleePtr, Args: IRCallArgs, OpBundles: BundleList); | 
|---|
| 5884 | } else { | 
|---|
| 5885 | llvm::BasicBlock *Cont = createBasicBlock(name: "invoke.cont"); | 
|---|
| 5886 | CI = Builder.CreateInvoke(Ty: IRFuncTy, Callee: CalleePtr, NormalDest: Cont, UnwindDest: InvokeDest, Args: IRCallArgs, | 
|---|
| 5887 | OpBundles: BundleList); | 
|---|
| 5888 | EmitBlock(BB: Cont); | 
|---|
| 5889 | } | 
|---|
| 5890 | if (CI->getCalledFunction() && CI->getCalledFunction()->hasName() && | 
|---|
| 5891 | CI->getCalledFunction()->getName().starts_with(Prefix: "_Z4sqrt")) { | 
|---|
| 5892 | SetSqrtFPAccuracy(CI); | 
|---|
| 5893 | } | 
|---|
| 5894 | if (callOrInvoke) | 
|---|
| 5895 | *callOrInvoke = CI; | 
|---|
| 5896 |  | 
|---|
| 5897 | // If this is within a function that has the guard(nocf) attribute and is an | 
|---|
| 5898 | // indirect call, add the "guard_nocf" attribute to this call to indicate that | 
|---|
| 5899 | // Control Flow Guard checks should not be added, even if the call is inlined. | 
|---|
| 5900 | if (const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: CurFuncDecl)) { | 
|---|
| 5901 | if (const auto *A = FD->getAttr<CFGuardAttr>()) { | 
|---|
| 5902 | if (A->getGuard() == CFGuardAttr::GuardArg::nocf && | 
|---|
| 5903 | !CI->getCalledFunction()) | 
|---|
| 5904 | Attrs = Attrs.addFnAttribute(C&: getLLVMContext(), Kind: "guard_nocf"); | 
|---|
| 5905 | } | 
|---|
| 5906 | } | 
|---|
| 5907 |  | 
|---|
| 5908 | // Apply the attributes and calling convention. | 
|---|
| 5909 | CI->setAttributes(Attrs); | 
|---|
| 5910 | CI->setCallingConv(static_cast<llvm::CallingConv::ID>(CallingConv)); | 
|---|
| 5911 |  | 
|---|
| 5912 | // Apply various metadata. | 
|---|
| 5913 |  | 
|---|
| 5914 | if (!CI->getType()->isVoidTy()) | 
|---|
| 5915 | CI->setName( "call"); | 
|---|
| 5916 |  | 
|---|
| 5917 | if (CGM.shouldEmitConvergenceTokens() && CI->isConvergent()) | 
|---|
| 5918 | CI = addConvergenceControlToken(Input: CI); | 
|---|
| 5919 |  | 
|---|
| 5920 | // Update largest vector width from the return type. | 
|---|
| 5921 | LargestVectorWidth = | 
|---|
| 5922 | std::max(a: LargestVectorWidth, b: getMaxVectorWidth(Ty: CI->getType())); | 
|---|
| 5923 |  | 
|---|
| 5924 | // Insert instrumentation or attach profile metadata at indirect call sites. | 
|---|
| 5925 | // For more details, see the comment before the definition of | 
|---|
| 5926 | // IPVK_IndirectCallTarget in InstrProfData.inc. | 
|---|
| 5927 | if (!CI->getCalledFunction()) | 
|---|
| 5928 | PGO->valueProfile(Builder, ValueKind: llvm::IPVK_IndirectCallTarget, ValueSite: CI, ValuePtr: CalleePtr); | 
|---|
| 5929 |  | 
|---|
| 5930 | // In ObjC ARC mode with no ObjC ARC exception safety, tell the ARC | 
|---|
| 5931 | // optimizer it can aggressively ignore unwind edges. | 
|---|
| 5932 | if (CGM.getLangOpts().ObjCAutoRefCount) | 
|---|
| 5933 | AddObjCARCExceptionMetadata(Inst: CI); | 
|---|
| 5934 |  | 
|---|
| 5935 | // Set tail call kind if necessary. | 
|---|
| 5936 | if (llvm::CallInst *Call = dyn_cast<llvm::CallInst>(Val: CI)) { | 
|---|
| 5937 | if (TargetDecl && TargetDecl->hasAttr<NotTailCalledAttr>()) | 
|---|
| 5938 | Call->setTailCallKind(llvm::CallInst::TCK_NoTail); | 
|---|
| 5939 | else if (IsMustTail) { | 
|---|
| 5940 | if (getTarget().getTriple().isPPC()) { | 
|---|
| 5941 | if (getTarget().getTriple().isOSAIX()) | 
|---|
| 5942 | CGM.getDiags().Report(Loc, DiagID: diag::err_aix_musttail_unsupported); | 
|---|
| 5943 | else if (!getTarget().hasFeature(Feature: "pcrelative-memops")) { | 
|---|
| 5944 | if (getTarget().hasFeature(Feature: "longcall")) | 
|---|
| 5945 | CGM.getDiags().Report(Loc, DiagID: diag::err_ppc_impossible_musttail) << 0; | 
|---|
| 5946 | else if (Call->isIndirectCall()) | 
|---|
| 5947 | CGM.getDiags().Report(Loc, DiagID: diag::err_ppc_impossible_musttail) << 1; | 
|---|
| 5948 | else if (isa_and_nonnull<FunctionDecl>(Val: TargetDecl)) { | 
|---|
| 5949 | if (!cast<FunctionDecl>(Val: TargetDecl)->isDefined()) | 
|---|
| 5950 | // The undefined callee may be a forward declaration. Without | 
|---|
| 5951 | // knowning all symbols in the module, we won't know the symbol is | 
|---|
| 5952 | // defined or not. Collect all these symbols for later diagnosing. | 
|---|
| 5953 | CGM.addUndefinedGlobalForTailCall( | 
|---|
| 5954 | Global: {cast<FunctionDecl>(Val: TargetDecl), Loc}); | 
|---|
| 5955 | else { | 
|---|
| 5956 | llvm::GlobalValue::LinkageTypes Linkage = CGM.getFunctionLinkage( | 
|---|
| 5957 | GD: GlobalDecl(cast<FunctionDecl>(Val: TargetDecl))); | 
|---|
| 5958 | if (llvm::GlobalValue::isWeakForLinker(Linkage) || | 
|---|
| 5959 | llvm::GlobalValue::isDiscardableIfUnused(Linkage)) | 
|---|
| 5960 | CGM.getDiags().Report(Loc, DiagID: diag::err_ppc_impossible_musttail) | 
|---|
| 5961 | << 2; | 
|---|
| 5962 | } | 
|---|
| 5963 | } | 
|---|
| 5964 | } | 
|---|
| 5965 | } | 
|---|
| 5966 | Call->setTailCallKind(llvm::CallInst::TCK_MustTail); | 
|---|
| 5967 | } | 
|---|
| 5968 | } | 
|---|
| 5969 |  | 
|---|
| 5970 | // Add metadata for calls to MSAllocator functions | 
|---|
| 5971 | if (getDebugInfo() && TargetDecl && TargetDecl->hasAttr<MSAllocatorAttr>()) | 
|---|
| 5972 | getDebugInfo()->addHeapAllocSiteMetadata(CallSite: CI, AllocatedTy: RetTy->getPointeeType(), Loc); | 
|---|
| 5973 |  | 
|---|
| 5974 | // Add metadata if calling an __attribute__((error(""))) or warning fn. | 
|---|
| 5975 | if (TargetDecl && TargetDecl->hasAttr<ErrorAttr>()) { | 
|---|
| 5976 | llvm::ConstantInt *Line = | 
|---|
| 5977 | llvm::ConstantInt::get(Ty: Int64Ty, V: Loc.getRawEncoding()); | 
|---|
| 5978 | llvm::ConstantAsMetadata *MD = llvm::ConstantAsMetadata::get(C: Line); | 
|---|
| 5979 | llvm::MDTuple *MDT = llvm::MDNode::get(Context&: getLLVMContext(), MDs: {MD}); | 
|---|
| 5980 | CI->setMetadata(Kind: "srcloc", Node: MDT); | 
|---|
| 5981 | } | 
|---|
| 5982 |  | 
|---|
| 5983 | // 4. Finish the call. | 
|---|
| 5984 |  | 
|---|
| 5985 | // If the call doesn't return, finish the basic block and clear the | 
|---|
| 5986 | // insertion point; this allows the rest of IRGen to discard | 
|---|
| 5987 | // unreachable code. | 
|---|
| 5988 | if (CI->doesNotReturn()) { | 
|---|
| 5989 | if (UnusedReturnSizePtr) | 
|---|
| 5990 | PopCleanupBlock(); | 
|---|
| 5991 |  | 
|---|
| 5992 | // Strip away the noreturn attribute to better diagnose unreachable UB. | 
|---|
| 5993 | if (SanOpts.has(K: SanitizerKind::Unreachable)) { | 
|---|
| 5994 | // Also remove from function since CallBase::hasFnAttr additionally checks | 
|---|
| 5995 | // attributes of the called function. | 
|---|
| 5996 | if (auto *F = CI->getCalledFunction()) | 
|---|
| 5997 | F->removeFnAttr(Kind: llvm::Attribute::NoReturn); | 
|---|
| 5998 | CI->removeFnAttr(Kind: llvm::Attribute::NoReturn); | 
|---|
| 5999 |  | 
|---|
| 6000 | // Avoid incompatibility with ASan which relies on the `noreturn` | 
|---|
| 6001 | // attribute to insert handler calls. | 
|---|
| 6002 | if (SanOpts.hasOneOf(K: SanitizerKind::Address | | 
|---|
| 6003 | SanitizerKind::KernelAddress)) { | 
|---|
| 6004 | SanitizerScope SanScope(this); | 
|---|
| 6005 | llvm::IRBuilder<>::InsertPointGuard IPGuard(Builder); | 
|---|
| 6006 | Builder.SetInsertPoint(CI); | 
|---|
| 6007 | auto *FnType = llvm::FunctionType::get(Result: CGM.VoidTy, /*isVarArg=*/false); | 
|---|
| 6008 | llvm::FunctionCallee Fn = | 
|---|
| 6009 | CGM.CreateRuntimeFunction(Ty: FnType, Name: "__asan_handle_no_return"); | 
|---|
| 6010 | EmitNounwindRuntimeCall(callee: Fn); | 
|---|
| 6011 | } | 
|---|
| 6012 | } | 
|---|
| 6013 |  | 
|---|
| 6014 | EmitUnreachable(Loc); | 
|---|
| 6015 | Builder.ClearInsertionPoint(); | 
|---|
| 6016 |  | 
|---|
| 6017 | // FIXME: For now, emit a dummy basic block because expr emitters in | 
|---|
| 6018 | // generally are not ready to handle emitting expressions at unreachable | 
|---|
| 6019 | // points. | 
|---|
| 6020 | EnsureInsertPoint(); | 
|---|
| 6021 |  | 
|---|
| 6022 | // Return a reasonable RValue. | 
|---|
| 6023 | return GetUndefRValue(Ty: RetTy); | 
|---|
| 6024 | } | 
|---|
| 6025 |  | 
|---|
| 6026 | // If this is a musttail call, return immediately. We do not branch to the | 
|---|
| 6027 | // epilogue in this case. | 
|---|
| 6028 | if (IsMustTail) { | 
|---|
| 6029 | for (auto it = EHStack.find(sp: CurrentCleanupScopeDepth); it != EHStack.end(); | 
|---|
| 6030 | ++it) { | 
|---|
| 6031 | EHCleanupScope *Cleanup = dyn_cast<EHCleanupScope>(Val: &*it); | 
|---|
| 6032 | // Fake uses can be safely emitted immediately prior to the tail call, so | 
|---|
| 6033 | // we choose to emit them just before the call here. | 
|---|
| 6034 | if (Cleanup && Cleanup->isFakeUse()) { | 
|---|
| 6035 | CGBuilderTy::InsertPointGuard IPG(Builder); | 
|---|
| 6036 | Builder.SetInsertPoint(CI); | 
|---|
| 6037 | Cleanup->getCleanup()->Emit(CGF&: *this, flags: EHScopeStack::Cleanup::Flags()); | 
|---|
| 6038 | } else if (!(Cleanup && | 
|---|
| 6039 | Cleanup->getCleanup()->isRedundantBeforeReturn())) { | 
|---|
| 6040 | CGM.ErrorUnsupported(S: MustTailCall, Type: "tail call skipping over cleanups"); | 
|---|
| 6041 | } | 
|---|
| 6042 | } | 
|---|
| 6043 | if (CI->getType()->isVoidTy()) | 
|---|
| 6044 | Builder.CreateRetVoid(); | 
|---|
| 6045 | else | 
|---|
| 6046 | Builder.CreateRet(V: CI); | 
|---|
| 6047 | Builder.ClearInsertionPoint(); | 
|---|
| 6048 | EnsureInsertPoint(); | 
|---|
| 6049 | return GetUndefRValue(Ty: RetTy); | 
|---|
| 6050 | } | 
|---|
| 6051 |  | 
|---|
| 6052 | // Perform the swifterror writeback. | 
|---|
| 6053 | if (swiftErrorTemp.isValid()) { | 
|---|
| 6054 | llvm::Value *errorResult = Builder.CreateLoad(Addr: swiftErrorTemp); | 
|---|
| 6055 | Builder.CreateStore(Val: errorResult, Addr: swiftErrorArg); | 
|---|
| 6056 | } | 
|---|
| 6057 |  | 
|---|
| 6058 | // Emit any call-associated writebacks immediately.  Arguably this | 
|---|
| 6059 | // should happen after any return-value munging. | 
|---|
| 6060 | if (CallArgs.hasWritebacks()) | 
|---|
| 6061 | EmitWritebacks(args: CallArgs); | 
|---|
| 6062 |  | 
|---|
| 6063 | // The stack cleanup for inalloca arguments has to run out of the normal | 
|---|
| 6064 | // lexical order, so deactivate it and run it manually here. | 
|---|
| 6065 | CallArgs.freeArgumentMemory(CGF&: *this); | 
|---|
| 6066 |  | 
|---|
| 6067 | // Extract the return value. | 
|---|
| 6068 | RValue Ret; | 
|---|
| 6069 |  | 
|---|
| 6070 | // If the current function is a virtual function pointer thunk, avoid copying | 
|---|
| 6071 | // the return value of the musttail call to a temporary. | 
|---|
| 6072 | if (IsVirtualFunctionPointerThunk) { | 
|---|
| 6073 | Ret = RValue::get(V: CI); | 
|---|
| 6074 | } else { | 
|---|
| 6075 | Ret = [&] { | 
|---|
| 6076 | switch (RetAI.getKind()) { | 
|---|
| 6077 | case ABIArgInfo::CoerceAndExpand: { | 
|---|
| 6078 | auto coercionType = RetAI.getCoerceAndExpandType(); | 
|---|
| 6079 |  | 
|---|
| 6080 | Address addr = SRetPtr.withElementType(ElemTy: coercionType); | 
|---|
| 6081 |  | 
|---|
| 6082 | assert(CI->getType() == RetAI.getUnpaddedCoerceAndExpandType()); | 
|---|
| 6083 | bool  = isa<llvm::StructType>(Val: CI->getType()); | 
|---|
| 6084 |  | 
|---|
| 6085 | unsigned unpaddedIndex = 0; | 
|---|
| 6086 | for (unsigned i = 0, e = coercionType->getNumElements(); i != e; ++i) { | 
|---|
| 6087 | llvm::Type *eltType = coercionType->getElementType(N: i); | 
|---|
| 6088 | if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType)) | 
|---|
| 6089 | continue; | 
|---|
| 6090 | Address eltAddr = Builder.CreateStructGEP(Addr: addr, Index: i); | 
|---|
| 6091 | llvm::Value *elt = CI; | 
|---|
| 6092 | if (requiresExtract) | 
|---|
| 6093 | elt = Builder.CreateExtractValue(Agg: elt, Idxs: unpaddedIndex++); | 
|---|
| 6094 | else | 
|---|
| 6095 | assert(unpaddedIndex == 0); | 
|---|
| 6096 | Builder.CreateStore(Val: elt, Addr: eltAddr); | 
|---|
| 6097 | } | 
|---|
| 6098 | [[fallthrough]]; | 
|---|
| 6099 | } | 
|---|
| 6100 |  | 
|---|
| 6101 | case ABIArgInfo::InAlloca: | 
|---|
| 6102 | case ABIArgInfo::Indirect: { | 
|---|
| 6103 | RValue ret = convertTempToRValue(addr: SRetPtr, type: RetTy, Loc: SourceLocation()); | 
|---|
| 6104 | if (UnusedReturnSizePtr) | 
|---|
| 6105 | PopCleanupBlock(); | 
|---|
| 6106 | return ret; | 
|---|
| 6107 | } | 
|---|
| 6108 |  | 
|---|
| 6109 | case ABIArgInfo::Ignore: | 
|---|
| 6110 | // If we are ignoring an argument that had a result, make sure to | 
|---|
| 6111 | // construct the appropriate return value for our caller. | 
|---|
| 6112 | return GetUndefRValue(Ty: RetTy); | 
|---|
| 6113 |  | 
|---|
| 6114 | case ABIArgInfo::Extend: | 
|---|
| 6115 | case ABIArgInfo::Direct: { | 
|---|
| 6116 | llvm::Type *RetIRTy = ConvertType(T: RetTy); | 
|---|
| 6117 | if (RetAI.getCoerceToType() == RetIRTy && | 
|---|
| 6118 | RetAI.getDirectOffset() == 0) { | 
|---|
| 6119 | switch (getEvaluationKind(T: RetTy)) { | 
|---|
| 6120 | case TEK_Complex: { | 
|---|
| 6121 | llvm::Value *Real = Builder.CreateExtractValue(Agg: CI, Idxs: 0); | 
|---|
| 6122 | llvm::Value *Imag = Builder.CreateExtractValue(Agg: CI, Idxs: 1); | 
|---|
| 6123 | return RValue::getComplex(C: std::make_pair(x&: Real, y&: Imag)); | 
|---|
| 6124 | } | 
|---|
| 6125 | case TEK_Aggregate: | 
|---|
| 6126 | break; | 
|---|
| 6127 | case TEK_Scalar: { | 
|---|
| 6128 | // If the argument doesn't match, perform a bitcast to coerce it. | 
|---|
| 6129 | // This can happen due to trivial type mismatches. | 
|---|
| 6130 | llvm::Value *V = CI; | 
|---|
| 6131 | if (V->getType() != RetIRTy) | 
|---|
| 6132 | V = Builder.CreateBitCast(V, DestTy: RetIRTy); | 
|---|
| 6133 | return RValue::get(V); | 
|---|
| 6134 | } | 
|---|
| 6135 | } | 
|---|
| 6136 | } | 
|---|
| 6137 |  | 
|---|
| 6138 | // If coercing a fixed vector from a scalable vector for ABI | 
|---|
| 6139 | // compatibility, and the types match, use the llvm.vector.extract | 
|---|
| 6140 | // intrinsic to perform the conversion. | 
|---|
| 6141 | if (auto *FixedDstTy = dyn_cast<llvm::FixedVectorType>(Val: RetIRTy)) { | 
|---|
| 6142 | llvm::Value *V = CI; | 
|---|
| 6143 | if (auto *ScalableSrcTy = | 
|---|
| 6144 | dyn_cast<llvm::ScalableVectorType>(Val: V->getType())) { | 
|---|
| 6145 | if (FixedDstTy->getElementType() == | 
|---|
| 6146 | ScalableSrcTy->getElementType()) { | 
|---|
| 6147 | V = Builder.CreateExtractVector(DstType: FixedDstTy, SrcVec: V, Idx: uint64_t(0), | 
|---|
| 6148 | Name: "cast.fixed"); | 
|---|
| 6149 | return RValue::get(V); | 
|---|
| 6150 | } | 
|---|
| 6151 | } | 
|---|
| 6152 | } | 
|---|
| 6153 |  | 
|---|
| 6154 | Address DestPtr = ReturnValue.getValue(); | 
|---|
| 6155 | bool DestIsVolatile = ReturnValue.isVolatile(); | 
|---|
| 6156 | uint64_t DestSize = | 
|---|
| 6157 | getContext().getTypeInfoDataSizeInChars(T: RetTy).Width.getQuantity(); | 
|---|
| 6158 |  | 
|---|
| 6159 | if (!DestPtr.isValid()) { | 
|---|
| 6160 | DestPtr = CreateMemTemp(T: RetTy, Name: "coerce"); | 
|---|
| 6161 | DestIsVolatile = false; | 
|---|
| 6162 | DestSize = getContext().getTypeSizeInChars(T: RetTy).getQuantity(); | 
|---|
| 6163 | } | 
|---|
| 6164 |  | 
|---|
| 6165 | // An empty record can overlap other data (if declared with | 
|---|
| 6166 | // no_unique_address); omit the store for such types - as there is no | 
|---|
| 6167 | // actual data to store. | 
|---|
| 6168 | if (!isEmptyRecord(Context&: getContext(), T: RetTy, AllowArrays: true)) { | 
|---|
| 6169 | // If the value is offset in memory, apply the offset now. | 
|---|
| 6170 | Address StorePtr = emitAddressAtOffset(CGF&: *this, addr: DestPtr, info: RetAI); | 
|---|
| 6171 | CreateCoercedStore( | 
|---|
| 6172 | Src: CI, Dst: StorePtr, | 
|---|
| 6173 | DstSize: llvm::TypeSize::getFixed(ExactSize: DestSize - RetAI.getDirectOffset()), | 
|---|
| 6174 | DstIsVolatile: DestIsVolatile); | 
|---|
| 6175 | } | 
|---|
| 6176 |  | 
|---|
| 6177 | return convertTempToRValue(addr: DestPtr, type: RetTy, Loc: SourceLocation()); | 
|---|
| 6178 | } | 
|---|
| 6179 |  | 
|---|
| 6180 | case ABIArgInfo::Expand: | 
|---|
| 6181 | case ABIArgInfo::IndirectAliased: | 
|---|
| 6182 | llvm_unreachable( "Invalid ABI kind for return argument"); | 
|---|
| 6183 | } | 
|---|
| 6184 |  | 
|---|
| 6185 | llvm_unreachable( "Unhandled ABIArgInfo::Kind"); | 
|---|
| 6186 | }(); | 
|---|
| 6187 | } | 
|---|
| 6188 |  | 
|---|
| 6189 | // Emit the assume_aligned check on the return value. | 
|---|
| 6190 | if (Ret.isScalar() && TargetDecl) { | 
|---|
| 6191 | AssumeAlignedAttrEmitter.EmitAsAnAssumption(Loc, RetTy, Ret); | 
|---|
| 6192 | AllocAlignAttrEmitter.EmitAsAnAssumption(Loc, RetTy, Ret); | 
|---|
| 6193 | } | 
|---|
| 6194 |  | 
|---|
| 6195 | // Explicitly call CallLifetimeEnd::Emit just to re-use the code even though | 
|---|
| 6196 | // we can't use the full cleanup mechanism. | 
|---|
| 6197 | for (CallLifetimeEnd &LifetimeEnd : CallLifetimeEndAfterCall) | 
|---|
| 6198 | LifetimeEnd.Emit(CGF&: *this, /*Flags=*/flags: {}); | 
|---|
| 6199 |  | 
|---|
| 6200 | if (!ReturnValue.isExternallyDestructed() && | 
|---|
| 6201 | RetTy.isDestructedType() == QualType::DK_nontrivial_c_struct) | 
|---|
| 6202 | pushDestroy(dtorKind: QualType::DK_nontrivial_c_struct, addr: Ret.getAggregateAddress(), | 
|---|
| 6203 | type: RetTy); | 
|---|
| 6204 |  | 
|---|
| 6205 | return Ret; | 
|---|
| 6206 | } | 
|---|
| 6207 |  | 
|---|
| 6208 | CGCallee CGCallee::prepareConcreteCallee(CodeGenFunction &CGF) const { | 
|---|
| 6209 | if (isVirtual()) { | 
|---|
| 6210 | const CallExpr *CE = getVirtualCallExpr(); | 
|---|
| 6211 | return CGF.CGM.getCXXABI().getVirtualFunctionPointer( | 
|---|
| 6212 | CGF, GD: getVirtualMethodDecl(), This: getThisAddress(), Ty: getVirtualFunctionType(), | 
|---|
| 6213 | Loc: CE ? CE->getBeginLoc() : SourceLocation()); | 
|---|
| 6214 | } | 
|---|
| 6215 |  | 
|---|
| 6216 | return *this; | 
|---|
| 6217 | } | 
|---|
| 6218 |  | 
|---|
| 6219 | /* VarArg handling */ | 
|---|
| 6220 |  | 
|---|
| 6221 | RValue CodeGenFunction::EmitVAArg(VAArgExpr *VE, Address &VAListAddr, | 
|---|
| 6222 | AggValueSlot Slot) { | 
|---|
| 6223 | VAListAddr = VE->isMicrosoftABI() ? EmitMSVAListRef(E: VE->getSubExpr()) | 
|---|
| 6224 | : EmitVAListRef(E: VE->getSubExpr()); | 
|---|
| 6225 | QualType Ty = VE->getType(); | 
|---|
| 6226 | if (Ty->isVariablyModifiedType()) | 
|---|
| 6227 | EmitVariablyModifiedType(Ty); | 
|---|
| 6228 | if (VE->isMicrosoftABI()) | 
|---|
| 6229 | return CGM.getABIInfo().EmitMSVAArg(CGF&: *this, VAListAddr, Ty, Slot); | 
|---|
| 6230 | return CGM.getABIInfo().EmitVAArg(CGF&: *this, VAListAddr, Ty, Slot); | 
|---|
| 6231 | } | 
|---|
| 6232 |  | 
|---|