| 1 | //===- AArch64.cpp --------------------------------------------------------===// | 
|---|
| 2 | // | 
|---|
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|---|
| 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|---|
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|---|
| 6 | // | 
|---|
| 7 | //===----------------------------------------------------------------------===// | 
|---|
| 8 |  | 
|---|
| 9 | #include "ABIInfoImpl.h" | 
|---|
| 10 | #include "TargetInfo.h" | 
|---|
| 11 | #include "clang/AST/Decl.h" | 
|---|
| 12 | #include "clang/Basic/DiagnosticFrontend.h" | 
|---|
| 13 | #include "llvm/TargetParser/AArch64TargetParser.h" | 
|---|
| 14 |  | 
|---|
| 15 | using namespace clang; | 
|---|
| 16 | using namespace clang::CodeGen; | 
|---|
| 17 |  | 
|---|
| 18 | //===----------------------------------------------------------------------===// | 
|---|
| 19 | // AArch64 ABI Implementation | 
|---|
| 20 | //===----------------------------------------------------------------------===// | 
|---|
| 21 |  | 
|---|
| 22 | namespace { | 
|---|
| 23 |  | 
|---|
| 24 | class AArch64ABIInfo : public ABIInfo { | 
|---|
| 25 | AArch64ABIKind Kind; | 
|---|
| 26 |  | 
|---|
| 27 | public: | 
|---|
| 28 | AArch64ABIInfo(CodeGenTypes &CGT, AArch64ABIKind Kind) | 
|---|
| 29 | : ABIInfo(CGT), Kind(Kind) {} | 
|---|
| 30 |  | 
|---|
| 31 | bool isSoftFloat() const { return Kind == AArch64ABIKind::AAPCSSoft; } | 
|---|
| 32 |  | 
|---|
| 33 | private: | 
|---|
| 34 | AArch64ABIKind getABIKind() const { return Kind; } | 
|---|
| 35 | bool isDarwinPCS() const { return Kind == AArch64ABIKind::DarwinPCS; } | 
|---|
| 36 |  | 
|---|
| 37 | ABIArgInfo classifyReturnType(QualType RetTy, bool IsVariadicFn) const; | 
|---|
| 38 | ABIArgInfo classifyArgumentType(QualType RetTy, bool IsVariadicFn, | 
|---|
| 39 | bool IsNamedArg, unsigned CallingConvention, | 
|---|
| 40 | unsigned &NSRN, unsigned &NPRN) const; | 
|---|
| 41 | llvm::Type *convertFixedToScalableVectorType(const VectorType *VT) const; | 
|---|
| 42 | ABIArgInfo coerceIllegalVector(QualType Ty, unsigned &NSRN, | 
|---|
| 43 | unsigned &NPRN) const; | 
|---|
| 44 | ABIArgInfo coerceAndExpandPureScalableAggregate( | 
|---|
| 45 | QualType Ty, bool IsNamedArg, unsigned NVec, unsigned NPred, | 
|---|
| 46 | const SmallVectorImpl<llvm::Type *> &UnpaddedCoerceToSeq, unsigned &NSRN, | 
|---|
| 47 | unsigned &NPRN) const; | 
|---|
| 48 | bool isHomogeneousAggregateBaseType(QualType Ty) const override; | 
|---|
| 49 | bool isHomogeneousAggregateSmallEnough(const Type *Ty, | 
|---|
| 50 | uint64_t Members) const override; | 
|---|
| 51 | bool isZeroLengthBitfieldPermittedInHomogeneousAggregate() const override; | 
|---|
| 52 |  | 
|---|
| 53 | bool isIllegalVectorType(QualType Ty) const; | 
|---|
| 54 |  | 
|---|
| 55 | bool passAsAggregateType(QualType Ty) const; | 
|---|
| 56 | bool passAsPureScalableType(QualType Ty, unsigned &NV, unsigned &NP, | 
|---|
| 57 | SmallVectorImpl<llvm::Type *> &CoerceToSeq) const; | 
|---|
| 58 |  | 
|---|
| 59 | void flattenType(llvm::Type *Ty, | 
|---|
| 60 | SmallVectorImpl<llvm::Type *> &Flattened) const; | 
|---|
| 61 |  | 
|---|
| 62 | void computeInfo(CGFunctionInfo &FI) const override { | 
|---|
| 63 | if (!::classifyReturnType(CXXABI: getCXXABI(), FI, Info: *this)) | 
|---|
| 64 | FI.getReturnInfo() = | 
|---|
| 65 | classifyReturnType(RetTy: FI.getReturnType(), IsVariadicFn: FI.isVariadic()); | 
|---|
| 66 |  | 
|---|
| 67 | unsigned ArgNo = 0; | 
|---|
| 68 | unsigned NSRN = 0, NPRN = 0; | 
|---|
| 69 | for (auto &it : FI.arguments()) { | 
|---|
| 70 | const bool IsNamedArg = | 
|---|
| 71 | !FI.isVariadic() || ArgNo < FI.getRequiredArgs().getNumRequiredArgs(); | 
|---|
| 72 | ++ArgNo; | 
|---|
| 73 | it.info = classifyArgumentType(RetTy: it.type, IsVariadicFn: FI.isVariadic(), IsNamedArg, | 
|---|
| 74 | CallingConvention: FI.getCallingConvention(), NSRN, NPRN); | 
|---|
| 75 | } | 
|---|
| 76 | } | 
|---|
| 77 |  | 
|---|
| 78 | RValue EmitDarwinVAArg(Address VAListAddr, QualType Ty, CodeGenFunction &CGF, | 
|---|
| 79 | AggValueSlot Slot) const; | 
|---|
| 80 |  | 
|---|
| 81 | RValue EmitAAPCSVAArg(Address VAListAddr, QualType Ty, CodeGenFunction &CGF, | 
|---|
| 82 | AArch64ABIKind Kind, AggValueSlot Slot) const; | 
|---|
| 83 |  | 
|---|
| 84 | RValue EmitVAArg(CodeGenFunction &CGF, Address VAListAddr, QualType Ty, | 
|---|
| 85 | AggValueSlot Slot) const override { | 
|---|
| 86 | llvm::Type *BaseTy = CGF.ConvertType(T: Ty); | 
|---|
| 87 | if (isa<llvm::ScalableVectorType>(Val: BaseTy)) | 
|---|
| 88 | llvm::report_fatal_error(reason: "Passing SVE types to variadic functions is " | 
|---|
| 89 | "currently not supported"); | 
|---|
| 90 |  | 
|---|
| 91 | return Kind == AArch64ABIKind::Win64 | 
|---|
| 92 | ? EmitMSVAArg(CGF, VAListAddr, Ty, Slot) | 
|---|
| 93 | : isDarwinPCS() ? EmitDarwinVAArg(VAListAddr, Ty, CGF, Slot) | 
|---|
| 94 | : EmitAAPCSVAArg(VAListAddr, Ty, CGF, Kind, Slot); | 
|---|
| 95 | } | 
|---|
| 96 |  | 
|---|
| 97 | RValue EmitMSVAArg(CodeGenFunction &CGF, Address VAListAddr, QualType Ty, | 
|---|
| 98 | AggValueSlot Slot) const override; | 
|---|
| 99 |  | 
|---|
| 100 | bool allowBFloatArgsAndRet() const override { | 
|---|
| 101 | return getTarget().hasBFloat16Type(); | 
|---|
| 102 | } | 
|---|
| 103 |  | 
|---|
| 104 | using ABIInfo::appendAttributeMangling; | 
|---|
| 105 | void appendAttributeMangling(TargetClonesAttr *Attr, unsigned Index, | 
|---|
| 106 | raw_ostream &Out) const override; | 
|---|
| 107 | void appendAttributeMangling(StringRef AttrStr, | 
|---|
| 108 | raw_ostream &Out) const override; | 
|---|
| 109 | }; | 
|---|
| 110 |  | 
|---|
| 111 | class AArch64SwiftABIInfo : public SwiftABIInfo { | 
|---|
| 112 | public: | 
|---|
| 113 | explicit AArch64SwiftABIInfo(CodeGenTypes &CGT) | 
|---|
| 114 | : SwiftABIInfo(CGT, /*SwiftErrorInRegister=*/true) {} | 
|---|
| 115 |  | 
|---|
| 116 | bool isLegalVectorType(CharUnits VectorSize, llvm::Type *EltTy, | 
|---|
| 117 | unsigned NumElts) const override; | 
|---|
| 118 | }; | 
|---|
| 119 |  | 
|---|
| 120 | class AArch64TargetCodeGenInfo : public TargetCodeGenInfo { | 
|---|
| 121 | public: | 
|---|
| 122 | AArch64TargetCodeGenInfo(CodeGenTypes &CGT, AArch64ABIKind Kind) | 
|---|
| 123 | : TargetCodeGenInfo(std::make_unique<AArch64ABIInfo>(args&: CGT, args&: Kind)) { | 
|---|
| 124 | SwiftInfo = std::make_unique<AArch64SwiftABIInfo>(args&: CGT); | 
|---|
| 125 | } | 
|---|
| 126 |  | 
|---|
| 127 | StringRef getARCRetainAutoreleasedReturnValueMarker() const override { | 
|---|
| 128 | return "mov\tfp, fp\t\t// marker for objc_retainAutoreleaseReturnValue"; | 
|---|
| 129 | } | 
|---|
| 130 |  | 
|---|
| 131 | int getDwarfEHStackPointer(CodeGen::CodeGenModule &M) const override { | 
|---|
| 132 | return 31; | 
|---|
| 133 | } | 
|---|
| 134 |  | 
|---|
| 135 | bool doesReturnSlotInterfereWithArgs() const override { return false; } | 
|---|
| 136 |  | 
|---|
| 137 | void setTargetAttributes(const Decl *D, llvm::GlobalValue *GV, | 
|---|
| 138 | CodeGen::CodeGenModule &CGM) const override { | 
|---|
| 139 | auto *Fn = dyn_cast<llvm::Function>(Val: GV); | 
|---|
| 140 | if (!Fn) | 
|---|
| 141 | return; | 
|---|
| 142 |  | 
|---|
| 143 | const auto *FD = dyn_cast_or_null<FunctionDecl>(Val: D); | 
|---|
| 144 | TargetInfo::BranchProtectionInfo BPI(CGM.getLangOpts()); | 
|---|
| 145 |  | 
|---|
| 146 | if (FD && FD->hasAttr<TargetAttr>()) { | 
|---|
| 147 | const auto *TA = FD->getAttr<TargetAttr>(); | 
|---|
| 148 | ParsedTargetAttr Attr = | 
|---|
| 149 | CGM.getTarget().parseTargetAttr(Str: TA->getFeaturesStr()); | 
|---|
| 150 | if (!Attr.BranchProtection.empty()) { | 
|---|
| 151 | StringRef Error; | 
|---|
| 152 | (void)CGM.getTarget().validateBranchProtection( | 
|---|
| 153 | Spec: Attr.BranchProtection, Arch: Attr.CPU, BPI, LO: CGM.getLangOpts(), Err&: Error); | 
|---|
| 154 | assert(Error.empty()); | 
|---|
| 155 | } | 
|---|
| 156 | } | 
|---|
| 157 | setBranchProtectionFnAttributes(BPI, F&: *Fn); | 
|---|
| 158 | setPointerAuthFnAttributes(Opts: CGM.getCodeGenOpts().PointerAuth, F&: *Fn); | 
|---|
| 159 | } | 
|---|
| 160 |  | 
|---|
| 161 | bool isScalarizableAsmOperand(CodeGen::CodeGenFunction &CGF, | 
|---|
| 162 | llvm::Type *Ty) const override { | 
|---|
| 163 | if (CGF.getTarget().hasFeature(Feature: "ls64")) { | 
|---|
| 164 | auto *ST = dyn_cast<llvm::StructType>(Val: Ty); | 
|---|
| 165 | if (ST && ST->getNumElements() == 1) { | 
|---|
| 166 | auto *AT = dyn_cast<llvm::ArrayType>(Val: ST->getElementType(N: 0)); | 
|---|
| 167 | if (AT && AT->getNumElements() == 8 && | 
|---|
| 168 | AT->getElementType()->isIntegerTy(Bitwidth: 64)) | 
|---|
| 169 | return true; | 
|---|
| 170 | } | 
|---|
| 171 | } | 
|---|
| 172 | return TargetCodeGenInfo::isScalarizableAsmOperand(CGF, Ty); | 
|---|
| 173 | } | 
|---|
| 174 |  | 
|---|
| 175 | void checkFunctionABI(CodeGenModule &CGM, | 
|---|
| 176 | const FunctionDecl *Decl) const override; | 
|---|
| 177 |  | 
|---|
| 178 | void checkFunctionCallABI(CodeGenModule &CGM, SourceLocation CallLoc, | 
|---|
| 179 | const FunctionDecl *Caller, | 
|---|
| 180 | const FunctionDecl *Callee, const CallArgList &Args, | 
|---|
| 181 | QualType ReturnType) const override; | 
|---|
| 182 |  | 
|---|
| 183 | bool wouldInliningViolateFunctionCallABI( | 
|---|
| 184 | const FunctionDecl *Caller, const FunctionDecl *Callee) const override; | 
|---|
| 185 |  | 
|---|
| 186 | private: | 
|---|
| 187 | // Diagnose calls between functions with incompatible Streaming SVE | 
|---|
| 188 | // attributes. | 
|---|
| 189 | void checkFunctionCallABIStreaming(CodeGenModule &CGM, SourceLocation CallLoc, | 
|---|
| 190 | const FunctionDecl *Caller, | 
|---|
| 191 | const FunctionDecl *Callee) const; | 
|---|
| 192 | // Diagnose calls which must pass arguments in floating-point registers when | 
|---|
| 193 | // the selected target does not have floating-point registers. | 
|---|
| 194 | void checkFunctionCallABISoftFloat(CodeGenModule &CGM, SourceLocation CallLoc, | 
|---|
| 195 | const FunctionDecl *Caller, | 
|---|
| 196 | const FunctionDecl *Callee, | 
|---|
| 197 | const CallArgList &Args, | 
|---|
| 198 | QualType ReturnType) const; | 
|---|
| 199 | }; | 
|---|
| 200 |  | 
|---|
| 201 | class WindowsAArch64TargetCodeGenInfo : public AArch64TargetCodeGenInfo { | 
|---|
| 202 | public: | 
|---|
| 203 | WindowsAArch64TargetCodeGenInfo(CodeGenTypes &CGT, AArch64ABIKind K) | 
|---|
| 204 | : AArch64TargetCodeGenInfo(CGT, K) {} | 
|---|
| 205 |  | 
|---|
| 206 | void setTargetAttributes(const Decl *D, llvm::GlobalValue *GV, | 
|---|
| 207 | CodeGen::CodeGenModule &CGM) const override; | 
|---|
| 208 |  | 
|---|
| 209 | void getDependentLibraryOption(llvm::StringRef Lib, | 
|---|
| 210 | llvm::SmallString<24> &Opt) const override { | 
|---|
| 211 | Opt = "/DEFAULTLIB:"+ qualifyWindowsLibrary(Lib); | 
|---|
| 212 | } | 
|---|
| 213 |  | 
|---|
| 214 | void getDetectMismatchOption(llvm::StringRef Name, llvm::StringRef Value, | 
|---|
| 215 | llvm::SmallString<32> &Opt) const override { | 
|---|
| 216 | Opt = "/FAILIFMISMATCH:\""+ Name.str() + "="+ Value.str() + "\""; | 
|---|
| 217 | } | 
|---|
| 218 | }; | 
|---|
| 219 |  | 
|---|
| 220 | void WindowsAArch64TargetCodeGenInfo::setTargetAttributes( | 
|---|
| 221 | const Decl *D, llvm::GlobalValue *GV, CodeGen::CodeGenModule &CGM) const { | 
|---|
| 222 | AArch64TargetCodeGenInfo::setTargetAttributes(D, GV, CGM); | 
|---|
| 223 | if (GV->isDeclaration()) | 
|---|
| 224 | return; | 
|---|
| 225 | addStackProbeTargetAttributes(D, GV, CGM); | 
|---|
| 226 | } | 
|---|
| 227 | } | 
|---|
| 228 |  | 
|---|
| 229 | llvm::Type * | 
|---|
| 230 | AArch64ABIInfo::convertFixedToScalableVectorType(const VectorType *VT) const { | 
|---|
| 231 | assert(VT->getElementType()->isBuiltinType() && "expected builtin type!"); | 
|---|
| 232 |  | 
|---|
| 233 | if (VT->getVectorKind() == VectorKind::SveFixedLengthPredicate) { | 
|---|
| 234 | assert(VT->getElementType()->castAs<BuiltinType>()->getKind() == | 
|---|
| 235 | BuiltinType::UChar && | 
|---|
| 236 | "unexpected builtin type for SVE predicate!"); | 
|---|
| 237 | return llvm::ScalableVectorType::get(ElementType: llvm::Type::getInt1Ty(C&: getVMContext()), | 
|---|
| 238 | MinNumElts: 16); | 
|---|
| 239 | } | 
|---|
| 240 |  | 
|---|
| 241 | if (VT->getVectorKind() == VectorKind::SveFixedLengthData) { | 
|---|
| 242 | const auto *BT = VT->getElementType()->castAs<BuiltinType>(); | 
|---|
| 243 | switch (BT->getKind()) { | 
|---|
| 244 | default: | 
|---|
| 245 | llvm_unreachable( "unexpected builtin type for SVE vector!"); | 
|---|
| 246 |  | 
|---|
| 247 | case BuiltinType::SChar: | 
|---|
| 248 | case BuiltinType::UChar: | 
|---|
| 249 | case BuiltinType::MFloat8: | 
|---|
| 250 | return llvm::ScalableVectorType::get( | 
|---|
| 251 | ElementType: llvm::Type::getInt8Ty(C&: getVMContext()), MinNumElts: 16); | 
|---|
| 252 |  | 
|---|
| 253 | case BuiltinType::Short: | 
|---|
| 254 | case BuiltinType::UShort: | 
|---|
| 255 | return llvm::ScalableVectorType::get( | 
|---|
| 256 | ElementType: llvm::Type::getInt16Ty(C&: getVMContext()), MinNumElts: 8); | 
|---|
| 257 |  | 
|---|
| 258 | case BuiltinType::Int: | 
|---|
| 259 | case BuiltinType::UInt: | 
|---|
| 260 | return llvm::ScalableVectorType::get( | 
|---|
| 261 | ElementType: llvm::Type::getInt32Ty(C&: getVMContext()), MinNumElts: 4); | 
|---|
| 262 |  | 
|---|
| 263 | case BuiltinType::Long: | 
|---|
| 264 | case BuiltinType::ULong: | 
|---|
| 265 | return llvm::ScalableVectorType::get( | 
|---|
| 266 | ElementType: llvm::Type::getInt64Ty(C&: getVMContext()), MinNumElts: 2); | 
|---|
| 267 |  | 
|---|
| 268 | case BuiltinType::Half: | 
|---|
| 269 | return llvm::ScalableVectorType::get( | 
|---|
| 270 | ElementType: llvm::Type::getHalfTy(C&: getVMContext()), MinNumElts: 8); | 
|---|
| 271 |  | 
|---|
| 272 | case BuiltinType::Float: | 
|---|
| 273 | return llvm::ScalableVectorType::get( | 
|---|
| 274 | ElementType: llvm::Type::getFloatTy(C&: getVMContext()), MinNumElts: 4); | 
|---|
| 275 |  | 
|---|
| 276 | case BuiltinType::Double: | 
|---|
| 277 | return llvm::ScalableVectorType::get( | 
|---|
| 278 | ElementType: llvm::Type::getDoubleTy(C&: getVMContext()), MinNumElts: 2); | 
|---|
| 279 |  | 
|---|
| 280 | case BuiltinType::BFloat16: | 
|---|
| 281 | return llvm::ScalableVectorType::get( | 
|---|
| 282 | ElementType: llvm::Type::getBFloatTy(C&: getVMContext()), MinNumElts: 8); | 
|---|
| 283 | } | 
|---|
| 284 | } | 
|---|
| 285 |  | 
|---|
| 286 | llvm_unreachable( "expected fixed-length SVE vector"); | 
|---|
| 287 | } | 
|---|
| 288 |  | 
|---|
| 289 | ABIArgInfo AArch64ABIInfo::coerceIllegalVector(QualType Ty, unsigned &NSRN, | 
|---|
| 290 | unsigned &NPRN) const { | 
|---|
| 291 | assert(Ty->isVectorType() && "expected vector type!"); | 
|---|
| 292 |  | 
|---|
| 293 | const auto *VT = Ty->castAs<VectorType>(); | 
|---|
| 294 | if (VT->getVectorKind() == VectorKind::SveFixedLengthPredicate) { | 
|---|
| 295 | assert(VT->getElementType()->isBuiltinType() && "expected builtin type!"); | 
|---|
| 296 | assert(VT->getElementType()->castAs<BuiltinType>()->getKind() == | 
|---|
| 297 | BuiltinType::UChar && | 
|---|
| 298 | "unexpected builtin type for SVE predicate!"); | 
|---|
| 299 | NPRN = std::min(a: NPRN + 1, b: 4u); | 
|---|
| 300 | return ABIArgInfo::getDirect(T: llvm::ScalableVectorType::get( | 
|---|
| 301 | ElementType: llvm::Type::getInt1Ty(C&: getVMContext()), MinNumElts: 16)); | 
|---|
| 302 | } | 
|---|
| 303 |  | 
|---|
| 304 | if (VT->getVectorKind() == VectorKind::SveFixedLengthData) { | 
|---|
| 305 | NSRN = std::min(a: NSRN + 1, b: 8u); | 
|---|
| 306 | return ABIArgInfo::getDirect(T: convertFixedToScalableVectorType(VT)); | 
|---|
| 307 | } | 
|---|
| 308 |  | 
|---|
| 309 | uint64_t Size = getContext().getTypeSize(T: Ty); | 
|---|
| 310 | // Android promotes <2 x i8> to i16, not i32 | 
|---|
| 311 | if ((isAndroid() || isOHOSFamily()) && (Size <= 16)) { | 
|---|
| 312 | llvm::Type *ResType = llvm::Type::getInt16Ty(C&: getVMContext()); | 
|---|
| 313 | return ABIArgInfo::getDirect(T: ResType); | 
|---|
| 314 | } | 
|---|
| 315 | if (Size <= 32) { | 
|---|
| 316 | llvm::Type *ResType = llvm::Type::getInt32Ty(C&: getVMContext()); | 
|---|
| 317 | return ABIArgInfo::getDirect(T: ResType); | 
|---|
| 318 | } | 
|---|
| 319 | if (Size == 64) { | 
|---|
| 320 | NSRN = std::min(a: NSRN + 1, b: 8u); | 
|---|
| 321 | auto *ResType = | 
|---|
| 322 | llvm::FixedVectorType::get(ElementType: llvm::Type::getInt32Ty(C&: getVMContext()), NumElts: 2); | 
|---|
| 323 | return ABIArgInfo::getDirect(T: ResType); | 
|---|
| 324 | } | 
|---|
| 325 | if (Size == 128) { | 
|---|
| 326 | NSRN = std::min(a: NSRN + 1, b: 8u); | 
|---|
| 327 | auto *ResType = | 
|---|
| 328 | llvm::FixedVectorType::get(ElementType: llvm::Type::getInt32Ty(C&: getVMContext()), NumElts: 4); | 
|---|
| 329 | return ABIArgInfo::getDirect(T: ResType); | 
|---|
| 330 | } | 
|---|
| 331 |  | 
|---|
| 332 | return getNaturalAlignIndirect(Ty, AddrSpace: getDataLayout().getAllocaAddrSpace(), | 
|---|
| 333 | /*ByVal=*/false); | 
|---|
| 334 | } | 
|---|
| 335 |  | 
|---|
| 336 | ABIArgInfo AArch64ABIInfo::coerceAndExpandPureScalableAggregate( | 
|---|
| 337 | QualType Ty, bool IsNamedArg, unsigned NVec, unsigned NPred, | 
|---|
| 338 | const SmallVectorImpl<llvm::Type *> &UnpaddedCoerceToSeq, unsigned &NSRN, | 
|---|
| 339 | unsigned &NPRN) const { | 
|---|
| 340 | if (!IsNamedArg || NSRN + NVec > 8 || NPRN + NPred > 4) | 
|---|
| 341 | return getNaturalAlignIndirect(Ty, AddrSpace: getDataLayout().getAllocaAddrSpace(), | 
|---|
| 342 | /*ByVal=*/false); | 
|---|
| 343 | NSRN += NVec; | 
|---|
| 344 | NPRN += NPred; | 
|---|
| 345 |  | 
|---|
| 346 | // Handle SVE vector tuples. | 
|---|
| 347 | if (Ty->isSVESizelessBuiltinType()) | 
|---|
| 348 | return ABIArgInfo::getDirect(); | 
|---|
| 349 |  | 
|---|
| 350 | llvm::Type *UnpaddedCoerceToType = | 
|---|
| 351 | UnpaddedCoerceToSeq.size() == 1 | 
|---|
| 352 | ? UnpaddedCoerceToSeq[0] | 
|---|
| 353 | : llvm::StructType::get(Context&: CGT.getLLVMContext(), Elements: UnpaddedCoerceToSeq, | 
|---|
| 354 | isPacked: true); | 
|---|
| 355 |  | 
|---|
| 356 | SmallVector<llvm::Type *> CoerceToSeq; | 
|---|
| 357 | flattenType(Ty: CGT.ConvertType(T: Ty), Flattened&: CoerceToSeq); | 
|---|
| 358 | auto *CoerceToType = | 
|---|
| 359 | llvm::StructType::get(Context&: CGT.getLLVMContext(), Elements: CoerceToSeq, isPacked: false); | 
|---|
| 360 |  | 
|---|
| 361 | return ABIArgInfo::getCoerceAndExpand(coerceToType: CoerceToType, unpaddedCoerceToType: UnpaddedCoerceToType); | 
|---|
| 362 | } | 
|---|
| 363 |  | 
|---|
| 364 | ABIArgInfo AArch64ABIInfo::classifyArgumentType(QualType Ty, bool IsVariadicFn, | 
|---|
| 365 | bool IsNamedArg, | 
|---|
| 366 | unsigned CallingConvention, | 
|---|
| 367 | unsigned &NSRN, | 
|---|
| 368 | unsigned &NPRN) const { | 
|---|
| 369 | Ty = useFirstFieldIfTransparentUnion(Ty); | 
|---|
| 370 |  | 
|---|
| 371 | // Handle illegal vector types here. | 
|---|
| 372 | if (isIllegalVectorType(Ty)) | 
|---|
| 373 | return coerceIllegalVector(Ty, NSRN, NPRN); | 
|---|
| 374 |  | 
|---|
| 375 | if (!passAsAggregateType(Ty)) { | 
|---|
| 376 | // Treat an enum type as its underlying type. | 
|---|
| 377 | if (const EnumType *EnumTy = Ty->getAs<EnumType>()) | 
|---|
| 378 | Ty = EnumTy->getDecl()->getIntegerType(); | 
|---|
| 379 |  | 
|---|
| 380 | if (const auto *EIT = Ty->getAs<BitIntType>()) | 
|---|
| 381 | if (EIT->getNumBits() > 128) | 
|---|
| 382 | return getNaturalAlignIndirect(Ty, AddrSpace: getDataLayout().getAllocaAddrSpace(), | 
|---|
| 383 | ByVal: false); | 
|---|
| 384 |  | 
|---|
| 385 | if (Ty->isVectorType()) | 
|---|
| 386 | NSRN = std::min(a: NSRN + 1, b: 8u); | 
|---|
| 387 | else if (const auto *BT = Ty->getAs<BuiltinType>()) { | 
|---|
| 388 | if (BT->isFloatingPoint()) | 
|---|
| 389 | NSRN = std::min(a: NSRN + 1, b: 8u); | 
|---|
| 390 | else { | 
|---|
| 391 | switch (BT->getKind()) { | 
|---|
| 392 | case BuiltinType::SveBool: | 
|---|
| 393 | case BuiltinType::SveCount: | 
|---|
| 394 | NPRN = std::min(a: NPRN + 1, b: 4u); | 
|---|
| 395 | break; | 
|---|
| 396 | case BuiltinType::SveBoolx2: | 
|---|
| 397 | NPRN = std::min(a: NPRN + 2, b: 4u); | 
|---|
| 398 | break; | 
|---|
| 399 | case BuiltinType::SveBoolx4: | 
|---|
| 400 | NPRN = std::min(a: NPRN + 4, b: 4u); | 
|---|
| 401 | break; | 
|---|
| 402 | default: | 
|---|
| 403 | if (BT->isSVESizelessBuiltinType()) | 
|---|
| 404 | NSRN = std::min( | 
|---|
| 405 | a: NSRN + getContext().getBuiltinVectorTypeInfo(VecTy: BT).NumVectors, | 
|---|
| 406 | b: 8u); | 
|---|
| 407 | } | 
|---|
| 408 | } | 
|---|
| 409 | } | 
|---|
| 410 |  | 
|---|
| 411 | return (isPromotableIntegerTypeForABI(Ty) && isDarwinPCS() | 
|---|
| 412 | ? ABIArgInfo::getExtend(Ty, T: CGT.ConvertType(T: Ty)) | 
|---|
| 413 | : ABIArgInfo::getDirect()); | 
|---|
| 414 | } | 
|---|
| 415 |  | 
|---|
| 416 | // Structures with either a non-trivial destructor or a non-trivial | 
|---|
| 417 | // copy constructor are always indirect. | 
|---|
| 418 | if (CGCXXABI::RecordArgABI RAA = getRecordArgABI(T: Ty, CXXABI&: getCXXABI())) { | 
|---|
| 419 | return getNaturalAlignIndirect( | 
|---|
| 420 | Ty, /*AddrSpace=*/getDataLayout().getAllocaAddrSpace(), | 
|---|
| 421 | /*ByVal=*/RAA == CGCXXABI::RAA_DirectInMemory); | 
|---|
| 422 | } | 
|---|
| 423 |  | 
|---|
| 424 | // Empty records: | 
|---|
| 425 | uint64_t Size = getContext().getTypeSize(T: Ty); | 
|---|
| 426 | bool IsEmpty = isEmptyRecord(Context&: getContext(), T: Ty, AllowArrays: true); | 
|---|
| 427 | if (!Ty->isSVESizelessBuiltinType() && (IsEmpty || Size == 0)) { | 
|---|
| 428 | // Empty records are ignored in C mode, and in C++ on Darwin. | 
|---|
| 429 | if (!getContext().getLangOpts().CPlusPlus || isDarwinPCS()) | 
|---|
| 430 | return ABIArgInfo::getIgnore(); | 
|---|
| 431 |  | 
|---|
| 432 | // In C++ mode, arguments which have sizeof() == 0 (which are non-standard | 
|---|
| 433 | // C++) are ignored. This isn't defined by any standard, so we copy GCC's | 
|---|
| 434 | // behaviour here. | 
|---|
| 435 | if (Size == 0) | 
|---|
| 436 | return ABIArgInfo::getIgnore(); | 
|---|
| 437 |  | 
|---|
| 438 | // Otherwise, they are passed as if they have a size of 1 byte. | 
|---|
| 439 | return ABIArgInfo::getDirect(T: llvm::Type::getInt8Ty(C&: getVMContext())); | 
|---|
| 440 | } | 
|---|
| 441 |  | 
|---|
| 442 | // Homogeneous Floating-point Aggregates (HFAs) need to be expanded. | 
|---|
| 443 | const Type *Base = nullptr; | 
|---|
| 444 | uint64_t Members = 0; | 
|---|
| 445 | bool IsWin64 = Kind == AArch64ABIKind::Win64 || | 
|---|
| 446 | CallingConvention == llvm::CallingConv::Win64; | 
|---|
| 447 | bool IsWinVariadic = IsWin64 && IsVariadicFn; | 
|---|
| 448 | // In variadic functions on Windows, all composite types are treated alike, | 
|---|
| 449 | // no special handling of HFAs/HVAs. | 
|---|
| 450 | if (!IsWinVariadic && isHomogeneousAggregate(Ty, Base, Members)) { | 
|---|
| 451 | NSRN = std::min(a: NSRN + Members, b: uint64_t(8)); | 
|---|
| 452 | if (Kind != AArch64ABIKind::AAPCS) | 
|---|
| 453 | return ABIArgInfo::getDirect( | 
|---|
| 454 | T: llvm::ArrayType::get(ElementType: CGT.ConvertType(T: QualType(Base, 0)), NumElements: Members)); | 
|---|
| 455 |  | 
|---|
| 456 | // For HFAs/HVAs, cap the argument alignment to 16, otherwise | 
|---|
| 457 | // set it to 8 according to the AAPCS64 document. | 
|---|
| 458 | unsigned Align = | 
|---|
| 459 | getContext().getTypeUnadjustedAlignInChars(T: Ty).getQuantity(); | 
|---|
| 460 | Align = (Align >= 16) ? 16 : 8; | 
|---|
| 461 | return ABIArgInfo::getDirect( | 
|---|
| 462 | T: llvm::ArrayType::get(ElementType: CGT.ConvertType(T: QualType(Base, 0)), NumElements: Members), Offset: 0, | 
|---|
| 463 | Padding: nullptr, CanBeFlattened: true, Align); | 
|---|
| 464 | } | 
|---|
| 465 |  | 
|---|
| 466 | // In AAPCS named arguments of a Pure Scalable Type are passed expanded in | 
|---|
| 467 | // registers, or indirectly if there are not enough registers. | 
|---|
| 468 | if (Kind == AArch64ABIKind::AAPCS) { | 
|---|
| 469 | unsigned NVec = 0, NPred = 0; | 
|---|
| 470 | SmallVector<llvm::Type *> UnpaddedCoerceToSeq; | 
|---|
| 471 | if (passAsPureScalableType(Ty, NV&: NVec, NP&: NPred, CoerceToSeq&: UnpaddedCoerceToSeq) && | 
|---|
| 472 | (NVec + NPred) > 0) | 
|---|
| 473 | return coerceAndExpandPureScalableAggregate( | 
|---|
| 474 | Ty, IsNamedArg, NVec, NPred, UnpaddedCoerceToSeq, NSRN, NPRN); | 
|---|
| 475 | } | 
|---|
| 476 |  | 
|---|
| 477 | // Aggregates <= 16 bytes are passed directly in registers or on the stack. | 
|---|
| 478 | if (Size <= 128) { | 
|---|
| 479 | unsigned Alignment; | 
|---|
| 480 | if (Kind == AArch64ABIKind::AAPCS) { | 
|---|
| 481 | Alignment = getContext().getTypeUnadjustedAlign(T: Ty); | 
|---|
| 482 | Alignment = Alignment < 128 ? 64 : 128; | 
|---|
| 483 | } else { | 
|---|
| 484 | Alignment = | 
|---|
| 485 | std::max(a: getContext().getTypeAlign(T: Ty), | 
|---|
| 486 | b: (unsigned)getTarget().getPointerWidth(AddrSpace: LangAS::Default)); | 
|---|
| 487 | } | 
|---|
| 488 | Size = llvm::alignTo(Value: Size, Align: Alignment); | 
|---|
| 489 |  | 
|---|
| 490 | // If the Aggregate is made up of pointers, use an array of pointers for the | 
|---|
| 491 | // coerced type. This prevents having to convert ptr2int->int2ptr through | 
|---|
| 492 | // the call, allowing alias analysis to produce better code. | 
|---|
| 493 | auto ContainsOnlyPointers = [&](const auto &Self, QualType Ty) { | 
|---|
| 494 | if (isEmptyRecord(Context&: getContext(), T: Ty, AllowArrays: true)) | 
|---|
| 495 | return false; | 
|---|
| 496 | const RecordType *RT = Ty->getAs<RecordType>(); | 
|---|
| 497 | if (!RT) | 
|---|
| 498 | return false; | 
|---|
| 499 | const RecordDecl *RD = RT->getDecl(); | 
|---|
| 500 | if (const CXXRecordDecl *CXXRD = dyn_cast<CXXRecordDecl>(Val: RD)) { | 
|---|
| 501 | for (const auto &I : CXXRD->bases()) | 
|---|
| 502 | if (!Self(Self, I.getType())) | 
|---|
| 503 | return false; | 
|---|
| 504 | } | 
|---|
| 505 | return all_of(RD->fields(), [&](FieldDecl *FD) { | 
|---|
| 506 | QualType FDTy = FD->getType(); | 
|---|
| 507 | if (FDTy->isArrayType()) | 
|---|
| 508 | FDTy = getContext().getBaseElementType(QT: FDTy); | 
|---|
| 509 | return (FDTy->isPointerOrReferenceType() && | 
|---|
| 510 | getContext().getTypeSize(T: FDTy) == 64 && | 
|---|
| 511 | !FDTy->getPointeeType().hasAddressSpace()) || | 
|---|
| 512 | Self(Self, FDTy); | 
|---|
| 513 | }); | 
|---|
| 514 | }; | 
|---|
| 515 |  | 
|---|
| 516 | // We use a pair of i64 for 16-byte aggregate with 8-byte alignment. | 
|---|
| 517 | // For aggregates with 16-byte alignment, we use i128. | 
|---|
| 518 | llvm::Type *BaseTy = llvm::Type::getIntNTy(C&: getVMContext(), N: Alignment); | 
|---|
| 519 | if ((Size == 64 || Size == 128) && Alignment == 64 && | 
|---|
| 520 | ContainsOnlyPointers(ContainsOnlyPointers, Ty)) | 
|---|
| 521 | BaseTy = llvm::PointerType::getUnqual(C&: getVMContext()); | 
|---|
| 522 | return ABIArgInfo::getDirect( | 
|---|
| 523 | T: Size == Alignment ? BaseTy | 
|---|
| 524 | : llvm::ArrayType::get(ElementType: BaseTy, NumElements: Size / Alignment)); | 
|---|
| 525 | } | 
|---|
| 526 |  | 
|---|
| 527 | return getNaturalAlignIndirect(Ty, AddrSpace: getDataLayout().getAllocaAddrSpace(), | 
|---|
| 528 | /*ByVal=*/false); | 
|---|
| 529 | } | 
|---|
| 530 |  | 
|---|
| 531 | ABIArgInfo AArch64ABIInfo::classifyReturnType(QualType RetTy, | 
|---|
| 532 | bool IsVariadicFn) const { | 
|---|
| 533 | if (RetTy->isVoidType()) | 
|---|
| 534 | return ABIArgInfo::getIgnore(); | 
|---|
| 535 |  | 
|---|
| 536 | if (const auto *VT = RetTy->getAs<VectorType>()) { | 
|---|
| 537 | if (VT->getVectorKind() == VectorKind::SveFixedLengthData || | 
|---|
| 538 | VT->getVectorKind() == VectorKind::SveFixedLengthPredicate) { | 
|---|
| 539 | unsigned NSRN = 0, NPRN = 0; | 
|---|
| 540 | return coerceIllegalVector(Ty: RetTy, NSRN, NPRN); | 
|---|
| 541 | } | 
|---|
| 542 | } | 
|---|
| 543 |  | 
|---|
| 544 | // Large vector types should be returned via memory. | 
|---|
| 545 | if (RetTy->isVectorType() && getContext().getTypeSize(T: RetTy) > 128) | 
|---|
| 546 | return getNaturalAlignIndirect(Ty: RetTy, AddrSpace: getDataLayout().getAllocaAddrSpace()); | 
|---|
| 547 |  | 
|---|
| 548 | if (!passAsAggregateType(Ty: RetTy)) { | 
|---|
| 549 | // Treat an enum type as its underlying type. | 
|---|
| 550 | if (const EnumType *EnumTy = RetTy->getAs<EnumType>()) | 
|---|
| 551 | RetTy = EnumTy->getDecl()->getIntegerType(); | 
|---|
| 552 |  | 
|---|
| 553 | if (const auto *EIT = RetTy->getAs<BitIntType>()) | 
|---|
| 554 | if (EIT->getNumBits() > 128) | 
|---|
| 555 | return getNaturalAlignIndirect(Ty: RetTy, | 
|---|
| 556 | AddrSpace: getDataLayout().getAllocaAddrSpace()); | 
|---|
| 557 |  | 
|---|
| 558 | return (isPromotableIntegerTypeForABI(Ty: RetTy) && isDarwinPCS() | 
|---|
| 559 | ? ABIArgInfo::getExtend(Ty: RetTy) | 
|---|
| 560 | : ABIArgInfo::getDirect()); | 
|---|
| 561 | } | 
|---|
| 562 |  | 
|---|
| 563 | uint64_t Size = getContext().getTypeSize(T: RetTy); | 
|---|
| 564 | if (!RetTy->isSVESizelessBuiltinType() && | 
|---|
| 565 | (isEmptyRecord(Context&: getContext(), T: RetTy, AllowArrays: true) || Size == 0)) | 
|---|
| 566 | return ABIArgInfo::getIgnore(); | 
|---|
| 567 |  | 
|---|
| 568 | const Type *Base = nullptr; | 
|---|
| 569 | uint64_t Members = 0; | 
|---|
| 570 | if (isHomogeneousAggregate(Ty: RetTy, Base, Members) && | 
|---|
| 571 | !(getTarget().getTriple().getArch() == llvm::Triple::aarch64_32 && | 
|---|
| 572 | IsVariadicFn)) | 
|---|
| 573 | // Homogeneous Floating-point Aggregates (HFAs) are returned directly. | 
|---|
| 574 | return ABIArgInfo::getDirect(); | 
|---|
| 575 |  | 
|---|
| 576 | // In AAPCS return values of a Pure Scalable type are treated as a single | 
|---|
| 577 | // named argument and passed expanded in registers, or indirectly if there are | 
|---|
| 578 | // not enough registers. | 
|---|
| 579 | if (Kind == AArch64ABIKind::AAPCS) { | 
|---|
| 580 | unsigned NSRN = 0, NPRN = 0; | 
|---|
| 581 | unsigned NVec = 0, NPred = 0; | 
|---|
| 582 | SmallVector<llvm::Type *> UnpaddedCoerceToSeq; | 
|---|
| 583 | if (passAsPureScalableType(Ty: RetTy, NV&: NVec, NP&: NPred, CoerceToSeq&: UnpaddedCoerceToSeq) && | 
|---|
| 584 | (NVec + NPred) > 0) | 
|---|
| 585 | return coerceAndExpandPureScalableAggregate( | 
|---|
| 586 | Ty: RetTy, /* IsNamedArg */ true, NVec, NPred, UnpaddedCoerceToSeq, NSRN, | 
|---|
| 587 | NPRN); | 
|---|
| 588 | } | 
|---|
| 589 |  | 
|---|
| 590 | // Aggregates <= 16 bytes are returned directly in registers or on the stack. | 
|---|
| 591 | if (Size <= 128) { | 
|---|
| 592 | if (Size <= 64 && getDataLayout().isLittleEndian()) { | 
|---|
| 593 | // Composite types are returned in lower bits of a 64-bit register for LE, | 
|---|
| 594 | // and in higher bits for BE. However, integer types are always returned | 
|---|
| 595 | // in lower bits for both LE and BE, and they are not rounded up to | 
|---|
| 596 | // 64-bits. We can skip rounding up of composite types for LE, but not for | 
|---|
| 597 | // BE, otherwise composite types will be indistinguishable from integer | 
|---|
| 598 | // types. | 
|---|
| 599 | return ABIArgInfo::getDirect( | 
|---|
| 600 | T: llvm::IntegerType::get(C&: getVMContext(), NumBits: Size)); | 
|---|
| 601 | } | 
|---|
| 602 |  | 
|---|
| 603 | unsigned Alignment = getContext().getTypeAlign(T: RetTy); | 
|---|
| 604 | Size = llvm::alignTo(Value: Size, Align: 64); // round up to multiple of 8 bytes | 
|---|
| 605 |  | 
|---|
| 606 | // We use a pair of i64 for 16-byte aggregate with 8-byte alignment. | 
|---|
| 607 | // For aggregates with 16-byte alignment, we use i128. | 
|---|
| 608 | if (Alignment < 128 && Size == 128) { | 
|---|
| 609 | llvm::Type *BaseTy = llvm::Type::getInt64Ty(C&: getVMContext()); | 
|---|
| 610 | return ABIArgInfo::getDirect(T: llvm::ArrayType::get(ElementType: BaseTy, NumElements: Size / 64)); | 
|---|
| 611 | } | 
|---|
| 612 | return ABIArgInfo::getDirect(T: llvm::IntegerType::get(C&: getVMContext(), NumBits: Size)); | 
|---|
| 613 | } | 
|---|
| 614 |  | 
|---|
| 615 | return getNaturalAlignIndirect(Ty: RetTy, AddrSpace: getDataLayout().getAllocaAddrSpace()); | 
|---|
| 616 | } | 
|---|
| 617 |  | 
|---|
| 618 | /// isIllegalVectorType - check whether the vector type is legal for AArch64. | 
|---|
| 619 | bool AArch64ABIInfo::isIllegalVectorType(QualType Ty) const { | 
|---|
| 620 | if (const VectorType *VT = Ty->getAs<VectorType>()) { | 
|---|
| 621 | // Check whether VT is a fixed-length SVE vector. These types are | 
|---|
| 622 | // represented as scalable vectors in function args/return and must be | 
|---|
| 623 | // coerced from fixed vectors. | 
|---|
| 624 | if (VT->getVectorKind() == VectorKind::SveFixedLengthData || | 
|---|
| 625 | VT->getVectorKind() == VectorKind::SveFixedLengthPredicate) | 
|---|
| 626 | return true; | 
|---|
| 627 |  | 
|---|
| 628 | // Check whether VT is legal. | 
|---|
| 629 | unsigned NumElements = VT->getNumElements(); | 
|---|
| 630 | uint64_t Size = getContext().getTypeSize(T: VT); | 
|---|
| 631 | // NumElements should be power of 2. | 
|---|
| 632 | if (!llvm::isPowerOf2_32(Value: NumElements)) | 
|---|
| 633 | return true; | 
|---|
| 634 |  | 
|---|
| 635 | // arm64_32 has to be compatible with the ARM logic here, which allows huge | 
|---|
| 636 | // vectors for some reason. | 
|---|
| 637 | llvm::Triple Triple = getTarget().getTriple(); | 
|---|
| 638 | if (Triple.getArch() == llvm::Triple::aarch64_32 && | 
|---|
| 639 | Triple.isOSBinFormatMachO()) | 
|---|
| 640 | return Size <= 32; | 
|---|
| 641 |  | 
|---|
| 642 | return Size != 64 && (Size != 128 || NumElements == 1); | 
|---|
| 643 | } | 
|---|
| 644 | return false; | 
|---|
| 645 | } | 
|---|
| 646 |  | 
|---|
| 647 | bool AArch64SwiftABIInfo::isLegalVectorType(CharUnits VectorSize, | 
|---|
| 648 | llvm::Type *EltTy, | 
|---|
| 649 | unsigned NumElts) const { | 
|---|
| 650 | if (!llvm::isPowerOf2_32(Value: NumElts)) | 
|---|
| 651 | return false; | 
|---|
| 652 | if (VectorSize.getQuantity() != 8 && | 
|---|
| 653 | (VectorSize.getQuantity() != 16 || NumElts == 1)) | 
|---|
| 654 | return false; | 
|---|
| 655 | return true; | 
|---|
| 656 | } | 
|---|
| 657 |  | 
|---|
| 658 | bool AArch64ABIInfo::isHomogeneousAggregateBaseType(QualType Ty) const { | 
|---|
| 659 | // For the soft-float ABI variant, no types are considered to be homogeneous | 
|---|
| 660 | // aggregates. | 
|---|
| 661 | if (isSoftFloat()) | 
|---|
| 662 | return false; | 
|---|
| 663 |  | 
|---|
| 664 | // Homogeneous aggregates for AAPCS64 must have base types of a floating | 
|---|
| 665 | // point type or a short-vector type. This is the same as the 32-bit ABI, | 
|---|
| 666 | // but with the difference that any floating-point type is allowed, | 
|---|
| 667 | // including __fp16. | 
|---|
| 668 | if (const BuiltinType *BT = Ty->getAs<BuiltinType>()) { | 
|---|
| 669 | if (BT->isFloatingPoint()) | 
|---|
| 670 | return true; | 
|---|
| 671 | } else if (const VectorType *VT = Ty->getAs<VectorType>()) { | 
|---|
| 672 | if (auto Kind = VT->getVectorKind(); | 
|---|
| 673 | Kind == VectorKind::SveFixedLengthData || | 
|---|
| 674 | Kind == VectorKind::SveFixedLengthPredicate) | 
|---|
| 675 | return false; | 
|---|
| 676 |  | 
|---|
| 677 | unsigned VecSize = getContext().getTypeSize(T: VT); | 
|---|
| 678 | if (VecSize == 64 || VecSize == 128) | 
|---|
| 679 | return true; | 
|---|
| 680 | } | 
|---|
| 681 | return false; | 
|---|
| 682 | } | 
|---|
| 683 |  | 
|---|
| 684 | bool AArch64ABIInfo::isHomogeneousAggregateSmallEnough(const Type *Base, | 
|---|
| 685 | uint64_t Members) const { | 
|---|
| 686 | return Members <= 4; | 
|---|
| 687 | } | 
|---|
| 688 |  | 
|---|
| 689 | bool AArch64ABIInfo::isZeroLengthBitfieldPermittedInHomogeneousAggregate() | 
|---|
| 690 | const { | 
|---|
| 691 | // AAPCS64 says that the rule for whether something is a homogeneous | 
|---|
| 692 | // aggregate is applied to the output of the data layout decision. So | 
|---|
| 693 | // anything that doesn't affect the data layout also does not affect | 
|---|
| 694 | // homogeneity. In particular, zero-length bitfields don't stop a struct | 
|---|
| 695 | // being homogeneous. | 
|---|
| 696 | return true; | 
|---|
| 697 | } | 
|---|
| 698 |  | 
|---|
| 699 | bool AArch64ABIInfo::passAsAggregateType(QualType Ty) const { | 
|---|
| 700 | if (Kind == AArch64ABIKind::AAPCS && Ty->isSVESizelessBuiltinType()) { | 
|---|
| 701 | const auto *BT = Ty->castAs<BuiltinType>(); | 
|---|
| 702 | return !BT->isSVECount() && | 
|---|
| 703 | getContext().getBuiltinVectorTypeInfo(VecTy: BT).NumVectors > 1; | 
|---|
| 704 | } | 
|---|
| 705 | return isAggregateTypeForABI(T: Ty); | 
|---|
| 706 | } | 
|---|
| 707 |  | 
|---|
| 708 | // Check if a type needs to be passed in registers as a Pure Scalable Type (as | 
|---|
| 709 | // defined by AAPCS64). Return the number of data vectors and the number of | 
|---|
| 710 | // predicate vectors in the type, into `NVec` and `NPred`, respectively. Upon | 
|---|
| 711 | // return `CoerceToSeq` contains an expanded sequence of LLVM IR types, one | 
|---|
| 712 | // element for each non-composite member. For practical purposes, limit the | 
|---|
| 713 | // length of `CoerceToSeq` to about 12 (the maximum that could possibly fit | 
|---|
| 714 | // in registers) and return false, the effect of which will be to  pass the | 
|---|
| 715 | // argument under the rules for a large (> 128 bytes) composite. | 
|---|
| 716 | bool AArch64ABIInfo::passAsPureScalableType( | 
|---|
| 717 | QualType Ty, unsigned &NVec, unsigned &NPred, | 
|---|
| 718 | SmallVectorImpl<llvm::Type *> &CoerceToSeq) const { | 
|---|
| 719 | if (const ConstantArrayType *AT = getContext().getAsConstantArrayType(T: Ty)) { | 
|---|
| 720 | uint64_t NElt = AT->getZExtSize(); | 
|---|
| 721 | if (NElt == 0) | 
|---|
| 722 | return false; | 
|---|
| 723 |  | 
|---|
| 724 | unsigned NV = 0, NP = 0; | 
|---|
| 725 | SmallVector<llvm::Type *> EltCoerceToSeq; | 
|---|
| 726 | if (!passAsPureScalableType(Ty: AT->getElementType(), NVec&: NV, NPred&: NP, CoerceToSeq&: EltCoerceToSeq)) | 
|---|
| 727 | return false; | 
|---|
| 728 |  | 
|---|
| 729 | if (CoerceToSeq.size() + NElt * EltCoerceToSeq.size() > 12) | 
|---|
| 730 | return false; | 
|---|
| 731 |  | 
|---|
| 732 | for (uint64_t I = 0; I < NElt; ++I) | 
|---|
| 733 | llvm::append_range(C&: CoerceToSeq, R&: EltCoerceToSeq); | 
|---|
| 734 |  | 
|---|
| 735 | NVec += NElt * NV; | 
|---|
| 736 | NPred += NElt * NP; | 
|---|
| 737 | return true; | 
|---|
| 738 | } | 
|---|
| 739 |  | 
|---|
| 740 | if (const RecordType *RT = Ty->getAs<RecordType>()) { | 
|---|
| 741 | // If the record cannot be passed in registers, then it's not a PST. | 
|---|
| 742 | if (CGCXXABI::RecordArgABI RAA = getRecordArgABI(RT, CXXABI&: getCXXABI()); | 
|---|
| 743 | RAA != CGCXXABI::RAA_Default) | 
|---|
| 744 | return false; | 
|---|
| 745 |  | 
|---|
| 746 | // Pure scalable types are never unions and never contain unions. | 
|---|
| 747 | const RecordDecl *RD = RT->getDecl(); | 
|---|
| 748 | if (RD->isUnion()) | 
|---|
| 749 | return false; | 
|---|
| 750 |  | 
|---|
| 751 | // If this is a C++ record, check the bases. | 
|---|
| 752 | if (const CXXRecordDecl *CXXRD = dyn_cast<CXXRecordDecl>(Val: RD)) { | 
|---|
| 753 | for (const auto &I : CXXRD->bases()) { | 
|---|
| 754 | if (isEmptyRecord(Context&: getContext(), T: I.getType(), AllowArrays: true)) | 
|---|
| 755 | continue; | 
|---|
| 756 | if (!passAsPureScalableType(Ty: I.getType(), NVec, NPred, CoerceToSeq)) | 
|---|
| 757 | return false; | 
|---|
| 758 | } | 
|---|
| 759 | } | 
|---|
| 760 |  | 
|---|
| 761 | // Check members. | 
|---|
| 762 | for (const auto *FD : RD->fields()) { | 
|---|
| 763 | QualType FT = FD->getType(); | 
|---|
| 764 | if (isEmptyField(Context&: getContext(), FD, /* AllowArrays */ true)) | 
|---|
| 765 | continue; | 
|---|
| 766 | if (!passAsPureScalableType(Ty: FT, NVec, NPred, CoerceToSeq)) | 
|---|
| 767 | return false; | 
|---|
| 768 | } | 
|---|
| 769 |  | 
|---|
| 770 | return true; | 
|---|
| 771 | } | 
|---|
| 772 |  | 
|---|
| 773 | if (const auto *VT = Ty->getAs<VectorType>()) { | 
|---|
| 774 | if (VT->getVectorKind() == VectorKind::SveFixedLengthPredicate) { | 
|---|
| 775 | ++NPred; | 
|---|
| 776 | if (CoerceToSeq.size() + 1 > 12) | 
|---|
| 777 | return false; | 
|---|
| 778 | CoerceToSeq.push_back(Elt: convertFixedToScalableVectorType(VT)); | 
|---|
| 779 | return true; | 
|---|
| 780 | } | 
|---|
| 781 |  | 
|---|
| 782 | if (VT->getVectorKind() == VectorKind::SveFixedLengthData) { | 
|---|
| 783 | ++NVec; | 
|---|
| 784 | if (CoerceToSeq.size() + 1 > 12) | 
|---|
| 785 | return false; | 
|---|
| 786 | CoerceToSeq.push_back(Elt: convertFixedToScalableVectorType(VT)); | 
|---|
| 787 | return true; | 
|---|
| 788 | } | 
|---|
| 789 |  | 
|---|
| 790 | return false; | 
|---|
| 791 | } | 
|---|
| 792 |  | 
|---|
| 793 | if (!Ty->isBuiltinType()) | 
|---|
| 794 | return false; | 
|---|
| 795 |  | 
|---|
| 796 | bool isPredicate; | 
|---|
| 797 | switch (Ty->castAs<BuiltinType>()->getKind()) { | 
|---|
| 798 | #define SVE_VECTOR_TYPE(Name, MangledName, Id, SingletonId)                    \ | 
|---|
| 799 | case BuiltinType::Id:                                                        \ | 
|---|
| 800 | isPredicate = false;                                                       \ | 
|---|
| 801 | break; | 
|---|
| 802 | #define SVE_PREDICATE_TYPE(Name, MangledName, Id, SingletonId)                 \ | 
|---|
| 803 | case BuiltinType::Id:                                                        \ | 
|---|
| 804 | isPredicate = true;                                                        \ | 
|---|
| 805 | break; | 
|---|
| 806 | #include "clang/Basic/AArch64ACLETypes.def" | 
|---|
| 807 | default: | 
|---|
| 808 | return false; | 
|---|
| 809 | } | 
|---|
| 810 |  | 
|---|
| 811 | ASTContext::BuiltinVectorTypeInfo Info = | 
|---|
| 812 | getContext().getBuiltinVectorTypeInfo(VecTy: cast<BuiltinType>(Val&: Ty)); | 
|---|
| 813 | assert(Info.NumVectors > 0 && Info.NumVectors <= 4 && | 
|---|
| 814 | "Expected 1, 2, 3 or 4 vectors!"); | 
|---|
| 815 | if (isPredicate) | 
|---|
| 816 | NPred += Info.NumVectors; | 
|---|
| 817 | else | 
|---|
| 818 | NVec += Info.NumVectors; | 
|---|
| 819 | llvm::Type *EltTy = Info.ElementType->isMFloat8Type() | 
|---|
| 820 | ? llvm::Type::getInt8Ty(C&: getVMContext()) | 
|---|
| 821 | : CGT.ConvertType(T: Info.ElementType); | 
|---|
| 822 | auto *VTy = llvm::ScalableVectorType::get(ElementType: EltTy, MinNumElts: Info.EC.getKnownMinValue()); | 
|---|
| 823 |  | 
|---|
| 824 | if (CoerceToSeq.size() + Info.NumVectors > 12) | 
|---|
| 825 | return false; | 
|---|
| 826 | std::fill_n(first: std::back_inserter(x&: CoerceToSeq), n: Info.NumVectors, value: VTy); | 
|---|
| 827 |  | 
|---|
| 828 | return true; | 
|---|
| 829 | } | 
|---|
| 830 |  | 
|---|
| 831 | // Expand an LLVM IR type into a sequence with a element for each non-struct, | 
|---|
| 832 | // non-array member of the type, with the exception of the padding types, which | 
|---|
| 833 | // are retained. | 
|---|
| 834 | void AArch64ABIInfo::flattenType( | 
|---|
| 835 | llvm::Type *Ty, SmallVectorImpl<llvm::Type *> &Flattened) const { | 
|---|
| 836 |  | 
|---|
| 837 | if (ABIArgInfo::isPaddingForCoerceAndExpand(eltType: Ty)) { | 
|---|
| 838 | Flattened.push_back(Elt: Ty); | 
|---|
| 839 | return; | 
|---|
| 840 | } | 
|---|
| 841 |  | 
|---|
| 842 | if (const auto *AT = dyn_cast<llvm::ArrayType>(Val: Ty)) { | 
|---|
| 843 | uint64_t NElt = AT->getNumElements(); | 
|---|
| 844 | if (NElt == 0) | 
|---|
| 845 | return; | 
|---|
| 846 |  | 
|---|
| 847 | SmallVector<llvm::Type *> EltFlattened; | 
|---|
| 848 | flattenType(Ty: AT->getElementType(), Flattened&: EltFlattened); | 
|---|
| 849 |  | 
|---|
| 850 | for (uint64_t I = 0; I < NElt; ++I) | 
|---|
| 851 | llvm::append_range(C&: Flattened, R&: EltFlattened); | 
|---|
| 852 | return; | 
|---|
| 853 | } | 
|---|
| 854 |  | 
|---|
| 855 | if (const auto *ST = dyn_cast<llvm::StructType>(Val: Ty)) { | 
|---|
| 856 | for (auto *ET : ST->elements()) | 
|---|
| 857 | flattenType(Ty: ET, Flattened); | 
|---|
| 858 | return; | 
|---|
| 859 | } | 
|---|
| 860 |  | 
|---|
| 861 | Flattened.push_back(Elt: Ty); | 
|---|
| 862 | } | 
|---|
| 863 |  | 
|---|
| 864 | RValue AArch64ABIInfo::EmitAAPCSVAArg(Address VAListAddr, QualType Ty, | 
|---|
| 865 | CodeGenFunction &CGF, AArch64ABIKind Kind, | 
|---|
| 866 | AggValueSlot Slot) const { | 
|---|
| 867 | // These numbers are not used for variadic arguments, hence it doesn't matter | 
|---|
| 868 | // they don't retain their values across multiple calls to | 
|---|
| 869 | // `classifyArgumentType` here. | 
|---|
| 870 | unsigned NSRN = 0, NPRN = 0; | 
|---|
| 871 | ABIArgInfo AI = | 
|---|
| 872 | classifyArgumentType(Ty, /*IsVariadicFn=*/true, /* IsNamedArg */ false, | 
|---|
| 873 | CallingConvention: CGF.CurFnInfo->getCallingConvention(), NSRN, NPRN); | 
|---|
| 874 | // Empty records are ignored for parameter passing purposes. | 
|---|
| 875 | if (AI.isIgnore()) | 
|---|
| 876 | return Slot.asRValue(); | 
|---|
| 877 |  | 
|---|
| 878 | bool IsIndirect = AI.isIndirect(); | 
|---|
| 879 |  | 
|---|
| 880 | llvm::Type *BaseTy = CGF.ConvertType(T: Ty); | 
|---|
| 881 | if (IsIndirect) | 
|---|
| 882 | BaseTy = llvm::PointerType::getUnqual(C&: BaseTy->getContext()); | 
|---|
| 883 | else if (AI.getCoerceToType()) | 
|---|
| 884 | BaseTy = AI.getCoerceToType(); | 
|---|
| 885 |  | 
|---|
| 886 | unsigned NumRegs = 1; | 
|---|
| 887 | if (llvm::ArrayType *ArrTy = dyn_cast<llvm::ArrayType>(Val: BaseTy)) { | 
|---|
| 888 | BaseTy = ArrTy->getElementType(); | 
|---|
| 889 | NumRegs = ArrTy->getNumElements(); | 
|---|
| 890 | } | 
|---|
| 891 | bool IsFPR = | 
|---|
| 892 | !isSoftFloat() && (BaseTy->isFloatingPointTy() || BaseTy->isVectorTy()); | 
|---|
| 893 |  | 
|---|
| 894 | // The AArch64 va_list type and handling is specified in the Procedure Call | 
|---|
| 895 | // Standard, section B.4: | 
|---|
| 896 | // | 
|---|
| 897 | // struct { | 
|---|
| 898 | //   void *__stack; | 
|---|
| 899 | //   void *__gr_top; | 
|---|
| 900 | //   void *__vr_top; | 
|---|
| 901 | //   int __gr_offs; | 
|---|
| 902 | //   int __vr_offs; | 
|---|
| 903 | // }; | 
|---|
| 904 |  | 
|---|
| 905 | llvm::BasicBlock *MaybeRegBlock = CGF.createBasicBlock(name: "vaarg.maybe_reg"); | 
|---|
| 906 | llvm::BasicBlock *InRegBlock = CGF.createBasicBlock(name: "vaarg.in_reg"); | 
|---|
| 907 | llvm::BasicBlock *OnStackBlock = CGF.createBasicBlock(name: "vaarg.on_stack"); | 
|---|
| 908 | llvm::BasicBlock *ContBlock = CGF.createBasicBlock(name: "vaarg.end"); | 
|---|
| 909 |  | 
|---|
| 910 | CharUnits TySize = getContext().getTypeSizeInChars(T: Ty); | 
|---|
| 911 | CharUnits TyAlign = getContext().getTypeUnadjustedAlignInChars(T: Ty); | 
|---|
| 912 |  | 
|---|
| 913 | Address reg_offs_p = Address::invalid(); | 
|---|
| 914 | llvm::Value *reg_offs = nullptr; | 
|---|
| 915 | int reg_top_index; | 
|---|
| 916 | int RegSize = IsIndirect ? 8 : TySize.getQuantity(); | 
|---|
| 917 | if (!IsFPR) { | 
|---|
| 918 | // 3 is the field number of __gr_offs | 
|---|
| 919 | reg_offs_p = CGF.Builder.CreateStructGEP(Addr: VAListAddr, Index: 3, Name: "gr_offs_p"); | 
|---|
| 920 | reg_offs = CGF.Builder.CreateLoad(Addr: reg_offs_p, Name: "gr_offs"); | 
|---|
| 921 | reg_top_index = 1; // field number for __gr_top | 
|---|
| 922 | RegSize = llvm::alignTo(Value: RegSize, Align: 8); | 
|---|
| 923 | } else { | 
|---|
| 924 | // 4 is the field number of __vr_offs. | 
|---|
| 925 | reg_offs_p = CGF.Builder.CreateStructGEP(Addr: VAListAddr, Index: 4, Name: "vr_offs_p"); | 
|---|
| 926 | reg_offs = CGF.Builder.CreateLoad(Addr: reg_offs_p, Name: "vr_offs"); | 
|---|
| 927 | reg_top_index = 2; // field number for __vr_top | 
|---|
| 928 | RegSize = 16 * NumRegs; | 
|---|
| 929 | } | 
|---|
| 930 |  | 
|---|
| 931 | //======================================= | 
|---|
| 932 | // Find out where argument was passed | 
|---|
| 933 | //======================================= | 
|---|
| 934 |  | 
|---|
| 935 | // If reg_offs >= 0 we're already using the stack for this type of | 
|---|
| 936 | // argument. We don't want to keep updating reg_offs (in case it overflows, | 
|---|
| 937 | // though anyone passing 2GB of arguments, each at most 16 bytes, deserves | 
|---|
| 938 | // whatever they get). | 
|---|
| 939 | llvm::Value *UsingStack = nullptr; | 
|---|
| 940 | UsingStack = CGF.Builder.CreateICmpSGE( | 
|---|
| 941 | LHS: reg_offs, RHS: llvm::ConstantInt::get(Ty: CGF.Int32Ty, V: 0)); | 
|---|
| 942 |  | 
|---|
| 943 | CGF.Builder.CreateCondBr(Cond: UsingStack, True: OnStackBlock, False: MaybeRegBlock); | 
|---|
| 944 |  | 
|---|
| 945 | // Otherwise, at least some kind of argument could go in these registers, the | 
|---|
| 946 | // question is whether this particular type is too big. | 
|---|
| 947 | CGF.EmitBlock(BB: MaybeRegBlock); | 
|---|
| 948 |  | 
|---|
| 949 | // Integer arguments may need to correct register alignment (for example a | 
|---|
| 950 | // "struct { __int128 a; };" gets passed in x_2N, x_{2N+1}). In this case we | 
|---|
| 951 | // align __gr_offs to calculate the potential address. | 
|---|
| 952 | if (!IsFPR && !IsIndirect && TyAlign.getQuantity() > 8) { | 
|---|
| 953 | int Align = TyAlign.getQuantity(); | 
|---|
| 954 |  | 
|---|
| 955 | reg_offs = CGF.Builder.CreateAdd( | 
|---|
| 956 | LHS: reg_offs, RHS: llvm::ConstantInt::get(Ty: CGF.Int32Ty, V: Align - 1), | 
|---|
| 957 | Name: "align_regoffs"); | 
|---|
| 958 | reg_offs = CGF.Builder.CreateAnd( | 
|---|
| 959 | LHS: reg_offs, RHS: llvm::ConstantInt::get(Ty: CGF.Int32Ty, V: -Align), | 
|---|
| 960 | Name: "aligned_regoffs"); | 
|---|
| 961 | } | 
|---|
| 962 |  | 
|---|
| 963 | // Update the gr_offs/vr_offs pointer for next call to va_arg on this va_list. | 
|---|
| 964 | // The fact that this is done unconditionally reflects the fact that | 
|---|
| 965 | // allocating an argument to the stack also uses up all the remaining | 
|---|
| 966 | // registers of the appropriate kind. | 
|---|
| 967 | llvm::Value *NewOffset = nullptr; | 
|---|
| 968 | NewOffset = CGF.Builder.CreateAdd( | 
|---|
| 969 | LHS: reg_offs, RHS: llvm::ConstantInt::get(Ty: CGF.Int32Ty, V: RegSize), Name: "new_reg_offs"); | 
|---|
| 970 | CGF.Builder.CreateStore(Val: NewOffset, Addr: reg_offs_p); | 
|---|
| 971 |  | 
|---|
| 972 | // Now we're in a position to decide whether this argument really was in | 
|---|
| 973 | // registers or not. | 
|---|
| 974 | llvm::Value *InRegs = nullptr; | 
|---|
| 975 | InRegs = CGF.Builder.CreateICmpSLE( | 
|---|
| 976 | LHS: NewOffset, RHS: llvm::ConstantInt::get(Ty: CGF.Int32Ty, V: 0), Name: "inreg"); | 
|---|
| 977 |  | 
|---|
| 978 | CGF.Builder.CreateCondBr(Cond: InRegs, True: InRegBlock, False: OnStackBlock); | 
|---|
| 979 |  | 
|---|
| 980 | //======================================= | 
|---|
| 981 | // Argument was in registers | 
|---|
| 982 | //======================================= | 
|---|
| 983 |  | 
|---|
| 984 | // Now we emit the code for if the argument was originally passed in | 
|---|
| 985 | // registers. First start the appropriate block: | 
|---|
| 986 | CGF.EmitBlock(BB: InRegBlock); | 
|---|
| 987 |  | 
|---|
| 988 | llvm::Value *reg_top = nullptr; | 
|---|
| 989 | Address reg_top_p = | 
|---|
| 990 | CGF.Builder.CreateStructGEP(Addr: VAListAddr, Index: reg_top_index, Name: "reg_top_p"); | 
|---|
| 991 | reg_top = CGF.Builder.CreateLoad(Addr: reg_top_p, Name: "reg_top"); | 
|---|
| 992 | Address BaseAddr(CGF.Builder.CreateInBoundsGEP(Ty: CGF.Int8Ty, Ptr: reg_top, IdxList: reg_offs), | 
|---|
| 993 | CGF.Int8Ty, CharUnits::fromQuantity(Quantity: IsFPR ? 16 : 8)); | 
|---|
| 994 | Address RegAddr = Address::invalid(); | 
|---|
| 995 | llvm::Type *MemTy = CGF.ConvertTypeForMem(T: Ty), *ElementTy = MemTy; | 
|---|
| 996 |  | 
|---|
| 997 | if (IsIndirect) { | 
|---|
| 998 | // If it's been passed indirectly (actually a struct), whatever we find from | 
|---|
| 999 | // stored registers or on the stack will actually be a struct **. | 
|---|
| 1000 | MemTy = llvm::PointerType::getUnqual(C&: MemTy->getContext()); | 
|---|
| 1001 | } | 
|---|
| 1002 |  | 
|---|
| 1003 | const Type *Base = nullptr; | 
|---|
| 1004 | uint64_t NumMembers = 0; | 
|---|
| 1005 | bool IsHFA = isHomogeneousAggregate(Ty, Base, Members&: NumMembers); | 
|---|
| 1006 | if (IsHFA && NumMembers > 1) { | 
|---|
| 1007 | // Homogeneous aggregates passed in registers will have their elements split | 
|---|
| 1008 | // and stored 16-bytes apart regardless of size (they're notionally in qN, | 
|---|
| 1009 | // qN+1, ...). We reload and store into a temporary local variable | 
|---|
| 1010 | // contiguously. | 
|---|
| 1011 | assert(!IsIndirect && "Homogeneous aggregates should be passed directly"); | 
|---|
| 1012 | auto BaseTyInfo = getContext().getTypeInfoInChars(T: QualType(Base, 0)); | 
|---|
| 1013 | llvm::Type *BaseTy = CGF.ConvertType(T: QualType(Base, 0)); | 
|---|
| 1014 | llvm::Type *HFATy = llvm::ArrayType::get(ElementType: BaseTy, NumElements: NumMembers); | 
|---|
| 1015 | Address Tmp = CGF.CreateTempAlloca(Ty: HFATy, | 
|---|
| 1016 | align: std::max(a: TyAlign, b: BaseTyInfo.Align)); | 
|---|
| 1017 |  | 
|---|
| 1018 | // On big-endian platforms, the value will be right-aligned in its slot. | 
|---|
| 1019 | int Offset = 0; | 
|---|
| 1020 | if (CGF.CGM.getDataLayout().isBigEndian() && | 
|---|
| 1021 | BaseTyInfo.Width.getQuantity() < 16) | 
|---|
| 1022 | Offset = 16 - BaseTyInfo.Width.getQuantity(); | 
|---|
| 1023 |  | 
|---|
| 1024 | for (unsigned i = 0; i < NumMembers; ++i) { | 
|---|
| 1025 | CharUnits BaseOffset = CharUnits::fromQuantity(Quantity: 16 * i + Offset); | 
|---|
| 1026 | Address LoadAddr = | 
|---|
| 1027 | CGF.Builder.CreateConstInBoundsByteGEP(Addr: BaseAddr, Offset: BaseOffset); | 
|---|
| 1028 | LoadAddr = LoadAddr.withElementType(ElemTy: BaseTy); | 
|---|
| 1029 |  | 
|---|
| 1030 | Address StoreAddr = CGF.Builder.CreateConstArrayGEP(Addr: Tmp, Index: i); | 
|---|
| 1031 |  | 
|---|
| 1032 | llvm::Value *Elem = CGF.Builder.CreateLoad(Addr: LoadAddr); | 
|---|
| 1033 | CGF.Builder.CreateStore(Val: Elem, Addr: StoreAddr); | 
|---|
| 1034 | } | 
|---|
| 1035 |  | 
|---|
| 1036 | RegAddr = Tmp.withElementType(ElemTy: MemTy); | 
|---|
| 1037 | } else { | 
|---|
| 1038 | // Otherwise the object is contiguous in memory. | 
|---|
| 1039 |  | 
|---|
| 1040 | // It might be right-aligned in its slot. | 
|---|
| 1041 | CharUnits SlotSize = BaseAddr.getAlignment(); | 
|---|
| 1042 | if (CGF.CGM.getDataLayout().isBigEndian() && !IsIndirect && | 
|---|
| 1043 | (IsHFA || !isAggregateTypeForABI(T: Ty)) && | 
|---|
| 1044 | TySize < SlotSize) { | 
|---|
| 1045 | CharUnits Offset = SlotSize - TySize; | 
|---|
| 1046 | BaseAddr = CGF.Builder.CreateConstInBoundsByteGEP(Addr: BaseAddr, Offset); | 
|---|
| 1047 | } | 
|---|
| 1048 |  | 
|---|
| 1049 | RegAddr = BaseAddr.withElementType(ElemTy: MemTy); | 
|---|
| 1050 | } | 
|---|
| 1051 |  | 
|---|
| 1052 | CGF.EmitBranch(Block: ContBlock); | 
|---|
| 1053 |  | 
|---|
| 1054 | //======================================= | 
|---|
| 1055 | // Argument was on the stack | 
|---|
| 1056 | //======================================= | 
|---|
| 1057 | CGF.EmitBlock(BB: OnStackBlock); | 
|---|
| 1058 |  | 
|---|
| 1059 | Address stack_p = CGF.Builder.CreateStructGEP(Addr: VAListAddr, Index: 0, Name: "stack_p"); | 
|---|
| 1060 | llvm::Value *OnStackPtr = CGF.Builder.CreateLoad(Addr: stack_p, Name: "stack"); | 
|---|
| 1061 |  | 
|---|
| 1062 | // Again, stack arguments may need realignment. In this case both integer and | 
|---|
| 1063 | // floating-point ones might be affected. | 
|---|
| 1064 | if (!IsIndirect && TyAlign.getQuantity() > 8) { | 
|---|
| 1065 | OnStackPtr = emitRoundPointerUpToAlignment(CGF, Ptr: OnStackPtr, Align: TyAlign); | 
|---|
| 1066 | } | 
|---|
| 1067 | Address OnStackAddr = Address(OnStackPtr, CGF.Int8Ty, | 
|---|
| 1068 | std::max(a: CharUnits::fromQuantity(Quantity: 8), b: TyAlign)); | 
|---|
| 1069 |  | 
|---|
| 1070 | // All stack slots are multiples of 8 bytes. | 
|---|
| 1071 | CharUnits StackSlotSize = CharUnits::fromQuantity(Quantity: 8); | 
|---|
| 1072 | CharUnits StackSize; | 
|---|
| 1073 | if (IsIndirect) | 
|---|
| 1074 | StackSize = StackSlotSize; | 
|---|
| 1075 | else | 
|---|
| 1076 | StackSize = TySize.alignTo(Align: StackSlotSize); | 
|---|
| 1077 |  | 
|---|
| 1078 | llvm::Value *StackSizeC = CGF.Builder.getSize(N: StackSize); | 
|---|
| 1079 | llvm::Value *NewStack = CGF.Builder.CreateInBoundsGEP( | 
|---|
| 1080 | Ty: CGF.Int8Ty, Ptr: OnStackPtr, IdxList: StackSizeC, Name: "new_stack"); | 
|---|
| 1081 |  | 
|---|
| 1082 | // Write the new value of __stack for the next call to va_arg | 
|---|
| 1083 | CGF.Builder.CreateStore(Val: NewStack, Addr: stack_p); | 
|---|
| 1084 |  | 
|---|
| 1085 | if (CGF.CGM.getDataLayout().isBigEndian() && !isAggregateTypeForABI(T: Ty) && | 
|---|
| 1086 | TySize < StackSlotSize) { | 
|---|
| 1087 | CharUnits Offset = StackSlotSize - TySize; | 
|---|
| 1088 | OnStackAddr = CGF.Builder.CreateConstInBoundsByteGEP(Addr: OnStackAddr, Offset); | 
|---|
| 1089 | } | 
|---|
| 1090 |  | 
|---|
| 1091 | OnStackAddr = OnStackAddr.withElementType(ElemTy: MemTy); | 
|---|
| 1092 |  | 
|---|
| 1093 | CGF.EmitBranch(Block: ContBlock); | 
|---|
| 1094 |  | 
|---|
| 1095 | //======================================= | 
|---|
| 1096 | // Tidy up | 
|---|
| 1097 | //======================================= | 
|---|
| 1098 | CGF.EmitBlock(BB: ContBlock); | 
|---|
| 1099 |  | 
|---|
| 1100 | Address ResAddr = emitMergePHI(CGF, Addr1: RegAddr, Block1: InRegBlock, Addr2: OnStackAddr, | 
|---|
| 1101 | Block2: OnStackBlock, Name: "vaargs.addr"); | 
|---|
| 1102 |  | 
|---|
| 1103 | if (IsIndirect) | 
|---|
| 1104 | return CGF.EmitLoadOfAnyValue( | 
|---|
| 1105 | V: CGF.MakeAddrLValue( | 
|---|
| 1106 | Addr: Address(CGF.Builder.CreateLoad(Addr: ResAddr, Name: "vaarg.addr"), ElementTy, | 
|---|
| 1107 | TyAlign), | 
|---|
| 1108 | T: Ty), | 
|---|
| 1109 | Slot); | 
|---|
| 1110 |  | 
|---|
| 1111 | return CGF.EmitLoadOfAnyValue(V: CGF.MakeAddrLValue(Addr: ResAddr, T: Ty), Slot); | 
|---|
| 1112 | } | 
|---|
| 1113 |  | 
|---|
| 1114 | RValue AArch64ABIInfo::EmitDarwinVAArg(Address VAListAddr, QualType Ty, | 
|---|
| 1115 | CodeGenFunction &CGF, | 
|---|
| 1116 | AggValueSlot Slot) const { | 
|---|
| 1117 | // The backend's lowering doesn't support va_arg for aggregates or | 
|---|
| 1118 | // illegal vector types.  Lower VAArg here for these cases and use | 
|---|
| 1119 | // the LLVM va_arg instruction for everything else. | 
|---|
| 1120 | if (!isAggregateTypeForABI(T: Ty) && !isIllegalVectorType(Ty)) | 
|---|
| 1121 | return CGF.EmitLoadOfAnyValue( | 
|---|
| 1122 | V: CGF.MakeAddrLValue( | 
|---|
| 1123 | Addr: EmitVAArgInstr(CGF, VAListAddr, Ty, AI: ABIArgInfo::getDirect()), T: Ty), | 
|---|
| 1124 | Slot); | 
|---|
| 1125 |  | 
|---|
| 1126 | uint64_t PointerSize = getTarget().getPointerWidth(AddrSpace: LangAS::Default) / 8; | 
|---|
| 1127 | CharUnits SlotSize = CharUnits::fromQuantity(Quantity: PointerSize); | 
|---|
| 1128 |  | 
|---|
| 1129 | // Empty records are ignored for parameter passing purposes. | 
|---|
| 1130 | if (isEmptyRecord(Context&: getContext(), T: Ty, AllowArrays: true)) | 
|---|
| 1131 | return Slot.asRValue(); | 
|---|
| 1132 |  | 
|---|
| 1133 | // The size of the actual thing passed, which might end up just | 
|---|
| 1134 | // being a pointer for indirect types. | 
|---|
| 1135 | auto TyInfo = getContext().getTypeInfoInChars(T: Ty); | 
|---|
| 1136 |  | 
|---|
| 1137 | // Arguments bigger than 16 bytes which aren't homogeneous | 
|---|
| 1138 | // aggregates should be passed indirectly. | 
|---|
| 1139 | bool IsIndirect = false; | 
|---|
| 1140 | if (TyInfo.Width.getQuantity() > 16) { | 
|---|
| 1141 | const Type *Base = nullptr; | 
|---|
| 1142 | uint64_t Members = 0; | 
|---|
| 1143 | IsIndirect = !isHomogeneousAggregate(Ty, Base, Members); | 
|---|
| 1144 | } | 
|---|
| 1145 |  | 
|---|
| 1146 | return emitVoidPtrVAArg(CGF, VAListAddr, ValueTy: Ty, IsIndirect, ValueInfo: TyInfo, SlotSizeAndAlign: SlotSize, | 
|---|
| 1147 | /*AllowHigherAlign*/ true, Slot); | 
|---|
| 1148 | } | 
|---|
| 1149 |  | 
|---|
| 1150 | RValue AArch64ABIInfo::EmitMSVAArg(CodeGenFunction &CGF, Address VAListAddr, | 
|---|
| 1151 | QualType Ty, AggValueSlot Slot) const { | 
|---|
| 1152 | bool IsIndirect = false; | 
|---|
| 1153 |  | 
|---|
| 1154 | // Composites larger than 16 bytes are passed by reference. | 
|---|
| 1155 | if (isAggregateTypeForABI(T: Ty) && getContext().getTypeSize(T: Ty) > 128) | 
|---|
| 1156 | IsIndirect = true; | 
|---|
| 1157 |  | 
|---|
| 1158 | return emitVoidPtrVAArg(CGF, VAListAddr, ValueTy: Ty, IsIndirect, | 
|---|
| 1159 | ValueInfo: CGF.getContext().getTypeInfoInChars(T: Ty), | 
|---|
| 1160 | SlotSizeAndAlign: CharUnits::fromQuantity(Quantity: 8), | 
|---|
| 1161 | /*allowHigherAlign*/ AllowHigherAlign: false, Slot); | 
|---|
| 1162 | } | 
|---|
| 1163 |  | 
|---|
| 1164 | static bool isStreamingCompatible(const FunctionDecl *F) { | 
|---|
| 1165 | if (const auto *T = F->getType()->getAs<FunctionProtoType>()) | 
|---|
| 1166 | return T->getAArch64SMEAttributes() & | 
|---|
| 1167 | FunctionType::SME_PStateSMCompatibleMask; | 
|---|
| 1168 | return false; | 
|---|
| 1169 | } | 
|---|
| 1170 |  | 
|---|
| 1171 | // Report an error if an argument or return value of type Ty would need to be | 
|---|
| 1172 | // passed in a floating-point register. | 
|---|
| 1173 | static void diagnoseIfNeedsFPReg(DiagnosticsEngine &Diags, | 
|---|
| 1174 | const StringRef ABIName, | 
|---|
| 1175 | const AArch64ABIInfo &ABIInfo, | 
|---|
| 1176 | const QualType &Ty, const NamedDecl *D, | 
|---|
| 1177 | SourceLocation loc) { | 
|---|
| 1178 | const Type *HABase = nullptr; | 
|---|
| 1179 | uint64_t HAMembers = 0; | 
|---|
| 1180 | if (Ty->isFloatingType() || Ty->isVectorType() || | 
|---|
| 1181 | ABIInfo.isHomogeneousAggregate(Ty, Base&: HABase, Members&: HAMembers)) { | 
|---|
| 1182 | Diags.Report(Loc: loc, DiagID: diag::err_target_unsupported_type_for_abi) | 
|---|
| 1183 | << D->getDeclName() << Ty << ABIName; | 
|---|
| 1184 | } | 
|---|
| 1185 | } | 
|---|
| 1186 |  | 
|---|
| 1187 | // If we are using a hard-float ABI, but do not have floating point registers, | 
|---|
| 1188 | // then report an error for any function arguments or returns which would be | 
|---|
| 1189 | // passed in floating-pint registers. | 
|---|
| 1190 | void AArch64TargetCodeGenInfo::checkFunctionABI( | 
|---|
| 1191 | CodeGenModule &CGM, const FunctionDecl *FuncDecl) const { | 
|---|
| 1192 | const AArch64ABIInfo &ABIInfo = getABIInfo<AArch64ABIInfo>(); | 
|---|
| 1193 | const TargetInfo &TI = ABIInfo.getContext().getTargetInfo(); | 
|---|
| 1194 |  | 
|---|
| 1195 | if (!TI.hasFeature(Feature: "fp") && !ABIInfo.isSoftFloat()) { | 
|---|
| 1196 | diagnoseIfNeedsFPReg(Diags&: CGM.getDiags(), ABIName: TI.getABI(), ABIInfo, | 
|---|
| 1197 | Ty: FuncDecl->getReturnType(), D: FuncDecl, | 
|---|
| 1198 | loc: FuncDecl->getLocation()); | 
|---|
| 1199 | for (ParmVarDecl *PVD : FuncDecl->parameters()) { | 
|---|
| 1200 | diagnoseIfNeedsFPReg(Diags&: CGM.getDiags(), ABIName: TI.getABI(), ABIInfo, Ty: PVD->getType(), | 
|---|
| 1201 | D: PVD, loc: FuncDecl->getLocation()); | 
|---|
| 1202 | } | 
|---|
| 1203 | } | 
|---|
| 1204 | } | 
|---|
| 1205 |  | 
|---|
| 1206 | enum class ArmSMEInlinability : uint8_t { | 
|---|
| 1207 | Ok = 0, | 
|---|
| 1208 | ErrorCalleeRequiresNewZA = 1 << 0, | 
|---|
| 1209 | ErrorCalleeRequiresNewZT0 = 1 << 1, | 
|---|
| 1210 | WarnIncompatibleStreamingModes = 1 << 2, | 
|---|
| 1211 | ErrorIncompatibleStreamingModes = 1 << 3, | 
|---|
| 1212 |  | 
|---|
| 1213 | IncompatibleStreamingModes = | 
|---|
| 1214 | WarnIncompatibleStreamingModes | ErrorIncompatibleStreamingModes, | 
|---|
| 1215 |  | 
|---|
| 1216 | LLVM_MARK_AS_BITMASK_ENUM(/*LargestValue=*/ErrorIncompatibleStreamingModes), | 
|---|
| 1217 | }; | 
|---|
| 1218 |  | 
|---|
| 1219 | /// Determines if there are any Arm SME ABI issues with inlining \p Callee into | 
|---|
| 1220 | /// \p Caller. Returns the issue (if any) in the ArmSMEInlinability bit enum. | 
|---|
| 1221 | static ArmSMEInlinability GetArmSMEInlinability(const FunctionDecl *Caller, | 
|---|
| 1222 | const FunctionDecl *Callee) { | 
|---|
| 1223 | bool CallerIsStreaming = | 
|---|
| 1224 | IsArmStreamingFunction(FD: Caller, /*IncludeLocallyStreaming=*/true); | 
|---|
| 1225 | bool CalleeIsStreaming = | 
|---|
| 1226 | IsArmStreamingFunction(FD: Callee, /*IncludeLocallyStreaming=*/true); | 
|---|
| 1227 | bool CallerIsStreamingCompatible = isStreamingCompatible(F: Caller); | 
|---|
| 1228 | bool CalleeIsStreamingCompatible = isStreamingCompatible(F: Callee); | 
|---|
| 1229 |  | 
|---|
| 1230 | ArmSMEInlinability Inlinability = ArmSMEInlinability::Ok; | 
|---|
| 1231 |  | 
|---|
| 1232 | if (!CalleeIsStreamingCompatible && | 
|---|
| 1233 | (CallerIsStreaming != CalleeIsStreaming || CallerIsStreamingCompatible)) { | 
|---|
| 1234 | if (CalleeIsStreaming) | 
|---|
| 1235 | Inlinability |= ArmSMEInlinability::ErrorIncompatibleStreamingModes; | 
|---|
| 1236 | else | 
|---|
| 1237 | Inlinability |= ArmSMEInlinability::WarnIncompatibleStreamingModes; | 
|---|
| 1238 | } | 
|---|
| 1239 | if (auto *NewAttr = Callee->getAttr<ArmNewAttr>()) { | 
|---|
| 1240 | if (NewAttr->isNewZA()) | 
|---|
| 1241 | Inlinability |= ArmSMEInlinability::ErrorCalleeRequiresNewZA; | 
|---|
| 1242 | if (NewAttr->isNewZT0()) | 
|---|
| 1243 | Inlinability |= ArmSMEInlinability::ErrorCalleeRequiresNewZT0; | 
|---|
| 1244 | } | 
|---|
| 1245 |  | 
|---|
| 1246 | return Inlinability; | 
|---|
| 1247 | } | 
|---|
| 1248 |  | 
|---|
| 1249 | void AArch64TargetCodeGenInfo::checkFunctionCallABIStreaming( | 
|---|
| 1250 | CodeGenModule &CGM, SourceLocation CallLoc, const FunctionDecl *Caller, | 
|---|
| 1251 | const FunctionDecl *Callee) const { | 
|---|
| 1252 | if (!Caller || !Callee || !Callee->hasAttr<AlwaysInlineAttr>()) | 
|---|
| 1253 | return; | 
|---|
| 1254 |  | 
|---|
| 1255 | ArmSMEInlinability Inlinability = GetArmSMEInlinability(Caller, Callee); | 
|---|
| 1256 |  | 
|---|
| 1257 | if ((Inlinability & ArmSMEInlinability::IncompatibleStreamingModes) != | 
|---|
| 1258 | ArmSMEInlinability::Ok) | 
|---|
| 1259 | CGM.getDiags().Report( | 
|---|
| 1260 | Loc: CallLoc, | 
|---|
| 1261 | DiagID: (Inlinability & ArmSMEInlinability::ErrorIncompatibleStreamingModes) == | 
|---|
| 1262 | ArmSMEInlinability::ErrorIncompatibleStreamingModes | 
|---|
| 1263 | ? diag::err_function_always_inline_attribute_mismatch | 
|---|
| 1264 | : diag::warn_function_always_inline_attribute_mismatch) | 
|---|
| 1265 | << Caller->getDeclName() << Callee->getDeclName() << "streaming"; | 
|---|
| 1266 |  | 
|---|
| 1267 | if ((Inlinability & ArmSMEInlinability::ErrorCalleeRequiresNewZA) == | 
|---|
| 1268 | ArmSMEInlinability::ErrorCalleeRequiresNewZA) | 
|---|
| 1269 | CGM.getDiags().Report(Loc: CallLoc, DiagID: diag::err_function_always_inline_new_za) | 
|---|
| 1270 | << Callee->getDeclName(); | 
|---|
| 1271 |  | 
|---|
| 1272 | if ((Inlinability & ArmSMEInlinability::ErrorCalleeRequiresNewZT0) == | 
|---|
| 1273 | ArmSMEInlinability::ErrorCalleeRequiresNewZT0) | 
|---|
| 1274 | CGM.getDiags().Report(Loc: CallLoc, DiagID: diag::err_function_always_inline_new_zt0) | 
|---|
| 1275 | << Callee->getDeclName(); | 
|---|
| 1276 | } | 
|---|
| 1277 |  | 
|---|
| 1278 | // If the target does not have floating-point registers, but we are using a | 
|---|
| 1279 | // hard-float ABI, there is no way to pass floating-point, vector or HFA values | 
|---|
| 1280 | // to functions, so we report an error. | 
|---|
| 1281 | void AArch64TargetCodeGenInfo::checkFunctionCallABISoftFloat( | 
|---|
| 1282 | CodeGenModule &CGM, SourceLocation CallLoc, const FunctionDecl *Caller, | 
|---|
| 1283 | const FunctionDecl *Callee, const CallArgList &Args, | 
|---|
| 1284 | QualType ReturnType) const { | 
|---|
| 1285 | const AArch64ABIInfo &ABIInfo = getABIInfo<AArch64ABIInfo>(); | 
|---|
| 1286 | const TargetInfo &TI = ABIInfo.getContext().getTargetInfo(); | 
|---|
| 1287 |  | 
|---|
| 1288 | if (!Caller || TI.hasFeature(Feature: "fp") || ABIInfo.isSoftFloat()) | 
|---|
| 1289 | return; | 
|---|
| 1290 |  | 
|---|
| 1291 | diagnoseIfNeedsFPReg(Diags&: CGM.getDiags(), ABIName: TI.getABI(), ABIInfo, Ty: ReturnType, | 
|---|
| 1292 | D: Callee ? Callee : Caller, loc: CallLoc); | 
|---|
| 1293 |  | 
|---|
| 1294 | for (const CallArg &Arg : Args) | 
|---|
| 1295 | diagnoseIfNeedsFPReg(Diags&: CGM.getDiags(), ABIName: TI.getABI(), ABIInfo, Ty: Arg.getType(), | 
|---|
| 1296 | D: Callee ? Callee : Caller, loc: CallLoc); | 
|---|
| 1297 | } | 
|---|
| 1298 |  | 
|---|
| 1299 | void AArch64TargetCodeGenInfo::checkFunctionCallABI(CodeGenModule &CGM, | 
|---|
| 1300 | SourceLocation CallLoc, | 
|---|
| 1301 | const FunctionDecl *Caller, | 
|---|
| 1302 | const FunctionDecl *Callee, | 
|---|
| 1303 | const CallArgList &Args, | 
|---|
| 1304 | QualType ReturnType) const { | 
|---|
| 1305 | checkFunctionCallABIStreaming(CGM, CallLoc, Caller, Callee); | 
|---|
| 1306 | checkFunctionCallABISoftFloat(CGM, CallLoc, Caller, Callee, Args, ReturnType); | 
|---|
| 1307 | } | 
|---|
| 1308 |  | 
|---|
| 1309 | bool AArch64TargetCodeGenInfo::wouldInliningViolateFunctionCallABI( | 
|---|
| 1310 | const FunctionDecl *Caller, const FunctionDecl *Callee) const { | 
|---|
| 1311 | return Caller && Callee && | 
|---|
| 1312 | GetArmSMEInlinability(Caller, Callee) != ArmSMEInlinability::Ok; | 
|---|
| 1313 | } | 
|---|
| 1314 |  | 
|---|
| 1315 | void AArch64ABIInfo::appendAttributeMangling(TargetClonesAttr *Attr, | 
|---|
| 1316 | unsigned Index, | 
|---|
| 1317 | raw_ostream &Out) const { | 
|---|
| 1318 | appendAttributeMangling(AttrStr: Attr->getFeatureStr(Index), Out); | 
|---|
| 1319 | } | 
|---|
| 1320 |  | 
|---|
| 1321 | void AArch64ABIInfo::appendAttributeMangling(StringRef AttrStr, | 
|---|
| 1322 | raw_ostream &Out) const { | 
|---|
| 1323 | if (AttrStr == "default") { | 
|---|
| 1324 | Out << ".default"; | 
|---|
| 1325 | return; | 
|---|
| 1326 | } | 
|---|
| 1327 |  | 
|---|
| 1328 | Out << "._"; | 
|---|
| 1329 | SmallVector<StringRef, 8> Features; | 
|---|
| 1330 | AttrStr.split(A&: Features, Separator: "+"); | 
|---|
| 1331 | for (auto &Feat : Features) | 
|---|
| 1332 | Feat = Feat.trim(); | 
|---|
| 1333 |  | 
|---|
| 1334 | llvm::sort(C&: Features, Comp: [](const StringRef LHS, const StringRef RHS) { | 
|---|
| 1335 | return LHS.compare(RHS) < 0; | 
|---|
| 1336 | }); | 
|---|
| 1337 |  | 
|---|
| 1338 | llvm::SmallDenseSet<StringRef, 8> UniqueFeats; | 
|---|
| 1339 | for (auto &Feat : Features) | 
|---|
| 1340 | if (auto Ext = llvm::AArch64::parseFMVExtension(Extension: Feat)) | 
|---|
| 1341 | if (UniqueFeats.insert(V: Ext->Name).second) | 
|---|
| 1342 | Out << 'M' << Ext->Name; | 
|---|
| 1343 | } | 
|---|
| 1344 |  | 
|---|
| 1345 | std::unique_ptr<TargetCodeGenInfo> | 
|---|
| 1346 | CodeGen::createAArch64TargetCodeGenInfo(CodeGenModule &CGM, | 
|---|
| 1347 | AArch64ABIKind Kind) { | 
|---|
| 1348 | return std::make_unique<AArch64TargetCodeGenInfo>(args&: CGM.getTypes(), args&: Kind); | 
|---|
| 1349 | } | 
|---|
| 1350 |  | 
|---|
| 1351 | std::unique_ptr<TargetCodeGenInfo> | 
|---|
| 1352 | CodeGen::createWindowsAArch64TargetCodeGenInfo(CodeGenModule &CGM, | 
|---|
| 1353 | AArch64ABIKind K) { | 
|---|
| 1354 | return std::make_unique<WindowsAArch64TargetCodeGenInfo>(args&: CGM.getTypes(), args&: K); | 
|---|
| 1355 | } | 
|---|
| 1356 |  | 
|---|