1//===---- CGBuiltin.cpp - Emit LLVM Code for builtins ---------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This contains code to emit Builtin calls as LLVM code.
10//
11//===----------------------------------------------------------------------===//
12
13#include "CGBuiltin.h"
14#include "ABIInfo.h"
15#include "CGCUDARuntime.h"
16#include "CGCXXABI.h"
17#include "CGDebugInfo.h"
18#include "CGObjCRuntime.h"
19#include "CGOpenCLRuntime.h"
20#include "CGRecordLayout.h"
21#include "CGValue.h"
22#include "CodeGenFunction.h"
23#include "CodeGenModule.h"
24#include "ConstantEmitter.h"
25#include "PatternInit.h"
26#include "TargetInfo.h"
27#include "clang/AST/OSLog.h"
28#include "clang/AST/StmtVisitor.h"
29#include "clang/Basic/DiagnosticFrontend.h"
30#include "clang/Basic/TargetInfo.h"
31#include "llvm/ADT/APFloat.h"
32#include "llvm/IR/InlineAsm.h"
33#include "llvm/IR/Instruction.h"
34#include "llvm/IR/Intrinsics.h"
35#include "llvm/IR/IntrinsicsX86.h"
36#include "llvm/IR/MatrixBuilder.h"
37#include "llvm/Support/ConvertUTF.h"
38#include "llvm/Support/ScopedPrinter.h"
39#include <algorithm>
40#include <optional>
41#include <utility>
42
43using namespace clang;
44using namespace CodeGen;
45using namespace llvm;
46
47/// Some builtins do not have library implementation on some targets and
48/// are instead emitted as LLVM IRs by some target builtin emitters.
49/// FIXME: Remove this when library support is added
50static bool shouldEmitBuiltinAsIR(unsigned BuiltinID,
51 const Builtin::Context &BI,
52 const CodeGenFunction &CGF) {
53 if (!CGF.CGM.getLangOpts().MathErrno &&
54 CGF.CurFPFeatures.getExceptionMode() ==
55 LangOptions::FPExceptionModeKind::FPE_Ignore &&
56 !CGF.CGM.getTargetCodeGenInfo().supportsLibCall()) {
57 switch (BuiltinID) {
58 default:
59 return false;
60 case Builtin::BIlogbf:
61 case Builtin::BI__builtin_logbf:
62 case Builtin::BIlogb:
63 case Builtin::BI__builtin_logb:
64 case Builtin::BIscalbnf:
65 case Builtin::BI__builtin_scalbnf:
66 case Builtin::BIscalbn:
67 case Builtin::BI__builtin_scalbn:
68 return true;
69 }
70 }
71 return false;
72}
73
74static Value *EmitTargetArchBuiltinExpr(CodeGenFunction *CGF,
75 unsigned BuiltinID, const CallExpr *E,
76 ReturnValueSlot ReturnValue,
77 llvm::Triple::ArchType Arch) {
78 // When compiling in HipStdPar mode we have to be conservative in rejecting
79 // target specific features in the FE, and defer the possible error to the
80 // AcceleratorCodeSelection pass, wherein iff an unsupported target builtin is
81 // referenced by an accelerator executable function, we emit an error.
82 // Returning nullptr here leads to the builtin being handled in
83 // EmitStdParUnsupportedBuiltin.
84 if (CGF->getLangOpts().HIPStdPar && CGF->getLangOpts().CUDAIsDevice &&
85 Arch != CGF->getTarget().getTriple().getArch())
86 return nullptr;
87
88 switch (Arch) {
89 case llvm::Triple::arm:
90 case llvm::Triple::armeb:
91 case llvm::Triple::thumb:
92 case llvm::Triple::thumbeb:
93 return CGF->EmitARMBuiltinExpr(BuiltinID, E, ReturnValue, Arch);
94 case llvm::Triple::aarch64:
95 case llvm::Triple::aarch64_32:
96 case llvm::Triple::aarch64_be:
97 return CGF->EmitAArch64BuiltinExpr(BuiltinID, E, Arch);
98 case llvm::Triple::bpfeb:
99 case llvm::Triple::bpfel:
100 return CGF->EmitBPFBuiltinExpr(BuiltinID, E);
101 case llvm::Triple::dxil:
102 return CGF->EmitDirectXBuiltinExpr(BuiltinID, E);
103 case llvm::Triple::x86:
104 case llvm::Triple::x86_64:
105 return CGF->EmitX86BuiltinExpr(BuiltinID, E);
106 case llvm::Triple::ppc:
107 case llvm::Triple::ppcle:
108 case llvm::Triple::ppc64:
109 case llvm::Triple::ppc64le:
110 return CGF->EmitPPCBuiltinExpr(BuiltinID, E);
111 case llvm::Triple::r600:
112 case llvm::Triple::amdgcn:
113 return CGF->EmitAMDGPUBuiltinExpr(BuiltinID, E);
114 case llvm::Triple::systemz:
115 return CGF->EmitSystemZBuiltinExpr(BuiltinID, E);
116 case llvm::Triple::nvptx:
117 case llvm::Triple::nvptx64:
118 return CGF->EmitNVPTXBuiltinExpr(BuiltinID, E);
119 case llvm::Triple::wasm32:
120 case llvm::Triple::wasm64:
121 return CGF->EmitWebAssemblyBuiltinExpr(BuiltinID, E);
122 case llvm::Triple::hexagon:
123 return CGF->EmitHexagonBuiltinExpr(BuiltinID, E);
124 case llvm::Triple::riscv32:
125 case llvm::Triple::riscv64:
126 case llvm::Triple::riscv32be:
127 case llvm::Triple::riscv64be:
128 return CGF->EmitRISCVBuiltinExpr(BuiltinID, E, ReturnValue);
129 case llvm::Triple::spirv32:
130 case llvm::Triple::spirv64:
131 if (CGF->getTarget().getTriple().getOS() == llvm::Triple::OSType::AMDHSA)
132 return CGF->EmitAMDGPUBuiltinExpr(BuiltinID, E);
133 [[fallthrough]];
134 case llvm::Triple::spirv:
135 return CGF->EmitSPIRVBuiltinExpr(BuiltinID, E);
136 case llvm::Triple::avr:
137 return CGF->EmitAVRBuiltinExpr(BuiltinID, E);
138 default:
139 return nullptr;
140 }
141}
142
143Value *CodeGenFunction::EmitTargetBuiltinExpr(unsigned BuiltinID,
144 const CallExpr *E,
145 ReturnValueSlot ReturnValue) {
146 if (getContext().BuiltinInfo.isAuxBuiltinID(ID: BuiltinID)) {
147 assert(getContext().getAuxTargetInfo() && "Missing aux target info");
148 return EmitTargetArchBuiltinExpr(
149 CGF: this, BuiltinID: getContext().BuiltinInfo.getAuxBuiltinID(ID: BuiltinID), E,
150 ReturnValue, Arch: getContext().getAuxTargetInfo()->getTriple().getArch());
151 }
152
153 return EmitTargetArchBuiltinExpr(CGF: this, BuiltinID, E, ReturnValue,
154 Arch: getTarget().getTriple().getArch());
155}
156
157static void initializeAlloca(CodeGenFunction &CGF, AllocaInst *AI, Value *Size,
158 Align AlignmentInBytes) {
159 ConstantInt *Byte;
160 switch (CGF.getLangOpts().getTrivialAutoVarInit()) {
161 case LangOptions::TrivialAutoVarInitKind::Uninitialized:
162 // Nothing to initialize.
163 return;
164 case LangOptions::TrivialAutoVarInitKind::Zero:
165 Byte = CGF.Builder.getInt8(C: 0x00);
166 break;
167 case LangOptions::TrivialAutoVarInitKind::Pattern: {
168 llvm::Type *Int8 = llvm::IntegerType::getInt8Ty(C&: CGF.CGM.getLLVMContext());
169 Byte = llvm::dyn_cast<llvm::ConstantInt>(
170 Val: initializationPatternFor(CGF.CGM, Int8));
171 break;
172 }
173 }
174 if (CGF.CGM.stopAutoInit())
175 return;
176 auto *I = CGF.Builder.CreateMemSet(Ptr: AI, Val: Byte, Size, Align: AlignmentInBytes);
177 I->addAnnotationMetadata(Annotation: "auto-init");
178}
179
180/// getBuiltinLibFunction - Given a builtin id for a function like
181/// "__builtin_fabsf", return a Function* for "fabsf".
182llvm::Constant *CodeGenModule::getBuiltinLibFunction(const FunctionDecl *FD,
183 unsigned BuiltinID) {
184 assert(Context.BuiltinInfo.isLibFunction(BuiltinID));
185
186 // Get the name, skip over the __builtin_ prefix (if necessary). We may have
187 // to build this up so provide a small stack buffer to handle the vast
188 // majority of names.
189 llvm::SmallString<64> Name;
190 GlobalDecl D(FD);
191
192 // TODO: This list should be expanded or refactored after all GCC-compatible
193 // std libcall builtins are implemented.
194 static const SmallDenseMap<unsigned, StringRef, 64> F128Builtins{
195 {Builtin::BI__builtin___fprintf_chk, "__fprintf_chkieee128"},
196 {Builtin::BI__builtin___printf_chk, "__printf_chkieee128"},
197 {Builtin::BI__builtin___snprintf_chk, "__snprintf_chkieee128"},
198 {Builtin::BI__builtin___sprintf_chk, "__sprintf_chkieee128"},
199 {Builtin::BI__builtin___vfprintf_chk, "__vfprintf_chkieee128"},
200 {Builtin::BI__builtin___vprintf_chk, "__vprintf_chkieee128"},
201 {Builtin::BI__builtin___vsnprintf_chk, "__vsnprintf_chkieee128"},
202 {Builtin::BI__builtin___vsprintf_chk, "__vsprintf_chkieee128"},
203 {Builtin::BI__builtin_fprintf, "__fprintfieee128"},
204 {Builtin::BI__builtin_printf, "__printfieee128"},
205 {Builtin::BI__builtin_snprintf, "__snprintfieee128"},
206 {Builtin::BI__builtin_sprintf, "__sprintfieee128"},
207 {Builtin::BI__builtin_vfprintf, "__vfprintfieee128"},
208 {Builtin::BI__builtin_vprintf, "__vprintfieee128"},
209 {Builtin::BI__builtin_vsnprintf, "__vsnprintfieee128"},
210 {Builtin::BI__builtin_vsprintf, "__vsprintfieee128"},
211 {Builtin::BI__builtin_fscanf, "__fscanfieee128"},
212 {Builtin::BI__builtin_scanf, "__scanfieee128"},
213 {Builtin::BI__builtin_sscanf, "__sscanfieee128"},
214 {Builtin::BI__builtin_vfscanf, "__vfscanfieee128"},
215 {Builtin::BI__builtin_vscanf, "__vscanfieee128"},
216 {Builtin::BI__builtin_vsscanf, "__vsscanfieee128"},
217 {Builtin::BI__builtin_nexttowardf128, "__nexttowardieee128"},
218 };
219
220 // The AIX library functions frexpl, ldexpl, and modfl are for 128-bit
221 // IBM 'long double' (i.e. __ibm128). Map to the 'double' versions
222 // if it is 64-bit 'long double' mode.
223 static const SmallDenseMap<unsigned, StringRef, 4> AIXLongDouble64Builtins{
224 {Builtin::BI__builtin_frexpl, "frexp"},
225 {Builtin::BI__builtin_ldexpl, "ldexp"},
226 {Builtin::BI__builtin_modfl, "modf"},
227 };
228
229 // If the builtin has been declared explicitly with an assembler label,
230 // use the mangled name. This differs from the plain label on platforms
231 // that prefix labels.
232 if (FD->hasAttr<AsmLabelAttr>())
233 Name = getMangledName(GD: D);
234 else {
235 // TODO: This mutation should also be applied to other targets other than
236 // PPC, after backend supports IEEE 128-bit style libcalls.
237 if (getTriple().isPPC64() &&
238 &getTarget().getLongDoubleFormat() == &llvm::APFloat::IEEEquad() &&
239 F128Builtins.contains(Val: BuiltinID))
240 Name = F128Builtins.lookup(Val: BuiltinID);
241 else if (getTriple().isOSAIX() &&
242 &getTarget().getLongDoubleFormat() ==
243 &llvm::APFloat::IEEEdouble() &&
244 AIXLongDouble64Builtins.contains(Val: BuiltinID))
245 Name = AIXLongDouble64Builtins.lookup(Val: BuiltinID);
246 else
247 Name = Context.BuiltinInfo.getName(ID: BuiltinID).substr(pos: 10);
248 }
249
250 llvm::FunctionType *Ty =
251 cast<llvm::FunctionType>(Val: getTypes().ConvertType(T: FD->getType()));
252
253 return GetOrCreateLLVMFunction(MangledName: Name, Ty, D, /*ForVTable=*/false);
254}
255
256/// Emit the conversions required to turn the given value into an
257/// integer of the given size.
258Value *EmitToInt(CodeGenFunction &CGF, llvm::Value *V,
259 QualType T, llvm::IntegerType *IntType) {
260 V = CGF.EmitToMemory(Value: V, Ty: T);
261
262 if (V->getType()->isPointerTy())
263 return CGF.Builder.CreatePtrToInt(V, DestTy: IntType);
264
265 assert(V->getType() == IntType);
266 return V;
267}
268
269Value *EmitFromInt(CodeGenFunction &CGF, llvm::Value *V,
270 QualType T, llvm::Type *ResultType) {
271 V = CGF.EmitFromMemory(Value: V, Ty: T);
272
273 if (ResultType->isPointerTy())
274 return CGF.Builder.CreateIntToPtr(V, DestTy: ResultType);
275
276 assert(V->getType() == ResultType);
277 return V;
278}
279
280Address CheckAtomicAlignment(CodeGenFunction &CGF, const CallExpr *E) {
281 ASTContext &Ctx = CGF.getContext();
282 Address Ptr = CGF.EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
283 const llvm::DataLayout &DL = CGF.CGM.getDataLayout();
284 unsigned Bytes = Ptr.getElementType()->isPointerTy()
285 ? Ctx.getTypeSizeInChars(T: Ctx.VoidPtrTy).getQuantity()
286 : DL.getTypeStoreSize(Ty: Ptr.getElementType());
287 unsigned Align = Ptr.getAlignment().getQuantity();
288 if (Align % Bytes != 0) {
289 DiagnosticsEngine &Diags = CGF.CGM.getDiags();
290 Diags.Report(Loc: E->getBeginLoc(), DiagID: diag::warn_sync_op_misaligned);
291 // Force address to be at least naturally-aligned.
292 return Ptr.withAlignment(NewAlignment: CharUnits::fromQuantity(Quantity: Bytes));
293 }
294 return Ptr;
295}
296
297/// Utility to insert an atomic instruction based on Intrinsic::ID
298/// and the expression node.
299Value *MakeBinaryAtomicValue(
300 CodeGenFunction &CGF, llvm::AtomicRMWInst::BinOp Kind, const CallExpr *E,
301 AtomicOrdering Ordering) {
302
303 QualType T = E->getType();
304 assert(E->getArg(0)->getType()->isPointerType());
305 assert(CGF.getContext().hasSameUnqualifiedType(T,
306 E->getArg(0)->getType()->getPointeeType()));
307 assert(CGF.getContext().hasSameUnqualifiedType(T, E->getArg(1)->getType()));
308
309 Address DestAddr = CheckAtomicAlignment(CGF, E);
310
311 llvm::IntegerType *IntType = llvm::IntegerType::get(
312 C&: CGF.getLLVMContext(), NumBits: CGF.getContext().getTypeSize(T));
313
314 llvm::Value *Val = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
315 llvm::Type *ValueType = Val->getType();
316 Val = EmitToInt(CGF, V: Val, T, IntType);
317
318 llvm::Value *Result =
319 CGF.Builder.CreateAtomicRMW(Op: Kind, Addr: DestAddr, Val, Ordering);
320 // Consider atomics to be volatile in MS kernel mode.
321 if (CGF.CGM.getLangOpts().Kernel)
322 cast<llvm::AtomicRMWInst>(Val: Result)->setVolatile(true);
323 return EmitFromInt(CGF, V: Result, T, ResultType: ValueType);
324}
325
326static Value *EmitNontemporalStore(CodeGenFunction &CGF, const CallExpr *E) {
327 Value *Val = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
328 Address Addr = CGF.EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
329
330 Val = CGF.EmitToMemory(Value: Val, Ty: E->getArg(Arg: 0)->getType());
331 LValue LV = CGF.MakeAddrLValue(Addr, T: E->getArg(Arg: 0)->getType());
332 LV.setNontemporal(true);
333 CGF.EmitStoreOfScalar(value: Val, lvalue: LV, isInit: false);
334 return nullptr;
335}
336
337static Value *EmitNontemporalLoad(CodeGenFunction &CGF, const CallExpr *E) {
338 Address Addr = CGF.EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
339
340 LValue LV = CGF.MakeAddrLValue(Addr, T: E->getType());
341 LV.setNontemporal(true);
342 return CGF.EmitLoadOfScalar(lvalue: LV, Loc: E->getExprLoc());
343}
344
345static RValue EmitBinaryAtomic(CodeGenFunction &CGF,
346 llvm::AtomicRMWInst::BinOp Kind,
347 const CallExpr *E) {
348 return RValue::get(V: MakeBinaryAtomicValue(CGF, Kind, E));
349}
350
351/// Utility to insert an atomic instruction based Intrinsic::ID and
352/// the expression node, where the return value is the result of the
353/// operation.
354static RValue EmitBinaryAtomicPost(CodeGenFunction &CGF,
355 llvm::AtomicRMWInst::BinOp Kind,
356 const CallExpr *E,
357 Instruction::BinaryOps Op,
358 bool Invert = false) {
359 QualType T = E->getType();
360 assert(E->getArg(0)->getType()->isPointerType());
361 assert(CGF.getContext().hasSameUnqualifiedType(T,
362 E->getArg(0)->getType()->getPointeeType()));
363 assert(CGF.getContext().hasSameUnqualifiedType(T, E->getArg(1)->getType()));
364
365 Address DestAddr = CheckAtomicAlignment(CGF, E);
366
367 llvm::IntegerType *IntType = llvm::IntegerType::get(
368 C&: CGF.getLLVMContext(), NumBits: CGF.getContext().getTypeSize(T));
369
370 llvm::Value *Val = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
371 llvm::Type *ValueType = Val->getType();
372 Val = EmitToInt(CGF, V: Val, T, IntType);
373
374 llvm::Value *Result = CGF.Builder.CreateAtomicRMW(
375 Op: Kind, Addr: DestAddr, Val, Ordering: llvm::AtomicOrdering::SequentiallyConsistent);
376 Result = CGF.Builder.CreateBinOp(Opc: Op, LHS: Result, RHS: Val);
377 if (Invert)
378 Result =
379 CGF.Builder.CreateBinOp(Opc: llvm::Instruction::Xor, LHS: Result,
380 RHS: llvm::ConstantInt::getAllOnesValue(Ty: IntType));
381 Result = EmitFromInt(CGF, V: Result, T, ResultType: ValueType);
382 return RValue::get(V: Result);
383}
384
385/// Utility to insert an atomic cmpxchg instruction.
386///
387/// @param CGF The current codegen function.
388/// @param E Builtin call expression to convert to cmpxchg.
389/// arg0 - address to operate on
390/// arg1 - value to compare with
391/// arg2 - new value
392/// @param ReturnBool Specifies whether to return success flag of
393/// cmpxchg result or the old value.
394///
395/// @returns result of cmpxchg, according to ReturnBool
396///
397/// Note: In order to lower Microsoft's _InterlockedCompareExchange* intrinsics
398/// invoke the function EmitAtomicCmpXchgForMSIntrin.
399Value *MakeAtomicCmpXchgValue(CodeGenFunction &CGF, const CallExpr *E,
400 bool ReturnBool,
401 llvm::AtomicOrdering SuccessOrdering,
402 llvm::AtomicOrdering FailureOrdering) {
403 QualType T = ReturnBool ? E->getArg(Arg: 1)->getType() : E->getType();
404 Address DestAddr = CheckAtomicAlignment(CGF, E);
405
406 llvm::IntegerType *IntType = llvm::IntegerType::get(
407 C&: CGF.getLLVMContext(), NumBits: CGF.getContext().getTypeSize(T));
408
409 Value *Cmp = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
410 llvm::Type *ValueType = Cmp->getType();
411 Cmp = EmitToInt(CGF, V: Cmp, T, IntType);
412 Value *New = EmitToInt(CGF, V: CGF.EmitScalarExpr(E: E->getArg(Arg: 2)), T, IntType);
413
414 Value *Pair = CGF.Builder.CreateAtomicCmpXchg(
415 Addr: DestAddr, Cmp, New, SuccessOrdering, FailureOrdering);
416 if (ReturnBool)
417 // Extract boolean success flag and zext it to int.
418 return CGF.Builder.CreateZExt(V: CGF.Builder.CreateExtractValue(Agg: Pair, Idxs: 1),
419 DestTy: CGF.ConvertType(T: E->getType()));
420 else
421 // Extract old value and emit it using the same type as compare value.
422 return EmitFromInt(CGF, V: CGF.Builder.CreateExtractValue(Agg: Pair, Idxs: 0), T,
423 ResultType: ValueType);
424}
425
426/// This function should be invoked to emit atomic cmpxchg for Microsoft's
427/// _InterlockedCompareExchange* intrinsics which have the following signature:
428/// T _InterlockedCompareExchange(T volatile *Destination,
429/// T Exchange,
430/// T Comparand);
431///
432/// Whereas the llvm 'cmpxchg' instruction has the following syntax:
433/// cmpxchg *Destination, Comparand, Exchange.
434/// So we need to swap Comparand and Exchange when invoking
435/// CreateAtomicCmpXchg. That is the reason we could not use the above utility
436/// function MakeAtomicCmpXchgValue since it expects the arguments to be
437/// already swapped.
438
439static
440Value *EmitAtomicCmpXchgForMSIntrin(CodeGenFunction &CGF, const CallExpr *E,
441 AtomicOrdering SuccessOrdering = AtomicOrdering::SequentiallyConsistent) {
442 assert(E->getArg(0)->getType()->isPointerType());
443 assert(CGF.getContext().hasSameUnqualifiedType(
444 E->getType(), E->getArg(0)->getType()->getPointeeType()));
445 assert(CGF.getContext().hasSameUnqualifiedType(E->getType(),
446 E->getArg(1)->getType()));
447 assert(CGF.getContext().hasSameUnqualifiedType(E->getType(),
448 E->getArg(2)->getType()));
449
450 Address DestAddr = CheckAtomicAlignment(CGF, E);
451
452 auto *Exchange = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
453 auto *RTy = Exchange->getType();
454
455 auto *Comparand = CGF.EmitScalarExpr(E: E->getArg(Arg: 2));
456
457 if (RTy->isPointerTy()) {
458 Exchange = CGF.Builder.CreatePtrToInt(V: Exchange, DestTy: CGF.IntPtrTy);
459 Comparand = CGF.Builder.CreatePtrToInt(V: Comparand, DestTy: CGF.IntPtrTy);
460 }
461
462 // For Release ordering, the failure ordering should be Monotonic.
463 auto FailureOrdering = SuccessOrdering == AtomicOrdering::Release ?
464 AtomicOrdering::Monotonic :
465 SuccessOrdering;
466
467 // The atomic instruction is marked volatile for consistency with MSVC. This
468 // blocks the few atomics optimizations that LLVM has. If we want to optimize
469 // _Interlocked* operations in the future, we will have to remove the volatile
470 // marker.
471 auto *CmpXchg = CGF.Builder.CreateAtomicCmpXchg(
472 Addr: DestAddr, Cmp: Comparand, New: Exchange, SuccessOrdering, FailureOrdering);
473 CmpXchg->setVolatile(true);
474
475 auto *Result = CGF.Builder.CreateExtractValue(Agg: CmpXchg, Idxs: 0);
476 if (RTy->isPointerTy()) {
477 Result = CGF.Builder.CreateIntToPtr(V: Result, DestTy: RTy);
478 }
479
480 return Result;
481}
482
483// 64-bit Microsoft platforms support 128 bit cmpxchg operations. They are
484// prototyped like this:
485//
486// unsigned char _InterlockedCompareExchange128...(
487// __int64 volatile * _Destination,
488// __int64 _ExchangeHigh,
489// __int64 _ExchangeLow,
490// __int64 * _ComparandResult);
491//
492// Note that Destination is assumed to be at least 16-byte aligned, despite
493// being typed int64.
494
495static Value *EmitAtomicCmpXchg128ForMSIntrin(CodeGenFunction &CGF,
496 const CallExpr *E,
497 AtomicOrdering SuccessOrdering) {
498 assert(E->getNumArgs() == 4);
499 llvm::Value *DestPtr = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
500 llvm::Value *ExchangeHigh = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
501 llvm::Value *ExchangeLow = CGF.EmitScalarExpr(E: E->getArg(Arg: 2));
502 Address ComparandAddr = CGF.EmitPointerWithAlignment(Addr: E->getArg(Arg: 3));
503
504 assert(DestPtr->getType()->isPointerTy());
505 assert(!ExchangeHigh->getType()->isPointerTy());
506 assert(!ExchangeLow->getType()->isPointerTy());
507
508 // For Release ordering, the failure ordering should be Monotonic.
509 auto FailureOrdering = SuccessOrdering == AtomicOrdering::Release
510 ? AtomicOrdering::Monotonic
511 : SuccessOrdering;
512
513 // Convert to i128 pointers and values. Alignment is also overridden for
514 // destination pointer.
515 llvm::Type *Int128Ty = llvm::IntegerType::get(C&: CGF.getLLVMContext(), NumBits: 128);
516 Address DestAddr(DestPtr, Int128Ty,
517 CGF.getContext().toCharUnitsFromBits(BitSize: 128));
518 ComparandAddr = ComparandAddr.withElementType(ElemTy: Int128Ty);
519
520 // (((i128)hi) << 64) | ((i128)lo)
521 ExchangeHigh = CGF.Builder.CreateZExt(V: ExchangeHigh, DestTy: Int128Ty);
522 ExchangeLow = CGF.Builder.CreateZExt(V: ExchangeLow, DestTy: Int128Ty);
523 ExchangeHigh =
524 CGF.Builder.CreateShl(LHS: ExchangeHigh, RHS: llvm::ConstantInt::get(Ty: Int128Ty, V: 64));
525 llvm::Value *Exchange = CGF.Builder.CreateOr(LHS: ExchangeHigh, RHS: ExchangeLow);
526
527 // Load the comparand for the instruction.
528 llvm::Value *Comparand = CGF.Builder.CreateLoad(Addr: ComparandAddr);
529
530 auto *CXI = CGF.Builder.CreateAtomicCmpXchg(Addr: DestAddr, Cmp: Comparand, New: Exchange,
531 SuccessOrdering, FailureOrdering);
532
533 // The atomic instruction is marked volatile for consistency with MSVC. This
534 // blocks the few atomics optimizations that LLVM has. If we want to optimize
535 // _Interlocked* operations in the future, we will have to remove the volatile
536 // marker.
537 CXI->setVolatile(true);
538
539 // Store the result as an outparameter.
540 CGF.Builder.CreateStore(Val: CGF.Builder.CreateExtractValue(Agg: CXI, Idxs: 0),
541 Addr: ComparandAddr);
542
543 // Get the success boolean and zero extend it to i8.
544 Value *Success = CGF.Builder.CreateExtractValue(Agg: CXI, Idxs: 1);
545 return CGF.Builder.CreateZExt(V: Success, DestTy: CGF.Int8Ty);
546}
547
548static Value *EmitAtomicIncrementValue(CodeGenFunction &CGF, const CallExpr *E,
549 AtomicOrdering Ordering = AtomicOrdering::SequentiallyConsistent) {
550 assert(E->getArg(0)->getType()->isPointerType());
551
552 auto *IntTy = CGF.ConvertType(T: E->getType());
553 Address DestAddr = CheckAtomicAlignment(CGF, E);
554 auto *Result = CGF.Builder.CreateAtomicRMW(
555 Op: AtomicRMWInst::Add, Addr: DestAddr, Val: ConstantInt::get(Ty: IntTy, V: 1), Ordering);
556 return CGF.Builder.CreateAdd(LHS: Result, RHS: ConstantInt::get(Ty: IntTy, V: 1));
557}
558
559static Value *EmitAtomicDecrementValue(
560 CodeGenFunction &CGF, const CallExpr *E,
561 AtomicOrdering Ordering = AtomicOrdering::SequentiallyConsistent) {
562 assert(E->getArg(0)->getType()->isPointerType());
563
564 auto *IntTy = CGF.ConvertType(T: E->getType());
565 Address DestAddr = CheckAtomicAlignment(CGF, E);
566 auto *Result = CGF.Builder.CreateAtomicRMW(
567 Op: AtomicRMWInst::Sub, Addr: DestAddr, Val: ConstantInt::get(Ty: IntTy, V: 1), Ordering);
568 return CGF.Builder.CreateSub(LHS: Result, RHS: ConstantInt::get(Ty: IntTy, V: 1));
569}
570
571// Build a plain volatile load.
572static Value *EmitISOVolatileLoad(CodeGenFunction &CGF, const CallExpr *E) {
573 Value *Ptr = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
574 QualType ElTy = E->getArg(Arg: 0)->getType()->getPointeeType();
575 CharUnits LoadSize = CGF.getContext().getTypeSizeInChars(T: ElTy);
576 llvm::Type *ITy =
577 llvm::IntegerType::get(C&: CGF.getLLVMContext(), NumBits: LoadSize.getQuantity() * 8);
578 llvm::LoadInst *Load = CGF.Builder.CreateAlignedLoad(Ty: ITy, Addr: Ptr, Align: LoadSize);
579 Load->setAtomic(Ordering: llvm::AtomicOrdering::Monotonic);
580 Load->setVolatile(true);
581 return Load;
582}
583
584// Build a plain volatile store.
585static Value *EmitISOVolatileStore(CodeGenFunction &CGF, const CallExpr *E) {
586 Value *Ptr = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
587 Value *Value = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
588 QualType ElTy = E->getArg(Arg: 0)->getType()->getPointeeType();
589 CharUnits StoreSize = CGF.getContext().getTypeSizeInChars(T: ElTy);
590 llvm::StoreInst *Store =
591 CGF.Builder.CreateAlignedStore(Val: Value, Addr: Ptr, Align: StoreSize);
592 Store->setAtomic(Ordering: llvm::AtomicOrdering::Monotonic);
593 Store->setVolatile(true);
594 return Store;
595}
596
597// Emit a simple mangled intrinsic that has 1 argument and a return type
598// matching the argument type. Depending on mode, this may be a constrained
599// floating-point intrinsic.
600Value *emitUnaryMaybeConstrainedFPBuiltin(CodeGenFunction &CGF,
601 const CallExpr *E, unsigned IntrinsicID,
602 unsigned ConstrainedIntrinsicID) {
603 llvm::Value *Src0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
604
605 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(CGF, E);
606 if (CGF.Builder.getIsFPConstrained()) {
607 Function *F = CGF.CGM.getIntrinsic(IID: ConstrainedIntrinsicID, Tys: Src0->getType());
608 return CGF.Builder.CreateConstrainedFPCall(Callee: F, Args: { Src0 });
609 } else {
610 Function *F = CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: Src0->getType());
611 return CGF.Builder.CreateCall(Callee: F, Args: Src0);
612 }
613}
614
615// Emit an intrinsic that has 2 operands of the same type as its result.
616// Depending on mode, this may be a constrained floating-point intrinsic.
617static Value *emitBinaryMaybeConstrainedFPBuiltin(CodeGenFunction &CGF,
618 const CallExpr *E, unsigned IntrinsicID,
619 unsigned ConstrainedIntrinsicID) {
620 llvm::Value *Src0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
621 llvm::Value *Src1 = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
622
623 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(CGF, E);
624 if (CGF.Builder.getIsFPConstrained()) {
625 Function *F = CGF.CGM.getIntrinsic(IID: ConstrainedIntrinsicID, Tys: Src0->getType());
626 return CGF.Builder.CreateConstrainedFPCall(Callee: F, Args: { Src0, Src1 });
627 } else {
628 Function *F = CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: Src0->getType());
629 return CGF.Builder.CreateCall(Callee: F, Args: { Src0, Src1 });
630 }
631}
632
633// Has second type mangled argument.
634static Value *
635emitBinaryExpMaybeConstrainedFPBuiltin(CodeGenFunction &CGF, const CallExpr *E,
636 Intrinsic::ID IntrinsicID,
637 Intrinsic::ID ConstrainedIntrinsicID) {
638 llvm::Value *Src0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
639 llvm::Value *Src1 = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
640
641 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(CGF, E);
642 if (CGF.Builder.getIsFPConstrained()) {
643 Function *F = CGF.CGM.getIntrinsic(IID: ConstrainedIntrinsicID,
644 Tys: {Src0->getType(), Src1->getType()});
645 return CGF.Builder.CreateConstrainedFPCall(Callee: F, Args: {Src0, Src1});
646 }
647
648 Function *F =
649 CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: {Src0->getType(), Src1->getType()});
650 return CGF.Builder.CreateCall(Callee: F, Args: {Src0, Src1});
651}
652
653// Emit an intrinsic that has 3 operands of the same type as its result.
654// Depending on mode, this may be a constrained floating-point intrinsic.
655static Value *emitTernaryMaybeConstrainedFPBuiltin(CodeGenFunction &CGF,
656 const CallExpr *E, unsigned IntrinsicID,
657 unsigned ConstrainedIntrinsicID) {
658 llvm::Value *Src0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
659 llvm::Value *Src1 = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
660 llvm::Value *Src2 = CGF.EmitScalarExpr(E: E->getArg(Arg: 2));
661
662 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(CGF, E);
663 if (CGF.Builder.getIsFPConstrained()) {
664 Function *F = CGF.CGM.getIntrinsic(IID: ConstrainedIntrinsicID, Tys: Src0->getType());
665 return CGF.Builder.CreateConstrainedFPCall(Callee: F, Args: { Src0, Src1, Src2 });
666 } else {
667 Function *F = CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: Src0->getType());
668 return CGF.Builder.CreateCall(Callee: F, Args: { Src0, Src1, Src2 });
669 }
670}
671
672// Emit an intrinsic that has overloaded integer result and fp operand.
673static Value *
674emitMaybeConstrainedFPToIntRoundBuiltin(CodeGenFunction &CGF, const CallExpr *E,
675 unsigned IntrinsicID,
676 unsigned ConstrainedIntrinsicID) {
677 llvm::Type *ResultType = CGF.ConvertType(T: E->getType());
678 llvm::Value *Src0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
679
680 if (CGF.Builder.getIsFPConstrained()) {
681 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(CGF, E);
682 Function *F = CGF.CGM.getIntrinsic(IID: ConstrainedIntrinsicID,
683 Tys: {ResultType, Src0->getType()});
684 return CGF.Builder.CreateConstrainedFPCall(Callee: F, Args: {Src0});
685 } else {
686 Function *F =
687 CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: {ResultType, Src0->getType()});
688 return CGF.Builder.CreateCall(Callee: F, Args: Src0);
689 }
690}
691
692static Value *emitFrexpBuiltin(CodeGenFunction &CGF, const CallExpr *E,
693 Intrinsic::ID IntrinsicID) {
694 llvm::Value *Src0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
695 llvm::Value *Src1 = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
696
697 QualType IntPtrTy = E->getArg(Arg: 1)->getType()->getPointeeType();
698 llvm::Type *IntTy = CGF.ConvertType(T: IntPtrTy);
699 llvm::Function *F =
700 CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: {Src0->getType(), IntTy});
701 llvm::Value *Call = CGF.Builder.CreateCall(Callee: F, Args: Src0);
702
703 llvm::Value *Exp = CGF.Builder.CreateExtractValue(Agg: Call, Idxs: 1);
704 LValue LV = CGF.MakeNaturalAlignAddrLValue(V: Src1, T: IntPtrTy);
705 CGF.EmitStoreOfScalar(value: Exp, lvalue: LV);
706
707 return CGF.Builder.CreateExtractValue(Agg: Call, Idxs: 0);
708}
709
710static void emitSincosBuiltin(CodeGenFunction &CGF, const CallExpr *E,
711 Intrinsic::ID IntrinsicID) {
712 llvm::Value *Val = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
713 llvm::Value *Dest0 = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
714 llvm::Value *Dest1 = CGF.EmitScalarExpr(E: E->getArg(Arg: 2));
715
716 llvm::Function *F = CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: {Val->getType()});
717 llvm::Value *Call = CGF.Builder.CreateCall(Callee: F, Args: Val);
718
719 llvm::Value *SinResult = CGF.Builder.CreateExtractValue(Agg: Call, Idxs: 0);
720 llvm::Value *CosResult = CGF.Builder.CreateExtractValue(Agg: Call, Idxs: 1);
721
722 QualType DestPtrType = E->getArg(Arg: 1)->getType()->getPointeeType();
723 LValue SinLV = CGF.MakeNaturalAlignAddrLValue(V: Dest0, T: DestPtrType);
724 LValue CosLV = CGF.MakeNaturalAlignAddrLValue(V: Dest1, T: DestPtrType);
725
726 llvm::StoreInst *StoreSin =
727 CGF.Builder.CreateStore(Val: SinResult, Addr: SinLV.getAddress());
728 llvm::StoreInst *StoreCos =
729 CGF.Builder.CreateStore(Val: CosResult, Addr: CosLV.getAddress());
730
731 // Mark the two stores as non-aliasing with each other. The order of stores
732 // emitted by this builtin is arbitrary, enforcing a particular order will
733 // prevent optimizations later on.
734 llvm::MDBuilder MDHelper(CGF.getLLVMContext());
735 MDNode *Domain = MDHelper.createAnonymousAliasScopeDomain();
736 MDNode *AliasScope = MDHelper.createAnonymousAliasScope(Domain);
737 MDNode *AliasScopeList = MDNode::get(Context&: Call->getContext(), MDs: AliasScope);
738 StoreSin->setMetadata(KindID: LLVMContext::MD_alias_scope, Node: AliasScopeList);
739 StoreCos->setMetadata(KindID: LLVMContext::MD_noalias, Node: AliasScopeList);
740}
741
742static llvm::Value *emitModfBuiltin(CodeGenFunction &CGF, const CallExpr *E,
743 Intrinsic::ID IntrinsicID) {
744 llvm::Value *Val = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
745 llvm::Value *IntPartDest = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
746
747 llvm::Value *Call =
748 CGF.Builder.CreateIntrinsic(ID: IntrinsicID, OverloadTypes: {Val->getType()}, Args: Val);
749
750 llvm::Value *FractionalResult = CGF.Builder.CreateExtractValue(Agg: Call, Idxs: 0);
751 llvm::Value *IntegralResult = CGF.Builder.CreateExtractValue(Agg: Call, Idxs: 1);
752
753 QualType DestPtrType = E->getArg(Arg: 1)->getType()->getPointeeType();
754 LValue IntegralLV = CGF.MakeNaturalAlignAddrLValue(V: IntPartDest, T: DestPtrType);
755 CGF.EmitStoreOfScalar(value: IntegralResult, lvalue: IntegralLV);
756
757 return FractionalResult;
758}
759
760/// EmitFAbs - Emit a call to @llvm.fabs().
761static Value *EmitFAbs(CodeGenFunction &CGF, Value *V) {
762 llvm::Value *Call = CGF.Builder.CreateFAbs(V);
763 if (auto *CallI = dyn_cast<llvm::CallInst>(Val: Call))
764 CallI->setDoesNotAccessMemory();
765 return Call;
766}
767
768/// Emit the computation of the sign bit for a floating point value. Returns
769/// the i1 sign bit value.
770static Value *EmitSignBit(CodeGenFunction &CGF, Value *V) {
771 LLVMContext &C = CGF.CGM.getLLVMContext();
772
773 llvm::Type *Ty = V->getType();
774 int Width = Ty->getPrimitiveSizeInBits();
775 llvm::Type *IntTy = llvm::IntegerType::get(C, NumBits: Width);
776 V = CGF.Builder.CreateBitCast(V, DestTy: IntTy);
777 if (Ty->isPPC_FP128Ty()) {
778 // We want the sign bit of the higher-order double. The bitcast we just
779 // did works as if the double-double was stored to memory and then
780 // read as an i128. The "store" will put the higher-order double in the
781 // lower address in both little- and big-Endian modes, but the "load"
782 // will treat those bits as a different part of the i128: the low bits in
783 // little-Endian, the high bits in big-Endian. Therefore, on big-Endian
784 // we need to shift the high bits down to the low before truncating.
785 Width >>= 1;
786 if (CGF.getTarget().isBigEndian()) {
787 Value *ShiftCst = llvm::ConstantInt::get(Ty: IntTy, V: Width);
788 V = CGF.Builder.CreateLShr(LHS: V, RHS: ShiftCst);
789 }
790 // We are truncating value in order to extract the higher-order
791 // double, which we will be using to extract the sign from.
792 IntTy = llvm::IntegerType::get(C, NumBits: Width);
793 V = CGF.Builder.CreateTrunc(V, DestTy: IntTy);
794 }
795 Value *Zero = llvm::Constant::getNullValue(Ty: IntTy);
796 return CGF.Builder.CreateICmpSLT(LHS: V, RHS: Zero);
797}
798
799static RValue emitLibraryCall(CodeGenFunction &CGF, const FunctionDecl *FD,
800 const CallExpr *E, llvm::Constant *calleeValue) {
801 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(CGF, E);
802 CGCallee callee = CGCallee::forDirect(functionPtr: calleeValue, abstractInfo: GlobalDecl(FD));
803 llvm::CallBase *callOrInvoke = nullptr;
804 CGFunctionInfo const *FnInfo = nullptr;
805 return CGF.EmitCall(FnType: E->getCallee()->getType(), Callee: callee, E, ReturnValue: ReturnValueSlot(),
806 /*Chain=*/nullptr, CallOrInvoke: &callOrInvoke, ResolvedFnInfo: &FnInfo);
807}
808
809/// Emit a call to llvm.{sadd,uadd,ssub,usub,smul,umul}.with.overflow.*
810/// depending on IntrinsicID.
811///
812/// \arg CGF The current codegen function.
813/// \arg IntrinsicID The ID for the Intrinsic we wish to generate.
814/// \arg X The first argument to the llvm.*.with.overflow.*.
815/// \arg Y The second argument to the llvm.*.with.overflow.*.
816/// \arg Carry The carry returned by the llvm.*.with.overflow.*.
817/// \returns The result (i.e. sum/product) returned by the intrinsic.
818llvm::Value *EmitOverflowIntrinsic(CodeGenFunction &CGF,
819 const Intrinsic::ID IntrinsicID,
820 llvm::Value *X, llvm::Value *Y,
821 llvm::Value *&Carry) {
822 // Make sure we have integers of the same width.
823 assert(X->getType() == Y->getType() &&
824 "Arguments must be the same type. (Did you forget to make sure both "
825 "arguments have the same integer width?)");
826
827 Function *Callee = CGF.CGM.getIntrinsic(IID: IntrinsicID, Tys: X->getType());
828 llvm::Value *Tmp = CGF.Builder.CreateCall(Callee, Args: {X, Y});
829 Carry = CGF.Builder.CreateExtractValue(Agg: Tmp, Idxs: 1);
830 return CGF.Builder.CreateExtractValue(Agg: Tmp, Idxs: 0);
831}
832
833namespace {
834 struct WidthAndSignedness {
835 unsigned Width;
836 bool Signed;
837 };
838}
839
840static WidthAndSignedness
841getIntegerWidthAndSignedness(const clang::ASTContext &context,
842 const clang::QualType Type) {
843 assert(Type->isIntegerType() && "Given type is not an integer.");
844 unsigned Width = context.getIntWidth(T: Type);
845 bool Signed = Type->isSignedIntegerType();
846 return {.Width: Width, .Signed: Signed};
847}
848
849// Given one or more integer types, this function produces an integer type that
850// encompasses them: any value in one of the given types could be expressed in
851// the encompassing type.
852static struct WidthAndSignedness
853EncompassingIntegerType(ArrayRef<struct WidthAndSignedness> Types) {
854 assert(Types.size() > 0 && "Empty list of types.");
855
856 // If any of the given types is signed, we must return a signed type.
857 bool Signed = false;
858 for (const auto &Type : Types) {
859 Signed |= Type.Signed;
860 }
861
862 // The encompassing type must have a width greater than or equal to the width
863 // of the specified types. Additionally, if the encompassing type is signed,
864 // its width must be strictly greater than the width of any unsigned types
865 // given.
866 unsigned Width = 0;
867 for (const auto &Type : Types) {
868 unsigned MinWidth = Type.Width + (Signed && !Type.Signed);
869 if (Width < MinWidth) {
870 Width = MinWidth;
871 }
872 }
873
874 return {.Width: Width, .Signed: Signed};
875}
876
877Value *CodeGenFunction::EmitVAStartEnd(Value *ArgValue, bool IsStart) {
878 Intrinsic::ID inst = IsStart ? Intrinsic::vastart : Intrinsic::vaend;
879 return Builder.CreateCall(Callee: CGM.getIntrinsic(IID: inst, Tys: {ArgValue->getType()}),
880 Args: ArgValue);
881}
882
883/// Checks if using the result of __builtin_object_size(p, @p From) in place of
884/// __builtin_object_size(p, @p To) is correct
885static bool areBOSTypesCompatible(int From, int To) {
886 // Note: Our __builtin_object_size implementation currently treats Type=0 and
887 // Type=2 identically. Encoding this implementation detail here may make
888 // improving __builtin_object_size difficult in the future, so it's omitted.
889 return From == To || (From == 0 && To == 1) || (From == 3 && To == 2);
890}
891
892static llvm::Value *
893getDefaultBuiltinObjectSizeResult(unsigned Type, llvm::IntegerType *ResType) {
894 return ConstantInt::get(Ty: ResType, V: (Type & 2) ? 0 : -1, /*isSigned=*/IsSigned: true);
895}
896
897llvm::Value *
898CodeGenFunction::evaluateOrEmitBuiltinObjectSize(const Expr *E, unsigned Type,
899 llvm::IntegerType *ResType,
900 llvm::Value *EmittedE,
901 bool IsDynamic) {
902 if (std::optional<uint64_t> ObjectSize =
903 E->tryEvaluateObjectSize(Ctx: getContext(), Type))
904 return ConstantInt::get(Ty: ResType, V: *ObjectSize, /*isSigned=*/IsSigned: true);
905 return emitBuiltinObjectSize(E, Type, ResType, EmittedE, IsDynamic);
906}
907
908/// Find a struct's flexible array member. It may be embedded inside multiple
909/// sub-structs, but must still be the last field.
910static const FieldDecl *FindFlexibleArrayMemberField(CodeGenFunction &CGF,
911 ASTContext &Ctx,
912 const RecordDecl *RD) {
913 const LangOptions::StrictFlexArraysLevelKind StrictFlexArraysLevel =
914 CGF.getLangOpts().getStrictFlexArraysLevel();
915
916 if (RD->isImplicit())
917 return nullptr;
918
919 for (const FieldDecl *FD : RD->fields()) {
920 if (Decl::isFlexibleArrayMemberLike(
921 Context: Ctx, D: FD, Ty: FD->getType(), StrictFlexArraysLevel,
922 /*IgnoreTemplateOrMacroSubstitution=*/true))
923 return FD;
924
925 if (const auto *RD = FD->getType()->getAsRecordDecl())
926 if (const FieldDecl *FD = FindFlexibleArrayMemberField(CGF, Ctx, RD))
927 return FD;
928 }
929
930 return nullptr;
931}
932
933/// Calculate the offset of a struct field. It may be embedded inside multiple
934/// sub-structs.
935static bool GetFieldOffset(ASTContext &Ctx, const RecordDecl *RD,
936 const FieldDecl *FD, int64_t &Offset) {
937 if (RD->isImplicit())
938 return false;
939
940 // Keep track of the field number ourselves, because the other methods
941 // (CGRecordLayout::getLLVMFieldNo) aren't always equivalent to how the AST
942 // is laid out.
943 uint32_t FieldNo = 0;
944 const ASTRecordLayout &Layout = Ctx.getASTRecordLayout(D: RD);
945
946 for (const FieldDecl *Field : RD->fields()) {
947 if (Field == FD) {
948 Offset += Layout.getFieldOffset(FieldNo);
949 return true;
950 }
951
952 if (const auto *RD = Field->getType()->getAsRecordDecl()) {
953 if (GetFieldOffset(Ctx, RD, FD, Offset)) {
954 Offset += Layout.getFieldOffset(FieldNo);
955 return true;
956 }
957 }
958
959 if (!RD->isUnion())
960 ++FieldNo;
961 }
962
963 return false;
964}
965
966static std::optional<int64_t>
967GetFieldOffset(ASTContext &Ctx, const RecordDecl *RD, const FieldDecl *FD) {
968 int64_t Offset = 0;
969
970 if (GetFieldOffset(Ctx, RD, FD, Offset))
971 return std::optional<int64_t>(Offset);
972
973 return std::nullopt;
974}
975
976llvm::Value *CodeGenFunction::emitCountedBySize(const Expr *E,
977 llvm::Value *EmittedE,
978 unsigned Type,
979 llvm::IntegerType *ResType) {
980 // Note: If the whole struct is specificed in the __bdos (i.e. Visitor
981 // returns a DeclRefExpr). The calculation of the whole size of the structure
982 // with a flexible array member can be done in two ways:
983 //
984 // 1) sizeof(struct S) + count * sizeof(typeof(fam))
985 // 2) offsetof(struct S, fam) + count * sizeof(typeof(fam))
986 //
987 // The first will add additional padding after the end of the array
988 // allocation while the second method is more precise, but not quite expected
989 // from programmers. See
990 // https://lore.kernel.org/lkml/ZvV6X5FPBBW7CO1f@archlinux/ for a discussion
991 // of the topic.
992 //
993 // GCC isn't (currently) able to calculate __bdos on a pointer to the whole
994 // structure. Therefore, because of the above issue, we choose to match what
995 // GCC does for consistency's sake.
996
997 const Expr *Idx = nullptr;
998 QualType ArrayElementTy;
999 E = findStructFieldAccess(E, OutArrayIndex: &Idx, OutArrayElementTy: &ArrayElementTy);
1000 if (!E)
1001 return nullptr;
1002
1003 if (Idx) {
1004 if (Idx->HasSideEffects(Ctx: getContext()))
1005 // We can't have side-effects.
1006 return getDefaultBuiltinObjectSizeResult(Type, ResType);
1007
1008 if (const auto *IL = dyn_cast<IntegerLiteral>(Val: Idx)) {
1009 int64_t Val = IL->getValue().getSExtValue();
1010 if (Val < 0)
1011 return getDefaultBuiltinObjectSizeResult(Type, ResType);
1012
1013 // The index is 0, so we don't need to take it into account.
1014 if (Val == 0)
1015 Idx = nullptr;
1016 }
1017 }
1018
1019 // __counted_by on either a flexible array member or a pointer into a struct
1020 // with a flexible array member.
1021 if (const auto *ME = dyn_cast<MemberExpr>(Val: E))
1022 return emitCountedByMemberSize(E: ME, Idx, EmittedE, CastedArrayElementTy: ArrayElementTy, Type,
1023 ResType);
1024
1025 // __counted_by on a pointer in a struct.
1026 if (const auto *ICE = dyn_cast<ImplicitCastExpr>(Val: E);
1027 ICE && ICE->getCastKind() == CK_LValueToRValue)
1028 return emitCountedByPointerSize(E: ICE, Idx, EmittedE, CastedArrayElementTy: ArrayElementTy, Type,
1029 ResType);
1030
1031 return nullptr;
1032}
1033
1034static llvm::Value *EmitPositiveResultOrZero(CodeGenFunction &CGF,
1035 llvm::Value *Res,
1036 llvm::Value *Index,
1037 llvm::IntegerType *ResType,
1038 bool IsSigned) {
1039 // cmp = (array_size >= 0)
1040 Value *Cmp = CGF.Builder.CreateIsNotNeg(Arg: Res);
1041 if (Index)
1042 // cmp = (cmp && index >= 0)
1043 Cmp = CGF.Builder.CreateAnd(LHS: CGF.Builder.CreateIsNotNeg(Arg: Index), RHS: Cmp);
1044
1045 // return cmp ? result : 0
1046 return CGF.Builder.CreateSelect(C: Cmp, True: Res,
1047 False: ConstantInt::get(Ty: ResType, V: 0, IsSigned));
1048}
1049
1050static std::pair<llvm::Value *, llvm::Value *>
1051GetCountFieldAndIndex(CodeGenFunction &CGF, const MemberExpr *ME,
1052 const FieldDecl *ArrayFD, const FieldDecl *CountFD,
1053 const Expr *Idx, llvm::IntegerType *ResType,
1054 bool IsSigned) {
1055 // count = ptr->count;
1056 Value *Count = CGF.EmitLoadOfCountedByField(Base: ME, FD: ArrayFD, CountDecl: CountFD);
1057 if (!Count)
1058 return std::make_pair<Value *>(x: nullptr, y: nullptr);
1059 Count = CGF.Builder.CreateIntCast(V: Count, DestTy: ResType, isSigned: IsSigned, Name: "count");
1060
1061 // index = ptr->index;
1062 Value *Index = nullptr;
1063 if (Idx) {
1064 bool IdxSigned = Idx->getType()->isSignedIntegerType();
1065 Index = CGF.EmitScalarExpr(E: Idx);
1066 Index = CGF.Builder.CreateIntCast(V: Index, DestTy: ResType, isSigned: IdxSigned, Name: "index");
1067 }
1068
1069 return std::make_pair(x&: Count, y&: Index);
1070}
1071
1072llvm::Value *CodeGenFunction::emitCountedByPointerSize(
1073 const ImplicitCastExpr *E, const Expr *Idx, llvm::Value *EmittedE,
1074 QualType CastedArrayElementTy, unsigned Type, llvm::IntegerType *ResType) {
1075 assert(E->getCastKind() == CK_LValueToRValue &&
1076 "must be an LValue to RValue cast");
1077
1078 const MemberExpr *ME =
1079 dyn_cast<MemberExpr>(Val: E->getSubExpr()->IgnoreParenNoopCasts(Ctx: getContext()));
1080 if (!ME)
1081 return nullptr;
1082
1083 const auto *ArrayBaseFD = dyn_cast<FieldDecl>(Val: ME->getMemberDecl());
1084 if (!ArrayBaseFD || !ArrayBaseFD->getType()->isPointerType() ||
1085 !ArrayBaseFD->getType()->isCountAttributedType())
1086 return nullptr;
1087
1088 // Get the 'count' FieldDecl.
1089 const FieldDecl *CountFD = ArrayBaseFD->findCountedByField();
1090 if (!CountFD)
1091 // Can't find the field referenced by the "counted_by" attribute.
1092 return nullptr;
1093
1094 // Calculate the array's object size using these formulae. (Note: if the
1095 // calculation is negative, we return 0.):
1096 //
1097 // struct p;
1098 // struct s {
1099 // /* ... */
1100 // struct p **array __attribute__((counted_by(count)));
1101 // int count;
1102 // };
1103 //
1104 // 1) 'ptr->array':
1105 //
1106 // count = ptr->count;
1107 //
1108 // array_element_size = sizeof (*ptr->array);
1109 // array_size = count * array_element_size;
1110 //
1111 // result = array_size;
1112 //
1113 // cmp = (result >= 0)
1114 // return cmp ? result : 0;
1115 //
1116 // 2) '&((cast) ptr->array)[idx]':
1117 //
1118 // count = ptr->count;
1119 // index = idx;
1120 //
1121 // array_element_size = sizeof (*ptr->array);
1122 // array_size = count * array_element_size;
1123 //
1124 // casted_array_element_size = sizeof (*((cast) ptr->array));
1125 //
1126 // index_size = index * casted_array_element_size;
1127 // result = array_size - index_size;
1128 //
1129 // cmp = (result >= 0)
1130 // if (index)
1131 // cmp = (cmp && index > 0)
1132 // return cmp ? result : 0;
1133
1134 auto GetElementBaseSize = [&](QualType ElementTy) {
1135 CharUnits ElementSize =
1136 getContext().getTypeSizeInChars(T: ElementTy->getPointeeType());
1137
1138 if (ElementSize.isZero()) {
1139 // This might be a __sized_by (or __counted_by) on a
1140 // 'void *', which counts bytes, not elements.
1141 [[maybe_unused]] auto *CAT = ElementTy->getAs<CountAttributedType>();
1142 assert(CAT && "must have an CountAttributedType");
1143
1144 ElementSize = CharUnits::One();
1145 }
1146
1147 return std::optional<CharUnits>(ElementSize);
1148 };
1149
1150 // Get the sizes of the original array element and the casted array element,
1151 // if different.
1152 std::optional<CharUnits> ArrayElementBaseSize =
1153 GetElementBaseSize(ArrayBaseFD->getType());
1154 if (!ArrayElementBaseSize)
1155 return nullptr;
1156
1157 std::optional<CharUnits> CastedArrayElementBaseSize = ArrayElementBaseSize;
1158 if (!CastedArrayElementTy.isNull() && CastedArrayElementTy->isPointerType()) {
1159 CastedArrayElementBaseSize = GetElementBaseSize(CastedArrayElementTy);
1160 if (!CastedArrayElementBaseSize)
1161 return nullptr;
1162 }
1163
1164 bool IsSigned = CountFD->getType()->isSignedIntegerType();
1165
1166 // count = ptr->count;
1167 // index = ptr->index;
1168 Value *Count, *Index;
1169 std::tie(args&: Count, args&: Index) = GetCountFieldAndIndex(
1170 CGF&: *this, ME, ArrayFD: ArrayBaseFD, CountFD, Idx, ResType, IsSigned);
1171 if (!Count)
1172 return nullptr;
1173
1174 // array_element_size = sizeof (*ptr->array)
1175 auto *ArrayElementSize = llvm::ConstantInt::get(
1176 Ty: ResType, V: ArrayElementBaseSize->getQuantity(), IsSigned);
1177
1178 // casted_array_element_size = sizeof (*((cast) ptr->array));
1179 auto *CastedArrayElementSize = llvm::ConstantInt::get(
1180 Ty: ResType, V: CastedArrayElementBaseSize->getQuantity(), IsSigned);
1181
1182 // array_size = count * array_element_size;
1183 Value *ArraySize = Builder.CreateMul(LHS: Count, RHS: ArrayElementSize, Name: "array_size",
1184 HasNUW: !IsSigned, HasNSW: IsSigned);
1185
1186 // Option (1) 'ptr->array'
1187 // result = array_size
1188 Value *Result = ArraySize;
1189
1190 if (Idx) { // Option (2) '&((cast) ptr->array)[idx]'
1191 // index_size = index * casted_array_element_size;
1192 Value *IndexSize = Builder.CreateMul(LHS: Index, RHS: CastedArrayElementSize,
1193 Name: "index_size", HasNUW: !IsSigned, HasNSW: IsSigned);
1194
1195 // result = result - index_size;
1196 Result =
1197 Builder.CreateSub(LHS: Result, RHS: IndexSize, Name: "result", HasNUW: !IsSigned, HasNSW: IsSigned);
1198 }
1199
1200 return EmitPositiveResultOrZero(CGF&: *this, Res: Result, Index, ResType, IsSigned);
1201}
1202
1203llvm::Value *CodeGenFunction::emitCountedByMemberSize(
1204 const MemberExpr *ME, const Expr *Idx, llvm::Value *EmittedE,
1205 QualType CastedArrayElementTy, unsigned Type, llvm::IntegerType *ResType) {
1206 const auto *FD = dyn_cast<FieldDecl>(Val: ME->getMemberDecl());
1207 if (!FD)
1208 return nullptr;
1209
1210 // Find the flexible array member and check that it has the __counted_by
1211 // attribute.
1212 ASTContext &Ctx = getContext();
1213 const RecordDecl *RD = FD->getDeclContext()->getOuterLexicalRecordContext();
1214 const FieldDecl *FlexibleArrayMemberFD = nullptr;
1215
1216 if (Decl::isFlexibleArrayMemberLike(
1217 Context: Ctx, D: FD, Ty: FD->getType(), StrictFlexArraysLevel: getLangOpts().getStrictFlexArraysLevel(),
1218 /*IgnoreTemplateOrMacroSubstitution=*/true))
1219 FlexibleArrayMemberFD = FD;
1220 else
1221 FlexibleArrayMemberFD = FindFlexibleArrayMemberField(CGF&: *this, Ctx, RD);
1222
1223 if (!FlexibleArrayMemberFD ||
1224 !FlexibleArrayMemberFD->getType()->isCountAttributedType())
1225 return nullptr;
1226
1227 // Get the 'count' FieldDecl.
1228 const FieldDecl *CountFD = FlexibleArrayMemberFD->findCountedByField();
1229 if (!CountFD)
1230 // Can't find the field referenced by the "counted_by" attribute.
1231 return nullptr;
1232
1233 // Calculate the flexible array member's object size using these formulae.
1234 // (Note: if the calculation is negative, we return 0.):
1235 //
1236 // struct p;
1237 // struct s {
1238 // /* ... */
1239 // int count;
1240 // struct p *array[] __attribute__((counted_by(count)));
1241 // };
1242 //
1243 // 1) 'ptr->array':
1244 //
1245 // count = ptr->count;
1246 //
1247 // flexible_array_member_element_size = sizeof (*ptr->array);
1248 // flexible_array_member_size =
1249 // count * flexible_array_member_element_size;
1250 //
1251 // result = flexible_array_member_size;
1252 //
1253 // cmp = (result >= 0)
1254 // return cmp ? result : 0;
1255 //
1256 // 2) '&((cast) ptr->array)[idx]':
1257 //
1258 // count = ptr->count;
1259 // index = idx;
1260 //
1261 // flexible_array_member_element_size = sizeof (*ptr->array);
1262 // flexible_array_member_size =
1263 // count * flexible_array_member_element_size;
1264 //
1265 // casted_flexible_array_member_element_size =
1266 // sizeof (*((cast) ptr->array));
1267 // index_size = index * casted_flexible_array_member_element_size;
1268 //
1269 // result = flexible_array_member_size - index_size;
1270 //
1271 // cmp = (result >= 0)
1272 // if (index != 0)
1273 // cmp = (cmp && index >= 0)
1274 // return cmp ? result : 0;
1275 //
1276 // 3) '&ptr->field':
1277 //
1278 // count = ptr->count;
1279 // sizeof_struct = sizeof (struct s);
1280 //
1281 // flexible_array_member_element_size = sizeof (*ptr->array);
1282 // flexible_array_member_size =
1283 // count * flexible_array_member_element_size;
1284 //
1285 // field_offset = offsetof (struct s, field);
1286 // offset_diff = sizeof_struct - field_offset;
1287 //
1288 // result = offset_diff + flexible_array_member_size;
1289 //
1290 // cmp = (result >= 0)
1291 // return cmp ? result : 0;
1292 //
1293 // 4) '&((cast) ptr->field_array)[idx]':
1294 //
1295 // count = ptr->count;
1296 // index = idx;
1297 // sizeof_struct = sizeof (struct s);
1298 //
1299 // flexible_array_member_element_size = sizeof (*ptr->array);
1300 // flexible_array_member_size =
1301 // count * flexible_array_member_element_size;
1302 //
1303 // casted_field_element_size = sizeof (*((cast) ptr->field_array));
1304 // field_offset = offsetof (struct s, field)
1305 // field_offset += index * casted_field_element_size;
1306 //
1307 // offset_diff = sizeof_struct - field_offset;
1308 //
1309 // result = offset_diff + flexible_array_member_size;
1310 //
1311 // cmp = (result >= 0)
1312 // if (index != 0)
1313 // cmp = (cmp && index >= 0)
1314 // return cmp ? result : 0;
1315
1316 bool IsSigned = CountFD->getType()->isSignedIntegerType();
1317
1318 QualType FlexibleArrayMemberTy = FlexibleArrayMemberFD->getType();
1319
1320 // Explicit cast because otherwise the CharWidth will promote an i32's into
1321 // u64's leading to overflows.
1322 int64_t CharWidth = static_cast<int64_t>(CGM.getContext().getCharWidth());
1323
1324 // field_offset = offsetof (struct s, field);
1325 Value *FieldOffset = nullptr;
1326 if (FlexibleArrayMemberFD != FD) {
1327 std::optional<int64_t> Offset = GetFieldOffset(Ctx, RD, FD);
1328 if (!Offset)
1329 return nullptr;
1330 FieldOffset =
1331 llvm::ConstantInt::get(Ty: ResType, V: *Offset / CharWidth, IsSigned);
1332 }
1333
1334 // count = ptr->count;
1335 // index = ptr->index;
1336 Value *Count, *Index;
1337 std::tie(args&: Count, args&: Index) = GetCountFieldAndIndex(
1338 CGF&: *this, ME, ArrayFD: FlexibleArrayMemberFD, CountFD, Idx, ResType, IsSigned);
1339 if (!Count)
1340 return nullptr;
1341
1342 // flexible_array_member_element_size = sizeof (*ptr->array);
1343 const ArrayType *ArrayTy = Ctx.getAsArrayType(T: FlexibleArrayMemberTy);
1344 CharUnits BaseSize = Ctx.getTypeSizeInChars(T: ArrayTy->getElementType());
1345 auto *FlexibleArrayMemberElementSize =
1346 llvm::ConstantInt::get(Ty: ResType, V: BaseSize.getQuantity(), IsSigned);
1347
1348 // flexible_array_member_size = count * flexible_array_member_element_size;
1349 Value *FlexibleArrayMemberSize =
1350 Builder.CreateMul(LHS: Count, RHS: FlexibleArrayMemberElementSize,
1351 Name: "flexible_array_member_size", HasNUW: !IsSigned, HasNSW: IsSigned);
1352
1353 Value *Result = nullptr;
1354 if (FlexibleArrayMemberFD == FD) {
1355 if (Idx) { // Option (2) '&((cast) ptr->array)[idx]'
1356 // casted_flexible_array_member_element_size =
1357 // sizeof (*((cast) ptr->array));
1358 llvm::ConstantInt *CastedFlexibleArrayMemberElementSize =
1359 FlexibleArrayMemberElementSize;
1360 if (!CastedArrayElementTy.isNull() &&
1361 CastedArrayElementTy->isPointerType()) {
1362 CharUnits BaseSize =
1363 Ctx.getTypeSizeInChars(T: CastedArrayElementTy->getPointeeType());
1364 CastedFlexibleArrayMemberElementSize =
1365 llvm::ConstantInt::get(Ty: ResType, V: BaseSize.getQuantity(), IsSigned);
1366 }
1367
1368 // index_size = index * casted_flexible_array_member_element_size;
1369 Value *IndexSize =
1370 Builder.CreateMul(LHS: Index, RHS: CastedFlexibleArrayMemberElementSize,
1371 Name: "index_size", HasNUW: !IsSigned, HasNSW: IsSigned);
1372
1373 // result = flexible_array_member_size - index_size;
1374 Result = Builder.CreateSub(LHS: FlexibleArrayMemberSize, RHS: IndexSize, Name: "result",
1375 HasNUW: !IsSigned, HasNSW: IsSigned);
1376 } else { // Option (1) 'ptr->array'
1377 // result = flexible_array_member_size;
1378 Result = FlexibleArrayMemberSize;
1379 }
1380 } else {
1381 // sizeof_struct = sizeof (struct s);
1382 llvm::StructType *StructTy = getTypes().getCGRecordLayout(RD).getLLVMType();
1383 const llvm::DataLayout &Layout = CGM.getDataLayout();
1384 TypeSize Size = Layout.getTypeSizeInBits(Ty: StructTy);
1385 Value *SizeofStruct =
1386 llvm::ConstantInt::get(Ty: ResType, V: Size.getKnownMinValue() / CharWidth);
1387
1388 if (Idx) { // Option (4) '&((cast) ptr->field_array)[idx]'
1389 // casted_field_element_size = sizeof (*((cast) ptr->field_array));
1390 CharUnits BaseSize;
1391 if (!CastedArrayElementTy.isNull() &&
1392 CastedArrayElementTy->isPointerType()) {
1393 BaseSize =
1394 Ctx.getTypeSizeInChars(T: CastedArrayElementTy->getPointeeType());
1395 } else {
1396 const ArrayType *ArrayTy = Ctx.getAsArrayType(T: FD->getType());
1397 BaseSize = Ctx.getTypeSizeInChars(T: ArrayTy->getElementType());
1398 }
1399
1400 llvm::ConstantInt *CastedFieldElementSize =
1401 llvm::ConstantInt::get(Ty: ResType, V: BaseSize.getQuantity(), IsSigned);
1402
1403 // field_offset += index * casted_field_element_size;
1404 Value *Mul = Builder.CreateMul(LHS: Index, RHS: CastedFieldElementSize,
1405 Name: "field_offset", HasNUW: !IsSigned, HasNSW: IsSigned);
1406 FieldOffset = Builder.CreateAdd(LHS: FieldOffset, RHS: Mul);
1407 }
1408 // Option (3) '&ptr->field', and Option (4) continuation.
1409 // offset_diff = flexible_array_member_offset - field_offset;
1410 Value *OffsetDiff = Builder.CreateSub(LHS: SizeofStruct, RHS: FieldOffset,
1411 Name: "offset_diff", HasNUW: !IsSigned, HasNSW: IsSigned);
1412
1413 // result = offset_diff + flexible_array_member_size;
1414 Result = Builder.CreateAdd(LHS: FlexibleArrayMemberSize, RHS: OffsetDiff, Name: "result");
1415 }
1416
1417 return EmitPositiveResultOrZero(CGF&: *this, Res: Result, Index, ResType, IsSigned);
1418}
1419
1420/// Returns a Value corresponding to the size of the given expression.
1421/// This Value may be either of the following:
1422/// - A llvm::Argument (if E is a param with the pass_object_size attribute on
1423/// it)
1424/// - A call to the @llvm.objectsize intrinsic
1425///
1426/// EmittedE is the result of emitting `E` as a scalar expr. If it's non-null
1427/// and we wouldn't otherwise try to reference a pass_object_size parameter,
1428/// we'll call @llvm.objectsize on EmittedE, rather than emitting E.
1429llvm::Value *
1430CodeGenFunction::emitBuiltinObjectSize(const Expr *E, unsigned Type,
1431 llvm::IntegerType *ResType,
1432 llvm::Value *EmittedE, bool IsDynamic) {
1433 // We need to reference an argument if the pointer is a parameter with the
1434 // pass_object_size attribute.
1435 if (auto *D = dyn_cast<DeclRefExpr>(Val: E->IgnoreParenImpCasts())) {
1436 auto *Param = dyn_cast<ParmVarDecl>(Val: D->getDecl());
1437 auto *PS = D->getDecl()->getAttr<PassObjectSizeAttr>();
1438 if (Param != nullptr && PS != nullptr &&
1439 areBOSTypesCompatible(From: PS->getType(), To: Type)) {
1440 auto Iter = SizeArguments.find(Val: Param);
1441 assert(Iter != SizeArguments.end());
1442
1443 const ImplicitParamDecl *D = Iter->second;
1444 auto DIter = LocalDeclMap.find(Val: D);
1445 assert(DIter != LocalDeclMap.end());
1446
1447 return EmitLoadOfScalar(Addr: DIter->second, /*Volatile=*/false,
1448 Ty: getContext().getSizeType(), Loc: E->getBeginLoc());
1449 }
1450 }
1451
1452 // LLVM can't handle Type=3 appropriately, and __builtin_object_size shouldn't
1453 // evaluate E for side-effects. In either case, we shouldn't lower to
1454 // @llvm.objectsize.
1455 if (Type == 3 || (!EmittedE && E->HasSideEffects(Ctx: getContext())))
1456 return getDefaultBuiltinObjectSizeResult(Type, ResType);
1457
1458 Value *Ptr = EmittedE ? EmittedE : EmitScalarExpr(E);
1459 assert(Ptr->getType()->isPointerTy() &&
1460 "Non-pointer passed to __builtin_object_size?");
1461
1462 if (IsDynamic)
1463 // Emit special code for a flexible array member with the "counted_by"
1464 // attribute.
1465 if (Value *V = emitCountedBySize(E, EmittedE: Ptr, Type, ResType))
1466 return V;
1467
1468 Function *F =
1469 CGM.getIntrinsic(IID: Intrinsic::objectsize, Tys: {ResType, Ptr->getType()});
1470
1471 // LLVM only supports 0 and 2, make sure that we pass along that as a boolean.
1472 Value *Min = Builder.getInt1(V: (Type & 2) != 0);
1473 // For GCC compatibility, __builtin_object_size treat NULL as unknown size.
1474 Value *NullIsUnknown = Builder.getTrue();
1475 Value *Dynamic = Builder.getInt1(V: IsDynamic);
1476 return Builder.CreateCall(Callee: F, Args: {Ptr, Min, NullIsUnknown, Dynamic});
1477}
1478
1479namespace {
1480/// A struct to generically describe a bit test intrinsic.
1481struct BitTest {
1482 enum ActionKind : uint8_t { TestOnly, Complement, Reset, Set };
1483 enum InterlockingKind : uint8_t {
1484 Unlocked,
1485 Sequential,
1486 Acquire,
1487 Release,
1488 NoFence
1489 };
1490
1491 ActionKind Action;
1492 InterlockingKind Interlocking;
1493 bool Is64Bit;
1494
1495 static BitTest decodeBitTestBuiltin(unsigned BuiltinID);
1496};
1497
1498} // namespace
1499
1500BitTest BitTest::decodeBitTestBuiltin(unsigned BuiltinID) {
1501 switch (BuiltinID) {
1502 // Main portable variants.
1503 case Builtin::BI_bittest:
1504 return {.Action: TestOnly, .Interlocking: Unlocked, .Is64Bit: false};
1505 case Builtin::BI_bittestandcomplement:
1506 return {.Action: Complement, .Interlocking: Unlocked, .Is64Bit: false};
1507 case Builtin::BI_bittestandreset:
1508 return {.Action: Reset, .Interlocking: Unlocked, .Is64Bit: false};
1509 case Builtin::BI_bittestandset:
1510 return {.Action: Set, .Interlocking: Unlocked, .Is64Bit: false};
1511 case Builtin::BI_interlockedbittestandreset:
1512 return {.Action: Reset, .Interlocking: Sequential, .Is64Bit: false};
1513 case Builtin::BI_interlockedbittestandset:
1514 return {.Action: Set, .Interlocking: Sequential, .Is64Bit: false};
1515
1516 // 64-bit variants.
1517 case Builtin::BI_bittest64:
1518 return {.Action: TestOnly, .Interlocking: Unlocked, .Is64Bit: true};
1519 case Builtin::BI_bittestandcomplement64:
1520 return {.Action: Complement, .Interlocking: Unlocked, .Is64Bit: true};
1521 case Builtin::BI_bittestandreset64:
1522 return {.Action: Reset, .Interlocking: Unlocked, .Is64Bit: true};
1523 case Builtin::BI_bittestandset64:
1524 return {.Action: Set, .Interlocking: Unlocked, .Is64Bit: true};
1525 case Builtin::BI_interlockedbittestandreset64:
1526 return {.Action: Reset, .Interlocking: Sequential, .Is64Bit: true};
1527 case Builtin::BI_interlockedbittestandset64:
1528 return {.Action: Set, .Interlocking: Sequential, .Is64Bit: true};
1529
1530 // ARM/AArch64-specific ordering variants.
1531 case Builtin::BI_interlockedbittestandset_acq:
1532 return {.Action: Set, .Interlocking: Acquire, .Is64Bit: false};
1533 case Builtin::BI_interlockedbittestandset_rel:
1534 return {.Action: Set, .Interlocking: Release, .Is64Bit: false};
1535 case Builtin::BI_interlockedbittestandset_nf:
1536 return {.Action: Set, .Interlocking: NoFence, .Is64Bit: false};
1537 case Builtin::BI_interlockedbittestandreset_acq:
1538 return {.Action: Reset, .Interlocking: Acquire, .Is64Bit: false};
1539 case Builtin::BI_interlockedbittestandreset_rel:
1540 return {.Action: Reset, .Interlocking: Release, .Is64Bit: false};
1541 case Builtin::BI_interlockedbittestandreset_nf:
1542 return {.Action: Reset, .Interlocking: NoFence, .Is64Bit: false};
1543 case Builtin::BI_interlockedbittestandreset64_acq:
1544 return {.Action: Reset, .Interlocking: Acquire, .Is64Bit: false};
1545 case Builtin::BI_interlockedbittestandreset64_rel:
1546 return {.Action: Reset, .Interlocking: Release, .Is64Bit: false};
1547 case Builtin::BI_interlockedbittestandreset64_nf:
1548 return {.Action: Reset, .Interlocking: NoFence, .Is64Bit: false};
1549 case Builtin::BI_interlockedbittestandset64_acq:
1550 return {.Action: Set, .Interlocking: Acquire, .Is64Bit: false};
1551 case Builtin::BI_interlockedbittestandset64_rel:
1552 return {.Action: Set, .Interlocking: Release, .Is64Bit: false};
1553 case Builtin::BI_interlockedbittestandset64_nf:
1554 return {.Action: Set, .Interlocking: NoFence, .Is64Bit: false};
1555 }
1556 llvm_unreachable("expected only bittest intrinsics");
1557}
1558
1559static char bitActionToX86BTCode(BitTest::ActionKind A) {
1560 switch (A) {
1561 case BitTest::TestOnly: return '\0';
1562 case BitTest::Complement: return 'c';
1563 case BitTest::Reset: return 'r';
1564 case BitTest::Set: return 's';
1565 }
1566 llvm_unreachable("invalid action");
1567}
1568
1569static llvm::Value *EmitX86BitTestIntrinsic(CodeGenFunction &CGF,
1570 BitTest BT,
1571 const CallExpr *E, Value *BitBase,
1572 Value *BitPos) {
1573 char Action = bitActionToX86BTCode(A: BT.Action);
1574 char SizeSuffix = BT.Is64Bit ? 'q' : 'l';
1575
1576 // Build the assembly.
1577 SmallString<64> Asm;
1578 raw_svector_ostream AsmOS(Asm);
1579 if (BT.Interlocking != BitTest::Unlocked)
1580 AsmOS << "lock ";
1581 AsmOS << "bt";
1582 if (Action)
1583 AsmOS << Action;
1584 AsmOS << SizeSuffix << " $2, ($1)";
1585
1586 // Build the constraints. FIXME: We should support immediates when possible.
1587 std::string Constraints = "={@ccc},r,r,~{cc},~{memory}";
1588 std::string_view MachineClobbers = CGF.getTarget().getClobbers();
1589 if (!MachineClobbers.empty()) {
1590 Constraints += ',';
1591 Constraints += MachineClobbers;
1592 }
1593 llvm::IntegerType *IntType = llvm::IntegerType::get(
1594 C&: CGF.getLLVMContext(),
1595 NumBits: CGF.getContext().getTypeSize(T: E->getArg(Arg: 1)->getType()));
1596 llvm::FunctionType *FTy =
1597 llvm::FunctionType::get(Result: CGF.Int8Ty, Params: {CGF.DefaultPtrTy, IntType}, isVarArg: false);
1598
1599 llvm::InlineAsm *IA =
1600 llvm::InlineAsm::get(Ty: FTy, AsmString: Asm, Constraints, /*hasSideEffects=*/true);
1601 return CGF.Builder.CreateCall(Callee: IA, Args: {BitBase, BitPos});
1602}
1603
1604static llvm::AtomicOrdering
1605getBitTestAtomicOrdering(BitTest::InterlockingKind I) {
1606 switch (I) {
1607 case BitTest::Unlocked: return llvm::AtomicOrdering::NotAtomic;
1608 case BitTest::Sequential: return llvm::AtomicOrdering::SequentiallyConsistent;
1609 case BitTest::Acquire: return llvm::AtomicOrdering::Acquire;
1610 case BitTest::Release: return llvm::AtomicOrdering::Release;
1611 case BitTest::NoFence: return llvm::AtomicOrdering::Monotonic;
1612 }
1613 llvm_unreachable("invalid interlocking");
1614}
1615
1616static llvm::Value *EmitBitCountExpr(CodeGenFunction &CGF, const Expr *E) {
1617 llvm::Value *ArgValue = CGF.EmitScalarExpr(E);
1618 llvm::Type *ArgType = ArgValue->getType();
1619
1620 // Boolean vectors can be casted directly to its bitfield representation. We
1621 // intentionally do not round up to the next power of two size and let LLVM
1622 // handle the trailing bits.
1623 if (auto *VT = dyn_cast<llvm::FixedVectorType>(Val: ArgType);
1624 VT && VT->getElementType()->isIntegerTy(BitWidth: 1)) {
1625 llvm::Type *StorageType =
1626 llvm::Type::getIntNTy(C&: CGF.getLLVMContext(), N: VT->getNumElements());
1627 ArgValue = CGF.Builder.CreateBitCast(V: ArgValue, DestTy: StorageType);
1628 }
1629
1630 return ArgValue;
1631}
1632
1633/// Emit a _bittest* intrinsic. These intrinsics take a pointer to an array of
1634/// bits and a bit position and read and optionally modify the bit at that
1635/// position. The position index can be arbitrarily large, i.e. it can be larger
1636/// than 31 or 63, so we need an indexed load in the general case.
1637static llvm::Value *EmitBitTestIntrinsic(CodeGenFunction &CGF,
1638 unsigned BuiltinID,
1639 const CallExpr *E) {
1640 Value *BitBase = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
1641 Value *BitPos = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
1642
1643 BitTest BT = BitTest::decodeBitTestBuiltin(BuiltinID);
1644
1645 // X86 has special BT, BTC, BTR, and BTS instructions that handle the array
1646 // indexing operation internally. Use them if possible.
1647 if (CGF.getTarget().getTriple().isX86())
1648 return EmitX86BitTestIntrinsic(CGF, BT, E, BitBase, BitPos);
1649
1650 // Otherwise, use generic code to load one byte and test the bit. Use all but
1651 // the bottom three bits as the array index, and the bottom three bits to form
1652 // a mask.
1653 // Bit = BitBaseI8[BitPos >> 3] & (1 << (BitPos & 0x7)) != 0;
1654 Value *ByteIndex = CGF.Builder.CreateAShr(
1655 LHS: BitPos, RHS: llvm::ConstantInt::get(Ty: BitPos->getType(), V: 3), Name: "bittest.byteidx");
1656 Address ByteAddr(CGF.Builder.CreateInBoundsGEP(Ty: CGF.Int8Ty, Ptr: BitBase, IdxList: ByteIndex,
1657 Name: "bittest.byteaddr"),
1658 CGF.Int8Ty, CharUnits::One());
1659 Value *PosLow =
1660 CGF.Builder.CreateAnd(LHS: CGF.Builder.CreateTrunc(V: BitPos, DestTy: CGF.Int8Ty),
1661 RHS: llvm::ConstantInt::get(Ty: CGF.Int8Ty, V: 0x7));
1662
1663 // The updating instructions will need a mask.
1664 Value *Mask = nullptr;
1665 if (BT.Action != BitTest::TestOnly) {
1666 Mask = CGF.Builder.CreateShl(LHS: llvm::ConstantInt::get(Ty: CGF.Int8Ty, V: 1), RHS: PosLow,
1667 Name: "bittest.mask");
1668 }
1669
1670 // Check the action and ordering of the interlocked intrinsics.
1671 llvm::AtomicOrdering Ordering = getBitTestAtomicOrdering(I: BT.Interlocking);
1672
1673 Value *OldByte = nullptr;
1674 if (Ordering != llvm::AtomicOrdering::NotAtomic) {
1675 // Emit a combined atomicrmw load/store operation for the interlocked
1676 // intrinsics.
1677 llvm::AtomicRMWInst::BinOp RMWOp = llvm::AtomicRMWInst::Or;
1678 if (BT.Action == BitTest::Reset) {
1679 Mask = CGF.Builder.CreateNot(V: Mask);
1680 RMWOp = llvm::AtomicRMWInst::And;
1681 }
1682 OldByte = CGF.Builder.CreateAtomicRMW(Op: RMWOp, Addr: ByteAddr, Val: Mask, Ordering);
1683 } else {
1684 // Emit a plain load for the non-interlocked intrinsics.
1685 OldByte = CGF.Builder.CreateLoad(Addr: ByteAddr, Name: "bittest.byte");
1686 Value *NewByte = nullptr;
1687 switch (BT.Action) {
1688 case BitTest::TestOnly:
1689 // Don't store anything.
1690 break;
1691 case BitTest::Complement:
1692 NewByte = CGF.Builder.CreateXor(LHS: OldByte, RHS: Mask);
1693 break;
1694 case BitTest::Reset:
1695 NewByte = CGF.Builder.CreateAnd(LHS: OldByte, RHS: CGF.Builder.CreateNot(V: Mask));
1696 break;
1697 case BitTest::Set:
1698 NewByte = CGF.Builder.CreateOr(LHS: OldByte, RHS: Mask);
1699 break;
1700 }
1701 if (NewByte)
1702 CGF.Builder.CreateStore(Val: NewByte, Addr: ByteAddr);
1703 }
1704
1705 // However we loaded the old byte, either by plain load or atomicrmw, shift
1706 // the bit into the low position and mask it to 0 or 1.
1707 Value *ShiftedByte = CGF.Builder.CreateLShr(LHS: OldByte, RHS: PosLow, Name: "bittest.shr");
1708 return CGF.Builder.CreateAnd(
1709 LHS: ShiftedByte, RHS: llvm::ConstantInt::get(Ty: CGF.Int8Ty, V: 1), Name: "bittest.res");
1710}
1711
1712namespace {
1713enum class MSVCSetJmpKind {
1714 _setjmpex,
1715 _setjmp3,
1716 _setjmp
1717};
1718}
1719
1720/// MSVC handles setjmp a bit differently on different platforms. On every
1721/// architecture except 32-bit x86, the frame address is passed. On x86, extra
1722/// parameters can be passed as variadic arguments, but we always pass none.
1723static RValue EmitMSVCRTSetJmp(CodeGenFunction &CGF, MSVCSetJmpKind SJKind,
1724 const CallExpr *E) {
1725 llvm::Value *Arg1 = nullptr;
1726 llvm::Type *Arg1Ty = nullptr;
1727 StringRef Name;
1728 bool IsVarArg = false;
1729 if (SJKind == MSVCSetJmpKind::_setjmp3) {
1730 Name = "_setjmp3";
1731 Arg1Ty = CGF.Int32Ty;
1732 Arg1 = llvm::ConstantInt::get(Ty: CGF.IntTy, V: 0);
1733 IsVarArg = true;
1734 } else {
1735 Name = SJKind == MSVCSetJmpKind::_setjmp ? "_setjmp" : "_setjmpex";
1736 Arg1Ty = CGF.Int8PtrTy;
1737 if (CGF.getTarget().getTriple().getArch() == llvm::Triple::aarch64) {
1738 Arg1 = CGF.Builder.CreateCall(
1739 Callee: CGF.CGM.getIntrinsic(IID: Intrinsic::sponentry, Tys: CGF.AllocaInt8PtrTy));
1740 } else
1741 Arg1 = CGF.Builder.CreateCall(
1742 Callee: CGF.CGM.getIntrinsic(IID: Intrinsic::frameaddress, Tys: CGF.AllocaInt8PtrTy),
1743 Args: llvm::ConstantInt::get(Ty: CGF.Int32Ty, V: 0));
1744 }
1745
1746 // Mark the call site and declaration with ReturnsTwice.
1747 llvm::Type *ArgTypes[2] = {CGF.Int8PtrTy, Arg1Ty};
1748 llvm::AttributeList ReturnsTwiceAttr = llvm::AttributeList::get(
1749 C&: CGF.getLLVMContext(), Index: llvm::AttributeList::FunctionIndex,
1750 Kinds: llvm::Attribute::ReturnsTwice);
1751 llvm::FunctionCallee SetJmpFn = CGF.CGM.CreateRuntimeFunction(
1752 Ty: llvm::FunctionType::get(Result: CGF.IntTy, Params: ArgTypes, isVarArg: IsVarArg), Name,
1753 ExtraAttrs: ReturnsTwiceAttr, /*Local=*/true);
1754
1755 llvm::Value *Buf = CGF.Builder.CreateBitOrPointerCast(
1756 V: CGF.EmitScalarExpr(E: E->getArg(Arg: 0)), DestTy: CGF.Int8PtrTy);
1757 llvm::Value *Args[] = {Buf, Arg1};
1758 llvm::CallBase *CB = CGF.EmitRuntimeCallOrInvoke(callee: SetJmpFn, args: Args);
1759 CB->setAttributes(ReturnsTwiceAttr);
1760 return RValue::get(V: CB);
1761}
1762
1763// Emit an MSVC intrinsic. Assumes that arguments have *not* been evaluated.
1764Value *CodeGenFunction::EmitMSVCBuiltinExpr(MSVCIntrin BuiltinID,
1765 const CallExpr *E) {
1766 switch (BuiltinID) {
1767 case MSVCIntrin::_BitScanForward:
1768 case MSVCIntrin::_BitScanReverse: {
1769 Address IndexAddress(EmitPointerWithAlignment(Addr: E->getArg(Arg: 0)));
1770 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 1));
1771
1772 llvm::Type *ArgType = ArgValue->getType();
1773 llvm::Type *IndexType = IndexAddress.getElementType();
1774 llvm::Type *ResultType = ConvertType(T: E->getType());
1775
1776 Value *ArgZero = llvm::Constant::getNullValue(Ty: ArgType);
1777 Value *ResZero = llvm::Constant::getNullValue(Ty: ResultType);
1778 Value *ResOne = llvm::ConstantInt::get(Ty: ResultType, V: 1);
1779
1780 BasicBlock *Begin = Builder.GetInsertBlock();
1781 BasicBlock *End = createBasicBlock(name: "bitscan_end", parent: this->CurFn);
1782 Builder.SetInsertPoint(End);
1783 PHINode *Result = Builder.CreatePHI(Ty: ResultType, NumReservedValues: 2, Name: "bitscan_result");
1784
1785 Builder.SetInsertPoint(Begin);
1786 Value *IsZero = Builder.CreateICmpEQ(LHS: ArgValue, RHS: ArgZero);
1787 BasicBlock *NotZero = createBasicBlock(name: "bitscan_not_zero", parent: this->CurFn);
1788 Builder.CreateCondBr(Cond: IsZero, True: End, False: NotZero);
1789 Result->addIncoming(V: ResZero, BB: Begin);
1790
1791 Builder.SetInsertPoint(NotZero);
1792
1793 if (BuiltinID == MSVCIntrin::_BitScanForward) {
1794 Function *F = CGM.getIntrinsic(IID: Intrinsic::cttz, Tys: ArgType);
1795 Value *ZeroCount = Builder.CreateCall(Callee: F, Args: {ArgValue, Builder.getTrue()});
1796 ZeroCount = Builder.CreateIntCast(V: ZeroCount, DestTy: IndexType, isSigned: false);
1797 Builder.CreateStore(Val: ZeroCount, Addr: IndexAddress, IsVolatile: false);
1798 } else {
1799 unsigned ArgWidth = cast<llvm::IntegerType>(Val: ArgType)->getBitWidth();
1800 Value *ArgTypeLastIndex = llvm::ConstantInt::get(Ty: IndexType, V: ArgWidth - 1);
1801
1802 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctlz, Tys: ArgType);
1803 Value *ZeroCount = Builder.CreateCall(Callee: F, Args: {ArgValue, Builder.getTrue()});
1804 ZeroCount = Builder.CreateIntCast(V: ZeroCount, DestTy: IndexType, isSigned: false);
1805 Value *Index = Builder.CreateNSWSub(LHS: ArgTypeLastIndex, RHS: ZeroCount);
1806 Builder.CreateStore(Val: Index, Addr: IndexAddress, IsVolatile: false);
1807 }
1808 Builder.CreateBr(Dest: End);
1809 Result->addIncoming(V: ResOne, BB: NotZero);
1810
1811 Builder.SetInsertPoint(End);
1812 return Result;
1813 }
1814 case MSVCIntrin::_InterlockedAnd:
1815 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::And, E);
1816 case MSVCIntrin::_InterlockedExchange:
1817 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xchg, E);
1818 case MSVCIntrin::_InterlockedExchangeAdd:
1819 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Add, E);
1820 case MSVCIntrin::_InterlockedExchangeSub:
1821 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Sub, E);
1822 case MSVCIntrin::_InterlockedOr:
1823 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Or, E);
1824 case MSVCIntrin::_InterlockedXor:
1825 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xor, E);
1826 case MSVCIntrin::_InterlockedExchangeAdd_acq:
1827 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Add, E,
1828 Ordering: AtomicOrdering::Acquire);
1829 case MSVCIntrin::_InterlockedExchangeAdd_rel:
1830 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Add, E,
1831 Ordering: AtomicOrdering::Release);
1832 case MSVCIntrin::_InterlockedExchangeAdd_nf:
1833 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Add, E,
1834 Ordering: AtomicOrdering::Monotonic);
1835 case MSVCIntrin::_InterlockedExchange_acq:
1836 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xchg, E,
1837 Ordering: AtomicOrdering::Acquire);
1838 case MSVCIntrin::_InterlockedExchange_rel:
1839 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xchg, E,
1840 Ordering: AtomicOrdering::Release);
1841 case MSVCIntrin::_InterlockedExchange_nf:
1842 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xchg, E,
1843 Ordering: AtomicOrdering::Monotonic);
1844 case MSVCIntrin::_InterlockedCompareExchange:
1845 return EmitAtomicCmpXchgForMSIntrin(CGF&: *this, E);
1846 case MSVCIntrin::_InterlockedCompareExchange_acq:
1847 return EmitAtomicCmpXchgForMSIntrin(CGF&: *this, E, SuccessOrdering: AtomicOrdering::Acquire);
1848 case MSVCIntrin::_InterlockedCompareExchange_rel:
1849 return EmitAtomicCmpXchgForMSIntrin(CGF&: *this, E, SuccessOrdering: AtomicOrdering::Release);
1850 case MSVCIntrin::_InterlockedCompareExchange_nf:
1851 return EmitAtomicCmpXchgForMSIntrin(CGF&: *this, E, SuccessOrdering: AtomicOrdering::Monotonic);
1852 case MSVCIntrin::_InterlockedCompareExchange128:
1853 return EmitAtomicCmpXchg128ForMSIntrin(
1854 CGF&: *this, E, SuccessOrdering: AtomicOrdering::SequentiallyConsistent);
1855 case MSVCIntrin::_InterlockedCompareExchange128_acq:
1856 return EmitAtomicCmpXchg128ForMSIntrin(CGF&: *this, E, SuccessOrdering: AtomicOrdering::Acquire);
1857 case MSVCIntrin::_InterlockedCompareExchange128_rel:
1858 return EmitAtomicCmpXchg128ForMSIntrin(CGF&: *this, E, SuccessOrdering: AtomicOrdering::Release);
1859 case MSVCIntrin::_InterlockedCompareExchange128_nf:
1860 return EmitAtomicCmpXchg128ForMSIntrin(CGF&: *this, E, SuccessOrdering: AtomicOrdering::Monotonic);
1861 case MSVCIntrin::_InterlockedOr_acq:
1862 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Or, E,
1863 Ordering: AtomicOrdering::Acquire);
1864 case MSVCIntrin::_InterlockedOr_rel:
1865 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Or, E,
1866 Ordering: AtomicOrdering::Release);
1867 case MSVCIntrin::_InterlockedOr_nf:
1868 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Or, E,
1869 Ordering: AtomicOrdering::Monotonic);
1870 case MSVCIntrin::_InterlockedXor_acq:
1871 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xor, E,
1872 Ordering: AtomicOrdering::Acquire);
1873 case MSVCIntrin::_InterlockedXor_rel:
1874 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xor, E,
1875 Ordering: AtomicOrdering::Release);
1876 case MSVCIntrin::_InterlockedXor_nf:
1877 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::Xor, E,
1878 Ordering: AtomicOrdering::Monotonic);
1879 case MSVCIntrin::_InterlockedAnd_acq:
1880 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::And, E,
1881 Ordering: AtomicOrdering::Acquire);
1882 case MSVCIntrin::_InterlockedAnd_rel:
1883 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::And, E,
1884 Ordering: AtomicOrdering::Release);
1885 case MSVCIntrin::_InterlockedAnd_nf:
1886 return MakeBinaryAtomicValue(CGF&: *this, Kind: AtomicRMWInst::And, E,
1887 Ordering: AtomicOrdering::Monotonic);
1888 case MSVCIntrin::_InterlockedIncrement_acq:
1889 return EmitAtomicIncrementValue(CGF&: *this, E, Ordering: AtomicOrdering::Acquire);
1890 case MSVCIntrin::_InterlockedIncrement_rel:
1891 return EmitAtomicIncrementValue(CGF&: *this, E, Ordering: AtomicOrdering::Release);
1892 case MSVCIntrin::_InterlockedIncrement_nf:
1893 return EmitAtomicIncrementValue(CGF&: *this, E, Ordering: AtomicOrdering::Monotonic);
1894 case MSVCIntrin::_InterlockedDecrement_acq:
1895 return EmitAtomicDecrementValue(CGF&: *this, E, Ordering: AtomicOrdering::Acquire);
1896 case MSVCIntrin::_InterlockedDecrement_rel:
1897 return EmitAtomicDecrementValue(CGF&: *this, E, Ordering: AtomicOrdering::Release);
1898 case MSVCIntrin::_InterlockedDecrement_nf:
1899 return EmitAtomicDecrementValue(CGF&: *this, E, Ordering: AtomicOrdering::Monotonic);
1900
1901 case MSVCIntrin::_InterlockedDecrement:
1902 return EmitAtomicDecrementValue(CGF&: *this, E);
1903 case MSVCIntrin::_InterlockedIncrement:
1904 return EmitAtomicIncrementValue(CGF&: *this, E);
1905
1906 case MSVCIntrin::__fastfail: {
1907 // Request immediate process termination from the kernel. The instruction
1908 // sequences to do this are documented on MSDN:
1909 // https://msdn.microsoft.com/en-us/library/dn774154.aspx
1910 llvm::Triple::ArchType ISA = getTarget().getTriple().getArch();
1911 StringRef Asm, Constraints;
1912 switch (ISA) {
1913 default:
1914 ErrorUnsupported(S: E, Type: "__fastfail call for this architecture");
1915 break;
1916 case llvm::Triple::x86:
1917 case llvm::Triple::x86_64:
1918 Asm = "int $$0x29";
1919 Constraints = "{cx}";
1920 break;
1921 case llvm::Triple::thumb:
1922 Asm = "udf #251";
1923 Constraints = "{r0}";
1924 break;
1925 case llvm::Triple::aarch64:
1926 Asm = "brk #0xF003";
1927 Constraints = "{w0}";
1928 }
1929 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: VoidTy, Params: {Int32Ty}, isVarArg: false);
1930 llvm::InlineAsm *IA =
1931 llvm::InlineAsm::get(Ty: FTy, AsmString: Asm, Constraints, /*hasSideEffects=*/true);
1932 llvm::AttributeList NoReturnAttr = llvm::AttributeList::get(
1933 C&: getLLVMContext(), Index: llvm::AttributeList::FunctionIndex,
1934 Kinds: llvm::Attribute::NoReturn);
1935 llvm::CallInst *CI = Builder.CreateCall(Callee: IA, Args: EmitScalarExpr(E: E->getArg(Arg: 0)));
1936 CI->setAttributes(NoReturnAttr);
1937 return CI;
1938 }
1939 }
1940 llvm_unreachable("Incorrect MSVC intrinsic!");
1941}
1942
1943namespace {
1944// ARC cleanup for __builtin_os_log_format
1945struct CallObjCArcUse final : EHScopeStack::Cleanup {
1946 CallObjCArcUse(llvm::Value *object) : object(object) {}
1947 llvm::Value *object;
1948
1949 void Emit(CodeGenFunction &CGF, Flags flags) override {
1950 CGF.EmitARCIntrinsicUse(values: object);
1951 }
1952};
1953}
1954
1955Value *CodeGenFunction::EmitCheckedArgForBuiltin(const Expr *E,
1956 BuiltinCheckKind Kind) {
1957 assert((Kind == BCK_CLZPassedZero || Kind == BCK_CTZPassedZero) &&
1958 "Unsupported builtin check kind");
1959
1960 Value *ArgValue = EmitBitCountExpr(CGF&: *this, E);
1961 if (!SanOpts.has(K: SanitizerKind::Builtin))
1962 return ArgValue;
1963
1964 auto CheckOrdinal = SanitizerKind::SO_Builtin;
1965 auto CheckHandler = SanitizerHandler::InvalidBuiltin;
1966 SanitizerDebugLocation SanScope(this, {CheckOrdinal}, CheckHandler);
1967 Value *Cond = Builder.CreateICmpNE(
1968 LHS: ArgValue, RHS: llvm::Constant::getNullValue(Ty: ArgValue->getType()));
1969 EmitCheck(Checked: std::make_pair(x&: Cond, y&: CheckOrdinal), Check: CheckHandler,
1970 StaticArgs: {EmitCheckSourceLocation(Loc: E->getExprLoc()),
1971 llvm::ConstantInt::get(Ty: Builder.getInt8Ty(), V: Kind)},
1972 DynamicArgs: {});
1973 return ArgValue;
1974}
1975
1976Value *CodeGenFunction::EmitCheckedArgForAssume(const Expr *E) {
1977 Value *ArgValue = EvaluateExprAsBool(E);
1978 if (!SanOpts.has(K: SanitizerKind::Builtin))
1979 return ArgValue;
1980
1981 auto CheckOrdinal = SanitizerKind::SO_Builtin;
1982 auto CheckHandler = SanitizerHandler::InvalidBuiltin;
1983 SanitizerDebugLocation SanScope(this, {CheckOrdinal}, CheckHandler);
1984 EmitCheck(
1985 Checked: std::make_pair(x&: ArgValue, y&: CheckOrdinal), Check: CheckHandler,
1986 StaticArgs: {EmitCheckSourceLocation(Loc: E->getExprLoc()),
1987 llvm::ConstantInt::get(Ty: Builder.getInt8Ty(), V: BCK_AssumePassedFalse)},
1988 DynamicArgs: {});
1989 return ArgValue;
1990}
1991
1992static Value *EmitAbs(CodeGenFunction &CGF, Value *ArgValue, bool HasNSW) {
1993 return CGF.Builder.CreateBinaryIntrinsic(
1994 ID: Intrinsic::abs, LHS: ArgValue,
1995 RHS: ConstantInt::get(Ty: CGF.Builder.getInt1Ty(), V: HasNSW));
1996}
1997
1998static Value *EmitOverflowCheckedAbs(CodeGenFunction &CGF, const CallExpr *E,
1999 bool SanitizeOverflow) {
2000 Value *ArgValue = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
2001
2002 // Try to eliminate overflow check.
2003 if (const auto *VCI = dyn_cast<llvm::ConstantInt>(Val: ArgValue)) {
2004 if (!VCI->isMinSignedValue())
2005 return EmitAbs(CGF, ArgValue, HasNSW: true);
2006 }
2007
2008 SmallVector<SanitizerKind::SanitizerOrdinal, 1> Ordinals;
2009 SanitizerHandler CheckHandler;
2010 if (SanitizeOverflow) {
2011 Ordinals.push_back(Elt: SanitizerKind::SO_SignedIntegerOverflow);
2012 CheckHandler = SanitizerHandler::NegateOverflow;
2013 } else
2014 CheckHandler = SanitizerHandler::SubOverflow;
2015
2016 SanitizerDebugLocation SanScope(&CGF, Ordinals, CheckHandler);
2017
2018 Constant *Zero = Constant::getNullValue(Ty: ArgValue->getType());
2019 Value *ResultAndOverflow = CGF.Builder.CreateBinaryIntrinsic(
2020 ID: Intrinsic::ssub_with_overflow, LHS: Zero, RHS: ArgValue);
2021 Value *Result = CGF.Builder.CreateExtractValue(Agg: ResultAndOverflow, Idxs: 0);
2022 Value *NotOverflow = CGF.Builder.CreateNot(
2023 V: CGF.Builder.CreateExtractValue(Agg: ResultAndOverflow, Idxs: 1));
2024
2025 // TODO: support -ftrapv-handler.
2026 if (SanitizeOverflow) {
2027 CGF.EmitCheck(Checked: {{NotOverflow, SanitizerKind::SO_SignedIntegerOverflow}},
2028 Check: CheckHandler,
2029 StaticArgs: {CGF.EmitCheckSourceLocation(Loc: E->getArg(Arg: 0)->getExprLoc()),
2030 CGF.EmitCheckTypeDescriptor(T: E->getType())},
2031 DynamicArgs: {ArgValue});
2032 } else
2033 CGF.EmitTrapCheck(Checked: NotOverflow, CheckHandlerID: CheckHandler);
2034
2035 Value *CmpResult = CGF.Builder.CreateICmpSLT(LHS: ArgValue, RHS: Zero, Name: "abscond");
2036 return CGF.Builder.CreateSelect(C: CmpResult, True: Result, False: ArgValue, Name: "abs");
2037}
2038
2039/// Get the argument type for arguments to os_log_helper.
2040static CanQualType getOSLogArgType(ASTContext &C, int Size) {
2041 QualType UnsignedTy = C.getIntTypeForBitwidth(DestWidth: Size * 8, /*Signed=*/false);
2042 return C.getCanonicalType(T: UnsignedTy);
2043}
2044
2045llvm::Function *CodeGenFunction::generateBuiltinOSLogHelperFunction(
2046 const analyze_os_log::OSLogBufferLayout &Layout,
2047 CharUnits BufferAlignment) {
2048 ASTContext &Ctx = getContext();
2049
2050 llvm::SmallString<64> Name;
2051 {
2052 raw_svector_ostream OS(Name);
2053 OS << "__os_log_helper";
2054 OS << "_" << BufferAlignment.getQuantity();
2055 OS << "_" << int(Layout.getSummaryByte());
2056 OS << "_" << int(Layout.getNumArgsByte());
2057 for (const auto &Item : Layout.Items)
2058 OS << "_" << int(Item.getSizeByte()) << "_"
2059 << int(Item.getDescriptorByte());
2060 }
2061
2062 if (llvm::Function *F = CGM.getModule().getFunction(Name))
2063 return F;
2064
2065 llvm::SmallVector<QualType, 4> ArgTys;
2066 FunctionArgList Args;
2067 Args.push_back(Elt: ImplicitParamDecl::Create(
2068 C&: Ctx, DC: nullptr, IdLoc: SourceLocation(), Id: &Ctx.Idents.get(Name: "buffer"), T: Ctx.VoidPtrTy,
2069 ParamKind: ImplicitParamKind::Other));
2070 ArgTys.emplace_back(Args&: Ctx.VoidPtrTy);
2071
2072 for (unsigned int I = 0, E = Layout.Items.size(); I < E; ++I) {
2073 char Size = Layout.Items[I].getSizeByte();
2074 if (!Size)
2075 continue;
2076
2077 QualType ArgTy = getOSLogArgType(C&: Ctx, Size);
2078 Args.push_back(Elt: ImplicitParamDecl::Create(
2079 C&: Ctx, DC: nullptr, IdLoc: SourceLocation(),
2080 Id: &Ctx.Idents.get(Name: std::string("arg") + llvm::to_string(Value: I)), T: ArgTy,
2081 ParamKind: ImplicitParamKind::Other));
2082 ArgTys.emplace_back(Args&: ArgTy);
2083 }
2084
2085 QualType ReturnTy = Ctx.VoidTy;
2086
2087 // The helper function has linkonce_odr linkage to enable the linker to merge
2088 // identical functions. To ensure the merging always happens, 'noinline' is
2089 // attached to the function when compiling with -Oz.
2090 const CGFunctionInfo &FI =
2091 CGM.getTypes().arrangeBuiltinFunctionDeclaration(resultType: ReturnTy, args: Args);
2092 llvm::FunctionType *FuncTy = CGM.getTypes().GetFunctionType(Info: FI);
2093 llvm::Function *Fn = llvm::Function::Create(
2094 Ty: FuncTy, Linkage: llvm::GlobalValue::LinkOnceODRLinkage, N: Name, M: &CGM.getModule());
2095 Fn->setVisibility(llvm::GlobalValue::HiddenVisibility);
2096 CGM.SetLLVMFunctionAttributes(GD: GlobalDecl(), Info: FI, F: Fn, /*IsThunk=*/false);
2097 CGM.SetLLVMFunctionAttributesForDefinition(D: nullptr, F: Fn);
2098 Fn->setDoesNotThrow();
2099
2100 // Attach 'noinline' at -Oz.
2101 if (CGM.getCodeGenOpts().OptimizeSize == 2)
2102 Fn->addFnAttr(Kind: llvm::Attribute::NoInline);
2103
2104 auto NL = ApplyDebugLocation::CreateEmpty(CGF&: *this);
2105 StartFunction(GD: GlobalDecl(), RetTy: ReturnTy, Fn, FnInfo: FI, Args);
2106
2107 // Create a scope with an artificial location for the body of this function.
2108 auto AL = ApplyDebugLocation::CreateArtificial(CGF&: *this);
2109
2110 CharUnits Offset;
2111 Address BufAddr = makeNaturalAddressForPointer(
2112 Ptr: Builder.CreateLoad(Addr: GetAddrOfLocalVar(VD: Args[0]), Name: "buf"), T: Ctx.VoidTy,
2113 Alignment: BufferAlignment);
2114 Builder.CreateStore(Val: Builder.getInt8(C: Layout.getSummaryByte()),
2115 Addr: Builder.CreateConstByteGEP(Addr: BufAddr, Offset: Offset++, Name: "summary"));
2116 Builder.CreateStore(Val: Builder.getInt8(C: Layout.getNumArgsByte()),
2117 Addr: Builder.CreateConstByteGEP(Addr: BufAddr, Offset: Offset++, Name: "numArgs"));
2118
2119 unsigned I = 1;
2120 for (const auto &Item : Layout.Items) {
2121 Builder.CreateStore(
2122 Val: Builder.getInt8(C: Item.getDescriptorByte()),
2123 Addr: Builder.CreateConstByteGEP(Addr: BufAddr, Offset: Offset++, Name: "argDescriptor"));
2124 Builder.CreateStore(
2125 Val: Builder.getInt8(C: Item.getSizeByte()),
2126 Addr: Builder.CreateConstByteGEP(Addr: BufAddr, Offset: Offset++, Name: "argSize"));
2127
2128 CharUnits Size = Item.size();
2129 if (!Size.getQuantity())
2130 continue;
2131
2132 Address Arg = GetAddrOfLocalVar(VD: Args[I]);
2133 Address Addr = Builder.CreateConstByteGEP(Addr: BufAddr, Offset, Name: "argData");
2134 Addr = Addr.withElementType(ElemTy: Arg.getElementType());
2135 Builder.CreateStore(Val: Builder.CreateLoad(Addr: Arg), Addr);
2136 Offset += Size;
2137 ++I;
2138 }
2139
2140 FinishFunction();
2141
2142 return Fn;
2143}
2144
2145RValue CodeGenFunction::emitBuiltinOSLogFormat(const CallExpr &E) {
2146 assert(E.getNumArgs() >= 2 &&
2147 "__builtin_os_log_format takes at least 2 arguments");
2148 ASTContext &Ctx = getContext();
2149 analyze_os_log::OSLogBufferLayout Layout;
2150 analyze_os_log::computeOSLogBufferLayout(Ctx, E: &E, layout&: Layout);
2151 Address BufAddr = EmitPointerWithAlignment(Addr: E.getArg(Arg: 0));
2152
2153 // Ignore argument 1, the format string. It is not currently used.
2154 CallArgList Args;
2155 Args.add(rvalue: RValue::get(V: BufAddr.emitRawPointer(CGF&: *this)), type: Ctx.VoidPtrTy);
2156
2157 for (const auto &Item : Layout.Items) {
2158 int Size = Item.getSizeByte();
2159 if (!Size)
2160 continue;
2161
2162 llvm::Value *ArgVal;
2163
2164 if (Item.getKind() == analyze_os_log::OSLogBufferItem::MaskKind) {
2165 uint64_t Val = 0;
2166 for (unsigned I = 0, E = Item.getMaskType().size(); I < E; ++I)
2167 Val |= ((uint64_t)Item.getMaskType()[I]) << I * 8;
2168 ArgVal = llvm::Constant::getIntegerValue(Ty: Int64Ty, V: llvm::APInt(64, Val));
2169 } else if (const Expr *TheExpr = Item.getExpr()) {
2170 ArgVal = EmitScalarExpr(E: TheExpr, /*Ignore*/ IgnoreResultAssign: false);
2171
2172 // If a temporary object that requires destruction after the full
2173 // expression is passed, push a lifetime-extended cleanup to extend its
2174 // lifetime to the end of the enclosing block scope.
2175 auto LifetimeExtendObject = [&](const Expr *E) {
2176 E = E->IgnoreParenCasts();
2177 // Extend lifetimes of objects returned by function calls and message
2178 // sends.
2179
2180 // FIXME: We should do this in other cases in which temporaries are
2181 // created including arguments of non-ARC types (e.g., C++
2182 // temporaries).
2183 if (isa<CallExpr>(Val: E) || isa<ObjCMessageExpr>(Val: E))
2184 return true;
2185 return false;
2186 };
2187
2188 if (TheExpr->getType()->isObjCRetainableType() &&
2189 getLangOpts().ObjCAutoRefCount && LifetimeExtendObject(TheExpr)) {
2190 assert(getEvaluationKind(TheExpr->getType()) == TEK_Scalar &&
2191 "Only scalar can be a ObjC retainable type");
2192 if (!isa<Constant>(Val: ArgVal)) {
2193 CleanupKind Cleanup = getARCCleanupKind();
2194 QualType Ty = TheExpr->getType();
2195 RawAddress Alloca = CreateMemTempWithoutCast(T: Ty, Name: "os.log.arg");
2196 ArgVal = EmitARCRetain(type: Ty, value: ArgVal);
2197 Builder.CreateStore(Val: ArgVal, Addr: Alloca);
2198 pushLifetimeExtendedDestroy(kind: Cleanup, addr: Alloca, type: Ty,
2199 destroyer: CodeGenFunction::destroyARCStrongPrecise,
2200 useEHCleanupForArray: Cleanup & EHCleanup);
2201
2202 // Push a clang.arc.use call to ensure ARC optimizer knows that the
2203 // argument has to be alive.
2204 if (CGM.getCodeGenOpts().OptimizationLevel != 0)
2205 pushCleanupAfterFullExpr<CallObjCArcUse>(Kind: Cleanup, A: ArgVal);
2206 }
2207 }
2208 } else {
2209 ArgVal = Builder.getInt32(C: Item.getConstValue().getQuantity());
2210 }
2211
2212 unsigned ArgValSize =
2213 CGM.getDataLayout().getTypeSizeInBits(Ty: ArgVal->getType());
2214 llvm::IntegerType *IntTy = llvm::Type::getIntNTy(C&: getLLVMContext(),
2215 N: ArgValSize);
2216 ArgVal = Builder.CreateBitOrPointerCast(V: ArgVal, DestTy: IntTy);
2217 CanQualType ArgTy = getOSLogArgType(C&: Ctx, Size);
2218 // If ArgVal has type x86_fp80, zero-extend ArgVal.
2219 ArgVal = Builder.CreateZExtOrBitCast(V: ArgVal, DestTy: ConvertType(T: ArgTy));
2220 Args.add(rvalue: RValue::get(V: ArgVal), type: ArgTy);
2221 }
2222
2223 const CGFunctionInfo &FI =
2224 CGM.getTypes().arrangeBuiltinFunctionCall(resultType: Ctx.VoidTy, args: Args);
2225 llvm::Function *F = CodeGenFunction(CGM).generateBuiltinOSLogHelperFunction(
2226 Layout, BufferAlignment: BufAddr.getAlignment());
2227 EmitCall(CallInfo: FI, Callee: CGCallee::forDirect(functionPtr: F), ReturnValue: ReturnValueSlot(), Args);
2228 return RValue::get(Addr: BufAddr, CGF&: *this);
2229}
2230
2231static bool isSpecialUnsignedMultiplySignedResult(
2232 unsigned BuiltinID, WidthAndSignedness Op1Info, WidthAndSignedness Op2Info,
2233 WidthAndSignedness ResultInfo) {
2234 return BuiltinID == Builtin::BI__builtin_mul_overflow &&
2235 Op1Info.Width == Op2Info.Width && Op2Info.Width == ResultInfo.Width &&
2236 !Op1Info.Signed && !Op2Info.Signed && ResultInfo.Signed;
2237}
2238
2239static RValue EmitCheckedUnsignedMultiplySignedResult(
2240 CodeGenFunction &CGF, const clang::Expr *Op1, WidthAndSignedness Op1Info,
2241 const clang::Expr *Op2, WidthAndSignedness Op2Info,
2242 const clang::Expr *ResultArg, QualType ResultQTy,
2243 WidthAndSignedness ResultInfo) {
2244 assert(isSpecialUnsignedMultiplySignedResult(
2245 Builtin::BI__builtin_mul_overflow, Op1Info, Op2Info, ResultInfo) &&
2246 "Cannot specialize this multiply");
2247
2248 llvm::Value *V1 = CGF.EmitScalarExpr(E: Op1);
2249 llvm::Value *V2 = CGF.EmitScalarExpr(E: Op2);
2250
2251 llvm::Value *HasOverflow;
2252 llvm::Value *Result = EmitOverflowIntrinsic(
2253 CGF, IntrinsicID: Intrinsic::umul_with_overflow, X: V1, Y: V2, Carry&: HasOverflow);
2254
2255 // The intrinsic call will detect overflow when the value is > UINT_MAX,
2256 // however, since the original builtin had a signed result, we need to report
2257 // an overflow when the result is greater than INT_MAX.
2258 auto IntMax = llvm::APInt::getSignedMaxValue(numBits: ResultInfo.Width);
2259 llvm::Value *IntMaxValue = llvm::ConstantInt::get(Ty: Result->getType(), V: IntMax);
2260
2261 llvm::Value *IntMaxOverflow = CGF.Builder.CreateICmpUGT(LHS: Result, RHS: IntMaxValue);
2262 HasOverflow = CGF.Builder.CreateOr(LHS: HasOverflow, RHS: IntMaxOverflow);
2263
2264 bool isVolatile =
2265 ResultArg->getType()->getPointeeType().isVolatileQualified();
2266 Address ResultPtr = CGF.EmitPointerWithAlignment(Addr: ResultArg);
2267 CGF.Builder.CreateStore(Val: CGF.EmitToMemory(Value: Result, Ty: ResultQTy), Addr: ResultPtr,
2268 IsVolatile: isVolatile);
2269 return RValue::get(V: HasOverflow);
2270}
2271
2272/// Determine if a binop is a checked mixed-sign multiply we can specialize.
2273static bool isSpecialMixedSignMultiply(unsigned BuiltinID,
2274 WidthAndSignedness Op1Info,
2275 WidthAndSignedness Op2Info,
2276 WidthAndSignedness ResultInfo) {
2277 return BuiltinID == Builtin::BI__builtin_mul_overflow &&
2278 std::max(a: Op1Info.Width, b: Op2Info.Width) >= ResultInfo.Width &&
2279 Op1Info.Signed != Op2Info.Signed;
2280}
2281
2282/// Emit a checked mixed-sign multiply. This is a cheaper specialization of
2283/// the generic checked-binop irgen.
2284static RValue
2285EmitCheckedMixedSignMultiply(CodeGenFunction &CGF, const clang::Expr *Op1,
2286 WidthAndSignedness Op1Info, const clang::Expr *Op2,
2287 WidthAndSignedness Op2Info,
2288 const clang::Expr *ResultArg, QualType ResultQTy,
2289 WidthAndSignedness ResultInfo) {
2290 assert(isSpecialMixedSignMultiply(Builtin::BI__builtin_mul_overflow, Op1Info,
2291 Op2Info, ResultInfo) &&
2292 "Not a mixed-sign multipliction we can specialize");
2293
2294 // Emit the signed and unsigned operands.
2295 const clang::Expr *SignedOp = Op1Info.Signed ? Op1 : Op2;
2296 const clang::Expr *UnsignedOp = Op1Info.Signed ? Op2 : Op1;
2297 llvm::Value *Signed = CGF.EmitScalarExpr(E: SignedOp);
2298 llvm::Value *Unsigned = CGF.EmitScalarExpr(E: UnsignedOp);
2299 unsigned SignedOpWidth = Op1Info.Signed ? Op1Info.Width : Op2Info.Width;
2300 unsigned UnsignedOpWidth = Op1Info.Signed ? Op2Info.Width : Op1Info.Width;
2301
2302 // One of the operands may be smaller than the other. If so, [s|z]ext it.
2303 if (SignedOpWidth < UnsignedOpWidth)
2304 Signed = CGF.Builder.CreateSExt(V: Signed, DestTy: Unsigned->getType(), Name: "op.sext");
2305 if (UnsignedOpWidth < SignedOpWidth)
2306 Unsigned = CGF.Builder.CreateZExt(V: Unsigned, DestTy: Signed->getType(), Name: "op.zext");
2307
2308 llvm::Type *OpTy = Signed->getType();
2309 llvm::Value *Zero = llvm::Constant::getNullValue(Ty: OpTy);
2310 Address ResultPtr = CGF.EmitPointerWithAlignment(Addr: ResultArg);
2311 llvm::Type *ResTy = CGF.getTypes().ConvertType(T: ResultQTy);
2312 unsigned OpWidth = std::max(a: Op1Info.Width, b: Op2Info.Width);
2313
2314 // Take the absolute value of the signed operand.
2315 llvm::Value *IsNegative = CGF.Builder.CreateICmpSLT(LHS: Signed, RHS: Zero);
2316 llvm::Value *AbsOfNegative = CGF.Builder.CreateSub(LHS: Zero, RHS: Signed);
2317 llvm::Value *AbsSigned =
2318 CGF.Builder.CreateSelect(C: IsNegative, True: AbsOfNegative, False: Signed);
2319
2320 // Perform a checked unsigned multiplication.
2321 llvm::Value *UnsignedOverflow;
2322 llvm::Value *UnsignedResult =
2323 EmitOverflowIntrinsic(CGF, IntrinsicID: Intrinsic::umul_with_overflow, X: AbsSigned,
2324 Y: Unsigned, Carry&: UnsignedOverflow);
2325
2326 llvm::Value *Overflow, *Result;
2327 if (ResultInfo.Signed) {
2328 // Signed overflow occurs if the result is greater than INT_MAX or lesser
2329 // than INT_MIN, i.e when |Result| > (INT_MAX + IsNegative).
2330 auto IntMax =
2331 llvm::APInt::getSignedMaxValue(numBits: ResultInfo.Width).zext(width: OpWidth);
2332 llvm::Value *MaxResult =
2333 CGF.Builder.CreateAdd(LHS: llvm::ConstantInt::get(Ty: OpTy, V: IntMax),
2334 RHS: CGF.Builder.CreateZExt(V: IsNegative, DestTy: OpTy));
2335 llvm::Value *SignedOverflow =
2336 CGF.Builder.CreateICmpUGT(LHS: UnsignedResult, RHS: MaxResult);
2337 Overflow = CGF.Builder.CreateOr(LHS: UnsignedOverflow, RHS: SignedOverflow);
2338
2339 // Prepare the signed result (possibly by negating it).
2340 llvm::Value *NegativeResult = CGF.Builder.CreateNeg(V: UnsignedResult);
2341 llvm::Value *SignedResult =
2342 CGF.Builder.CreateSelect(C: IsNegative, True: NegativeResult, False: UnsignedResult);
2343 Result = CGF.Builder.CreateTrunc(V: SignedResult, DestTy: ResTy);
2344 } else {
2345 // Unsigned overflow occurs if the result is < 0 or greater than UINT_MAX.
2346 llvm::Value *Underflow = CGF.Builder.CreateAnd(
2347 LHS: IsNegative, RHS: CGF.Builder.CreateIsNotNull(Arg: UnsignedResult));
2348 Overflow = CGF.Builder.CreateOr(LHS: UnsignedOverflow, RHS: Underflow);
2349 if (ResultInfo.Width < OpWidth) {
2350 auto IntMax =
2351 llvm::APInt::getMaxValue(numBits: ResultInfo.Width).zext(width: OpWidth);
2352 llvm::Value *TruncOverflow = CGF.Builder.CreateICmpUGT(
2353 LHS: UnsignedResult, RHS: llvm::ConstantInt::get(Ty: OpTy, V: IntMax));
2354 Overflow = CGF.Builder.CreateOr(LHS: Overflow, RHS: TruncOverflow);
2355 }
2356
2357 // Negate the product if it would be negative in infinite precision.
2358 Result = CGF.Builder.CreateSelect(
2359 C: IsNegative, True: CGF.Builder.CreateNeg(V: UnsignedResult), False: UnsignedResult);
2360
2361 Result = CGF.Builder.CreateTrunc(V: Result, DestTy: ResTy);
2362 }
2363 assert(Overflow && Result && "Missing overflow or result");
2364
2365 bool isVolatile =
2366 ResultArg->getType()->getPointeeType().isVolatileQualified();
2367 CGF.Builder.CreateStore(Val: CGF.EmitToMemory(Value: Result, Ty: ResultQTy), Addr: ResultPtr,
2368 IsVolatile: isVolatile);
2369 return RValue::get(V: Overflow);
2370}
2371
2372/// Determine if the specified type requires laundering by checking if it is a
2373/// dynamic class type or contains a subobject which is a dynamic class type.
2374static bool TypeRequiresBuiltinLaunder(CodeGenModule &CGM, QualType Ty) {
2375 if (!CGM.getCodeGenOpts().StrictVTablePointers)
2376 return false;
2377 return Ty.requiresBuiltinLaunder(Context: CGM.getContext());
2378}
2379
2380RValue CodeGenFunction::emitRotate(const CallExpr *E, bool IsRotateRight) {
2381 llvm::Value *Src = EmitScalarExpr(E: E->getArg(Arg: 0));
2382 llvm::Value *ShiftAmt = EmitScalarExpr(E: E->getArg(Arg: 1));
2383
2384 // The builtin's shift arg may have a different type than the source arg and
2385 // result, but the LLVM intrinsic uses the same type for all values.
2386 llvm::Type *Ty = Src->getType();
2387 llvm::Type *ShiftTy = ShiftAmt->getType();
2388
2389 unsigned BitWidth = Ty->getIntegerBitWidth();
2390
2391 // Normalize shift amount to [0, BitWidth) range to match runtime behavior.
2392 // This matches the algorithm in ExprConstant.cpp for constant evaluation.
2393 if (BitWidth == 1) {
2394 // Rotating a 1-bit value is always a no-op
2395 ShiftAmt = ConstantInt::get(Ty: ShiftTy, V: 0);
2396 } else if (BitWidth == 2) {
2397 // For 2-bit values: rotation amount is 0 or 1 based on
2398 // whether the amount is even or odd. We can't use srem here because
2399 // the divisor (2) would be misinterpreted as -2 in 2-bit signed arithmetic.
2400 llvm::Value *One = ConstantInt::get(Ty: ShiftTy, V: 1);
2401 ShiftAmt = Builder.CreateAnd(LHS: ShiftAmt, RHS: One);
2402 } else {
2403 unsigned ShiftAmtBitWidth = ShiftTy->getIntegerBitWidth();
2404 bool ShiftAmtIsSigned = E->getArg(Arg: 1)->getType()->isSignedIntegerType();
2405
2406 // Choose the wider type for the divisor to avoid truncation
2407 llvm::Type *DivisorTy = ShiftAmtBitWidth > BitWidth ? ShiftTy : Ty;
2408 llvm::Value *Divisor = ConstantInt::get(Ty: DivisorTy, V: BitWidth);
2409
2410 // Extend ShiftAmt to match Divisor width if needed
2411 if (ShiftAmtBitWidth < DivisorTy->getIntegerBitWidth()) {
2412 ShiftAmt = Builder.CreateIntCast(V: ShiftAmt, DestTy: DivisorTy, isSigned: ShiftAmtIsSigned);
2413 }
2414
2415 // Normalize to [0, BitWidth)
2416 llvm::Value *RemResult;
2417 if (ShiftAmtIsSigned) {
2418 RemResult = Builder.CreateSRem(LHS: ShiftAmt, RHS: Divisor);
2419 // Signed remainder can be negative, convert to positive equivalent
2420 llvm::Value *Zero = ConstantInt::get(Ty: DivisorTy, V: 0);
2421 llvm::Value *IsNegative = Builder.CreateICmpSLT(LHS: RemResult, RHS: Zero);
2422 llvm::Value *PositiveShift = Builder.CreateAdd(LHS: RemResult, RHS: Divisor);
2423 ShiftAmt = Builder.CreateSelect(C: IsNegative, True: PositiveShift, False: RemResult);
2424 } else {
2425 ShiftAmt = Builder.CreateURem(LHS: ShiftAmt, RHS: Divisor);
2426 }
2427 }
2428
2429 // Convert to the source type if needed
2430 if (ShiftAmt->getType() != Ty) {
2431 ShiftAmt = Builder.CreateIntCast(V: ShiftAmt, DestTy: Ty, isSigned: false);
2432 }
2433
2434 // Rotate is a special case of LLVM funnel shift - 1st 2 args are the same.
2435 unsigned IID = IsRotateRight ? Intrinsic::fshr : Intrinsic::fshl;
2436 Function *F = CGM.getIntrinsic(IID, Tys: Ty);
2437 return RValue::get(V: Builder.CreateCall(Callee: F, Args: {Src, Src, ShiftAmt}));
2438}
2439
2440// Map math builtins for long-double to f128 version.
2441static unsigned mutateLongDoubleBuiltin(unsigned BuiltinID) {
2442 switch (BuiltinID) {
2443#define MUTATE_LDBL(func) \
2444 case Builtin::BI__builtin_##func##l: \
2445 return Builtin::BI__builtin_##func##f128;
2446 MUTATE_LDBL(sqrt)
2447 MUTATE_LDBL(cbrt)
2448 MUTATE_LDBL(fabs)
2449 MUTATE_LDBL(log)
2450 MUTATE_LDBL(log2)
2451 MUTATE_LDBL(log10)
2452 MUTATE_LDBL(log1p)
2453 MUTATE_LDBL(logb)
2454 MUTATE_LDBL(exp)
2455 MUTATE_LDBL(exp2)
2456 MUTATE_LDBL(expm1)
2457 MUTATE_LDBL(fdim)
2458 MUTATE_LDBL(hypot)
2459 MUTATE_LDBL(ilogb)
2460 MUTATE_LDBL(pow)
2461 MUTATE_LDBL(fmin)
2462 MUTATE_LDBL(fmax)
2463 MUTATE_LDBL(ceil)
2464 MUTATE_LDBL(trunc)
2465 MUTATE_LDBL(rint)
2466 MUTATE_LDBL(nearbyint)
2467 MUTATE_LDBL(round)
2468 MUTATE_LDBL(floor)
2469 MUTATE_LDBL(lround)
2470 MUTATE_LDBL(llround)
2471 MUTATE_LDBL(lrint)
2472 MUTATE_LDBL(llrint)
2473 MUTATE_LDBL(fmod)
2474 MUTATE_LDBL(modf)
2475 MUTATE_LDBL(nan)
2476 MUTATE_LDBL(nans)
2477 MUTATE_LDBL(inf)
2478 MUTATE_LDBL(fma)
2479 MUTATE_LDBL(sin)
2480 MUTATE_LDBL(cos)
2481 MUTATE_LDBL(tan)
2482 MUTATE_LDBL(sinh)
2483 MUTATE_LDBL(cosh)
2484 MUTATE_LDBL(tanh)
2485 MUTATE_LDBL(asin)
2486 MUTATE_LDBL(acos)
2487 MUTATE_LDBL(atan)
2488 MUTATE_LDBL(asinh)
2489 MUTATE_LDBL(acosh)
2490 MUTATE_LDBL(atanh)
2491 MUTATE_LDBL(atan2)
2492 MUTATE_LDBL(erf)
2493 MUTATE_LDBL(erfc)
2494 MUTATE_LDBL(ldexp)
2495 MUTATE_LDBL(frexp)
2496 MUTATE_LDBL(huge_val)
2497 MUTATE_LDBL(copysign)
2498 MUTATE_LDBL(nextafter)
2499 MUTATE_LDBL(nexttoward)
2500 MUTATE_LDBL(remainder)
2501 MUTATE_LDBL(remquo)
2502 MUTATE_LDBL(scalbln)
2503 MUTATE_LDBL(scalbn)
2504 MUTATE_LDBL(tgamma)
2505 MUTATE_LDBL(lgamma)
2506#undef MUTATE_LDBL
2507 default:
2508 return BuiltinID;
2509 }
2510}
2511
2512static Value *tryUseTestFPKind(CodeGenFunction &CGF, unsigned BuiltinID,
2513 Value *V) {
2514 if (CGF.Builder.getIsFPConstrained() &&
2515 CGF.Builder.getDefaultConstrainedExcept() != fp::ebIgnore) {
2516 if (Value *Result =
2517 CGF.getTargetHooks().testFPKind(V, BuiltinID, Builder&: CGF.Builder, CGM&: CGF.CGM))
2518 return Result;
2519 }
2520 return nullptr;
2521}
2522
2523static RValue EmitHipStdParUnsupportedBuiltin(CodeGenFunction *CGF,
2524 const FunctionDecl *FD) {
2525 auto Name = FD->getNameAsString() + "__hipstdpar_unsupported";
2526 auto FnTy = CGF->CGM.getTypes().GetFunctionType(GD: FD);
2527 auto UBF = CGF->CGM.getModule().getOrInsertFunction(Name, T: FnTy);
2528
2529 SmallVector<Value *, 16> Args;
2530 for (auto &&FormalTy : FnTy->params())
2531 Args.push_back(Elt: llvm::PoisonValue::get(T: FormalTy));
2532
2533 return RValue::get(V: CGF->Builder.CreateCall(Callee: UBF, Args));
2534}
2535
2536// stdc_{leading,trailing}_{zeros,ones} and stdc_count_ones: counts bits using
2537// ctlz, cttz, or ctpop (IsPop). InvertArg flips the input to count the
2538// opposite bit value.
2539RValue CodeGenFunction::emitStdcCountIntrinsic(const CallExpr *E,
2540 Intrinsic::ID IntID,
2541 bool InvertArg, bool IsPop) {
2542 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
2543 llvm::Type *ArgType = ArgValue->getType();
2544 llvm::Type *ResultType = ConvertType(T: E->getType());
2545 Value *ActualArg = InvertArg ? Builder.CreateNot(V: ArgValue) : ArgValue;
2546 Function *F = CGM.getIntrinsic(IID: IntID, Tys: ArgType);
2547 Value *Result = IsPop
2548 ? Builder.CreateCall(Callee: F, Args: ActualArg)
2549 : Builder.CreateCall(Callee: F, Args: {ActualArg, Builder.getFalse()});
2550 if (Result->getType() != ResultType)
2551 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, isSigned: false);
2552 return RValue::get(V: Result);
2553}
2554
2555// stdc_count_zeros (BitWidth - ctpop) and stdc_bit_width (BitWidth - ctlz).
2556// IsPop selects ctpop; otherwise ctlz is used.
2557RValue CodeGenFunction::emitStdcBitWidthMinus(const CallExpr *E,
2558 Intrinsic::ID IntID, bool IsPop) {
2559 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
2560 llvm::Type *ArgType = ArgValue->getType();
2561 llvm::Type *ResultType = ConvertType(T: E->getType());
2562 unsigned BitWidth = ArgType->getIntegerBitWidth();
2563 Function *F = CGM.getIntrinsic(IID: IntID, Tys: ArgType);
2564 Value *Cnt = IsPop ? Builder.CreateCall(Callee: F, Args: ArgValue)
2565 : Builder.CreateCall(Callee: F, Args: {ArgValue, Builder.getFalse()});
2566 Value *Result = Builder.CreateSub(LHS: ConstantInt::get(Ty: ArgType, V: BitWidth), RHS: Cnt);
2567 if (Result->getType() != ResultType)
2568 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, isSigned: false);
2569 return RValue::get(V: Result);
2570}
2571
2572// stdc_first_{leading,trailing}_{zero,one}: returns the 1-based position of
2573// the first matching bit, or 0 if no such bit exists. InvertArg flips the
2574// input to search for zeros instead of ones.
2575RValue CodeGenFunction::emitStdcFirstBit(const CallExpr *E, Intrinsic::ID IntID,
2576 bool InvertArg) {
2577 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
2578 llvm::Type *ArgType = ArgValue->getType();
2579 llvm::Type *ResultType = ConvertType(T: E->getType());
2580 Value *Zero = ConstantInt::get(Ty: ArgType, V: 0);
2581 Value *One = ConstantInt::get(Ty: ArgType, V: 1);
2582 Value *ActualArg = InvertArg ? Builder.CreateNot(V: ArgValue) : ArgValue;
2583 Function *F = CGM.getIntrinsic(IID: IntID, Tys: ArgType);
2584 Value *Cnt = Builder.CreateCall(Callee: F, Args: {ActualArg, Builder.getFalse()});
2585 Value *Tmp = Builder.CreateAdd(LHS: Cnt, RHS: One);
2586 Value *IsZero = Builder.CreateICmpEQ(LHS: ActualArg, RHS: Zero);
2587 Value *Result = Builder.CreateSelect(C: IsZero, True: Zero, False: Tmp);
2588 if (Result->getType() != ResultType)
2589 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, isSigned: false);
2590 return RValue::get(V: Result);
2591}
2592
2593namespace {
2594
2595// PaddingClearer is a utility class that clears padding bits in a
2596// c/c++ type. It traverses the type recursively, collecting occupied
2597// bit intervals, and then computes the padding intervals.
2598// In the end, it clears the padding bits by writing zeros
2599// to the padding intervals bytes-by-bytes. If a byte only contains
2600// some padding bits, it writes zeros to only those bits. This is
2601// the case for bit-fields.
2602struct PaddingClearer {
2603 PaddingClearer(CodeGenFunction &F)
2604 : CGF(F), CharWidth(CGF.getContext().getCharWidth()) {}
2605
2606 void run(Address Src, QualType Ty) {
2607 OccuppiedIntervals.clear();
2608 Stack.clear();
2609
2610 Stack.push_back(Elt: Data{.StartBitOffset: 0, .Ty: Ty, .VisitVirtualBase: true});
2611 while (!Stack.empty()) {
2612 auto Current = Stack.back();
2613 Stack.pop_back();
2614 Visit(D: Current);
2615 }
2616
2617 MergeOccuppiedIntervals();
2618 auto PaddingIntervals =
2619 GetPaddingIntervals(SizeInBits: CGF.getContext().getTypeSize(T: Ty));
2620 for (const auto &Interval : PaddingIntervals) {
2621 ClearPadding(Src, PaddingInterval: Interval);
2622 }
2623 }
2624
2625private:
2626 struct BitInterval {
2627 // [First, Last)
2628 uint64_t First;
2629 uint64_t Last;
2630 };
2631
2632 struct Data {
2633 uint64_t StartBitOffset;
2634 QualType Ty;
2635 bool VisitVirtualBase;
2636 };
2637
2638 // Return the number of non padding bits of a scalar type.
2639 //
2640 // The property that we specifically care about here is whether the scalar
2641 // type has padding bits, i.e. are there bits in the type which are not
2642 // specified by the ABI.
2643 //
2644 // We currently don't care about this anywhere else in clang: layout cares
2645 // about the ABI size, calling convention code cares about specific types, but
2646 // nothing cares about padding specifically. And it's not something we can
2647 // easily query from LLVM due to the type system mismatches.
2648 // DL.getTypeSizeInBits(convertTypeForLoadStore(T)) is probably close, but the
2649 // DataLayout methods aren't really designed for this usage.
2650 //
2651 // Therefore, it is better to explicitly list all the scalar types containing
2652 // padding bits that we know of, namely, _BitInt(N) and x87 long double.
2653 uint64_t getScalarOccupiedSizeInBits(QualType Ty) const {
2654 if (const auto *BIT = Ty->getAs<BitIntType>())
2655 return BIT->getNumBits();
2656
2657 if (const auto *BT = Ty->getAs<BuiltinType>()) {
2658 if (BT->getKind() == BuiltinType::LongDouble &&
2659 &CGF.getTarget().getLongDoubleFormat() ==
2660 &APFloat::x87DoubleExtended())
2661 return APFloat::getSizeInBits(Sem: CGF.getTarget().getLongDoubleFormat());
2662 }
2663
2664 return CGF.getContext().getTypeSize(T: Ty);
2665 }
2666
2667 void Visit(const Data &D) {
2668 if (auto *AT = dyn_cast<ConstantArrayType>(Val: D.Ty)) {
2669 VisitArray(AT, StartBitOffset: D.StartBitOffset);
2670 return;
2671 }
2672
2673 if (auto *Record = D.Ty->getAsRecordDecl()) {
2674 VisitStruct(R: Record, StartBitOffset: D.StartBitOffset, VisitVirtualBase: D.VisitVirtualBase);
2675 return;
2676 }
2677
2678 if (D.Ty->isAtomicType()) {
2679 auto Unwrapped = D;
2680 Unwrapped.Ty = D.Ty.getAtomicUnqualifiedType();
2681 Stack.push_back(Elt: Unwrapped);
2682 return;
2683 }
2684
2685 if (const auto *Complex = D.Ty->getAs<ComplexType>()) {
2686 VisitComplex(CT: Complex, StartBitOffset: D.StartBitOffset);
2687 return;
2688 }
2689
2690 if (const auto *VT = D.Ty->getAs<clang::VectorType>()) {
2691 VisitVector(VT, StartBitOffset: D.StartBitOffset);
2692 return;
2693 }
2694
2695 uint64_t SizeBit = getScalarOccupiedSizeInBits(Ty: D.Ty);
2696 OccuppiedIntervals.push_back(
2697 Elt: BitInterval{.First: D.StartBitOffset, .Last: D.StartBitOffset + SizeBit});
2698 }
2699
2700 void VisitArray(const ConstantArrayType *AT, uint64_t StartBitOffset) {
2701 for (uint64_t ArrIndex = 0; ArrIndex < AT->getSize().getLimitedValue();
2702 ++ArrIndex) {
2703
2704 QualType ElementQualType = AT->getElementType();
2705 auto ElementSize = CGF.getContext().getTypeSizeInChars(T: ElementQualType);
2706 auto ElementAlign = CGF.getContext().getTypeAlignInChars(T: ElementQualType);
2707 auto Offset = ElementSize.alignTo(Align: ElementAlign);
2708
2709 Stack.push_back(
2710 Elt: Data{.StartBitOffset: StartBitOffset + ArrIndex * Offset.getQuantity() * CharWidth,
2711 .Ty: ElementQualType, /*VisitVirtualBase*/ true});
2712 }
2713 }
2714
2715 void VisitStruct(const RecordDecl *R, uint64_t StartBitOffset,
2716 bool VisitVirtualBase) {
2717 const auto &DL = CGF.CGM.getModule().getDataLayout();
2718 const ASTRecordLayout &ASTLayout = CGF.getContext().getASTRecordLayout(D: R);
2719
2720 auto *CXXRecord = dyn_cast<CXXRecordDecl>(Val: R);
2721
2722 if (CXXRecord) {
2723 if (ASTLayout.hasOwnVFPtr()) {
2724 OccuppiedIntervals.push_back(Elt: BitInterval{
2725 .First: StartBitOffset, .Last: StartBitOffset + DL.getPointerSizeInBits()});
2726 }
2727
2728 const auto VisitBase = [&ASTLayout, StartBitOffset, this](
2729 const CXXBaseSpecifier &Base, auto GetOffset) {
2730 auto *BaseRecord = Base.getType()->getAsCXXRecordDecl();
2731 if (!BaseRecord) {
2732 return;
2733 }
2734 auto BaseOffset =
2735 std::invoke(GetOffset, ASTLayout, BaseRecord).getQuantity();
2736
2737 Stack.push_back(Elt: Data{StartBitOffset + BaseOffset * CharWidth,
2738 Base.getType(), /*VisitVirtualBase*/ false});
2739 };
2740
2741 for (auto Base : CXXRecord->bases()) {
2742 if (!Base.isVirtual()) {
2743 VisitBase(Base, &ASTRecordLayout::getBaseClassOffset);
2744 }
2745 }
2746
2747 if (VisitVirtualBase) {
2748 for (auto VBase : CXXRecord->vbases()) {
2749 VisitBase(VBase, &ASTRecordLayout::getVBaseClassOffset);
2750 }
2751 }
2752 }
2753
2754 for (auto *Field : R->fields()) {
2755 // Treat unnamed bitfields as padding.
2756 if (Field->isUnnamedBitField())
2757 continue;
2758
2759 auto FieldOffset = ASTLayout.getFieldOffset(FieldNo: Field->getFieldIndex());
2760 if (Field->isBitField()) {
2761 OccuppiedIntervals.push_back(Elt: BitInterval{
2762 .First: StartBitOffset + FieldOffset,
2763 .Last: StartBitOffset + FieldOffset + Field->getBitWidthValue()});
2764 } else {
2765 Stack.push_back(Elt: Data{.StartBitOffset: StartBitOffset + FieldOffset, .Ty: Field->getType(),
2766 /*VisitVirtualBase*/ true});
2767 }
2768 }
2769 }
2770
2771 void VisitComplex(const ComplexType *CT, uint64_t StartBitOffset) {
2772 QualType ElementQualType = CT->getElementType();
2773 auto ElementSize = CGF.getContext().getTypeSizeInChars(T: ElementQualType);
2774 auto ElementAlign = CGF.getContext().getTypeAlignInChars(T: ElementQualType);
2775 auto ImgOffset = ElementSize.alignTo(Align: ElementAlign);
2776
2777 Stack.push_back(
2778 Elt: Data{.StartBitOffset: StartBitOffset, .Ty: ElementQualType, /*VisitVirtualBase*/ true});
2779 Stack.push_back(Elt: Data{.StartBitOffset: StartBitOffset + ImgOffset.getQuantity() * CharWidth,
2780 .Ty: ElementQualType, /*VisitVirtualBase*/ true});
2781 }
2782
2783 void VisitVector(const clang::VectorType *VT, uint64_t StartBitOffset) {
2784 ASTContext &Ctx = CGF.getContext();
2785 uint64_t SizeBit = [&]() -> uint64_t {
2786 if (VT->isPackedVectorBoolType(ctx: Ctx))
2787 return VT->getNumElements();
2788 return getScalarOccupiedSizeInBits(Ty: VT->getElementType()) *
2789 VT->getNumElements();
2790 }();
2791 OccuppiedIntervals.push_back(
2792 Elt: BitInterval{.First: StartBitOffset, .Last: StartBitOffset + SizeBit});
2793 }
2794
2795 void MergeOccuppiedIntervals() {
2796 std::sort(first: OccuppiedIntervals.begin(), last: OccuppiedIntervals.end(),
2797 comp: [](const BitInterval &lhs, const BitInterval &rhs) {
2798 return std::tie(args: lhs.First, args: lhs.Last) <
2799 std::tie(args: rhs.First, args: rhs.Last);
2800 });
2801
2802 llvm::SmallVector<BitInterval> Merged;
2803 Merged.reserve(N: OccuppiedIntervals.size());
2804
2805 for (const BitInterval &NextInterval : OccuppiedIntervals) {
2806 if (Merged.empty()) {
2807 Merged.push_back(Elt: NextInterval);
2808 continue;
2809 }
2810 auto &LastInterval = Merged.back();
2811
2812 if (NextInterval.First > LastInterval.Last) {
2813 Merged.push_back(Elt: NextInterval);
2814 } else {
2815 LastInterval.Last = std::max(a: LastInterval.Last, b: NextInterval.Last);
2816 }
2817 }
2818
2819 OccuppiedIntervals = Merged;
2820 }
2821
2822 llvm::SmallVector<BitInterval>
2823 GetPaddingIntervals(uint64_t SizeInBits) const {
2824 llvm::SmallVector<BitInterval> Results;
2825 if (OccuppiedIntervals.size() == 1 &&
2826 OccuppiedIntervals.front().First == 0 &&
2827 OccuppiedIntervals.front().Last == SizeInBits) {
2828 return Results;
2829 }
2830 Results.reserve(N: OccuppiedIntervals.size() + 1);
2831 uint64_t CurrentPos = 0;
2832 for (const BitInterval &OccupiedInterval : OccuppiedIntervals) {
2833 if (OccupiedInterval.First > CurrentPos) {
2834 Results.push_back(Elt: BitInterval{.First: CurrentPos, .Last: OccupiedInterval.First});
2835 }
2836 CurrentPos = OccupiedInterval.Last;
2837 }
2838 if (SizeInBits > CurrentPos) {
2839 Results.push_back(Elt: BitInterval{.First: CurrentPos, .Last: SizeInBits});
2840 }
2841 return Results;
2842 }
2843
2844 void ClearPadding(Address Src, const BitInterval &PaddingInterval) {
2845 auto *I8Ptr =
2846 CGF.Builder.CreateBitCast(V: Src.getBasePointer(), DestTy: CGF.Int8PtrTy);
2847 auto *Zero = ConstantInt::get(Ty: CGF.Int8Ty, V: 0);
2848
2849 // Calculate byte indices and bit positions
2850 auto StartByte = PaddingInterval.First / CharWidth;
2851 auto StartBit = PaddingInterval.First % CharWidth;
2852 auto EndByte = PaddingInterval.Last / CharWidth;
2853 auto EndBit = PaddingInterval.Last % CharWidth;
2854
2855 if (StartByte == EndByte) {
2856 // Interval is within a single byte
2857 auto *Index = ConstantInt::get(Ty: CGF.IntTy, V: StartByte);
2858 auto *Element = CGF.Builder.CreateGEP(Ty: CGF.Int8Ty, Ptr: I8Ptr, IdxList: Index);
2859 Address ElementAddr(Element, CGF.Int8Ty,
2860 Src.getAlignment().alignmentAtOffset(
2861 offset: CharUnits::fromQuantity(Quantity: StartByte)));
2862
2863 auto *Value = CGF.Builder.CreateLoad(Addr: ElementAddr);
2864
2865 // Create mask to clear bits within the byte
2866 // We want to clear bits from StartBit to EndBit-1
2867 uint8_t bitsToClear = ((1 << EndBit) - 1) & ~((1 << StartBit) - 1);
2868 uint8_t bitsToKeep = ~bitsToClear;
2869 auto *MaskValue = ConstantInt::get(Ty: CGF.Int8Ty, V: bitsToKeep);
2870 auto *NewValue = CGF.Builder.CreateAnd(LHS: Value, RHS: MaskValue);
2871
2872 CGF.Builder.CreateStore(Val: NewValue, Addr: ElementAddr);
2873 } else {
2874 // Handle the start byte
2875 if (StartBit != 0) {
2876 auto *Index = ConstantInt::get(Ty: CGF.IntTy, V: StartByte);
2877 auto *Element = CGF.Builder.CreateGEP(Ty: CGF.Int8Ty, Ptr: I8Ptr, IdxList: Index);
2878 Address ElementAddr(Element, CGF.Int8Ty,
2879 Src.getAlignment().alignmentAtOffset(
2880 offset: CharUnits::fromQuantity(Quantity: StartByte)));
2881
2882 auto *Value = CGF.Builder.CreateLoad(Addr: ElementAddr);
2883
2884 uint8_t bitsToClear = ((1 << (CharWidth - StartBit)) - 1) << StartBit;
2885 uint8_t bitsToKeep = ~bitsToClear;
2886 auto *MaskValue = ConstantInt::get(Ty: CGF.Int8Ty, V: bitsToKeep);
2887 auto *NewValue = CGF.Builder.CreateAnd(LHS: Value, RHS: MaskValue);
2888
2889 CGF.Builder.CreateStore(Val: NewValue, Addr: ElementAddr);
2890 ++StartByte;
2891 }
2892
2893 // Handle full bytes in the middle
2894 for (auto Offset = StartByte; Offset < EndByte; ++Offset) {
2895 auto *Index = ConstantInt::get(Ty: CGF.IntTy, V: Offset);
2896 auto *Element = CGF.Builder.CreateGEP(Ty: CGF.Int8Ty, Ptr: I8Ptr, IdxList: Index);
2897 Address ElementAddr(Element, CGF.Int8Ty,
2898 Src.getAlignment().alignmentAtOffset(
2899 offset: CharUnits::fromQuantity(Quantity: Offset)));
2900
2901 CGF.Builder.CreateStore(Val: Zero, Addr: ElementAddr);
2902 }
2903
2904 // Handle the end byte
2905 if (EndBit != 0) {
2906 auto *Index = ConstantInt::get(Ty: CGF.IntTy, V: EndByte);
2907 auto *Element = CGF.Builder.CreateGEP(Ty: CGF.Int8Ty, Ptr: I8Ptr, IdxList: Index);
2908 Address ElementAddr(Element, CGF.Int8Ty,
2909 Src.getAlignment().alignmentAtOffset(
2910 offset: CharUnits::fromQuantity(Quantity: EndByte)));
2911
2912 auto *Value = CGF.Builder.CreateLoad(Addr: ElementAddr);
2913
2914 uint8_t bitsToClear = (1 << EndBit) - 1;
2915 uint8_t bitsToKeep = ~bitsToClear;
2916 auto *MaskValue = ConstantInt::get(Ty: CGF.Int8Ty, V: bitsToKeep);
2917 auto *NewValue = CGF.Builder.CreateAnd(LHS: Value, RHS: MaskValue);
2918
2919 CGF.Builder.CreateStore(Val: NewValue, Addr: ElementAddr);
2920 }
2921 }
2922 }
2923
2924 CodeGenFunction &CGF;
2925 const uint64_t CharWidth;
2926 llvm::SmallVector<Data> Stack;
2927 llvm::SmallVector<BitInterval> OccuppiedIntervals;
2928};
2929
2930} // namespace
2931
2932RValue CodeGenFunction::EmitBuiltinExpr(const GlobalDecl GD, unsigned BuiltinID,
2933 const CallExpr *E,
2934 ReturnValueSlot ReturnValue) {
2935 assert(!getContext().BuiltinInfo.isImmediate(BuiltinID) &&
2936 "Should not codegen for consteval builtins");
2937
2938 const FunctionDecl *FD = GD.getDecl()->getAsFunction();
2939 // See if we can constant fold this builtin. If so, don't emit it at all.
2940 // TODO: Extend this handling to all builtin calls that we can constant-fold.
2941 Expr::EvalResult Result;
2942 if (E->isPRValue() && E->EvaluateAsRValue(Result, Ctx: CGM.getContext()) &&
2943 !Result.hasSideEffects()) {
2944 if (Result.Val.isInt())
2945 return RValue::get(V: llvm::ConstantInt::get(Context&: getLLVMContext(),
2946 V: Result.Val.getInt()));
2947 if (Result.Val.isFloat())
2948 return RValue::get(V: llvm::ConstantFP::get(Context&: getLLVMContext(),
2949 V: Result.Val.getFloat()));
2950 }
2951
2952 // If current long-double semantics is IEEE 128-bit, replace math builtins
2953 // of long-double with f128 equivalent.
2954 // TODO: This mutation should also be applied to other targets other than PPC,
2955 // after backend supports IEEE 128-bit style libcalls.
2956 if (getTarget().getTriple().isPPC64() &&
2957 &getTarget().getLongDoubleFormat() == &llvm::APFloat::IEEEquad())
2958 BuiltinID = mutateLongDoubleBuiltin(BuiltinID);
2959
2960 // If the builtin has been declared explicitly with an assembler label,
2961 // disable the specialized emitting below. Ideally we should communicate the
2962 // rename in IR, or at least avoid generating the intrinsic calls that are
2963 // likely to get lowered to the renamed library functions.
2964 const unsigned BuiltinIDIfNoAsmLabel =
2965 FD->hasAttr<AsmLabelAttr>() ? 0 : BuiltinID;
2966
2967 std::optional<bool> ErrnoOverriden;
2968 // ErrnoOverriden is true if math-errno is overriden via the
2969 // '#pragma float_control(precise, on)'. This pragma disables fast-math,
2970 // which implies math-errno.
2971 if (E->hasStoredFPFeatures()) {
2972 FPOptionsOverride OP = E->getFPFeatures();
2973 if (OP.hasMathErrnoOverride())
2974 ErrnoOverriden = OP.getMathErrnoOverride();
2975 }
2976 // True if 'attribute__((optnone))' is used. This attribute overrides
2977 // fast-math which implies math-errno.
2978 bool OptNone = CurFuncDecl && CurFuncDecl->hasAttr<OptimizeNoneAttr>();
2979
2980 bool IsOptimizationEnabled = CGM.getCodeGenOpts().OptimizationLevel != 0;
2981
2982 bool GenerateFPMathIntrinsics =
2983 getContext().BuiltinInfo.shouldGenerateFPMathIntrinsic(
2984 BuiltinID, Trip: CGM.getTriple(), ErrnoOverwritten: ErrnoOverriden, MathErrnoEnabled: getLangOpts().MathErrno,
2985 HasOptNoneAttr: OptNone, IsOptimizationEnabled);
2986
2987 if (GenerateFPMathIntrinsics) {
2988 switch (BuiltinIDIfNoAsmLabel) {
2989 case Builtin::BIacos:
2990 case Builtin::BIacosf:
2991 case Builtin::BIacosl:
2992 case Builtin::BI__builtin_acos:
2993 case Builtin::BI__builtin_acosf:
2994 case Builtin::BI__builtin_acosf16:
2995 case Builtin::BI__builtin_acosl:
2996 case Builtin::BI__builtin_acosf128:
2997 case Builtin::BI__builtin_elementwise_acos:
2998 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
2999 CGF&: *this, E, IntrinsicID: Intrinsic::acos, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_acos));
3000
3001 case Builtin::BIasin:
3002 case Builtin::BIasinf:
3003 case Builtin::BIasinl:
3004 case Builtin::BI__builtin_asin:
3005 case Builtin::BI__builtin_asinf:
3006 case Builtin::BI__builtin_asinf16:
3007 case Builtin::BI__builtin_asinl:
3008 case Builtin::BI__builtin_asinf128:
3009 case Builtin::BI__builtin_elementwise_asin:
3010 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
3011 CGF&: *this, E, IntrinsicID: Intrinsic::asin, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_asin));
3012
3013 case Builtin::BIatan:
3014 case Builtin::BIatanf:
3015 case Builtin::BIatanl:
3016 case Builtin::BI__builtin_atan:
3017 case Builtin::BI__builtin_atanf:
3018 case Builtin::BI__builtin_atanf16:
3019 case Builtin::BI__builtin_atanl:
3020 case Builtin::BI__builtin_atanf128:
3021 case Builtin::BI__builtin_elementwise_atan:
3022 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
3023 CGF&: *this, E, IntrinsicID: Intrinsic::atan, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_atan));
3024
3025 case Builtin::BIatan2:
3026 case Builtin::BIatan2f:
3027 case Builtin::BIatan2l:
3028 case Builtin::BI__builtin_atan2:
3029 case Builtin::BI__builtin_atan2f:
3030 case Builtin::BI__builtin_atan2f16:
3031 case Builtin::BI__builtin_atan2l:
3032 case Builtin::BI__builtin_atan2f128:
3033 case Builtin::BI__builtin_elementwise_atan2:
3034 return RValue::get(V: emitBinaryMaybeConstrainedFPBuiltin(
3035 CGF&: *this, E, IntrinsicID: Intrinsic::atan2,
3036 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_atan2));
3037
3038 case Builtin::BIceil:
3039 case Builtin::BIceilf:
3040 case Builtin::BIceill:
3041 case Builtin::BI__builtin_ceil:
3042 case Builtin::BI__builtin_ceilf:
3043 case Builtin::BI__builtin_ceilf16:
3044 case Builtin::BI__builtin_ceill:
3045 case Builtin::BI__builtin_ceilf128:
3046 case Builtin::BI__builtin_elementwise_ceil:
3047 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3048 IntrinsicID: Intrinsic::ceil,
3049 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_ceil));
3050
3051 case Builtin::BIcopysign:
3052 case Builtin::BIcopysignf:
3053 case Builtin::BIcopysignl:
3054 case Builtin::BI__builtin_copysign:
3055 case Builtin::BI__builtin_copysignf:
3056 case Builtin::BI__builtin_copysignf16:
3057 case Builtin::BI__builtin_copysignl:
3058 case Builtin::BI__builtin_copysignf128:
3059 return RValue::get(
3060 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::copysign));
3061
3062 case Builtin::BIcos:
3063 case Builtin::BIcosf:
3064 case Builtin::BIcosl:
3065 case Builtin::BI__builtin_cos:
3066 case Builtin::BI__builtin_cosf:
3067 case Builtin::BI__builtin_cosf16:
3068 case Builtin::BI__builtin_cosl:
3069 case Builtin::BI__builtin_cosf128:
3070 case Builtin::BI__builtin_elementwise_cos:
3071 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3072 IntrinsicID: Intrinsic::cos,
3073 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_cos));
3074
3075 case Builtin::BIcosh:
3076 case Builtin::BIcoshf:
3077 case Builtin::BIcoshl:
3078 case Builtin::BI__builtin_cosh:
3079 case Builtin::BI__builtin_coshf:
3080 case Builtin::BI__builtin_coshf16:
3081 case Builtin::BI__builtin_coshl:
3082 case Builtin::BI__builtin_coshf128:
3083 case Builtin::BI__builtin_elementwise_cosh:
3084 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
3085 CGF&: *this, E, IntrinsicID: Intrinsic::cosh, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_cosh));
3086
3087 case Builtin::BIexp:
3088 case Builtin::BIexpf:
3089 case Builtin::BIexpl:
3090 case Builtin::BI__builtin_exp:
3091 case Builtin::BI__builtin_expf:
3092 case Builtin::BI__builtin_expf16:
3093 case Builtin::BI__builtin_expl:
3094 case Builtin::BI__builtin_expf128:
3095 case Builtin::BI__builtin_elementwise_exp:
3096 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3097 IntrinsicID: Intrinsic::exp,
3098 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_exp));
3099
3100 case Builtin::BIexp2:
3101 case Builtin::BIexp2f:
3102 case Builtin::BIexp2l:
3103 case Builtin::BI__builtin_exp2:
3104 case Builtin::BI__builtin_exp2f:
3105 case Builtin::BI__builtin_exp2f16:
3106 case Builtin::BI__builtin_exp2l:
3107 case Builtin::BI__builtin_exp2f128:
3108 case Builtin::BI__builtin_elementwise_exp2:
3109 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3110 IntrinsicID: Intrinsic::exp2,
3111 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_exp2));
3112 case Builtin::BI__builtin_exp10:
3113 case Builtin::BI__builtin_exp10f:
3114 case Builtin::BI__builtin_exp10f16:
3115 case Builtin::BI__builtin_exp10l:
3116 case Builtin::BI__builtin_exp10f128:
3117 case Builtin::BI__builtin_elementwise_exp10: {
3118 // TODO: strictfp support
3119 if (Builder.getIsFPConstrained())
3120 break;
3121 return RValue::get(
3122 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::exp10));
3123 }
3124 case Builtin::BIfabs:
3125 case Builtin::BIfabsf:
3126 case Builtin::BIfabsl:
3127 case Builtin::BI__builtin_fabs:
3128 case Builtin::BI__builtin_fabsf:
3129 case Builtin::BI__builtin_fabsf16:
3130 case Builtin::BI__builtin_fabsl:
3131 case Builtin::BI__builtin_fabsf128:
3132 return RValue::get(
3133 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::fabs));
3134
3135 case Builtin::BIfloor:
3136 case Builtin::BIfloorf:
3137 case Builtin::BIfloorl:
3138 case Builtin::BI__builtin_floor:
3139 case Builtin::BI__builtin_floorf:
3140 case Builtin::BI__builtin_floorf16:
3141 case Builtin::BI__builtin_floorl:
3142 case Builtin::BI__builtin_floorf128:
3143 case Builtin::BI__builtin_elementwise_floor:
3144 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3145 IntrinsicID: Intrinsic::floor,
3146 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_floor));
3147
3148 case Builtin::BIfma:
3149 case Builtin::BIfmaf:
3150 case Builtin::BIfmal:
3151 case Builtin::BI__builtin_fma:
3152 case Builtin::BI__builtin_fmaf:
3153 case Builtin::BI__builtin_fmaf16:
3154 case Builtin::BI__builtin_fmal:
3155 case Builtin::BI__builtin_fmaf128:
3156 case Builtin::BI__builtin_elementwise_fma:
3157 return RValue::get(V: emitTernaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3158 IntrinsicID: Intrinsic::fma,
3159 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_fma));
3160
3161 case Builtin::BIfmax:
3162 case Builtin::BIfmaxf:
3163 case Builtin::BIfmaxl:
3164 case Builtin::BI__builtin_fmax:
3165 case Builtin::BI__builtin_fmaxf:
3166 case Builtin::BI__builtin_fmaxf16:
3167 case Builtin::BI__builtin_fmaxl:
3168 case Builtin::BI__builtin_fmaxf128: {
3169 IRBuilder<>::FastMathFlagGuard FMFGuard(Builder);
3170 Builder.getFastMathFlags().setNoSignedZeros();
3171 return RValue::get(V: emitBinaryMaybeConstrainedFPBuiltin(
3172 CGF&: *this, E, IntrinsicID: Intrinsic::maxnum,
3173 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_maxnum));
3174 }
3175
3176 case Builtin::BIfmin:
3177 case Builtin::BIfminf:
3178 case Builtin::BIfminl:
3179 case Builtin::BI__builtin_fmin:
3180 case Builtin::BI__builtin_fminf:
3181 case Builtin::BI__builtin_fminf16:
3182 case Builtin::BI__builtin_fminl:
3183 case Builtin::BI__builtin_fminf128: {
3184 IRBuilder<>::FastMathFlagGuard FMFGuard(Builder);
3185 Builder.getFastMathFlags().setNoSignedZeros();
3186 return RValue::get(V: emitBinaryMaybeConstrainedFPBuiltin(
3187 CGF&: *this, E, IntrinsicID: Intrinsic::minnum,
3188 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_minnum));
3189 }
3190
3191 case Builtin::BIfmaximum_num:
3192 case Builtin::BIfmaximum_numf:
3193 case Builtin::BIfmaximum_numl:
3194 case Builtin::BI__builtin_fmaximum_num:
3195 case Builtin::BI__builtin_fmaximum_numf:
3196 case Builtin::BI__builtin_fmaximum_numf16:
3197 case Builtin::BI__builtin_fmaximum_numl:
3198 case Builtin::BI__builtin_fmaximum_numf128:
3199 return RValue::get(
3200 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::maximumnum));
3201
3202 case Builtin::BIfminimum_num:
3203 case Builtin::BIfminimum_numf:
3204 case Builtin::BIfminimum_numl:
3205 case Builtin::BI__builtin_fminimum_num:
3206 case Builtin::BI__builtin_fminimum_numf:
3207 case Builtin::BI__builtin_fminimum_numf16:
3208 case Builtin::BI__builtin_fminimum_numl:
3209 case Builtin::BI__builtin_fminimum_numf128:
3210 return RValue::get(
3211 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::minimumnum));
3212
3213 // fmod() is a special-case. It maps to the frem instruction rather than an
3214 // LLVM intrinsic.
3215 case Builtin::BIfmod:
3216 case Builtin::BIfmodf:
3217 case Builtin::BIfmodl:
3218 case Builtin::BI__builtin_fmod:
3219 case Builtin::BI__builtin_fmodf:
3220 case Builtin::BI__builtin_fmodf16:
3221 case Builtin::BI__builtin_fmodl:
3222 case Builtin::BI__builtin_fmodf128:
3223 case Builtin::BI__builtin_elementwise_fmod: {
3224 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
3225 Value *Arg1 = EmitScalarExpr(E: E->getArg(Arg: 0));
3226 Value *Arg2 = EmitScalarExpr(E: E->getArg(Arg: 1));
3227 if (Builder.getIsFPConstrained()) {
3228 Function *F = CGM.getIntrinsic(IID: Intrinsic::experimental_constrained_frem,
3229 Tys: Arg1->getType());
3230 return RValue::get(V: Builder.CreateConstrainedFPCall(Callee: F, Args: {Arg1, Arg2}));
3231 } else {
3232 return RValue::get(V: Builder.CreateFRem(L: Arg1, R: Arg2, Name: "fmod"));
3233 }
3234 }
3235
3236 case Builtin::BIlog:
3237 case Builtin::BIlogf:
3238 case Builtin::BIlogl:
3239 case Builtin::BI__builtin_log:
3240 case Builtin::BI__builtin_logf:
3241 case Builtin::BI__builtin_logf16:
3242 case Builtin::BI__builtin_logl:
3243 case Builtin::BI__builtin_logf128:
3244 case Builtin::BI__builtin_elementwise_log:
3245 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3246 IntrinsicID: Intrinsic::log,
3247 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_log));
3248
3249 case Builtin::BIlog10:
3250 case Builtin::BIlog10f:
3251 case Builtin::BIlog10l:
3252 case Builtin::BI__builtin_log10:
3253 case Builtin::BI__builtin_log10f:
3254 case Builtin::BI__builtin_log10f16:
3255 case Builtin::BI__builtin_log10l:
3256 case Builtin::BI__builtin_log10f128:
3257 case Builtin::BI__builtin_elementwise_log10:
3258 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3259 IntrinsicID: Intrinsic::log10,
3260 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_log10));
3261
3262 case Builtin::BIlog2:
3263 case Builtin::BIlog2f:
3264 case Builtin::BIlog2l:
3265 case Builtin::BI__builtin_log2:
3266 case Builtin::BI__builtin_log2f:
3267 case Builtin::BI__builtin_log2f16:
3268 case Builtin::BI__builtin_log2l:
3269 case Builtin::BI__builtin_log2f128:
3270 case Builtin::BI__builtin_elementwise_log2:
3271 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3272 IntrinsicID: Intrinsic::log2,
3273 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_log2));
3274
3275 case Builtin::BInearbyint:
3276 case Builtin::BInearbyintf:
3277 case Builtin::BInearbyintl:
3278 case Builtin::BI__builtin_nearbyint:
3279 case Builtin::BI__builtin_nearbyintf:
3280 case Builtin::BI__builtin_nearbyintl:
3281 case Builtin::BI__builtin_nearbyintf128:
3282 case Builtin::BI__builtin_elementwise_nearbyint:
3283 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3284 IntrinsicID: Intrinsic::nearbyint,
3285 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_nearbyint));
3286
3287 case Builtin::BIpow:
3288 case Builtin::BIpowf:
3289 case Builtin::BIpowl:
3290 case Builtin::BI__builtin_pow:
3291 case Builtin::BI__builtin_powf:
3292 case Builtin::BI__builtin_powf16:
3293 case Builtin::BI__builtin_powl:
3294 case Builtin::BI__builtin_powf128:
3295 case Builtin::BI__builtin_elementwise_pow:
3296 return RValue::get(V: emitBinaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3297 IntrinsicID: Intrinsic::pow,
3298 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_pow));
3299
3300 case Builtin::BIrint:
3301 case Builtin::BIrintf:
3302 case Builtin::BIrintl:
3303 case Builtin::BI__builtin_rint:
3304 case Builtin::BI__builtin_rintf:
3305 case Builtin::BI__builtin_rintf16:
3306 case Builtin::BI__builtin_rintl:
3307 case Builtin::BI__builtin_rintf128:
3308 case Builtin::BI__builtin_elementwise_rint:
3309 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3310 IntrinsicID: Intrinsic::rint,
3311 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_rint));
3312
3313 case Builtin::BIround:
3314 case Builtin::BIroundf:
3315 case Builtin::BIroundl:
3316 case Builtin::BI__builtin_round:
3317 case Builtin::BI__builtin_roundf:
3318 case Builtin::BI__builtin_roundf16:
3319 case Builtin::BI__builtin_roundl:
3320 case Builtin::BI__builtin_roundf128:
3321 case Builtin::BI__builtin_elementwise_round:
3322 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3323 IntrinsicID: Intrinsic::round,
3324 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_round));
3325
3326 case Builtin::BIroundeven:
3327 case Builtin::BIroundevenf:
3328 case Builtin::BIroundevenl:
3329 case Builtin::BI__builtin_roundeven:
3330 case Builtin::BI__builtin_roundevenf:
3331 case Builtin::BI__builtin_roundevenf16:
3332 case Builtin::BI__builtin_roundevenl:
3333 case Builtin::BI__builtin_roundevenf128:
3334 case Builtin::BI__builtin_elementwise_roundeven:
3335 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3336 IntrinsicID: Intrinsic::roundeven,
3337 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_roundeven));
3338
3339 case Builtin::BIsin:
3340 case Builtin::BIsinf:
3341 case Builtin::BIsinl:
3342 case Builtin::BI__builtin_sin:
3343 case Builtin::BI__builtin_sinf:
3344 case Builtin::BI__builtin_sinf16:
3345 case Builtin::BI__builtin_sinl:
3346 case Builtin::BI__builtin_sinf128:
3347 case Builtin::BI__builtin_elementwise_sin:
3348 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3349 IntrinsicID: Intrinsic::sin,
3350 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_sin));
3351
3352 case Builtin::BIsinh:
3353 case Builtin::BIsinhf:
3354 case Builtin::BIsinhl:
3355 case Builtin::BI__builtin_sinh:
3356 case Builtin::BI__builtin_sinhf:
3357 case Builtin::BI__builtin_sinhf16:
3358 case Builtin::BI__builtin_sinhl:
3359 case Builtin::BI__builtin_sinhf128:
3360 case Builtin::BI__builtin_elementwise_sinh:
3361 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
3362 CGF&: *this, E, IntrinsicID: Intrinsic::sinh, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_sinh));
3363
3364 case Builtin::BI__builtin_sincospi:
3365 case Builtin::BI__builtin_sincospif:
3366 case Builtin::BI__builtin_sincospil:
3367 if (Builder.getIsFPConstrained())
3368 break; // TODO: Emit constrained sincospi intrinsic once one exists.
3369 emitSincosBuiltin(CGF&: *this, E, IntrinsicID: Intrinsic::sincospi);
3370 return RValue::get(V: nullptr);
3371
3372 case Builtin::BIsincos:
3373 case Builtin::BIsincosf:
3374 case Builtin::BIsincosl:
3375 case Builtin::BI__builtin_sincos:
3376 case Builtin::BI__builtin_sincosf:
3377 case Builtin::BI__builtin_sincosf16:
3378 case Builtin::BI__builtin_sincosl:
3379 case Builtin::BI__builtin_sincosf128:
3380 if (Builder.getIsFPConstrained())
3381 break; // TODO: Emit constrained sincos intrinsic once one exists.
3382 emitSincosBuiltin(CGF&: *this, E, IntrinsicID: Intrinsic::sincos);
3383 return RValue::get(V: nullptr);
3384
3385 case Builtin::BIsqrt:
3386 case Builtin::BIsqrtf:
3387 case Builtin::BIsqrtl:
3388 case Builtin::BI__builtin_sqrt:
3389 case Builtin::BI__builtin_sqrtf:
3390 case Builtin::BI__builtin_sqrtf16:
3391 case Builtin::BI__builtin_sqrtl:
3392 case Builtin::BI__builtin_sqrtf128:
3393 case Builtin::BI__builtin_elementwise_sqrt: {
3394 llvm::Value *Call = emitUnaryMaybeConstrainedFPBuiltin(
3395 CGF&: *this, E, IntrinsicID: Intrinsic::sqrt, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_sqrt);
3396 SetSqrtFPAccuracy(Call);
3397 return RValue::get(V: Call);
3398 }
3399
3400 case Builtin::BItan:
3401 case Builtin::BItanf:
3402 case Builtin::BItanl:
3403 case Builtin::BI__builtin_tan:
3404 case Builtin::BI__builtin_tanf:
3405 case Builtin::BI__builtin_tanf16:
3406 case Builtin::BI__builtin_tanl:
3407 case Builtin::BI__builtin_tanf128:
3408 case Builtin::BI__builtin_elementwise_tan:
3409 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
3410 CGF&: *this, E, IntrinsicID: Intrinsic::tan, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_tan));
3411
3412 case Builtin::BItanh:
3413 case Builtin::BItanhf:
3414 case Builtin::BItanhl:
3415 case Builtin::BI__builtin_tanh:
3416 case Builtin::BI__builtin_tanhf:
3417 case Builtin::BI__builtin_tanhf16:
3418 case Builtin::BI__builtin_tanhl:
3419 case Builtin::BI__builtin_tanhf128:
3420 case Builtin::BI__builtin_elementwise_tanh:
3421 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(
3422 CGF&: *this, E, IntrinsicID: Intrinsic::tanh, ConstrainedIntrinsicID: Intrinsic::experimental_constrained_tanh));
3423
3424 case Builtin::BItrunc:
3425 case Builtin::BItruncf:
3426 case Builtin::BItruncl:
3427 case Builtin::BI__builtin_trunc:
3428 case Builtin::BI__builtin_truncf:
3429 case Builtin::BI__builtin_truncf16:
3430 case Builtin::BI__builtin_truncl:
3431 case Builtin::BI__builtin_truncf128:
3432 case Builtin::BI__builtin_elementwise_trunc:
3433 return RValue::get(V: emitUnaryMaybeConstrainedFPBuiltin(CGF&: *this, E,
3434 IntrinsicID: Intrinsic::trunc,
3435 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_trunc));
3436
3437 case Builtin::BIlround:
3438 case Builtin::BIlroundf:
3439 case Builtin::BIlroundl:
3440 case Builtin::BI__builtin_lround:
3441 case Builtin::BI__builtin_lroundf:
3442 case Builtin::BI__builtin_lroundl:
3443 case Builtin::BI__builtin_lroundf128:
3444 return RValue::get(V: emitMaybeConstrainedFPToIntRoundBuiltin(
3445 CGF&: *this, E, IntrinsicID: Intrinsic::lround,
3446 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_lround));
3447
3448 case Builtin::BIllround:
3449 case Builtin::BIllroundf:
3450 case Builtin::BIllroundl:
3451 case Builtin::BI__builtin_llround:
3452 case Builtin::BI__builtin_llroundf:
3453 case Builtin::BI__builtin_llroundl:
3454 case Builtin::BI__builtin_llroundf128:
3455 return RValue::get(V: emitMaybeConstrainedFPToIntRoundBuiltin(
3456 CGF&: *this, E, IntrinsicID: Intrinsic::llround,
3457 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_llround));
3458
3459 case Builtin::BIlrint:
3460 case Builtin::BIlrintf:
3461 case Builtin::BIlrintl:
3462 case Builtin::BI__builtin_lrint:
3463 case Builtin::BI__builtin_lrintf:
3464 case Builtin::BI__builtin_lrintl:
3465 case Builtin::BI__builtin_lrintf128:
3466 return RValue::get(V: emitMaybeConstrainedFPToIntRoundBuiltin(
3467 CGF&: *this, E, IntrinsicID: Intrinsic::lrint,
3468 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_lrint));
3469
3470 case Builtin::BIllrint:
3471 case Builtin::BIllrintf:
3472 case Builtin::BIllrintl:
3473 case Builtin::BI__builtin_llrint:
3474 case Builtin::BI__builtin_llrintf:
3475 case Builtin::BI__builtin_llrintl:
3476 case Builtin::BI__builtin_llrintf128:
3477 return RValue::get(V: emitMaybeConstrainedFPToIntRoundBuiltin(
3478 CGF&: *this, E, IntrinsicID: Intrinsic::llrint,
3479 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_llrint));
3480 case Builtin::BI__builtin_ldexp:
3481 case Builtin::BI__builtin_ldexpf:
3482 case Builtin::BI__builtin_ldexpl:
3483 case Builtin::BI__builtin_ldexpf16:
3484 case Builtin::BI__builtin_ldexpf128:
3485 case Builtin::BI__builtin_elementwise_ldexp:
3486 return RValue::get(V: emitBinaryExpMaybeConstrainedFPBuiltin(
3487 CGF&: *this, E, IntrinsicID: Intrinsic::ldexp,
3488 ConstrainedIntrinsicID: Intrinsic::experimental_constrained_ldexp));
3489 default:
3490 break;
3491 }
3492 }
3493
3494 // Check NonnullAttribute/NullabilityArg and Alignment.
3495 auto EmitArgCheck = [&](TypeCheckKind Kind, Address A, const Expr *Arg,
3496 unsigned ParmNum) {
3497 Value *Val = A.emitRawPointer(CGF&: *this);
3498 EmitNonNullArgCheck(RV: RValue::get(V: Val), ArgType: Arg->getType(), ArgLoc: Arg->getExprLoc(), AC: FD,
3499 ParmNum);
3500
3501 if (SanOpts.has(K: SanitizerKind::Alignment)) {
3502 SanitizerSet SkippedChecks;
3503 SkippedChecks.set(SanitizerKind::All);
3504 SkippedChecks.clear(K: SanitizerKind::Alignment);
3505 SourceLocation Loc = Arg->getExprLoc();
3506 // Strip an implicit cast.
3507 if (auto *CE = dyn_cast<ImplicitCastExpr>(Val: Arg))
3508 if (CE->getCastKind() == CK_BitCast)
3509 Arg = CE->getSubExpr();
3510 EmitTypeCheck(TCK: Kind, Loc, V: Val, Type: Arg->getType(), Alignment: A.getAlignment(),
3511 SkippedChecks);
3512 }
3513 };
3514
3515 switch (BuiltinIDIfNoAsmLabel) {
3516 default: break;
3517 case Builtin::BI__builtin___CFStringMakeConstantString:
3518 case Builtin::BI__builtin___NSStringMakeConstantString:
3519 return RValue::get(V: ConstantEmitter(*this).emitAbstract(E, T: E->getType()));
3520 case Builtin::BI__builtin_stdarg_start:
3521 case Builtin::BI__builtin_va_start:
3522 case Builtin::BI__va_start:
3523 case Builtin::BI__builtin_c23_va_start:
3524 case Builtin::BI__builtin_va_end:
3525 EmitVAStartEnd(ArgValue: BuiltinID == Builtin::BI__va_start
3526 ? EmitScalarExpr(E: E->getArg(Arg: 0))
3527 : EmitVAListRef(E: E->getArg(Arg: 0)).emitRawPointer(CGF&: *this),
3528 IsStart: BuiltinID != Builtin::BI__builtin_va_end);
3529 return RValue::get(V: nullptr);
3530 case Builtin::BI__builtin_va_copy: {
3531 Value *DstPtr = EmitVAListRef(E: E->getArg(Arg: 0)).emitRawPointer(CGF&: *this);
3532 Value *SrcPtr = EmitVAListRef(E: E->getArg(Arg: 1)).emitRawPointer(CGF&: *this);
3533 Builder.CreateCall(Callee: CGM.getIntrinsic(IID: Intrinsic::vacopy, Tys: {DstPtr->getType()}),
3534 Args: {DstPtr, SrcPtr});
3535 return RValue::get(V: nullptr);
3536 }
3537 case Builtin::BIabs:
3538 case Builtin::BIlabs:
3539 case Builtin::BIllabs:
3540 case Builtin::BI__builtin_abs:
3541 case Builtin::BI__builtin_labs:
3542 case Builtin::BI__builtin_llabs: {
3543 bool SanitizeOverflow = SanOpts.has(K: SanitizerKind::SignedIntegerOverflow);
3544
3545 Value *Result;
3546 switch (getLangOpts().getSignedOverflowBehavior()) {
3547 case LangOptions::SOB_Defined:
3548 Result = EmitAbs(CGF&: *this, ArgValue: EmitScalarExpr(E: E->getArg(Arg: 0)), HasNSW: false);
3549 break;
3550 case LangOptions::SOB_Undefined:
3551 if (!SanitizeOverflow) {
3552 Result = EmitAbs(CGF&: *this, ArgValue: EmitScalarExpr(E: E->getArg(Arg: 0)), HasNSW: true);
3553 break;
3554 }
3555 [[fallthrough]];
3556 case LangOptions::SOB_Trapping:
3557 // TODO: Somehow handle the corner case when the address of abs is taken.
3558 Result = EmitOverflowCheckedAbs(CGF&: *this, E, SanitizeOverflow);
3559 break;
3560 }
3561 return RValue::get(V: Result);
3562 }
3563 case Builtin::BI__builtin_complex: {
3564 Value *Real = EmitScalarExpr(E: E->getArg(Arg: 0));
3565 Value *Imag = EmitScalarExpr(E: E->getArg(Arg: 1));
3566 return RValue::getComplex(C: {Real, Imag});
3567 }
3568 case Builtin::BI__builtin_conj:
3569 case Builtin::BI__builtin_conjf:
3570 case Builtin::BI__builtin_conjl:
3571 case Builtin::BIconj:
3572 case Builtin::BIconjf:
3573 case Builtin::BIconjl: {
3574 ComplexPairTy ComplexVal = EmitComplexExpr(E: E->getArg(Arg: 0));
3575 Value *Real = ComplexVal.first;
3576 Value *Imag = ComplexVal.second;
3577 Imag = Builder.CreateFNeg(V: Imag, Name: "neg");
3578 return RValue::getComplex(C: std::make_pair(x&: Real, y&: Imag));
3579 }
3580 case Builtin::BI__builtin_creal:
3581 case Builtin::BI__builtin_crealf:
3582 case Builtin::BI__builtin_creall:
3583 case Builtin::BIcreal:
3584 case Builtin::BIcrealf:
3585 case Builtin::BIcreall: {
3586 ComplexPairTy ComplexVal = EmitComplexExpr(E: E->getArg(Arg: 0));
3587 return RValue::get(V: ComplexVal.first);
3588 }
3589
3590 case Builtin::BI__builtin_preserve_access_index: {
3591 // Only enabled preserved access index region when debuginfo
3592 // is available as debuginfo is needed to preserve user-level
3593 // access pattern.
3594 if (!getDebugInfo()) {
3595 CGM.Error(loc: E->getExprLoc(), error: "using builtin_preserve_access_index() without -g");
3596 return RValue::get(V: EmitScalarExpr(E: E->getArg(Arg: 0)));
3597 }
3598
3599 // Nested builtin_preserve_access_index() not supported
3600 if (IsInPreservedAIRegion) {
3601 CGM.Error(loc: E->getExprLoc(), error: "nested builtin_preserve_access_index() not supported");
3602 return RValue::get(V: EmitScalarExpr(E: E->getArg(Arg: 0)));
3603 }
3604
3605 IsInPreservedAIRegion = true;
3606 Value *Res = EmitScalarExpr(E: E->getArg(Arg: 0));
3607 IsInPreservedAIRegion = false;
3608 return RValue::get(V: Res);
3609 }
3610
3611 case Builtin::BI__builtin_cimag:
3612 case Builtin::BI__builtin_cimagf:
3613 case Builtin::BI__builtin_cimagl:
3614 case Builtin::BIcimag:
3615 case Builtin::BIcimagf:
3616 case Builtin::BIcimagl: {
3617 ComplexPairTy ComplexVal = EmitComplexExpr(E: E->getArg(Arg: 0));
3618 return RValue::get(V: ComplexVal.second);
3619 }
3620
3621 case Builtin::BI__builtin_clrsb:
3622 case Builtin::BI__builtin_clrsbl:
3623 case Builtin::BI__builtin_clrsbll: {
3624 // clrsb(x) -> clz(x < 0 ? ~x : x) - 1 or
3625 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3626
3627 llvm::Type *ArgType = ArgValue->getType();
3628 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctlz, Tys: ArgType);
3629
3630 llvm::Type *ResultType = ConvertType(T: E->getType());
3631 Value *Zero = llvm::Constant::getNullValue(Ty: ArgType);
3632 Value *IsNeg = Builder.CreateICmpSLT(LHS: ArgValue, RHS: Zero, Name: "isneg");
3633 Value *Inverse = Builder.CreateNot(V: ArgValue, Name: "not");
3634 Value *Tmp = Builder.CreateSelect(C: IsNeg, True: Inverse, False: ArgValue);
3635 Value *Ctlz = Builder.CreateCall(Callee: F, Args: {Tmp, Builder.getFalse()});
3636 Value *Result =
3637 Builder.CreateNUWSub(LHS: Ctlz, RHS: llvm::ConstantInt::get(Ty: ArgType, V: 1));
3638 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/true,
3639 Name: "cast");
3640 return RValue::get(V: Result);
3641 }
3642 case Builtin::BI__builtin_ctzs:
3643 case Builtin::BI__builtin_ctz:
3644 case Builtin::BI__builtin_ctzl:
3645 case Builtin::BI__builtin_ctzll:
3646 case Builtin::BI__builtin_ctzg:
3647 case Builtin::BI__builtin_elementwise_ctzg: {
3648 bool HasFallback =
3649 (BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_ctzg ||
3650 BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_elementwise_ctzg) &&
3651 E->getNumArgs() > 1;
3652
3653 Value *ArgValue =
3654 HasFallback ? EmitBitCountExpr(CGF&: *this, E: E->getArg(Arg: 0))
3655 : EmitCheckedArgForBuiltin(E: E->getArg(Arg: 0), Kind: BCK_CTZPassedZero);
3656
3657 llvm::Type *ArgType = ArgValue->getType();
3658 Function *F = CGM.getIntrinsic(IID: Intrinsic::cttz, Tys: ArgType);
3659
3660 llvm::Type *ResultType = ConvertType(T: E->getType());
3661 // The elementwise builtins always exhibit zero-is-undef behaviour
3662 Value *ZeroUndef = Builder.getInt1(
3663 V: HasFallback || getTarget().isCLZForZeroUndef() ||
3664 BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_elementwise_ctzg);
3665 Value *Result = Builder.CreateCall(Callee: F, Args: {ArgValue, ZeroUndef});
3666 if (Result->getType() != ResultType)
3667 Result =
3668 Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/ false, Name: "cast");
3669 if (!HasFallback)
3670 return RValue::get(V: Result);
3671
3672 Value *Zero = Constant::getNullValue(Ty: ArgType);
3673 Value *IsZero = Builder.CreateICmpEQ(LHS: ArgValue, RHS: Zero, Name: "iszero");
3674 Value *FallbackValue = EmitScalarExpr(E: E->getArg(Arg: 1));
3675 Value *ResultOrFallback =
3676 Builder.CreateSelect(C: IsZero, True: FallbackValue, False: Result, Name: "ctzg");
3677 return RValue::get(V: ResultOrFallback);
3678 }
3679 case Builtin::BI__builtin_clzs:
3680 case Builtin::BI__builtin_clz:
3681 case Builtin::BI__builtin_clzl:
3682 case Builtin::BI__builtin_clzll:
3683 case Builtin::BI__builtin_clzg:
3684 case Builtin::BI__builtin_elementwise_clzg: {
3685 bool HasFallback =
3686 (BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_clzg ||
3687 BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_elementwise_clzg) &&
3688 E->getNumArgs() > 1;
3689
3690 Value *ArgValue =
3691 HasFallback ? EmitBitCountExpr(CGF&: *this, E: E->getArg(Arg: 0))
3692 : EmitCheckedArgForBuiltin(E: E->getArg(Arg: 0), Kind: BCK_CLZPassedZero);
3693
3694 llvm::Type *ArgType = ArgValue->getType();
3695 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctlz, Tys: ArgType);
3696
3697 llvm::Type *ResultType = ConvertType(T: E->getType());
3698 // The elementwise builtins always exhibit zero-is-undef behaviour
3699 Value *ZeroUndef = Builder.getInt1(
3700 V: HasFallback || getTarget().isCLZForZeroUndef() ||
3701 BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_elementwise_clzg);
3702 Value *Result = Builder.CreateCall(Callee: F, Args: {ArgValue, ZeroUndef});
3703 if (Result->getType() != ResultType)
3704 Result =
3705 Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/ false, Name: "cast");
3706 if (!HasFallback)
3707 return RValue::get(V: Result);
3708
3709 Value *Zero = Constant::getNullValue(Ty: ArgType);
3710 Value *IsZero = Builder.CreateICmpEQ(LHS: ArgValue, RHS: Zero, Name: "iszero");
3711 Value *FallbackValue = EmitScalarExpr(E: E->getArg(Arg: 1));
3712 Value *ResultOrFallback =
3713 Builder.CreateSelect(C: IsZero, True: FallbackValue, False: Result, Name: "clzg");
3714 return RValue::get(V: ResultOrFallback);
3715 }
3716 case Builtin::BI__builtin_ffs:
3717 case Builtin::BI__builtin_ffsl:
3718 case Builtin::BI__builtin_ffsll: {
3719 // ffs(x) -> x ? cttz(x) + 1 : 0
3720 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3721
3722 llvm::Type *ArgType = ArgValue->getType();
3723 Function *F = CGM.getIntrinsic(IID: Intrinsic::cttz, Tys: ArgType);
3724
3725 llvm::Type *ResultType = ConvertType(T: E->getType());
3726 Value *Tmp =
3727 Builder.CreateAdd(LHS: Builder.CreateCall(Callee: F, Args: {ArgValue, Builder.getTrue()}),
3728 RHS: llvm::ConstantInt::get(Ty: ArgType, V: 1));
3729 Value *Zero = llvm::Constant::getNullValue(Ty: ArgType);
3730 Value *IsZero = Builder.CreateICmpEQ(LHS: ArgValue, RHS: Zero, Name: "iszero");
3731 Value *Result = Builder.CreateSelect(C: IsZero, True: Zero, False: Tmp, Name: "ffs");
3732 if (Result->getType() != ResultType)
3733 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/true,
3734 Name: "cast");
3735 return RValue::get(V: Result);
3736 }
3737 case Builtin::BI__builtin_parity:
3738 case Builtin::BI__builtin_parityl:
3739 case Builtin::BI__builtin_parityll: {
3740 // parity(x) -> ctpop(x) & 1
3741 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3742
3743 llvm::Type *ArgType = ArgValue->getType();
3744 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctpop, Tys: ArgType);
3745
3746 llvm::Type *ResultType = ConvertType(T: E->getType());
3747 Value *Tmp = Builder.CreateCall(Callee: F, Args: ArgValue);
3748 Value *Result = Builder.CreateAnd(LHS: Tmp, RHS: llvm::ConstantInt::get(Ty: ArgType, V: 1));
3749 if (Result->getType() != ResultType)
3750 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/true,
3751 Name: "cast");
3752 return RValue::get(V: Result);
3753 }
3754 case Builtin::BI__lzcnt16:
3755 case Builtin::BI__lzcnt:
3756 case Builtin::BI__lzcnt64: {
3757 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3758
3759 llvm::Type *ArgType = ArgValue->getType();
3760 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctlz, Tys: ArgType);
3761
3762 llvm::Type *ResultType = ConvertType(T: E->getType());
3763 Value *Result = Builder.CreateCall(Callee: F, Args: {ArgValue, Builder.getFalse()});
3764 if (Result->getType() != ResultType)
3765 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/true,
3766 Name: "cast");
3767 return RValue::get(V: Result);
3768 }
3769 case Builtin::BI__popcnt16:
3770 case Builtin::BI__popcnt:
3771 case Builtin::BI__popcnt64:
3772 case Builtin::BI__builtin_popcount:
3773 case Builtin::BI__builtin_popcountl:
3774 case Builtin::BI__builtin_popcountll:
3775 case Builtin::BI__builtin_popcountg: {
3776 Value *ArgValue = EmitBitCountExpr(CGF&: *this, E: E->getArg(Arg: 0));
3777
3778 llvm::Type *ArgType = ArgValue->getType();
3779 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctpop, Tys: ArgType);
3780
3781 llvm::Type *ResultType = ConvertType(T: E->getType());
3782 Value *Result = Builder.CreateCall(Callee: F, Args: ArgValue);
3783 if (Result->getType() != ResultType)
3784 Result =
3785 Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/ false, Name: "cast");
3786 return RValue::get(V: Result);
3787 }
3788 case Builtin::BI__builtin_unpredictable: {
3789 // Always return the argument of __builtin_unpredictable. LLVM does not
3790 // handle this builtin. Metadata for this builtin should be added directly
3791 // to instructions such as branches or switches that use it.
3792 return RValue::get(V: EmitScalarExpr(E: E->getArg(Arg: 0)));
3793 }
3794 case Builtin::BI__builtin_expect: {
3795 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3796 llvm::Type *ArgType = ArgValue->getType();
3797
3798 Value *ExpectedValue = EmitScalarExpr(E: E->getArg(Arg: 1));
3799 // Don't generate llvm.expect on -O0 as the backend won't use it for
3800 // anything.
3801 // Note, we still IRGen ExpectedValue because it could have side-effects.
3802 if (CGM.getCodeGenOpts().OptimizationLevel == 0)
3803 return RValue::get(V: ArgValue);
3804
3805 Function *FnExpect = CGM.getIntrinsic(IID: Intrinsic::expect, Tys: ArgType);
3806 Value *Result =
3807 Builder.CreateCall(Callee: FnExpect, Args: {ArgValue, ExpectedValue}, Name: "expval");
3808 return RValue::get(V: Result);
3809 }
3810 case Builtin::BI__builtin_expect_with_probability: {
3811 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3812 llvm::Type *ArgType = ArgValue->getType();
3813
3814 Value *ExpectedValue = EmitScalarExpr(E: E->getArg(Arg: 1));
3815 llvm::APFloat Probability(0.0);
3816 const Expr *ProbArg = E->getArg(Arg: 2);
3817 bool EvalSucceed = ProbArg->EvaluateAsFloat(Result&: Probability, Ctx: CGM.getContext());
3818 assert(EvalSucceed && "probability should be able to evaluate as float");
3819 (void)EvalSucceed;
3820 bool LoseInfo = false;
3821 Probability.convert(ToSemantics: llvm::APFloat::IEEEdouble(),
3822 RM: llvm::RoundingMode::Dynamic, losesInfo: &LoseInfo);
3823 llvm::Type *Ty = ConvertType(T: ProbArg->getType());
3824 Constant *Confidence = ConstantFP::get(Ty, V: Probability);
3825 // Don't generate llvm.expect.with.probability on -O0 as the backend
3826 // won't use it for anything.
3827 // Note, we still IRGen ExpectedValue because it could have side-effects.
3828 if (CGM.getCodeGenOpts().OptimizationLevel == 0)
3829 return RValue::get(V: ArgValue);
3830
3831 Function *FnExpect =
3832 CGM.getIntrinsic(IID: Intrinsic::expect_with_probability, Tys: ArgType);
3833 Value *Result = Builder.CreateCall(
3834 Callee: FnExpect, Args: {ArgValue, ExpectedValue, Confidence}, Name: "expval");
3835 return RValue::get(V: Result);
3836 }
3837 case Builtin::BI__builtin_assume_aligned: {
3838 const Expr *Ptr = E->getArg(Arg: 0);
3839 Value *PtrValue = EmitScalarExpr(E: Ptr);
3840 Value *OffsetValue =
3841 (E->getNumArgs() > 2) ? EmitScalarExpr(E: E->getArg(Arg: 2)) : nullptr;
3842
3843 Value *AlignmentValue = EmitScalarExpr(E: E->getArg(Arg: 1));
3844 ConstantInt *AlignmentCI = cast<ConstantInt>(Val: AlignmentValue);
3845 if (AlignmentCI->getValue().ugt(RHS: llvm::Value::MaximumAlignment))
3846 AlignmentCI = ConstantInt::get(Ty: AlignmentCI->getIntegerType(),
3847 V: llvm::Value::MaximumAlignment);
3848
3849 emitAlignmentAssumption(PtrValue, E: Ptr,
3850 /*The expr loc is sufficient.*/ AssumptionLoc: SourceLocation(),
3851 Alignment: AlignmentCI, OffsetValue);
3852 return RValue::get(V: PtrValue);
3853 }
3854 case Builtin::BI__builtin_assume_dereferenceable: {
3855 const Expr *Ptr = E->getArg(Arg: 0);
3856 const Expr *Size = E->getArg(Arg: 1);
3857 Value *PtrValue = EmitScalarExpr(E: Ptr);
3858 Value *SizeValue = EmitScalarExpr(E: Size);
3859 if (SizeValue->getType() != IntPtrTy)
3860 SizeValue =
3861 Builder.CreateIntCast(V: SizeValue, DestTy: IntPtrTy, isSigned: false, Name: "casted.size");
3862 Builder.CreateDereferenceableAssumption(PtrValue, SizeValue);
3863 return RValue::get(V: nullptr);
3864 }
3865 case Builtin::BI__assume:
3866 case Builtin::BI__builtin_assume: {
3867 if (E->getArg(Arg: 0)->HasSideEffects(Ctx: getContext()))
3868 return RValue::get(V: nullptr);
3869
3870 Value *ArgValue = EmitCheckedArgForAssume(E: E->getArg(Arg: 0));
3871 Function *FnAssume = CGM.getIntrinsic(IID: Intrinsic::assume);
3872 Builder.CreateCall(Callee: FnAssume, Args: ArgValue);
3873 return RValue::get(V: nullptr);
3874 }
3875 case Builtin::BI__builtin_assume_separate_storage: {
3876 const Expr *Arg0 = E->getArg(Arg: 0);
3877 const Expr *Arg1 = E->getArg(Arg: 1);
3878
3879 Value *Value0 = EmitScalarExpr(E: Arg0);
3880 Value *Value1 = EmitScalarExpr(E: Arg1);
3881
3882 Value *Values[] = {Value0, Value1};
3883 OperandBundleDefT<Value *> OBD("separate_storage", Values);
3884 Builder.CreateAssumption(OpBundles: {OBD});
3885 return RValue::get(V: nullptr);
3886 }
3887 case Builtin::BI__builtin_allow_runtime_check: {
3888 StringRef Kind =
3889 cast<StringLiteral>(Val: E->getArg(Arg: 0)->IgnoreParenCasts())->getString();
3890 LLVMContext &Ctx = CGM.getLLVMContext();
3891 llvm::Value *Allow = Builder.CreateCall(
3892 Callee: CGM.getIntrinsic(IID: Intrinsic::allow_runtime_check),
3893 Args: llvm::MetadataAsValue::get(Context&: Ctx, MD: llvm::MDString::get(Context&: Ctx, Str: Kind)));
3894 return RValue::get(V: Allow);
3895 }
3896 case Builtin::BI__builtin_allow_sanitize_check: {
3897 Intrinsic::ID IntrID = Intrinsic::not_intrinsic;
3898 StringRef Name =
3899 cast<StringLiteral>(Val: E->getArg(Arg: 0)->IgnoreParenCasts())->getString();
3900
3901 // We deliberately allow the use of kernel- and non-kernel names
3902 // interchangably, even when one or the other is enabled. This is consistent
3903 // with the no_sanitize-attribute, which allows either kernel- or non-kernel
3904 // name to disable instrumentation (see CodeGenFunction::StartFunction).
3905 if (getLangOpts().Sanitize.hasOneOf(K: SanitizerKind::Address |
3906 SanitizerKind::KernelAddress) &&
3907 (Name == "address" || Name == "kernel-address")) {
3908 IntrID = Intrinsic::allow_sanitize_address;
3909 } else if (getLangOpts().Sanitize.has(K: SanitizerKind::Thread) &&
3910 Name == "thread") {
3911 IntrID = Intrinsic::allow_sanitize_thread;
3912 } else if (getLangOpts().Sanitize.hasOneOf(K: SanitizerKind::Memory |
3913 SanitizerKind::KernelMemory) &&
3914 (Name == "memory" || Name == "kernel-memory")) {
3915 IntrID = Intrinsic::allow_sanitize_memory;
3916 } else if (getLangOpts().Sanitize.hasOneOf(
3917 K: SanitizerKind::HWAddress | SanitizerKind::KernelHWAddress) &&
3918 (Name == "hwaddress" || Name == "kernel-hwaddress")) {
3919 IntrID = Intrinsic::allow_sanitize_hwaddress;
3920 }
3921
3922 if (IntrID != Intrinsic::not_intrinsic) {
3923 llvm::Value *Allow = Builder.CreateCall(Callee: CGM.getIntrinsic(IID: IntrID));
3924 return RValue::get(V: Allow);
3925 }
3926 // If the checked sanitizer is not enabled, we can safely lower to false
3927 // right away. This is also more efficient, since the LowerAllowCheckPass
3928 // must not always be enabled if none of the above sanitizers are enabled.
3929 return RValue::get(V: Builder.getFalse());
3930 }
3931 case Builtin::BI__arithmetic_fence: {
3932 // Create the builtin call if FastMath is selected, and the target
3933 // supports the builtin, otherwise just return the argument.
3934 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
3935 llvm::FastMathFlags FMF = Builder.getFastMathFlags();
3936 bool isArithmeticFenceEnabled =
3937 FMF.allowReassoc() &&
3938 getContext().getTargetInfo().checkArithmeticFenceSupported();
3939 QualType ArgType = E->getArg(Arg: 0)->getType();
3940 if (ArgType->isComplexType()) {
3941 if (isArithmeticFenceEnabled) {
3942 QualType ElementType = ArgType->castAs<ComplexType>()->getElementType();
3943 ComplexPairTy ComplexVal = EmitComplexExpr(E: E->getArg(Arg: 0));
3944 Value *Real = Builder.CreateArithmeticFence(Val: ComplexVal.first,
3945 DstType: ConvertType(T: ElementType));
3946 Value *Imag = Builder.CreateArithmeticFence(Val: ComplexVal.second,
3947 DstType: ConvertType(T: ElementType));
3948 return RValue::getComplex(C: std::make_pair(x&: Real, y&: Imag));
3949 }
3950 ComplexPairTy ComplexVal = EmitComplexExpr(E: E->getArg(Arg: 0));
3951 Value *Real = ComplexVal.first;
3952 Value *Imag = ComplexVal.second;
3953 return RValue::getComplex(C: std::make_pair(x&: Real, y&: Imag));
3954 }
3955 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3956 if (isArithmeticFenceEnabled)
3957 return RValue::get(
3958 V: Builder.CreateArithmeticFence(Val: ArgValue, DstType: ConvertType(T: ArgType)));
3959 return RValue::get(V: ArgValue);
3960 }
3961 case Builtin::BI__builtin_bswapg: {
3962 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3963 llvm::IntegerType *IntTy = cast<llvm::IntegerType>(Val: ArgValue->getType());
3964 assert(IntTy && "LLVM's __builtin_bswapg only supports integer variants");
3965 if (IntTy->getBitWidth() == 1 || IntTy->getBitWidth() == 8)
3966 return RValue::get(V: ArgValue);
3967 assert(((IntTy->getBitWidth() % 16 == 0 && IntTy->getBitWidth() != 0)) &&
3968 "LLVM's __builtin_bswapg only supports integer variants that has a "
3969 "multiple of 16 bits as well as a single byte");
3970 return RValue::get(
3971 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::bswap));
3972 }
3973 case Builtin::BI__builtin_bswap16:
3974 case Builtin::BI__builtin_bswap32:
3975 case Builtin::BI__builtin_bswap64:
3976 case Builtin::BI_byteswap_ushort:
3977 case Builtin::BI_byteswap_ulong:
3978 case Builtin::BI_byteswap_uint64: {
3979 return RValue::get(
3980 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::bswap));
3981 }
3982 case Builtin::BI__builtin_bitreverseg: {
3983 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
3984 llvm::IntegerType *IntTy = cast<llvm::IntegerType>(Val: ArgValue->getType());
3985 assert(IntTy &&
3986 "LLVM's __builtin_bitreverseg only support integer variants");
3987 if (IntTy->getBitWidth() == 1)
3988 return RValue::get(V: ArgValue);
3989 return RValue::get(
3990 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::bitreverse));
3991 }
3992 case Builtin::BI__builtin_bitreverse8:
3993 case Builtin::BI__builtin_bitreverse16:
3994 case Builtin::BI__builtin_bitreverse32:
3995 case Builtin::BI__builtin_bitreverse64: {
3996 return RValue::get(
3997 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::bitreverse));
3998 }
3999 case Builtin::BI__builtin_rotateleft8:
4000 case Builtin::BI__builtin_rotateleft16:
4001 case Builtin::BI__builtin_rotateleft32:
4002 case Builtin::BI__builtin_rotateleft64:
4003 case Builtin::BI__builtin_stdc_rotate_left:
4004 case Builtin::BIstdc_rotate_left_uc:
4005 case Builtin::BIstdc_rotate_left_us:
4006 case Builtin::BIstdc_rotate_left_ui:
4007 case Builtin::BIstdc_rotate_left_ul:
4008 case Builtin::BIstdc_rotate_left_ull:
4009 case Builtin::BI_rotl8: // Microsoft variants of rotate left
4010 case Builtin::BI_rotl16:
4011 case Builtin::BI_rotl:
4012 case Builtin::BI_lrotl:
4013 case Builtin::BI_rotl64:
4014 return emitRotate(E, IsRotateRight: false);
4015
4016 case Builtin::BI__builtin_rotateright8:
4017 case Builtin::BI__builtin_rotateright16:
4018 case Builtin::BI__builtin_rotateright32:
4019 case Builtin::BI__builtin_rotateright64:
4020 case Builtin::BI__builtin_stdc_rotate_right:
4021 case Builtin::BIstdc_rotate_right_uc:
4022 case Builtin::BIstdc_rotate_right_us:
4023 case Builtin::BIstdc_rotate_right_ui:
4024 case Builtin::BIstdc_rotate_right_ul:
4025 case Builtin::BIstdc_rotate_right_ull:
4026 case Builtin::BI_rotr8: // Microsoft variants of rotate right
4027 case Builtin::BI_rotr16:
4028 case Builtin::BI_rotr:
4029 case Builtin::BI_lrotr:
4030 case Builtin::BI_rotr64:
4031 return emitRotate(E, IsRotateRight: true);
4032
4033 case Builtin::BIstdc_leading_zeros_uc:
4034 case Builtin::BIstdc_leading_zeros_us:
4035 case Builtin::BIstdc_leading_zeros_ui:
4036 case Builtin::BIstdc_leading_zeros_ul:
4037 case Builtin::BIstdc_leading_zeros_ull:
4038 case Builtin::BI__builtin_stdc_leading_zeros:
4039 return emitStdcCountIntrinsic(E, IntID: Intrinsic::ctlz, /*InvertArg=*/false);
4040 case Builtin::BIstdc_leading_ones_uc:
4041 case Builtin::BIstdc_leading_ones_us:
4042 case Builtin::BIstdc_leading_ones_ui:
4043 case Builtin::BIstdc_leading_ones_ul:
4044 case Builtin::BIstdc_leading_ones_ull:
4045 case Builtin::BI__builtin_stdc_leading_ones:
4046 return emitStdcCountIntrinsic(E, IntID: Intrinsic::ctlz, /*InvertArg=*/true);
4047 case Builtin::BIstdc_trailing_zeros_uc:
4048 case Builtin::BIstdc_trailing_zeros_us:
4049 case Builtin::BIstdc_trailing_zeros_ui:
4050 case Builtin::BIstdc_trailing_zeros_ul:
4051 case Builtin::BIstdc_trailing_zeros_ull:
4052 case Builtin::BI__builtin_stdc_trailing_zeros:
4053 return emitStdcCountIntrinsic(E, IntID: Intrinsic::cttz, /*InvertArg=*/false);
4054 case Builtin::BIstdc_trailing_ones_uc:
4055 case Builtin::BIstdc_trailing_ones_us:
4056 case Builtin::BIstdc_trailing_ones_ui:
4057 case Builtin::BIstdc_trailing_ones_ul:
4058 case Builtin::BIstdc_trailing_ones_ull:
4059 case Builtin::BI__builtin_stdc_trailing_ones:
4060 return emitStdcCountIntrinsic(E, IntID: Intrinsic::cttz, /*InvertArg=*/true);
4061 case Builtin::BIstdc_first_leading_zero_uc:
4062 case Builtin::BIstdc_first_leading_zero_us:
4063 case Builtin::BIstdc_first_leading_zero_ui:
4064 case Builtin::BIstdc_first_leading_zero_ul:
4065 case Builtin::BIstdc_first_leading_zero_ull:
4066 case Builtin::BI__builtin_stdc_first_leading_zero:
4067 return emitStdcFirstBit(E, IntID: Intrinsic::ctlz, /*InvertArg=*/true);
4068 case Builtin::BIstdc_first_leading_one_uc:
4069 case Builtin::BIstdc_first_leading_one_us:
4070 case Builtin::BIstdc_first_leading_one_ui:
4071 case Builtin::BIstdc_first_leading_one_ul:
4072 case Builtin::BIstdc_first_leading_one_ull:
4073 case Builtin::BI__builtin_stdc_first_leading_one:
4074 return emitStdcFirstBit(E, IntID: Intrinsic::ctlz, /*InvertArg=*/false);
4075 case Builtin::BIstdc_first_trailing_zero_uc:
4076 case Builtin::BIstdc_first_trailing_zero_us:
4077 case Builtin::BIstdc_first_trailing_zero_ui:
4078 case Builtin::BIstdc_first_trailing_zero_ul:
4079 case Builtin::BIstdc_first_trailing_zero_ull:
4080 case Builtin::BI__builtin_stdc_first_trailing_zero:
4081 return emitStdcFirstBit(E, IntID: Intrinsic::cttz, /*InvertArg=*/true);
4082 case Builtin::BIstdc_first_trailing_one_uc:
4083 case Builtin::BIstdc_first_trailing_one_us:
4084 case Builtin::BIstdc_first_trailing_one_ui:
4085 case Builtin::BIstdc_first_trailing_one_ul:
4086 case Builtin::BIstdc_first_trailing_one_ull:
4087 case Builtin::BI__builtin_stdc_first_trailing_one:
4088 return emitStdcFirstBit(E, IntID: Intrinsic::cttz, /*InvertArg=*/false);
4089 case Builtin::BIstdc_count_zeros_uc:
4090 case Builtin::BIstdc_count_zeros_us:
4091 case Builtin::BIstdc_count_zeros_ui:
4092 case Builtin::BIstdc_count_zeros_ul:
4093 case Builtin::BIstdc_count_zeros_ull:
4094 case Builtin::BI__builtin_stdc_count_zeros:
4095 return emitStdcBitWidthMinus(E, IntID: Intrinsic::ctpop, /*IsPop=*/true);
4096 case Builtin::BIstdc_count_ones_uc:
4097 case Builtin::BIstdc_count_ones_us:
4098 case Builtin::BIstdc_count_ones_ui:
4099 case Builtin::BIstdc_count_ones_ul:
4100 case Builtin::BIstdc_count_ones_ull:
4101 case Builtin::BI__builtin_stdc_count_ones:
4102 return emitStdcCountIntrinsic(E, IntID: Intrinsic::ctpop, /*InvertArg=*/false,
4103 /*IsPop=*/true);
4104 case Builtin::BIstdc_has_single_bit_uc:
4105 case Builtin::BIstdc_has_single_bit_us:
4106 case Builtin::BIstdc_has_single_bit_ui:
4107 case Builtin::BIstdc_has_single_bit_ul:
4108 case Builtin::BIstdc_has_single_bit_ull:
4109 case Builtin::BI__builtin_stdc_has_single_bit: {
4110 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
4111 llvm::Type *ArgType = ArgValue->getType();
4112 Value *One = ConstantInt::get(Ty: ArgType, V: 1);
4113 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctpop, Tys: ArgType);
4114 Value *PopCnt = Builder.CreateCall(Callee: F, Args: ArgValue);
4115 return RValue::get(V: Builder.CreateICmpEQ(LHS: PopCnt, RHS: One));
4116 }
4117 case Builtin::BIstdc_bit_width_uc:
4118 case Builtin::BIstdc_bit_width_us:
4119 case Builtin::BIstdc_bit_width_ui:
4120 case Builtin::BIstdc_bit_width_ul:
4121 case Builtin::BIstdc_bit_width_ull:
4122 case Builtin::BI__builtin_stdc_bit_width:
4123 return emitStdcBitWidthMinus(E, IntID: Intrinsic::ctlz, /*IsPop=*/false);
4124 case Builtin::BIstdc_bit_floor_uc:
4125 case Builtin::BIstdc_bit_floor_us:
4126 case Builtin::BIstdc_bit_floor_ui:
4127 case Builtin::BIstdc_bit_floor_ul:
4128 case Builtin::BIstdc_bit_floor_ull:
4129 case Builtin::BI__builtin_stdc_bit_floor: {
4130 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
4131 llvm::Type *ArgType = ArgValue->getType();
4132 unsigned BitWidth = ArgType->getIntegerBitWidth();
4133 Value *Zero = ConstantInt::get(Ty: ArgType, V: 0);
4134 Value *One = ConstantInt::get(Ty: ArgType, V: 1);
4135 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctlz, Tys: ArgType);
4136 Value *LZ = Builder.CreateCall(Callee: F, Args: {ArgValue, Builder.getTrue()});
4137 Value *ShiftAmt =
4138 Builder.CreateSub(LHS: ConstantInt::get(Ty: ArgType, V: BitWidth - 1), RHS: LZ);
4139 Value *Shifted = Builder.CreateShl(LHS: One, RHS: ShiftAmt);
4140 Value *IsZero = Builder.CreateICmpEQ(LHS: ArgValue, RHS: Zero);
4141 Value *Result = Builder.CreateSelect(C: IsZero, True: Zero, False: Shifted);
4142 return RValue::get(V: Result);
4143 }
4144 case Builtin::BIstdc_bit_ceil_uc:
4145 case Builtin::BIstdc_bit_ceil_us:
4146 case Builtin::BIstdc_bit_ceil_ui:
4147 case Builtin::BIstdc_bit_ceil_ul:
4148 case Builtin::BIstdc_bit_ceil_ull:
4149 case Builtin::BI__builtin_stdc_bit_ceil: {
4150 Value *ArgValue = EmitScalarExpr(E: E->getArg(Arg: 0));
4151 llvm::Type *ArgType = ArgValue->getType();
4152 unsigned BitWidth = ArgType->getIntegerBitWidth();
4153 Value *One = ConstantInt::get(Ty: ArgType, V: 1);
4154 Value *Two = ConstantInt::get(Ty: ArgType, V: 2);
4155
4156 Value *IsLEOne = Builder.CreateICmpULE(LHS: ArgValue, RHS: One, Name: "isleone");
4157
4158 BasicBlock *EntryBB = Builder.GetInsertBlock();
4159 BasicBlock *CalcBB = createBasicBlock(name: "bitceil.calc", parent: CurFn);
4160 BasicBlock *MergeBB = createBasicBlock(name: "bitceil.merge", parent: CurFn);
4161
4162 Builder.CreateCondBr(Cond: IsLEOne, True: MergeBB, False: CalcBB);
4163
4164 Builder.SetInsertPoint(CalcBB);
4165 Function *F = CGM.getIntrinsic(IID: Intrinsic::ctlz, Tys: ArgType);
4166 Value *ArgMinusOne = Builder.CreateSub(LHS: ArgValue, RHS: One);
4167 Value *LZ = Builder.CreateCall(Callee: F, Args: {ArgMinusOne, Builder.getFalse()});
4168 // 2<<(BitWidth-1-LZ) to get the next power of two. The shift
4169 // amount is always in [0, BitWidth-1], so when LZ==0 (argument has its MSB
4170 // set), the result wraps to 0
4171 Value *ShiftAmt =
4172 Builder.CreateSub(LHS: ConstantInt::get(Ty: ArgType, V: BitWidth - 1), RHS: LZ);
4173 Value *Tmp = Builder.CreateShl(LHS: Two, RHS: ShiftAmt);
4174 Builder.CreateBr(Dest: MergeBB);
4175
4176 Builder.SetInsertPoint(MergeBB);
4177 PHINode *Phi = Builder.CreatePHI(Ty: ArgType, NumReservedValues: 2);
4178 Phi->addIncoming(V: One, BB: EntryBB);
4179 Phi->addIncoming(V: Tmp, BB: CalcBB);
4180 return RValue::get(V: Phi);
4181 }
4182
4183 // stdc_memreverse8u8 is a no-op (single byte, nothing to swap).
4184 case Builtin::BIstdc_memreverse8u8:
4185 return RValue::get(V: EmitScalarExpr(E: E->getArg(Arg: 0)));
4186
4187 case Builtin::BIstdc_memreverse8u16:
4188 case Builtin::BIstdc_memreverse8u32:
4189 case Builtin::BIstdc_memreverse8u64:
4190 return RValue::get(
4191 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::bswap));
4192
4193 case Builtin::BIstdc_memreverse8:
4194 case Builtin::BI__builtin_stdc_memreverse8: {
4195 Expr::EvalResult R;
4196 if (E->getArg(Arg: 0)->EvaluateAsInt(Result&: R, Ctx: getContext())) {
4197 uint64_t Size = R.Val.getInt().getZExtValue();
4198 if (Size <= 1) {
4199 EmitIgnoredExpr(E: E->getArg(Arg: 1));
4200 return RValue::get(V: nullptr);
4201 }
4202 if (Size == 2 || Size == 4 || Size == 8) {
4203 llvm::Type *IntTy = Builder.getIntNTy(N: Size * 8);
4204 Address PtrAddr = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
4205 Address Addr = PtrAddr.withElementType(ElemTy: IntTy);
4206 Value *Val = Builder.CreateLoad(Addr);
4207 Function *F = CGM.getIntrinsic(IID: Intrinsic::bswap, Tys: IntTy);
4208 Value *Swapped = Builder.CreateCall(Callee: F, Args: Val);
4209 Builder.CreateStore(Val: Swapped, Addr);
4210 return RValue::get(V: nullptr);
4211 }
4212 }
4213
4214 // General case: fall back to the library function stdc_memreverse8.
4215 break;
4216 }
4217
4218 case Builtin::BI__builtin_constant_p: {
4219 llvm::Type *ResultType = ConvertType(T: E->getType());
4220
4221 const Expr *Arg = E->getArg(Arg: 0);
4222 QualType ArgType = Arg->getType();
4223 // FIXME: The allowance for Obj-C pointers and block pointers is historical
4224 // and likely a mistake.
4225 if (!ArgType->isIntegralOrEnumerationType() && !ArgType->isFloatingType() &&
4226 !ArgType->isObjCObjectPointerType() && !ArgType->isBlockPointerType())
4227 // Per the GCC documentation, only numeric constants are recognized after
4228 // inlining.
4229 return RValue::get(V: ConstantInt::get(Ty: ResultType, V: 0));
4230
4231 if (Arg->HasSideEffects(Ctx: getContext()))
4232 // The argument is unevaluated, so be conservative if it might have
4233 // side-effects.
4234 return RValue::get(V: ConstantInt::get(Ty: ResultType, V: 0));
4235
4236 Value *ArgValue = EmitScalarExpr(E: Arg);
4237 if (ArgType->isObjCObjectPointerType()) {
4238 // Convert Objective-C objects to id because we cannot distinguish between
4239 // LLVM types for Obj-C classes as they are opaque.
4240 ArgType = CGM.getContext().getObjCIdType();
4241 ArgValue = Builder.CreateBitCast(V: ArgValue, DestTy: ConvertType(T: ArgType));
4242 }
4243 Function *F =
4244 CGM.getIntrinsic(IID: Intrinsic::is_constant, Tys: ConvertType(T: ArgType));
4245 Value *Result = Builder.CreateCall(Callee: F, Args: ArgValue);
4246 if (Result->getType() != ResultType)
4247 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/false);
4248 return RValue::get(V: Result);
4249 }
4250 case Builtin::BI__builtin_dynamic_object_size:
4251 case Builtin::BI__builtin_object_size: {
4252 unsigned Type =
4253 E->getArg(Arg: 1)->EvaluateKnownConstInt(Ctx: getContext()).getZExtValue();
4254 auto *ResType = cast<llvm::IntegerType>(Val: ConvertType(T: E->getType()));
4255
4256 // We pass this builtin onto the optimizer so that it can figure out the
4257 // object size in more complex cases.
4258 bool IsDynamic = BuiltinID == Builtin::BI__builtin_dynamic_object_size;
4259 return RValue::get(V: emitBuiltinObjectSize(E: E->getArg(Arg: 0), Type, ResType,
4260 /*EmittedE=*/nullptr, IsDynamic));
4261 }
4262 case Builtin::BI__builtin_counted_by_ref: {
4263 // Default to returning '(void *) 0'.
4264 llvm::Value *Result = llvm::ConstantPointerNull::get(
4265 T: llvm::PointerType::getUnqual(C&: getLLVMContext()));
4266
4267 const Expr *Arg = E->getArg(Arg: 0)->IgnoreParenImpCasts();
4268
4269 if (auto *UO = dyn_cast<UnaryOperator>(Val: Arg);
4270 UO && UO->getOpcode() == UO_AddrOf) {
4271 Arg = UO->getSubExpr()->IgnoreParenImpCasts();
4272
4273 if (auto *ASE = dyn_cast<ArraySubscriptExpr>(Val: Arg))
4274 Arg = ASE->getBase()->IgnoreParenImpCasts();
4275 }
4276
4277 if (const MemberExpr *ME = dyn_cast_if_present<MemberExpr>(Val: Arg)) {
4278 if (auto *CATy =
4279 ME->getMemberDecl()->getType()->getAs<CountAttributedType>();
4280 CATy && CATy->getKind() == CountAttributedType::CountedBy) {
4281 const auto *MemberDecl = cast<FieldDecl>(Val: ME->getMemberDecl());
4282 if (const FieldDecl *CountFD = MemberDecl->findCountedByField())
4283 Result = GetCountedByFieldExprGEP(Base: Arg, FD: MemberDecl, CountDecl: CountFD);
4284 else
4285 llvm::report_fatal_error(reason: "Cannot find the counted_by 'count' field");
4286 }
4287 }
4288
4289 return RValue::get(V: Result);
4290 }
4291 case Builtin::BI__builtin_prefetch: {
4292 Value *Locality, *RW, *Address = EmitScalarExpr(E: E->getArg(Arg: 0));
4293 unsigned ICEArguments = (1 << 1) | (1 << 2);
4294 // FIXME: Technically these constants should of type 'int', yes?
4295 RW = (E->getNumArgs() > 1) ? EmitScalarOrConstFoldImmArg(ICEArguments, Idx: 1, E)
4296 : llvm::ConstantInt::get(Ty: Int32Ty, V: 0);
4297 Locality = (E->getNumArgs() > 2)
4298 ? EmitScalarOrConstFoldImmArg(ICEArguments, Idx: 2, E)
4299 : llvm::ConstantInt::get(Ty: Int32Ty, V: 3);
4300 Value *Data = llvm::ConstantInt::get(Ty: Int32Ty, V: 1);
4301 Function *F = CGM.getIntrinsic(IID: Intrinsic::prefetch, Tys: Address->getType());
4302 Builder.CreateCall(Callee: F, Args: {Address, RW, Locality, Data});
4303 return RValue::get(V: nullptr);
4304 }
4305 case Builtin::BI__builtin_readcyclecounter: {
4306 Function *F = CGM.getIntrinsic(IID: Intrinsic::readcyclecounter);
4307 return RValue::get(V: Builder.CreateCall(Callee: F));
4308 }
4309 case Builtin::BI__builtin_readsteadycounter: {
4310 Function *F = CGM.getIntrinsic(IID: Intrinsic::readsteadycounter);
4311 return RValue::get(V: Builder.CreateCall(Callee: F));
4312 }
4313 case Builtin::BI__builtin___clear_cache: {
4314 Value *Begin = EmitScalarExpr(E: E->getArg(Arg: 0));
4315 Value *End = EmitScalarExpr(E: E->getArg(Arg: 1));
4316 Function *F = CGM.getIntrinsic(IID: Intrinsic::clear_cache, Tys: {CGM.DefaultPtrTy});
4317 return RValue::get(V: Builder.CreateCall(Callee: F, Args: {Begin, End}));
4318 }
4319 case Builtin::BI__builtin_trap:
4320 EmitTrapCall(IntrID: Intrinsic::trap);
4321 return RValue::get(V: nullptr);
4322 case Builtin::BI__builtin_verbose_trap: {
4323 llvm::DILocation *TrapLocation = Builder.getCurrentDebugLocation();
4324 if (getDebugInfo()) {
4325 TrapLocation = getDebugInfo()->CreateTrapFailureMessageFor(
4326 TrapLocation, Category: *E->getArg(Arg: 0)->tryEvaluateString(Ctx&: getContext()),
4327 FailureMsg: *E->getArg(Arg: 1)->tryEvaluateString(Ctx&: getContext()));
4328 }
4329 ApplyDebugLocation ApplyTrapDI(*this, TrapLocation);
4330 // Currently no attempt is made to prevent traps from being merged.
4331 EmitTrapCall(IntrID: Intrinsic::trap);
4332 return RValue::get(V: nullptr);
4333 }
4334 case Builtin::BI__debugbreak:
4335 EmitTrapCall(IntrID: Intrinsic::debugtrap);
4336 return RValue::get(V: nullptr);
4337 case Builtin::BI__builtin_unreachable: {
4338 EmitUnreachable(Loc: E->getExprLoc());
4339
4340 // We do need to preserve an insertion point.
4341 EmitBlock(BB: createBasicBlock(name: "unreachable.cont"));
4342
4343 return RValue::get(V: nullptr);
4344 }
4345
4346 case Builtin::BI__builtin_powi:
4347 case Builtin::BI__builtin_powif:
4348 case Builtin::BI__builtin_powil: {
4349 llvm::Value *Src0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4350 llvm::Value *Src1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4351
4352 if (Builder.getIsFPConstrained()) {
4353 // FIXME: llvm.powi has 2 mangling types,
4354 // llvm.experimental.constrained.powi has one.
4355 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4356 Function *F = CGM.getIntrinsic(IID: Intrinsic::experimental_constrained_powi,
4357 Tys: Src0->getType());
4358 return RValue::get(V: Builder.CreateConstrainedFPCall(Callee: F, Args: { Src0, Src1 }));
4359 }
4360
4361 Function *F = CGM.getIntrinsic(IID: Intrinsic::powi,
4362 Tys: { Src0->getType(), Src1->getType() });
4363 return RValue::get(V: Builder.CreateCall(Callee: F, Args: { Src0, Src1 }));
4364 }
4365 case Builtin::BI__builtin_frexpl: {
4366 // Linux PPC will not be adding additional PPCDoubleDouble support.
4367 // WIP to switch default to IEEE long double. Will emit libcall for
4368 // frexpl instead of legalizing this type in the BE.
4369 if (&getTarget().getLongDoubleFormat() == &llvm::APFloat::PPCDoubleDouble())
4370 break;
4371 [[fallthrough]];
4372 }
4373 case Builtin::BI__builtin_frexp:
4374 case Builtin::BI__builtin_frexpf:
4375 case Builtin::BI__builtin_frexpf128:
4376 case Builtin::BI__builtin_frexpf16:
4377 return RValue::get(V: emitFrexpBuiltin(CGF&: *this, E, IntrinsicID: Intrinsic::frexp));
4378 case Builtin::BImodf:
4379 case Builtin::BImodff:
4380 case Builtin::BImodfl:
4381 case Builtin::BI__builtin_modf:
4382 case Builtin::BI__builtin_modff:
4383 case Builtin::BI__builtin_modfl:
4384 if (Builder.getIsFPConstrained())
4385 break; // TODO: Emit constrained modf intrinsic once one exists.
4386 return RValue::get(V: emitModfBuiltin(CGF&: *this, E, IntrinsicID: Intrinsic::modf));
4387 case Builtin::BI__builtin_isgreater:
4388 case Builtin::BI__builtin_isgreaterequal:
4389 case Builtin::BI__builtin_isless:
4390 case Builtin::BI__builtin_islessequal:
4391 case Builtin::BI__builtin_islessgreater:
4392 case Builtin::BI__builtin_isunordered: {
4393 // Ordered comparisons: we know the arguments to these are matching scalar
4394 // floating point values.
4395 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4396 Value *LHS = EmitScalarExpr(E: E->getArg(Arg: 0));
4397 Value *RHS = EmitScalarExpr(E: E->getArg(Arg: 1));
4398
4399 switch (BuiltinID) {
4400 default: llvm_unreachable("Unknown ordered comparison");
4401 case Builtin::BI__builtin_isgreater:
4402 LHS = Builder.CreateFCmpOGT(LHS, RHS, Name: "cmp");
4403 break;
4404 case Builtin::BI__builtin_isgreaterequal:
4405 LHS = Builder.CreateFCmpOGE(LHS, RHS, Name: "cmp");
4406 break;
4407 case Builtin::BI__builtin_isless:
4408 LHS = Builder.CreateFCmpOLT(LHS, RHS, Name: "cmp");
4409 break;
4410 case Builtin::BI__builtin_islessequal:
4411 LHS = Builder.CreateFCmpOLE(LHS, RHS, Name: "cmp");
4412 break;
4413 case Builtin::BI__builtin_islessgreater:
4414 LHS = Builder.CreateFCmpONE(LHS, RHS, Name: "cmp");
4415 break;
4416 case Builtin::BI__builtin_isunordered:
4417 LHS = Builder.CreateFCmpUNO(LHS, RHS, Name: "cmp");
4418 break;
4419 }
4420 // ZExt bool to int type.
4421 return RValue::get(V: Builder.CreateZExt(V: LHS, DestTy: ConvertType(T: E->getType())));
4422 }
4423
4424 case Builtin::BI__builtin_isnan: {
4425 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4426 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4427 if (Value *Result = tryUseTestFPKind(CGF&: *this, BuiltinID, V))
4428 return RValue::get(V: Result);
4429 return RValue::get(
4430 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcNan),
4431 DestTy: ConvertType(T: E->getType())));
4432 }
4433
4434 case Builtin::BI__builtin_issignaling: {
4435 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4436 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4437 return RValue::get(
4438 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcSNan),
4439 DestTy: ConvertType(T: E->getType())));
4440 }
4441
4442 case Builtin::BI__builtin_isinf: {
4443 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4444 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4445 if (Value *Result = tryUseTestFPKind(CGF&: *this, BuiltinID, V))
4446 return RValue::get(V: Result);
4447 return RValue::get(
4448 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcInf),
4449 DestTy: ConvertType(T: E->getType())));
4450 }
4451
4452 case Builtin::BIfinite:
4453 case Builtin::BI__finite:
4454 case Builtin::BIfinitef:
4455 case Builtin::BI__finitef:
4456 case Builtin::BIfinitel:
4457 case Builtin::BI__finitel:
4458 case Builtin::BI__builtin_isfinite: {
4459 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4460 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4461 if (Value *Result = tryUseTestFPKind(CGF&: *this, BuiltinID, V))
4462 return RValue::get(V: Result);
4463 return RValue::get(
4464 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcFinite),
4465 DestTy: ConvertType(T: E->getType())));
4466 }
4467
4468 case Builtin::BI__builtin_isnormal: {
4469 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4470 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4471 return RValue::get(
4472 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcNormal),
4473 DestTy: ConvertType(T: E->getType())));
4474 }
4475
4476 case Builtin::BI__builtin_issubnormal: {
4477 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4478 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4479 return RValue::get(
4480 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcSubnormal),
4481 DestTy: ConvertType(T: E->getType())));
4482 }
4483
4484 case Builtin::BI__builtin_iszero: {
4485 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4486 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4487 return RValue::get(
4488 V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test: FPClassTest::fcZero),
4489 DestTy: ConvertType(T: E->getType())));
4490 }
4491
4492 case Builtin::BI__builtin_isfpclass: {
4493 Expr::EvalResult Result;
4494 if (!E->getArg(Arg: 1)->EvaluateAsInt(Result, Ctx: CGM.getContext()))
4495 break;
4496 uint64_t Test = Result.Val.getInt().getLimitedValue();
4497 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4498 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4499 return RValue::get(V: Builder.CreateZExt(V: Builder.createIsFPClass(FPNum: V, Test),
4500 DestTy: ConvertType(T: E->getType())));
4501 }
4502
4503 case Builtin::BI__builtin_nondeterministic_value: {
4504 llvm::Type *Ty = ConvertType(T: E->getArg(Arg: 0)->getType());
4505
4506 Value *Result = PoisonValue::get(T: Ty);
4507 Result = Builder.CreateFreeze(V: Result);
4508
4509 return RValue::get(V: Result);
4510 }
4511
4512 case Builtin::BI__builtin_elementwise_abs: {
4513 Value *Result;
4514 QualType QT = E->getArg(Arg: 0)->getType();
4515
4516 if (auto *VecTy = QT->getAs<VectorType>())
4517 QT = VecTy->getElementType();
4518 if (QT->isIntegerType())
4519 Result = Builder.CreateBinaryIntrinsic(
4520 ID: Intrinsic::abs, LHS: EmitScalarExpr(E: E->getArg(Arg: 0)), RHS: Builder.getFalse(),
4521 FMFSource: nullptr, Name: "elt.abs");
4522 else
4523 Result = emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::fabs,
4524 Name: "elt.abs");
4525
4526 return RValue::get(V: Result);
4527 }
4528 case Builtin::BI__builtin_elementwise_bitreverse:
4529 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4530 CGF&: *this, E, IntrinsicID: Intrinsic::bitreverse, Name: "elt.bitreverse"));
4531 case Builtin::BI__builtin_elementwise_popcount:
4532 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4533 CGF&: *this, E, IntrinsicID: Intrinsic::ctpop, Name: "elt.ctpop"));
4534 case Builtin::BI__builtin_elementwise_canonicalize:
4535 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4536 CGF&: *this, E, IntrinsicID: Intrinsic::canonicalize, Name: "elt.canonicalize"));
4537 case Builtin::BI__builtin_elementwise_copysign:
4538 return RValue::get(
4539 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::copysign));
4540 case Builtin::BI__builtin_elementwise_fshl:
4541 return RValue::get(
4542 V: emitBuiltinWithOneOverloadedType<3>(CGF&: *this, E, IntrinsicID: Intrinsic::fshl));
4543 case Builtin::BI__builtin_elementwise_fshr:
4544 return RValue::get(
4545 V: emitBuiltinWithOneOverloadedType<3>(CGF&: *this, E, IntrinsicID: Intrinsic::fshr));
4546 case Builtin::BI__builtin_elementwise_clmul:
4547 return RValue::get(
4548 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::clmul));
4549 case Builtin::BI__builtin_elementwise_pext:
4550 return RValue::get(
4551 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::pext));
4552 case Builtin::BI__builtin_elementwise_pdep:
4553 return RValue::get(
4554 V: emitBuiltinWithOneOverloadedType<2>(CGF&: *this, E, IntrinsicID: Intrinsic::pdep));
4555
4556 case Builtin::BI__builtin_elementwise_add_sat:
4557 case Builtin::BI__builtin_elementwise_sub_sat: {
4558 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4559 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4560 Value *Result;
4561 assert(Op0->getType()->isIntOrIntVectorTy() && "integer type expected");
4562 QualType Ty = E->getArg(Arg: 0)->getType();
4563 if (auto *VecTy = Ty->getAs<VectorType>())
4564 Ty = VecTy->getElementType();
4565 bool IsSigned = Ty->isSignedIntegerType();
4566 unsigned Opc;
4567 if (BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_elementwise_add_sat)
4568 Opc = IsSigned ? Intrinsic::sadd_sat : Intrinsic::uadd_sat;
4569 else
4570 Opc = IsSigned ? Intrinsic::ssub_sat : Intrinsic::usub_sat;
4571 Result = Builder.CreateBinaryIntrinsic(ID: Opc, LHS: Op0, RHS: Op1, FMFSource: nullptr, Name: "elt.sat");
4572 return RValue::get(V: Result);
4573 }
4574
4575 case Builtin::BI__builtin_elementwise_max: {
4576 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4577 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4578 Value *Result;
4579 if (Op0->getType()->isIntOrIntVectorTy()) {
4580 QualType Ty = E->getArg(Arg: 0)->getType();
4581 if (auto *VecTy = Ty->getAs<VectorType>())
4582 Ty = VecTy->getElementType();
4583 Result = Builder.CreateBinaryIntrinsic(
4584 ID: Ty->isSignedIntegerType() ? Intrinsic::smax : Intrinsic::umax, LHS: Op0,
4585 RHS: Op1, FMFSource: nullptr, Name: "elt.max");
4586 } else
4587 Result = Builder.CreateMaxNum(LHS: Op0, RHS: Op1, /*FMFSource=*/nullptr, Name: "elt.max");
4588 return RValue::get(V: Result);
4589 }
4590 case Builtin::BI__builtin_elementwise_min: {
4591 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4592 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4593 Value *Result;
4594 if (Op0->getType()->isIntOrIntVectorTy()) {
4595 QualType Ty = E->getArg(Arg: 0)->getType();
4596 if (auto *VecTy = Ty->getAs<VectorType>())
4597 Ty = VecTy->getElementType();
4598 Result = Builder.CreateBinaryIntrinsic(
4599 ID: Ty->isSignedIntegerType() ? Intrinsic::smin : Intrinsic::umin, LHS: Op0,
4600 RHS: Op1, FMFSource: nullptr, Name: "elt.min");
4601 } else
4602 Result = Builder.CreateMinNum(LHS: Op0, RHS: Op1, /*FMFSource=*/nullptr, Name: "elt.min");
4603 return RValue::get(V: Result);
4604 }
4605
4606 case Builtin::BI__builtin_elementwise_maxnum: {
4607 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4608 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4609 Value *Result = Builder.CreateBinaryIntrinsic(ID: llvm::Intrinsic::maxnum, LHS: Op0,
4610 RHS: Op1, FMFSource: nullptr, Name: "elt.maxnum");
4611 return RValue::get(V: Result);
4612 }
4613
4614 case Builtin::BI__builtin_elementwise_minnum: {
4615 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4616 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4617 Value *Result = Builder.CreateBinaryIntrinsic(ID: llvm::Intrinsic::minnum, LHS: Op0,
4618 RHS: Op1, FMFSource: nullptr, Name: "elt.minnum");
4619 return RValue::get(V: Result);
4620 }
4621
4622 case Builtin::BI__builtin_elementwise_maximum: {
4623 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4624 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4625 Value *Result = Builder.CreateBinaryIntrinsic(ID: Intrinsic::maximum, LHS: Op0, RHS: Op1,
4626 FMFSource: nullptr, Name: "elt.maximum");
4627 return RValue::get(V: Result);
4628 }
4629
4630 case Builtin::BI__builtin_elementwise_minimum: {
4631 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4632 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4633 Value *Result = Builder.CreateBinaryIntrinsic(ID: Intrinsic::minimum, LHS: Op0, RHS: Op1,
4634 FMFSource: nullptr, Name: "elt.minimum");
4635 return RValue::get(V: Result);
4636 }
4637
4638 case Builtin::BI__builtin_elementwise_maximumnum: {
4639 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4640 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4641 Value *Result = Builder.CreateBinaryIntrinsic(
4642 ID: Intrinsic::maximumnum, LHS: Op0, RHS: Op1, FMFSource: nullptr, Name: "elt.maximumnum");
4643 return RValue::get(V: Result);
4644 }
4645
4646 case Builtin::BI__builtin_elementwise_minimumnum: {
4647 Value *Op0 = EmitScalarExpr(E: E->getArg(Arg: 0));
4648 Value *Op1 = EmitScalarExpr(E: E->getArg(Arg: 1));
4649 Value *Result = Builder.CreateBinaryIntrinsic(
4650 ID: Intrinsic::minimumnum, LHS: Op0, RHS: Op1, FMFSource: nullptr, Name: "elt.minimumnum");
4651 return RValue::get(V: Result);
4652 }
4653
4654 case Builtin::BI__builtin_reduce_max: {
4655 auto GetIntrinsicID = [this](QualType QT) {
4656 if (auto *VecTy = QT->getAs<VectorType>())
4657 QT = VecTy->getElementType();
4658 else if (QT->isSizelessVectorType())
4659 QT = QT->getSizelessVectorEltType(Ctx: CGM.getContext());
4660
4661 if (QT->isSignedIntegerType())
4662 return Intrinsic::vector_reduce_smax;
4663 if (QT->isUnsignedIntegerType())
4664 return Intrinsic::vector_reduce_umax;
4665 assert(QT->isFloatingType() && "must have a float here");
4666 return Intrinsic::vector_reduce_fmax;
4667 };
4668 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4669 CGF&: *this, E, IntrinsicID: GetIntrinsicID(E->getArg(Arg: 0)->getType()), Name: "rdx.min"));
4670 }
4671
4672 case Builtin::BI__builtin_reduce_min: {
4673 auto GetIntrinsicID = [this](QualType QT) {
4674 if (auto *VecTy = QT->getAs<VectorType>())
4675 QT = VecTy->getElementType();
4676 else if (QT->isSizelessVectorType())
4677 QT = QT->getSizelessVectorEltType(Ctx: CGM.getContext());
4678
4679 if (QT->isSignedIntegerType())
4680 return Intrinsic::vector_reduce_smin;
4681 if (QT->isUnsignedIntegerType())
4682 return Intrinsic::vector_reduce_umin;
4683 assert(QT->isFloatingType() && "must have a float here");
4684 return Intrinsic::vector_reduce_fmin;
4685 };
4686
4687 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4688 CGF&: *this, E, IntrinsicID: GetIntrinsicID(E->getArg(Arg: 0)->getType()), Name: "rdx.min"));
4689 }
4690
4691 case Builtin::BI__builtin_reduce_add:
4692 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4693 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_add, Name: "rdx.add"));
4694 case Builtin::BI__builtin_reduce_mul:
4695 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4696 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_mul, Name: "rdx.mul"));
4697 case Builtin::BI__builtin_reduce_xor:
4698 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4699 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_xor, Name: "rdx.xor"));
4700 case Builtin::BI__builtin_reduce_or:
4701 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4702 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_or, Name: "rdx.or"));
4703 case Builtin::BI__builtin_reduce_and:
4704 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4705 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_and, Name: "rdx.and"));
4706 case Builtin::BI__builtin_reduce_maximum:
4707 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4708 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_fmaximum, Name: "rdx.maximum"));
4709 case Builtin::BI__builtin_reduce_minimum:
4710 return RValue::get(V: emitBuiltinWithOneOverloadedType<1>(
4711 CGF&: *this, E, IntrinsicID: Intrinsic::vector_reduce_fminimum, Name: "rdx.minimum"));
4712 case Builtin::BI__builtin_reduce_assoc_fadd:
4713 case Builtin::BI__builtin_reduce_in_order_fadd: {
4714 llvm::Value *Vector = EmitScalarExpr(E: E->getArg(Arg: 0));
4715 llvm::Type *ScalarTy = Vector->getType()->getScalarType();
4716 llvm::Value *StartValue = nullptr;
4717 if (E->getNumArgs() == 2)
4718 StartValue = Builder.CreateFPCast(V: EmitScalarExpr(E: E->getArg(Arg: 1)), DestTy: ScalarTy);
4719 llvm::Value *Args[] = {/*start_value=*/StartValue
4720 ? StartValue
4721 : llvm::ConstantFP::get(Ty: ScalarTy, V: -0.0F),
4722 /*vector=*/Vector};
4723 llvm::Function *F =
4724 CGM.getIntrinsic(IID: Intrinsic::vector_reduce_fadd, Tys: Vector->getType());
4725 llvm::CallBase *Reduce = Builder.CreateCall(Callee: F, Args, Name: "rdx.addf");
4726 if (BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_reduce_assoc_fadd) {
4727 // `__builtin_reduce_assoc_fadd` is an associative reduction which
4728 // requires the reassoc FMF flag.
4729 llvm::FastMathFlags FMF;
4730 FMF.setAllowReassoc();
4731 cast<llvm::CallBase>(Val: Reduce)->setFastMathFlags(FMF);
4732 }
4733 return RValue::get(V: Reduce);
4734 }
4735
4736 case Builtin::BI__builtin_matrix_transpose: {
4737 auto *MatrixTy = E->getArg(Arg: 0)->getType()->castAs<ConstantMatrixType>();
4738 Value *MatValue = EmitScalarExpr(E: E->getArg(Arg: 0));
4739 MatrixBuilder MB(Builder);
4740 Value *Result = MB.CreateMatrixTranspose(Matrix: MatValue, Rows: MatrixTy->getNumRows(),
4741 Columns: MatrixTy->getNumColumns());
4742 return RValue::get(V: Result);
4743 }
4744
4745 case Builtin::BI__builtin_matrix_column_major_load: {
4746 MatrixBuilder MB(Builder);
4747 // Emit everything that isn't dependent on the first parameter type
4748 Value *Stride = EmitScalarExpr(E: E->getArg(Arg: 3));
4749 const auto *ResultTy = E->getType()->getAs<ConstantMatrixType>();
4750 auto *PtrTy = E->getArg(Arg: 0)->getType()->getAs<PointerType>();
4751 assert(PtrTy && "arg0 must be of pointer type");
4752 bool IsVolatile = PtrTy->getPointeeType().isVolatileQualified();
4753
4754 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
4755 EmitNonNullArgCheck(RV: RValue::get(V: Src.emitRawPointer(CGF&: *this)),
4756 ArgType: E->getArg(Arg: 0)->getType(), ArgLoc: E->getArg(Arg: 0)->getExprLoc(), AC: FD,
4757 ParmNum: 0);
4758 Value *Result = MB.CreateColumnMajorLoad(
4759 EltTy: Src.getElementType(), DataPtr: Src.emitRawPointer(CGF&: *this),
4760 Alignment: Align(Src.getAlignment().getQuantity()), Stride, IsVolatile,
4761 Rows: ResultTy->getNumRows(), Columns: ResultTy->getNumColumns(), Name: "matrix");
4762 return RValue::get(V: Result);
4763 }
4764
4765 case Builtin::BI__builtin_matrix_column_major_store: {
4766 MatrixBuilder MB(Builder);
4767 Value *Matrix = EmitScalarExpr(E: E->getArg(Arg: 0));
4768 Address Dst = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
4769 Value *Stride = EmitScalarExpr(E: E->getArg(Arg: 2));
4770
4771 const auto *MatrixTy = E->getArg(Arg: 0)->getType()->getAs<ConstantMatrixType>();
4772 auto *PtrTy = E->getArg(Arg: 1)->getType()->getAs<PointerType>();
4773 assert(PtrTy && "arg1 must be of pointer type");
4774 bool IsVolatile = PtrTy->getPointeeType().isVolatileQualified();
4775
4776 EmitNonNullArgCheck(RV: RValue::get(V: Dst.emitRawPointer(CGF&: *this)),
4777 ArgType: E->getArg(Arg: 1)->getType(), ArgLoc: E->getArg(Arg: 1)->getExprLoc(), AC: FD,
4778 ParmNum: 0);
4779 Value *Result = MB.CreateColumnMajorStore(
4780 Matrix, Ptr: Dst.emitRawPointer(CGF&: *this),
4781 Alignment: Align(Dst.getAlignment().getQuantity()), Stride, IsVolatile,
4782 Rows: MatrixTy->getNumRows(), Columns: MatrixTy->getNumColumns());
4783 addInstToNewSourceAtom(KeyInstruction: cast<Instruction>(Val: Result), Backup: Matrix);
4784 return RValue::get(V: Result);
4785 }
4786
4787 case Builtin::BI__builtin_masked_load:
4788 case Builtin::BI__builtin_masked_expand_load: {
4789 llvm::Value *Mask = EmitScalarExpr(E: E->getArg(Arg: 0));
4790 llvm::Value *Ptr = EmitScalarExpr(E: E->getArg(Arg: 1));
4791
4792 llvm::Type *RetTy = CGM.getTypes().ConvertType(T: E->getType());
4793 llvm::Value *PassThru = llvm::PoisonValue::get(T: RetTy);
4794 if (E->getNumArgs() > 2)
4795 PassThru = EmitScalarExpr(E: E->getArg(Arg: 2));
4796
4797 CharUnits Align = CGM.getNaturalTypeAlignment(
4798 T: E->getType()->getAs<VectorType>()->getElementType(), BaseInfo: nullptr);
4799
4800 llvm::Value *Result;
4801 if (BuiltinID == Builtin::BI__builtin_masked_load)
4802 Result = Builder.CreateMaskedLoad(Ty: RetTy, Ptr, Alignment: Align.getAsAlign(), Mask,
4803 PassThru, Name: "masked_load");
4804 else
4805 Result = Builder.CreateMaskedExpandLoad(Ty: RetTy, Ptr, Align: MaybeAlign(), Mask,
4806 PassThru, Name: "masked_expand_load");
4807
4808 return RValue::get(V: Result);
4809 };
4810 case Builtin::BI__builtin_masked_gather: {
4811 llvm::Value *Mask = EmitScalarExpr(E: E->getArg(Arg: 0));
4812 llvm::Value *Idx = EmitScalarExpr(E: E->getArg(Arg: 1));
4813 llvm::Value *Ptr = EmitScalarExpr(E: E->getArg(Arg: 2));
4814
4815 llvm::Type *RetTy = CGM.getTypes().ConvertType(T: E->getType());
4816 CharUnits Align = CGM.getNaturalTypeAlignment(
4817 T: E->getType()->getAs<VectorType>()->getElementType(), BaseInfo: nullptr);
4818
4819 llvm::Value *PassThru = llvm::PoisonValue::get(T: RetTy);
4820 if (E->getNumArgs() > 3)
4821 PassThru = EmitScalarExpr(E: E->getArg(Arg: 3));
4822
4823 llvm::Type *ElemTy = CGM.getTypes().ConvertType(
4824 T: E->getType()->getAs<VectorType>()->getElementType());
4825 llvm::Value *PtrVec = Builder.CreateGEP(Ty: ElemTy, Ptr, IdxList: Idx);
4826
4827 llvm::Value *Result = Builder.CreateMaskedGather(
4828 Ty: RetTy, Ptrs: PtrVec, Alignment: Align.getAsAlign(), Mask, PassThru, Name: "masked_gather");
4829 return RValue::get(V: Result);
4830 }
4831 case Builtin::BI__builtin_masked_store:
4832 case Builtin::BI__builtin_masked_compress_store: {
4833 llvm::Value *Mask = EmitScalarExpr(E: E->getArg(Arg: 0));
4834 llvm::Value *Val = EmitScalarExpr(E: E->getArg(Arg: 1));
4835 llvm::Value *Ptr = EmitScalarExpr(E: E->getArg(Arg: 2));
4836
4837 CharUnits Align = CGM.getNaturalTypeAlignment(
4838 T: E->getArg(Arg: 1)->getType()->getAs<VectorType>()->getElementType(),
4839 BaseInfo: nullptr);
4840
4841 if (BuiltinID == Builtin::BI__builtin_masked_store)
4842 Builder.CreateMaskedStore(Val, Ptr, Alignment: Align.getAsAlign(), Mask);
4843 else
4844 Builder.CreateMaskedCompressStore(Val, Ptr, Align: MaybeAlign(), Mask);
4845
4846 return RValue::get(V: nullptr);
4847 }
4848 case Builtin::BI__builtin_masked_scatter: {
4849 llvm::Value *Mask = EmitScalarExpr(E: E->getArg(Arg: 0));
4850 llvm::Value *Idx = EmitScalarExpr(E: E->getArg(Arg: 1));
4851 llvm::Value *Val = EmitScalarExpr(E: E->getArg(Arg: 2));
4852 llvm::Value *Ptr = EmitScalarExpr(E: E->getArg(Arg: 3));
4853
4854 CharUnits Align = CGM.getNaturalTypeAlignment(
4855 T: E->getArg(Arg: 2)->getType()->getAs<VectorType>()->getElementType(),
4856 BaseInfo: nullptr);
4857
4858 llvm::Type *ElemTy = CGM.getTypes().ConvertType(
4859 T: E->getArg(Arg: 1)->getType()->getAs<VectorType>()->getElementType());
4860 llvm::Value *PtrVec = Builder.CreateGEP(Ty: ElemTy, Ptr, IdxList: Idx);
4861
4862 Builder.CreateMaskedScatter(Val, Ptrs: PtrVec, Alignment: Align.getAsAlign(), Mask);
4863 return RValue();
4864 }
4865 case Builtin::BI__builtin_isinf_sign: {
4866 // isinf_sign(x) -> fabs(x) == infinity ? (signbit(x) ? -1 : 1) : 0
4867 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4868 // FIXME: for strictfp/IEEE-754 we need to not trap on SNaN here.
4869 Value *Arg = EmitScalarExpr(E: E->getArg(Arg: 0));
4870 Value *AbsArg = EmitFAbs(CGF&: *this, V: Arg);
4871 Value *IsInf = Builder.CreateFCmpOEQ(
4872 LHS: AbsArg, RHS: ConstantFP::getInfinity(Ty: Arg->getType()), Name: "isinf");
4873 Value *IsNeg = EmitSignBit(CGF&: *this, V: Arg);
4874
4875 llvm::Type *IntTy = ConvertType(T: E->getType());
4876 Value *Zero = Constant::getNullValue(Ty: IntTy);
4877 Value *One = ConstantInt::get(Ty: IntTy, V: 1);
4878 Value *NegativeOne = ConstantInt::getAllOnesValue(Ty: IntTy);
4879 Value *SignResult = Builder.CreateSelect(C: IsNeg, True: NegativeOne, False: One);
4880 Value *Result = Builder.CreateSelect(C: IsInf, True: SignResult, False: Zero);
4881 return RValue::get(V: Result);
4882 }
4883
4884 case Builtin::BI__builtin_flt_rounds: {
4885 Function *F = CGM.getIntrinsic(IID: Intrinsic::get_rounding);
4886
4887 llvm::Type *ResultType = ConvertType(T: E->getType());
4888 Value *Result = Builder.CreateCall(Callee: F);
4889 if (Result->getType() != ResultType)
4890 Result = Builder.CreateIntCast(V: Result, DestTy: ResultType, /*isSigned*/true,
4891 Name: "cast");
4892 return RValue::get(V: Result);
4893 }
4894
4895 case Builtin::BI__builtin_set_flt_rounds: {
4896 Function *F = CGM.getIntrinsic(IID: Intrinsic::set_rounding);
4897
4898 Value *V = EmitScalarExpr(E: E->getArg(Arg: 0));
4899 Builder.CreateCall(Callee: F, Args: V);
4900 return RValue::get(V: nullptr);
4901 }
4902
4903 case Builtin::BI__builtin_fpclassify: {
4904 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
4905 // FIXME: for strictfp/IEEE-754 we need to not trap on SNaN here.
4906 Value *V = EmitScalarExpr(E: E->getArg(Arg: 5));
4907 llvm::Type *Ty = ConvertType(T: E->getArg(Arg: 5)->getType());
4908
4909 // Create Result
4910 BasicBlock *Begin = Builder.GetInsertBlock();
4911 BasicBlock *End = createBasicBlock(name: "fpclassify_end", parent: this->CurFn);
4912 Builder.SetInsertPoint(End);
4913 PHINode *Result =
4914 Builder.CreatePHI(Ty: ConvertType(T: E->getArg(Arg: 0)->getType()), NumReservedValues: 4,
4915 Name: "fpclassify_result");
4916
4917 // if (V==0) return FP_ZERO
4918 Builder.SetInsertPoint(Begin);
4919 Value *IsZero = Builder.CreateFCmpOEQ(LHS: V, RHS: Constant::getNullValue(Ty),
4920 Name: "iszero");
4921 Value *ZeroLiteral = EmitScalarExpr(E: E->getArg(Arg: 4));
4922 BasicBlock *NotZero = createBasicBlock(name: "fpclassify_not_zero", parent: this->CurFn);
4923 Builder.CreateCondBr(Cond: IsZero, True: End, False: NotZero);
4924 Result->addIncoming(V: ZeroLiteral, BB: Begin);
4925
4926 // if (V != V) return FP_NAN
4927 Builder.SetInsertPoint(NotZero);
4928 Value *IsNan = Builder.CreateFCmpUNO(LHS: V, RHS: V, Name: "cmp");
4929 Value *NanLiteral = EmitScalarExpr(E: E->getArg(Arg: 0));
4930 BasicBlock *NotNan = createBasicBlock(name: "fpclassify_not_nan", parent: this->CurFn);
4931 Builder.CreateCondBr(Cond: IsNan, True: End, False: NotNan);
4932 Result->addIncoming(V: NanLiteral, BB: NotZero);
4933
4934 // if (fabs(V) == infinity) return FP_INFINITY
4935 Builder.SetInsertPoint(NotNan);
4936 Value *VAbs = EmitFAbs(CGF&: *this, V);
4937 Value *IsInf =
4938 Builder.CreateFCmpOEQ(LHS: VAbs, RHS: ConstantFP::getInfinity(Ty: V->getType()),
4939 Name: "isinf");
4940 Value *InfLiteral = EmitScalarExpr(E: E->getArg(Arg: 1));
4941 BasicBlock *NotInf = createBasicBlock(name: "fpclassify_not_inf", parent: this->CurFn);
4942 Builder.CreateCondBr(Cond: IsInf, True: End, False: NotInf);
4943 Result->addIncoming(V: InfLiteral, BB: NotNan);
4944
4945 // if (fabs(V) >= MIN_NORMAL) return FP_NORMAL else FP_SUBNORMAL
4946 Builder.SetInsertPoint(NotInf);
4947 APFloat Smallest = APFloat::getSmallestNormalized(
4948 Sem: getContext().getFloatTypeSemantics(T: E->getArg(Arg: 5)->getType()));
4949 Value *IsNormal =
4950 Builder.CreateFCmpUGE(LHS: VAbs, RHS: ConstantFP::get(Context&: V->getContext(), V: Smallest),
4951 Name: "isnormal");
4952 Value *NormalResult =
4953 Builder.CreateSelect(C: IsNormal, True: EmitScalarExpr(E: E->getArg(Arg: 2)),
4954 False: EmitScalarExpr(E: E->getArg(Arg: 3)));
4955 Builder.CreateBr(Dest: End);
4956 Result->addIncoming(V: NormalResult, BB: NotInf);
4957
4958 // return Result
4959 Builder.SetInsertPoint(End);
4960 return RValue::get(V: Result);
4961 }
4962
4963 // An alloca will always return a pointer to the alloca (stack) address
4964 // space. This address space need not be the same as the AST / Language
4965 // default (e.g. in C / C++ auto vars are in the generic address space). At
4966 // the AST level this is handled within CreateTempAlloca et al., but for the
4967 // builtin / dynamic alloca we have to handle it here. We use an explicit cast
4968 // instead of passing an AS to CreateAlloca so as to not inhibit optimisation.
4969 case Builtin::BIalloca:
4970 case Builtin::BI_alloca:
4971 case Builtin::BI__builtin_alloca_uninitialized:
4972 case Builtin::BI__builtin_alloca: {
4973 Value *Size = EmitScalarExpr(E: E->getArg(Arg: 0));
4974 const TargetInfo &TI = getContext().getTargetInfo();
4975 // The alignment of the alloca should correspond to __BIGGEST_ALIGNMENT__.
4976 const Align SuitableAlignmentInBytes =
4977 CGM.getContext()
4978 .toCharUnitsFromBits(BitSize: TI.getSuitableAlign())
4979 .getAsAlign();
4980 AllocaInst *AI = Builder.CreateAlloca(Ty: Builder.getInt8Ty(), ArraySize: Size);
4981 AI->setAlignment(SuitableAlignmentInBytes);
4982 if (BuiltinID != Builtin::BI__builtin_alloca_uninitialized)
4983 initializeAlloca(CGF&: *this, AI, Size, AlignmentInBytes: SuitableAlignmentInBytes);
4984 if (AI->getAddressSpace() !=
4985 CGM.getContext().getTargetAddressSpace(
4986 AS: E->getType()->getPointeeType().getAddressSpace())) {
4987 llvm::Type *Ty = CGM.getTypes().ConvertType(T: E->getType());
4988 return RValue::get(V: performAddrSpaceCast(Src: AI, DestTy: Ty));
4989 }
4990 return RValue::get(V: AI);
4991 }
4992
4993 case Builtin::BI__builtin_alloca_with_align_uninitialized:
4994 case Builtin::BI__builtin_alloca_with_align: {
4995 Value *Size = EmitScalarExpr(E: E->getArg(Arg: 0));
4996 Value *AlignmentInBitsValue = EmitScalarExpr(E: E->getArg(Arg: 1));
4997 auto *AlignmentInBitsCI = cast<ConstantInt>(Val: AlignmentInBitsValue);
4998 unsigned AlignmentInBits = AlignmentInBitsCI->getZExtValue();
4999 const Align AlignmentInBytes =
5000 CGM.getContext().toCharUnitsFromBits(BitSize: AlignmentInBits).getAsAlign();
5001 AllocaInst *AI = Builder.CreateAlloca(Ty: Builder.getInt8Ty(), ArraySize: Size);
5002 AI->setAlignment(AlignmentInBytes);
5003 if (BuiltinID != Builtin::BI__builtin_alloca_with_align_uninitialized)
5004 initializeAlloca(CGF&: *this, AI, Size, AlignmentInBytes);
5005 if (AI->getAddressSpace() !=
5006 CGM.getContext().getTargetAddressSpace(
5007 AS: E->getType()->getPointeeType().getAddressSpace())) {
5008 llvm::Type *Ty = CGM.getTypes().ConvertType(T: E->getType());
5009 return RValue::get(V: performAddrSpaceCast(Src: AI, DestTy: Ty));
5010 }
5011 return RValue::get(V: AI);
5012 }
5013
5014 case Builtin::BI__builtin_infer_alloc_token: {
5015 llvm::MDNode *MDN = buildAllocToken(E);
5016 llvm::Value *MDV = MetadataAsValue::get(Context&: getLLVMContext(), MD: MDN);
5017 llvm::Function *F =
5018 CGM.getIntrinsic(IID: llvm::Intrinsic::alloc_token_id, Tys: {IntPtrTy});
5019 llvm::CallBase *TokenID = Builder.CreateCall(Callee: F, Args: MDV);
5020 return RValue::get(V: TokenID);
5021 }
5022
5023 case Builtin::BIbzero:
5024 case Builtin::BI__builtin_bzero: {
5025 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5026 Value *SizeVal = EmitScalarExpr(E: E->getArg(Arg: 1));
5027 EmitNonNullArgCheck(Addr: Dest, ArgType: E->getArg(Arg: 0)->getType(),
5028 ArgLoc: E->getArg(Arg: 0)->getExprLoc(), AC: FD, ParmNum: 0);
5029 auto *I = Builder.CreateMemSet(Dest, Value: Builder.getInt8(C: 0), Size: SizeVal, IsVolatile: false);
5030 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5031 return RValue::get(V: nullptr);
5032 }
5033
5034 case Builtin::BIbcopy:
5035 case Builtin::BI__builtin_bcopy: {
5036 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5037 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5038 Value *SizeVal = EmitScalarExpr(E: E->getArg(Arg: 2));
5039 EmitNonNullArgCheck(RV: RValue::get(V: Src.emitRawPointer(CGF&: *this)),
5040 ArgType: E->getArg(Arg: 0)->getType(), ArgLoc: E->getArg(Arg: 0)->getExprLoc(), AC: FD,
5041 ParmNum: 0);
5042 EmitNonNullArgCheck(RV: RValue::get(V: Dest.emitRawPointer(CGF&: *this)),
5043 ArgType: E->getArg(Arg: 1)->getType(), ArgLoc: E->getArg(Arg: 1)->getExprLoc(), AC: FD,
5044 ParmNum: 0);
5045 auto *I = Builder.CreateMemMove(Dest, Src, Size: SizeVal, IsVolatile: false);
5046 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5047 return RValue::get(V: nullptr);
5048 }
5049
5050 case Builtin::BImemcpy:
5051 case Builtin::BI__builtin_memcpy:
5052 case Builtin::BImempcpy:
5053 case Builtin::BI__builtin_mempcpy: {
5054 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5055 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5056 Value *SizeVal = EmitScalarExpr(E: E->getArg(Arg: 2));
5057 EmitArgCheck(TCK_Store, Dest, E->getArg(Arg: 0), 0);
5058 EmitArgCheck(TCK_Load, Src, E->getArg(Arg: 1), 1);
5059 auto *I = Builder.CreateMemCpy(Dest, Src, Size: SizeVal, IsVolatile: false);
5060 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5061 if (BuiltinID == Builtin::BImempcpy ||
5062 BuiltinID == Builtin::BI__builtin_mempcpy)
5063 return RValue::get(V: Builder.CreateInBoundsGEP(
5064 Ty: Dest.getElementType(), Ptr: Dest.emitRawPointer(CGF&: *this), IdxList: SizeVal));
5065 else
5066 return RValue::get(Addr: Dest, CGF&: *this);
5067 }
5068
5069 case Builtin::BI__builtin_memcpy_inline: {
5070 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5071 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5072 uint64_t Size =
5073 E->getArg(Arg: 2)->EvaluateKnownConstInt(Ctx: getContext()).getZExtValue();
5074 EmitArgCheck(TCK_Store, Dest, E->getArg(Arg: 0), 0);
5075 EmitArgCheck(TCK_Load, Src, E->getArg(Arg: 1), 1);
5076 auto *I = Builder.CreateMemCpyInline(Dest, Src, Size);
5077 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5078 return RValue::get(V: nullptr);
5079 }
5080
5081 case Builtin::BI__builtin_char_memchr:
5082 BuiltinID = Builtin::BI__builtin_memchr;
5083 break;
5084
5085 case Builtin::BI__builtin___memcpy_chk: {
5086 // fold __builtin_memcpy_chk(x, y, cst1, cst2) to memcpy iff cst1<=cst2.
5087 Expr::EvalResult SizeResult, DstSizeResult;
5088 if (!E->getArg(Arg: 2)->EvaluateAsInt(Result&: SizeResult, Ctx: CGM.getContext()) ||
5089 !E->getArg(Arg: 3)->EvaluateAsInt(Result&: DstSizeResult, Ctx: CGM.getContext()))
5090 break;
5091 llvm::APSInt Size = SizeResult.Val.getInt();
5092 llvm::APSInt DstSize = DstSizeResult.Val.getInt();
5093 if (Size.ugt(RHS: DstSize))
5094 break;
5095 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5096 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5097 Value *SizeVal = llvm::ConstantInt::get(Context&: Builder.getContext(), V: Size);
5098 auto *I = Builder.CreateMemCpy(Dest, Src, Size: SizeVal, IsVolatile: false);
5099 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5100 return RValue::get(Addr: Dest, CGF&: *this);
5101 }
5102
5103 case Builtin::BI__builtin_objc_memmove_collectable: {
5104 Address DestAddr = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5105 Address SrcAddr = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5106 Value *SizeVal = EmitScalarExpr(E: E->getArg(Arg: 2));
5107 CGM.getObjCRuntime().EmitGCMemmoveCollectable(CGF&: *this,
5108 DestPtr: DestAddr, SrcPtr: SrcAddr, Size: SizeVal);
5109 return RValue::get(Addr: DestAddr, CGF&: *this);
5110 }
5111
5112 case Builtin::BI__builtin___memmove_chk: {
5113 // fold __builtin_memmove_chk(x, y, cst1, cst2) to memmove iff cst1<=cst2.
5114 Expr::EvalResult SizeResult, DstSizeResult;
5115 if (!E->getArg(Arg: 2)->EvaluateAsInt(Result&: SizeResult, Ctx: CGM.getContext()) ||
5116 !E->getArg(Arg: 3)->EvaluateAsInt(Result&: DstSizeResult, Ctx: CGM.getContext()))
5117 break;
5118 llvm::APSInt Size = SizeResult.Val.getInt();
5119 llvm::APSInt DstSize = DstSizeResult.Val.getInt();
5120 if (Size.ugt(RHS: DstSize))
5121 break;
5122 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5123 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5124 Value *SizeVal = llvm::ConstantInt::get(Context&: Builder.getContext(), V: Size);
5125 auto *I = Builder.CreateMemMove(Dest, Src, Size: SizeVal, IsVolatile: false);
5126 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5127 return RValue::get(Addr: Dest, CGF&: *this);
5128 }
5129
5130 case Builtin::BI__builtin_trivially_relocate:
5131 case Builtin::BImemmove:
5132 case Builtin::BI__builtin_memmove: {
5133 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5134 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
5135 Value *SizeVal = EmitScalarExpr(E: E->getArg(Arg: 2));
5136 if (BuiltinIDIfNoAsmLabel == Builtin::BI__builtin_trivially_relocate)
5137 SizeVal = Builder.CreateMul(
5138 LHS: SizeVal,
5139 RHS: ConstantInt::get(
5140 Ty: SizeVal->getType(),
5141 V: getContext()
5142 .getTypeSizeInChars(T: E->getArg(Arg: 0)->getType()->getPointeeType())
5143 .getQuantity()));
5144 EmitArgCheck(TCK_Store, Dest, E->getArg(Arg: 0), 0);
5145 EmitArgCheck(TCK_Load, Src, E->getArg(Arg: 1), 1);
5146 auto *I = Builder.CreateMemMove(Dest, Src, Size: SizeVal, IsVolatile: false);
5147 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5148 return RValue::get(Addr: Dest, CGF&: *this);
5149 }
5150 case Builtin::BImemset:
5151 case Builtin::BI__builtin_memset: {
5152 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5153 Value *ByteVal = Builder.CreateTrunc(V: EmitScalarExpr(E: E->getArg(Arg: 1)),
5154 DestTy: Builder.getInt8Ty());
5155 Value *SizeVal = EmitScalarExpr(E: E->getArg(Arg: 2));
5156 EmitNonNullArgCheck(Addr: Dest, ArgType: E->getArg(Arg: 0)->getType(),
5157 ArgLoc: E->getArg(Arg: 0)->getExprLoc(), AC: FD, ParmNum: 0);
5158 auto *I = Builder.CreateMemSet(Dest, Value: ByteVal, Size: SizeVal, IsVolatile: false);
5159 addInstToNewSourceAtom(KeyInstruction: I, Backup: ByteVal);
5160 return RValue::get(Addr: Dest, CGF&: *this);
5161 }
5162 case Builtin::BI__builtin_memset_inline: {
5163 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5164 Value *ByteVal =
5165 Builder.CreateTrunc(V: EmitScalarExpr(E: E->getArg(Arg: 1)), DestTy: Builder.getInt8Ty());
5166 uint64_t Size =
5167 E->getArg(Arg: 2)->EvaluateKnownConstInt(Ctx: getContext()).getZExtValue();
5168 EmitNonNullArgCheck(RV: RValue::get(V: Dest.emitRawPointer(CGF&: *this)),
5169 ArgType: E->getArg(Arg: 0)->getType(), ArgLoc: E->getArg(Arg: 0)->getExprLoc(), AC: FD,
5170 ParmNum: 0);
5171 auto *I = Builder.CreateMemSetInline(Dest, Value: ByteVal, Size);
5172 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5173 return RValue::get(V: nullptr);
5174 }
5175 case Builtin::BI__builtin___memset_chk: {
5176 // fold __builtin_memset_chk(x, y, cst1, cst2) to memset iff cst1<=cst2.
5177 Expr::EvalResult SizeResult, DstSizeResult;
5178 if (!E->getArg(Arg: 2)->EvaluateAsInt(Result&: SizeResult, Ctx: CGM.getContext()) ||
5179 !E->getArg(Arg: 3)->EvaluateAsInt(Result&: DstSizeResult, Ctx: CGM.getContext()))
5180 break;
5181 llvm::APSInt Size = SizeResult.Val.getInt();
5182 llvm::APSInt DstSize = DstSizeResult.Val.getInt();
5183 if (Size.ugt(RHS: DstSize))
5184 break;
5185 Address Dest = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5186 Value *ByteVal = Builder.CreateTrunc(V: EmitScalarExpr(E: E->getArg(Arg: 1)),
5187 DestTy: Builder.getInt8Ty());
5188 Value *SizeVal = llvm::ConstantInt::get(Context&: Builder.getContext(), V: Size);
5189 auto *I = Builder.CreateMemSet(Dest, Value: ByteVal, Size: SizeVal, IsVolatile: false);
5190 addInstToNewSourceAtom(KeyInstruction: I, Backup: nullptr);
5191 return RValue::get(Addr: Dest, CGF&: *this);
5192 }
5193 case Builtin::BI__builtin_wmemchr: {
5194 // The MSVC runtime library does not provide a definition of wmemchr, so we
5195 // need an inline implementation.
5196 if (!getTarget().getTriple().isOSMSVCRT())
5197 break;
5198
5199 llvm::Type *WCharTy = ConvertType(T: getContext().WCharTy);
5200 Value *Str = EmitScalarExpr(E: E->getArg(Arg: 0));
5201 Value *Chr = EmitScalarExpr(E: E->getArg(Arg: 1));
5202 Value *Size = EmitScalarExpr(E: E->getArg(Arg: 2));
5203
5204 BasicBlock *Entry = Builder.GetInsertBlock();
5205 BasicBlock *CmpEq = createBasicBlock(name: "wmemchr.eq");
5206 BasicBlock *Next = createBasicBlock(name: "wmemchr.next");
5207 BasicBlock *Exit = createBasicBlock(name: "wmemchr.exit");
5208 Value *SizeEq0 = Builder.CreateICmpEQ(LHS: Size, RHS: ConstantInt::get(Ty: SizeTy, V: 0));
5209 Builder.CreateCondBr(Cond: SizeEq0, True: Exit, False: CmpEq);
5210
5211 EmitBlock(BB: CmpEq);
5212 PHINode *StrPhi = Builder.CreatePHI(Ty: Str->getType(), NumReservedValues: 2);
5213 StrPhi->addIncoming(V: Str, BB: Entry);
5214 PHINode *SizePhi = Builder.CreatePHI(Ty: SizeTy, NumReservedValues: 2);
5215 SizePhi->addIncoming(V: Size, BB: Entry);
5216 CharUnits WCharAlign =
5217 getContext().getTypeAlignInChars(T: getContext().WCharTy);
5218 Value *StrCh = Builder.CreateAlignedLoad(Ty: WCharTy, Addr: StrPhi, Align: WCharAlign);
5219 Value *FoundChr = Builder.CreateConstInBoundsGEP1_32(Ty: WCharTy, Ptr: StrPhi, Idx0: 0);
5220 Value *StrEqChr = Builder.CreateICmpEQ(LHS: StrCh, RHS: Chr);
5221 Builder.CreateCondBr(Cond: StrEqChr, True: Exit, False: Next);
5222
5223 EmitBlock(BB: Next);
5224 Value *NextStr = Builder.CreateConstInBoundsGEP1_32(Ty: WCharTy, Ptr: StrPhi, Idx0: 1);
5225 Value *NextSize = Builder.CreateSub(LHS: SizePhi, RHS: ConstantInt::get(Ty: SizeTy, V: 1));
5226 Value *NextSizeEq0 =
5227 Builder.CreateICmpEQ(LHS: NextSize, RHS: ConstantInt::get(Ty: SizeTy, V: 0));
5228 Builder.CreateCondBr(Cond: NextSizeEq0, True: Exit, False: CmpEq);
5229 StrPhi->addIncoming(V: NextStr, BB: Next);
5230 SizePhi->addIncoming(V: NextSize, BB: Next);
5231
5232 EmitBlock(BB: Exit);
5233 PHINode *Ret = Builder.CreatePHI(Ty: Str->getType(), NumReservedValues: 3);
5234 Ret->addIncoming(V: llvm::Constant::getNullValue(Ty: Str->getType()), BB: Entry);
5235 Ret->addIncoming(V: llvm::Constant::getNullValue(Ty: Str->getType()), BB: Next);
5236 Ret->addIncoming(V: FoundChr, BB: CmpEq);
5237 return RValue::get(V: Ret);
5238 }
5239 case Builtin::BI__builtin_wmemcmp: {
5240 // The MSVC runtime library does not provide a definition of wmemcmp, so we
5241 // need an inline implementation.
5242 if (!getTarget().getTriple().isOSMSVCRT())
5243 break;
5244
5245 llvm::Type *WCharTy = ConvertType(T: getContext().WCharTy);
5246
5247 Value *Dst = EmitScalarExpr(E: E->getArg(Arg: 0));
5248 Value *Src = EmitScalarExpr(E: E->getArg(Arg: 1));
5249 Value *Size = EmitScalarExpr(E: E->getArg(Arg: 2));
5250
5251 BasicBlock *Entry = Builder.GetInsertBlock();
5252 BasicBlock *CmpGT = createBasicBlock(name: "wmemcmp.gt");
5253 BasicBlock *CmpLT = createBasicBlock(name: "wmemcmp.lt");
5254 BasicBlock *Next = createBasicBlock(name: "wmemcmp.next");
5255 BasicBlock *Exit = createBasicBlock(name: "wmemcmp.exit");
5256 Value *SizeEq0 = Builder.CreateICmpEQ(LHS: Size, RHS: ConstantInt::get(Ty: SizeTy, V: 0));
5257 Builder.CreateCondBr(Cond: SizeEq0, True: Exit, False: CmpGT);
5258
5259 EmitBlock(BB: CmpGT);
5260 PHINode *DstPhi = Builder.CreatePHI(Ty: Dst->getType(), NumReservedValues: 2);
5261 DstPhi->addIncoming(V: Dst, BB: Entry);
5262 PHINode *SrcPhi = Builder.CreatePHI(Ty: Src->getType(), NumReservedValues: 2);
5263 SrcPhi->addIncoming(V: Src, BB: Entry);
5264 PHINode *SizePhi = Builder.CreatePHI(Ty: SizeTy, NumReservedValues: 2);
5265 SizePhi->addIncoming(V: Size, BB: Entry);
5266 CharUnits WCharAlign =
5267 getContext().getTypeAlignInChars(T: getContext().WCharTy);
5268 Value *DstCh = Builder.CreateAlignedLoad(Ty: WCharTy, Addr: DstPhi, Align: WCharAlign);
5269 Value *SrcCh = Builder.CreateAlignedLoad(Ty: WCharTy, Addr: SrcPhi, Align: WCharAlign);
5270 Value *DstGtSrc = Builder.CreateICmpUGT(LHS: DstCh, RHS: SrcCh);
5271 Builder.CreateCondBr(Cond: DstGtSrc, True: Exit, False: CmpLT);
5272
5273 EmitBlock(BB: CmpLT);
5274 Value *DstLtSrc = Builder.CreateICmpULT(LHS: DstCh, RHS: SrcCh);
5275 Builder.CreateCondBr(Cond: DstLtSrc, True: Exit, False: Next);
5276
5277 EmitBlock(BB: Next);
5278 Value *NextDst = Builder.CreateConstInBoundsGEP1_32(Ty: WCharTy, Ptr: DstPhi, Idx0: 1);
5279 Value *NextSrc = Builder.CreateConstInBoundsGEP1_32(Ty: WCharTy, Ptr: SrcPhi, Idx0: 1);
5280 Value *NextSize = Builder.CreateSub(LHS: SizePhi, RHS: ConstantInt::get(Ty: SizeTy, V: 1));
5281 Value *NextSizeEq0 =
5282 Builder.CreateICmpEQ(LHS: NextSize, RHS: ConstantInt::get(Ty: SizeTy, V: 0));
5283 Builder.CreateCondBr(Cond: NextSizeEq0, True: Exit, False: CmpGT);
5284 DstPhi->addIncoming(V: NextDst, BB: Next);
5285 SrcPhi->addIncoming(V: NextSrc, BB: Next);
5286 SizePhi->addIncoming(V: NextSize, BB: Next);
5287
5288 EmitBlock(BB: Exit);
5289 PHINode *Ret = Builder.CreatePHI(Ty: IntTy, NumReservedValues: 4);
5290 Ret->addIncoming(V: ConstantInt::get(Ty: IntTy, V: 0), BB: Entry);
5291 Ret->addIncoming(V: ConstantInt::get(Ty: IntTy, V: 1), BB: CmpGT);
5292 Ret->addIncoming(V: ConstantInt::getAllOnesValue(Ty: IntTy), BB: CmpLT);
5293 Ret->addIncoming(V: ConstantInt::get(Ty: IntTy, V: 0), BB: Next);
5294 return RValue::get(V: Ret);
5295 }
5296 case Builtin::BI__builtin_dwarf_cfa: {
5297 // The offset in bytes from the first argument to the CFA.
5298 //
5299 // Why on earth is this in the frontend? Is there any reason at
5300 // all that the backend can't reasonably determine this while
5301 // lowering llvm.eh.dwarf.cfa()?
5302 //
5303 // TODO: If there's a satisfactory reason, add a target hook for
5304 // this instead of hard-coding 0, which is correct for most targets.
5305 int32_t Offset = 0;
5306
5307 Function *F = CGM.getIntrinsic(IID: Intrinsic::eh_dwarf_cfa);
5308 return RValue::get(V: Builder.CreateCall(Callee: F,
5309 Args: llvm::ConstantInt::get(Ty: Int32Ty, V: Offset)));
5310 }
5311 case Builtin::BI__builtin_return_address: {
5312 Value *Depth = ConstantEmitter(*this).emitAbstract(E: E->getArg(Arg: 0),
5313 T: getContext().UnsignedIntTy);
5314 Function *F =
5315 CGM.getIntrinsic(IID: Intrinsic::returnaddress, Tys: {CGM.ProgramPtrTy});
5316 return RValue::get(V: Builder.CreateCall(Callee: F, Args: Depth));
5317 }
5318 case Builtin::BI_ReturnAddress: {
5319 Function *F =
5320 CGM.getIntrinsic(IID: Intrinsic::returnaddress, Tys: {CGM.ProgramPtrTy});
5321 return RValue::get(V: Builder.CreateCall(Callee: F, Args: Builder.getInt32(C: 0)));
5322 }
5323 case Builtin::BI__builtin_frame_address: {
5324 Value *Depth = ConstantEmitter(*this).emitAbstract(E: E->getArg(Arg: 0),
5325 T: getContext().UnsignedIntTy);
5326 Function *F = CGM.getIntrinsic(IID: Intrinsic::frameaddress, Tys: AllocaInt8PtrTy);
5327 return RValue::get(V: Builder.CreateCall(Callee: F, Args: Depth));
5328 }
5329 case Builtin::BI__builtin_stack_address: {
5330 return RValue::get(V: Builder.CreateCall(
5331 Callee: CGM.getIntrinsic(IID: Intrinsic::stackaddress, Tys: AllocaInt8PtrTy)));
5332 }
5333 case Builtin::BI__builtin_extract_return_addr: {
5334 Value *Address = EmitScalarExpr(E: E->getArg(Arg: 0));
5335 Value *Result = getTargetHooks().decodeReturnAddress(CGF&: *this, Address);
5336 return RValue::get(V: Result);
5337 }
5338 case Builtin::BI__builtin_frob_return_addr: {
5339 Value *Address = EmitScalarExpr(E: E->getArg(Arg: 0));
5340 Value *Result = getTargetHooks().encodeReturnAddress(CGF&: *this, Address);
5341 return RValue::get(V: Result);
5342 }
5343 case Builtin::BI__builtin_dwarf_sp_column: {
5344 llvm::IntegerType *Ty
5345 = cast<llvm::IntegerType>(Val: ConvertType(T: E->getType()));
5346 int Column = getTargetHooks().getDwarfEHStackPointer(M&: CGM);
5347 if (Column == -1) {
5348 CGM.ErrorUnsupported(S: E, Type: "__builtin_dwarf_sp_column");
5349 return RValue::get(V: llvm::UndefValue::get(T: Ty));
5350 }
5351 return RValue::get(V: llvm::ConstantInt::get(Ty, V: Column, IsSigned: true));
5352 }
5353 case Builtin::BI__builtin_init_dwarf_reg_size_table: {
5354 Value *Address = EmitScalarExpr(E: E->getArg(Arg: 0));
5355 if (getTargetHooks().initDwarfEHRegSizeTable(CGF&: *this, Address))
5356 CGM.ErrorUnsupported(S: E, Type: "__builtin_init_dwarf_reg_size_table");
5357 return RValue::get(V: llvm::UndefValue::get(T: ConvertType(T: E->getType())));
5358 }
5359 case Builtin::BI__builtin_eh_return: {
5360 Value *Int = EmitScalarExpr(E: E->getArg(Arg: 0));
5361 Value *Ptr = EmitScalarExpr(E: E->getArg(Arg: 1));
5362
5363 llvm::IntegerType *IntTy = cast<llvm::IntegerType>(Val: Int->getType());
5364 assert((IntTy->getBitWidth() == 32 || IntTy->getBitWidth() == 64) &&
5365 "LLVM's __builtin_eh_return only supports 32- and 64-bit variants");
5366 Function *F =
5367 CGM.getIntrinsic(IID: IntTy->getBitWidth() == 32 ? Intrinsic::eh_return_i32
5368 : Intrinsic::eh_return_i64);
5369 Builder.CreateCall(Callee: F, Args: {Int, Ptr});
5370 Builder.CreateUnreachable();
5371
5372 // We do need to preserve an insertion point.
5373 EmitBlock(BB: createBasicBlock(name: "builtin_eh_return.cont"));
5374
5375 return RValue::get(V: nullptr);
5376 }
5377 case Builtin::BI__builtin_unwind_init: {
5378 Function *F = CGM.getIntrinsic(IID: Intrinsic::eh_unwind_init);
5379 Builder.CreateCall(Callee: F);
5380 return RValue::get(V: nullptr);
5381 }
5382 case Builtin::BI__builtin_extend_pointer: {
5383 // Extends a pointer to the size of an _Unwind_Word, which is
5384 // uint64_t on all platforms. Generally this gets poked into a
5385 // register and eventually used as an address, so if the
5386 // addressing registers are wider than pointers and the platform
5387 // doesn't implicitly ignore high-order bits when doing
5388 // addressing, we need to make sure we zext / sext based on
5389 // the platform's expectations.
5390 //
5391 // See: http://gcc.gnu.org/ml/gcc-bugs/2002-02/msg00237.html
5392
5393 // Cast the pointer to intptr_t.
5394 Value *Ptr = EmitScalarExpr(E: E->getArg(Arg: 0));
5395 Value *Result = Builder.CreatePtrToInt(V: Ptr, DestTy: IntPtrTy, Name: "extend.cast");
5396
5397 // If that's 64 bits, we're done.
5398 if (IntPtrTy->getBitWidth() == 64)
5399 return RValue::get(V: Result);
5400
5401 // Otherwise, ask the codegen data what to do.
5402 if (getTargetHooks().extendPointerWithSExt())
5403 return RValue::get(V: Builder.CreateSExt(V: Result, DestTy: Int64Ty, Name: "extend.sext"));
5404 else
5405 return RValue::get(V: Builder.CreateZExt(V: Result, DestTy: Int64Ty, Name: "extend.zext"));
5406 }
5407 case Builtin::BI__builtin_setjmp: {
5408 // Buffer is a void**.
5409 Address Buf = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5410
5411 if (getTarget().getTriple().getArch() == llvm::Triple::systemz) {
5412 // On this target, the back end fills in the context buffer completely.
5413 // It doesn't really matter if the frontend stores to the buffer before
5414 // calling setjmp, the back-end is going to overwrite them anyway.
5415 Function *F = CGM.getIntrinsic(IID: Intrinsic::eh_sjlj_setjmp);
5416 return RValue::get(V: Builder.CreateCall(Callee: F, Args: Buf.emitRawPointer(CGF&: *this)));
5417 }
5418
5419 // Store the frame pointer to the setjmp buffer.
5420 Value *FrameAddr = Builder.CreateCall(
5421 Callee: CGM.getIntrinsic(IID: Intrinsic::frameaddress, Tys: AllocaInt8PtrTy),
5422 Args: ConstantInt::get(Ty: Int32Ty, V: 0));
5423 Builder.CreateStore(Val: FrameAddr, Addr: Buf);
5424
5425 // Store the stack pointer to the setjmp buffer.
5426 Value *StackAddr = Builder.CreateStackSave();
5427 assert(Buf.emitRawPointer(*this)->getType() == StackAddr->getType());
5428
5429 Address StackSaveSlot = Builder.CreateConstInBoundsGEP(Addr: Buf, Index: 2);
5430 Builder.CreateStore(Val: StackAddr, Addr: StackSaveSlot);
5431
5432 // Call LLVM's EH setjmp, which is lightweight.
5433 Function *F = CGM.getIntrinsic(IID: Intrinsic::eh_sjlj_setjmp);
5434 return RValue::get(V: Builder.CreateCall(Callee: F, Args: Buf.emitRawPointer(CGF&: *this)));
5435 }
5436 case Builtin::BI__builtin_longjmp: {
5437 Value *Buf = EmitScalarExpr(E: E->getArg(Arg: 0));
5438
5439 // Call LLVM's EH longjmp, which is lightweight.
5440 Builder.CreateCall(Callee: CGM.getIntrinsic(IID: Intrinsic::eh_sjlj_longjmp), Args: Buf);
5441
5442 // longjmp doesn't return; mark this as unreachable.
5443 Builder.CreateUnreachable();
5444
5445 // We do need to preserve an insertion point.
5446 EmitBlock(BB: createBasicBlock(name: "longjmp.cont"));
5447
5448 return RValue::get(V: nullptr);
5449 }
5450 case Builtin::BI__builtin_launder: {
5451 const Expr *Arg = E->getArg(Arg: 0);
5452 QualType ArgTy = Arg->getType()->getPointeeType();
5453 Value *Ptr = EmitScalarExpr(E: Arg);
5454 if (TypeRequiresBuiltinLaunder(CGM, Ty: ArgTy))
5455 Ptr = Builder.CreateLaunderInvariantGroup(Ptr);
5456
5457 return RValue::get(V: Ptr);
5458 }
5459 case Builtin::BI__builtin_clear_padding: {
5460 Address Src = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
5461 auto PointeeTy = E->getArg(Arg: 0)->getType()->getPointeeType();
5462 PaddingClearer clearer{*this};
5463 clearer.run(Src, Ty: PointeeTy);
5464 return RValue::get(V: nullptr);
5465 }
5466 case Builtin::BI__sync_fetch_and_add:
5467 case Builtin::BI__sync_fetch_and_sub:
5468 case Builtin::BI__sync_fetch_and_or:
5469 case Builtin::BI__sync_fetch_and_and:
5470 case Builtin::BI__sync_fetch_and_xor:
5471 case Builtin::BI__sync_fetch_and_nand:
5472 case Builtin::BI__sync_add_and_fetch:
5473 case Builtin::BI__sync_sub_and_fetch:
5474 case Builtin::BI__sync_and_and_fetch:
5475 case Builtin::BI__sync_or_and_fetch:
5476 case Builtin::BI__sync_xor_and_fetch:
5477 case Builtin::BI__sync_nand_and_fetch:
5478 case Builtin::BI__sync_val_compare_and_swap:
5479 case Builtin::BI__sync_bool_compare_and_swap:
5480 case Builtin::BI__sync_lock_test_and_set:
5481 case Builtin::BI__sync_lock_release:
5482 case Builtin::BI__sync_swap:
5483 llvm_unreachable("Shouldn't make it through sema");
5484 case Builtin::BI__sync_fetch_and_add_1:
5485 case Builtin::BI__sync_fetch_and_add_2:
5486 case Builtin::BI__sync_fetch_and_add_4:
5487 case Builtin::BI__sync_fetch_and_add_8:
5488 case Builtin::BI__sync_fetch_and_add_16:
5489 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Add, E);
5490 case Builtin::BI__sync_fetch_and_sub_1:
5491 case Builtin::BI__sync_fetch_and_sub_2:
5492 case Builtin::BI__sync_fetch_and_sub_4:
5493 case Builtin::BI__sync_fetch_and_sub_8:
5494 case Builtin::BI__sync_fetch_and_sub_16:
5495 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Sub, E);
5496 case Builtin::BI__sync_fetch_and_or_1:
5497 case Builtin::BI__sync_fetch_and_or_2:
5498 case Builtin::BI__sync_fetch_and_or_4:
5499 case Builtin::BI__sync_fetch_and_or_8:
5500 case Builtin::BI__sync_fetch_and_or_16:
5501 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Or, E);
5502 case Builtin::BI__sync_fetch_and_and_1:
5503 case Builtin::BI__sync_fetch_and_and_2:
5504 case Builtin::BI__sync_fetch_and_and_4:
5505 case Builtin::BI__sync_fetch_and_and_8:
5506 case Builtin::BI__sync_fetch_and_and_16:
5507 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::And, E);
5508 case Builtin::BI__sync_fetch_and_xor_1:
5509 case Builtin::BI__sync_fetch_and_xor_2:
5510 case Builtin::BI__sync_fetch_and_xor_4:
5511 case Builtin::BI__sync_fetch_and_xor_8:
5512 case Builtin::BI__sync_fetch_and_xor_16:
5513 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Xor, E);
5514 case Builtin::BI__sync_fetch_and_nand_1:
5515 case Builtin::BI__sync_fetch_and_nand_2:
5516 case Builtin::BI__sync_fetch_and_nand_4:
5517 case Builtin::BI__sync_fetch_and_nand_8:
5518 case Builtin::BI__sync_fetch_and_nand_16:
5519 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Nand, E);
5520
5521 // Clang extensions: not overloaded yet.
5522 case Builtin::BI__sync_fetch_and_min:
5523 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Min, E);
5524 case Builtin::BI__sync_fetch_and_max:
5525 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Max, E);
5526 case Builtin::BI__sync_fetch_and_umin:
5527 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::UMin, E);
5528 case Builtin::BI__sync_fetch_and_umax:
5529 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::UMax, E);
5530
5531 case Builtin::BI__sync_add_and_fetch_1:
5532 case Builtin::BI__sync_add_and_fetch_2:
5533 case Builtin::BI__sync_add_and_fetch_4:
5534 case Builtin::BI__sync_add_and_fetch_8:
5535 case Builtin::BI__sync_add_and_fetch_16:
5536 return EmitBinaryAtomicPost(CGF&: *this, Kind: llvm::AtomicRMWInst::Add, E,
5537 Op: llvm::Instruction::Add);
5538 case Builtin::BI__sync_sub_and_fetch_1:
5539 case Builtin::BI__sync_sub_and_fetch_2:
5540 case Builtin::BI__sync_sub_and_fetch_4:
5541 case Builtin::BI__sync_sub_and_fetch_8:
5542 case Builtin::BI__sync_sub_and_fetch_16:
5543 return EmitBinaryAtomicPost(CGF&: *this, Kind: llvm::AtomicRMWInst::Sub, E,
5544 Op: llvm::Instruction::Sub);
5545 case Builtin::BI__sync_and_and_fetch_1:
5546 case Builtin::BI__sync_and_and_fetch_2:
5547 case Builtin::BI__sync_and_and_fetch_4:
5548 case Builtin::BI__sync_and_and_fetch_8:
5549 case Builtin::BI__sync_and_and_fetch_16:
5550 return EmitBinaryAtomicPost(CGF&: *this, Kind: llvm::AtomicRMWInst::And, E,
5551 Op: llvm::Instruction::And);
5552 case Builtin::BI__sync_or_and_fetch_1:
5553 case Builtin::BI__sync_or_and_fetch_2:
5554 case Builtin::BI__sync_or_and_fetch_4:
5555 case Builtin::BI__sync_or_and_fetch_8:
5556 case Builtin::BI__sync_or_and_fetch_16:
5557 return EmitBinaryAtomicPost(CGF&: *this, Kind: llvm::AtomicRMWInst::Or, E,
5558 Op: llvm::Instruction::Or);
5559 case Builtin::BI__sync_xor_and_fetch_1:
5560 case Builtin::BI__sync_xor_and_fetch_2:
5561 case Builtin::BI__sync_xor_and_fetch_4:
5562 case Builtin::BI__sync_xor_and_fetch_8:
5563 case Builtin::BI__sync_xor_and_fetch_16:
5564 return EmitBinaryAtomicPost(CGF&: *this, Kind: llvm::AtomicRMWInst::Xor, E,
5565 Op: llvm::Instruction::Xor);
5566 case Builtin::BI__sync_nand_and_fetch_1:
5567 case Builtin::BI__sync_nand_and_fetch_2:
5568 case Builtin::BI__sync_nand_and_fetch_4:
5569 case Builtin::BI__sync_nand_and_fetch_8:
5570 case Builtin::BI__sync_nand_and_fetch_16:
5571 return EmitBinaryAtomicPost(CGF&: *this, Kind: llvm::AtomicRMWInst::Nand, E,
5572 Op: llvm::Instruction::And, Invert: true);
5573
5574 case Builtin::BI__sync_val_compare_and_swap_1:
5575 case Builtin::BI__sync_val_compare_and_swap_2:
5576 case Builtin::BI__sync_val_compare_and_swap_4:
5577 case Builtin::BI__sync_val_compare_and_swap_8:
5578 case Builtin::BI__sync_val_compare_and_swap_16:
5579 return RValue::get(V: MakeAtomicCmpXchgValue(
5580 CGF&: *this, E, ReturnBool: false, SuccessOrdering: AtomicOrdering::SequentiallyConsistent,
5581 FailureOrdering: AtomicOrdering::SequentiallyConsistent));
5582
5583 case Builtin::BI__sync_bool_compare_and_swap_1:
5584 case Builtin::BI__sync_bool_compare_and_swap_2:
5585 case Builtin::BI__sync_bool_compare_and_swap_4:
5586 case Builtin::BI__sync_bool_compare_and_swap_8:
5587 case Builtin::BI__sync_bool_compare_and_swap_16:
5588 return RValue::get(V: MakeAtomicCmpXchgValue(
5589 CGF&: *this, E, ReturnBool: true, SuccessOrdering: AtomicOrdering::SequentiallyConsistent,
5590 FailureOrdering: AtomicOrdering::SequentiallyConsistent));
5591
5592 case Builtin::BI__sync_swap_1:
5593 case Builtin::BI__sync_swap_2:
5594 case Builtin::BI__sync_swap_4:
5595 case Builtin::BI__sync_swap_8:
5596 case Builtin::BI__sync_swap_16:
5597 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Xchg, E);
5598
5599 case Builtin::BI__sync_lock_test_and_set_1:
5600 case Builtin::BI__sync_lock_test_and_set_2:
5601 case Builtin::BI__sync_lock_test_and_set_4:
5602 case Builtin::BI__sync_lock_test_and_set_8:
5603 case Builtin::BI__sync_lock_test_and_set_16:
5604 return EmitBinaryAtomic(CGF&: *this, Kind: llvm::AtomicRMWInst::Xchg, E);
5605
5606 case Builtin::BI__sync_lock_release_1:
5607 case Builtin::BI__sync_lock_release_2:
5608 case Builtin::BI__sync_lock_release_4:
5609 case Builtin::BI__sync_lock_release_8:
5610 case Builtin::BI__sync_lock_release_16: {
5611 Address Ptr = CheckAtomicAlignment(CGF&: *this, E);
5612 QualType ElTy = E->getArg(Arg: 0)->getType()->getPointeeType();
5613
5614 llvm::Type *ITy = llvm::IntegerType::get(C&: getLLVMContext(),
5615 NumBits: getContext().getTypeSize(T: ElTy));
5616 llvm::StoreInst *Store =
5617 Builder.CreateStore(Val: llvm::Constant::getNullValue(Ty: ITy), Addr: Ptr);
5618 Store->setAtomic(Ordering: llvm::AtomicOrdering::Release);
5619 return RValue::get(V: nullptr);
5620 }
5621
5622 case Builtin::BI__sync_synchronize: {
5623 // We assume this is supposed to correspond to a C++0x-style
5624 // sequentially-consistent fence (i.e. this is only usable for
5625 // synchronization, not device I/O or anything like that). This intrinsic
5626 // is really badly designed in the sense that in theory, there isn't
5627 // any way to safely use it... but in practice, it mostly works
5628 // to use it with non-atomic loads and stores to get acquire/release
5629 // semantics.
5630 Builder.CreateFence(Ordering: llvm::AtomicOrdering::SequentiallyConsistent);
5631 return RValue::get(V: nullptr);
5632 }
5633
5634 case Builtin::BI__builtin_nontemporal_load:
5635 return RValue::get(V: EmitNontemporalLoad(CGF&: *this, E));
5636 case Builtin::BI__builtin_nontemporal_store:
5637 return RValue::get(V: EmitNontemporalStore(CGF&: *this, E));
5638 case Builtin::BI__c11_atomic_is_lock_free:
5639 case Builtin::BI__atomic_is_lock_free: {
5640 // Call "bool __atomic_is_lock_free(size_t size, void *ptr)". For the
5641 // __c11 builtin, ptr is 0 (indicating a properly-aligned object), since
5642 // _Atomic(T) is always properly-aligned.
5643 const char *LibCallName = "__atomic_is_lock_free";
5644 CallArgList Args;
5645 Args.add(rvalue: RValue::get(V: EmitScalarExpr(E: E->getArg(Arg: 0))),
5646 type: getContext().getSizeType());
5647 if (BuiltinID == Builtin::BI__atomic_is_lock_free)
5648 Args.add(rvalue: RValue::get(V: EmitScalarExpr(E: E->getArg(Arg: 1))),
5649 type: getContext().VoidPtrTy);
5650 else
5651 Args.add(rvalue: RValue::get(V: llvm::Constant::getNullValue(Ty: VoidPtrTy)),
5652 type: getContext().VoidPtrTy);
5653 const CGFunctionInfo &FuncInfo =
5654 CGM.getTypes().arrangeBuiltinFunctionCall(resultType: E->getType(), args: Args);
5655 llvm::FunctionType *FTy = CGM.getTypes().GetFunctionType(Info: FuncInfo);
5656 llvm::FunctionCallee Func = CGM.CreateRuntimeFunction(Ty: FTy, Name: LibCallName);
5657 return EmitCall(CallInfo: FuncInfo, Callee: CGCallee::forDirect(functionPtr: Func),
5658 ReturnValue: ReturnValueSlot(), Args);
5659 }
5660
5661 case Builtin::BI__atomic_thread_fence:
5662 case Builtin::BI__atomic_signal_fence:
5663 case Builtin::BI__c11_atomic_thread_fence:
5664 case Builtin::BI__c11_atomic_signal_fence: {
5665 llvm::SyncScope::ID SSID;
5666 if (BuiltinID == Builtin::BI__atomic_signal_fence ||
5667 BuiltinID == Builtin::BI__c11_atomic_signal_fence)
5668 SSID = llvm::SyncScope::SingleThread;
5669 else
5670 SSID = llvm::SyncScope::System;
5671 Value *Order = EmitScalarExpr(E: E->getArg(Arg: 0));
5672 if (isa<llvm::ConstantInt>(Val: Order)) {
5673 int ord = cast<llvm::ConstantInt>(Val: Order)->getZExtValue();
5674 switch (ord) {
5675 case 0: // memory_order_relaxed
5676 default: // invalid order
5677 break;
5678 case 1: // memory_order_consume
5679 case 2: // memory_order_acquire
5680 Builder.CreateFence(Ordering: llvm::AtomicOrdering::Acquire, SSID);
5681 break;
5682 case 3: // memory_order_release
5683 Builder.CreateFence(Ordering: llvm::AtomicOrdering::Release, SSID);
5684 break;
5685 case 4: // memory_order_acq_rel
5686 Builder.CreateFence(Ordering: llvm::AtomicOrdering::AcquireRelease, SSID);
5687 break;
5688 case 5: // memory_order_seq_cst
5689 Builder.CreateFence(Ordering: llvm::AtomicOrdering::SequentiallyConsistent, SSID);
5690 break;
5691 }
5692 return RValue::get(V: nullptr);
5693 }
5694
5695 llvm::BasicBlock *AcquireBB, *ReleaseBB, *AcqRelBB, *SeqCstBB;
5696 AcquireBB = createBasicBlock(name: "acquire", parent: CurFn);
5697 ReleaseBB = createBasicBlock(name: "release", parent: CurFn);
5698 AcqRelBB = createBasicBlock(name: "acqrel", parent: CurFn);
5699 SeqCstBB = createBasicBlock(name: "seqcst", parent: CurFn);
5700 llvm::BasicBlock *ContBB = createBasicBlock(name: "atomic.continue", parent: CurFn);
5701
5702 Order = Builder.CreateIntCast(V: Order, DestTy: Builder.getInt32Ty(), isSigned: false);
5703 llvm::SwitchInst *SI = Builder.CreateSwitch(V: Order, Dest: ContBB);
5704
5705 Builder.SetInsertPoint(AcquireBB);
5706 Builder.CreateFence(Ordering: llvm::AtomicOrdering::Acquire, SSID);
5707 Builder.CreateBr(Dest: ContBB);
5708 SI->addCase(OnVal: Builder.getInt32(C: 1), Dest: AcquireBB);
5709 SI->addCase(OnVal: Builder.getInt32(C: 2), Dest: AcquireBB);
5710
5711 Builder.SetInsertPoint(ReleaseBB);
5712 Builder.CreateFence(Ordering: llvm::AtomicOrdering::Release, SSID);
5713 Builder.CreateBr(Dest: ContBB);
5714 SI->addCase(OnVal: Builder.getInt32(C: 3), Dest: ReleaseBB);
5715
5716 Builder.SetInsertPoint(AcqRelBB);
5717 Builder.CreateFence(Ordering: llvm::AtomicOrdering::AcquireRelease, SSID);
5718 Builder.CreateBr(Dest: ContBB);
5719 SI->addCase(OnVal: Builder.getInt32(C: 4), Dest: AcqRelBB);
5720
5721 Builder.SetInsertPoint(SeqCstBB);
5722 Builder.CreateFence(Ordering: llvm::AtomicOrdering::SequentiallyConsistent, SSID);
5723 Builder.CreateBr(Dest: ContBB);
5724 SI->addCase(OnVal: Builder.getInt32(C: 5), Dest: SeqCstBB);
5725
5726 Builder.SetInsertPoint(ContBB);
5727 return RValue::get(V: nullptr);
5728 }
5729 case Builtin::BI__scoped_atomic_thread_fence: {
5730 auto ScopeModel = AtomicScopeModel::create(K: AtomicScopeModelKind::Generic);
5731
5732 Value *Order = EmitScalarExpr(E: E->getArg(Arg: 0));
5733 Value *Scope = EmitScalarExpr(E: E->getArg(Arg: 1));
5734 auto Ord = dyn_cast<llvm::ConstantInt>(Val: Order);
5735 auto Scp = dyn_cast<llvm::ConstantInt>(Val: Scope);
5736 if (Ord && Scp) {
5737 SyncScope SS = ScopeModel->isValid(S: Scp->getZExtValue())
5738 ? ScopeModel->map(S: Scp->getZExtValue())
5739 : ScopeModel->map(S: ScopeModel->getFallBackValue());
5740 switch (Ord->getZExtValue()) {
5741 case 0: // memory_order_relaxed
5742 default: // invalid order
5743 break;
5744 case 1: // memory_order_consume
5745 case 2: // memory_order_acquire
5746 Builder.CreateFence(
5747 Ordering: llvm::AtomicOrdering::Acquire,
5748 SSID: getTargetHooks().getLLVMSyncScopeID(LangOpts: getLangOpts(), Scope: SS,
5749 Ordering: llvm::AtomicOrdering::Acquire,
5750 Ctx&: getLLVMContext()));
5751 break;
5752 case 3: // memory_order_release
5753 Builder.CreateFence(
5754 Ordering: llvm::AtomicOrdering::Release,
5755 SSID: getTargetHooks().getLLVMSyncScopeID(LangOpts: getLangOpts(), Scope: SS,
5756 Ordering: llvm::AtomicOrdering::Release,
5757 Ctx&: getLLVMContext()));
5758 break;
5759 case 4: // memory_order_acq_rel
5760 Builder.CreateFence(Ordering: llvm::AtomicOrdering::AcquireRelease,
5761 SSID: getTargetHooks().getLLVMSyncScopeID(
5762 LangOpts: getLangOpts(), Scope: SS,
5763 Ordering: llvm::AtomicOrdering::AcquireRelease,
5764 Ctx&: getLLVMContext()));
5765 break;
5766 case 5: // memory_order_seq_cst
5767 Builder.CreateFence(Ordering: llvm::AtomicOrdering::SequentiallyConsistent,
5768 SSID: getTargetHooks().getLLVMSyncScopeID(
5769 LangOpts: getLangOpts(), Scope: SS,
5770 Ordering: llvm::AtomicOrdering::SequentiallyConsistent,
5771 Ctx&: getLLVMContext()));
5772 break;
5773 }
5774 return RValue::get(V: nullptr);
5775 }
5776
5777 llvm::BasicBlock *ContBB = createBasicBlock(name: "atomic.scope.continue", parent: CurFn);
5778
5779 llvm::SmallVector<std::pair<llvm::BasicBlock *, llvm::AtomicOrdering>>
5780 OrderBBs;
5781 if (Ord) {
5782 switch (Ord->getZExtValue()) {
5783 case 0: // memory_order_relaxed
5784 default: // invalid order
5785 ContBB->eraseFromParent();
5786 return RValue::get(V: nullptr);
5787 case 1: // memory_order_consume
5788 case 2: // memory_order_acquire
5789 OrderBBs.emplace_back(Args: Builder.GetInsertBlock(),
5790 Args: llvm::AtomicOrdering::Acquire);
5791 break;
5792 case 3: // memory_order_release
5793 OrderBBs.emplace_back(Args: Builder.GetInsertBlock(),
5794 Args: llvm::AtomicOrdering::Release);
5795 break;
5796 case 4: // memory_order_acq_rel
5797 OrderBBs.emplace_back(Args: Builder.GetInsertBlock(),
5798 Args: llvm::AtomicOrdering::AcquireRelease);
5799 break;
5800 case 5: // memory_order_seq_cst
5801 OrderBBs.emplace_back(Args: Builder.GetInsertBlock(),
5802 Args: llvm::AtomicOrdering::SequentiallyConsistent);
5803 break;
5804 }
5805 } else {
5806 llvm::BasicBlock *AcquireBB = createBasicBlock(name: "acquire", parent: CurFn);
5807 llvm::BasicBlock *ReleaseBB = createBasicBlock(name: "release", parent: CurFn);
5808 llvm::BasicBlock *AcqRelBB = createBasicBlock(name: "acqrel", parent: CurFn);
5809 llvm::BasicBlock *SeqCstBB = createBasicBlock(name: "seqcst", parent: CurFn);
5810
5811 Order = Builder.CreateIntCast(V: Order, DestTy: Builder.getInt32Ty(), isSigned: false);
5812 llvm::SwitchInst *SI = Builder.CreateSwitch(V: Order, Dest: ContBB);
5813 SI->addCase(OnVal: Builder.getInt32(C: 1), Dest: AcquireBB);
5814 SI->addCase(OnVal: Builder.getInt32(C: 2), Dest: AcquireBB);
5815 SI->addCase(OnVal: Builder.getInt32(C: 3), Dest: ReleaseBB);
5816 SI->addCase(OnVal: Builder.getInt32(C: 4), Dest: AcqRelBB);
5817 SI->addCase(OnVal: Builder.getInt32(C: 5), Dest: SeqCstBB);
5818
5819 OrderBBs.emplace_back(Args&: AcquireBB, Args: llvm::AtomicOrdering::Acquire);
5820 OrderBBs.emplace_back(Args&: ReleaseBB, Args: llvm::AtomicOrdering::Release);
5821 OrderBBs.emplace_back(Args&: AcqRelBB, Args: llvm::AtomicOrdering::AcquireRelease);
5822 OrderBBs.emplace_back(Args&: SeqCstBB,
5823 Args: llvm::AtomicOrdering::SequentiallyConsistent);
5824 }
5825
5826 for (auto &[OrderBB, Ordering] : OrderBBs) {
5827 Builder.SetInsertPoint(OrderBB);
5828 if (Scp) {
5829 SyncScope SS = ScopeModel->isValid(S: Scp->getZExtValue())
5830 ? ScopeModel->map(S: Scp->getZExtValue())
5831 : ScopeModel->map(S: ScopeModel->getFallBackValue());
5832 Builder.CreateFence(Ordering,
5833 SSID: getTargetHooks().getLLVMSyncScopeID(
5834 LangOpts: getLangOpts(), Scope: SS, Ordering, Ctx&: getLLVMContext()));
5835 Builder.CreateBr(Dest: ContBB);
5836 } else {
5837 llvm::DenseMap<unsigned, llvm::BasicBlock *> BBs;
5838 for (unsigned Scp : ScopeModel->getRuntimeValues())
5839 BBs[Scp] = createBasicBlock(name: getAsString(S: ScopeModel->map(S: Scp)), parent: CurFn);
5840
5841 auto *SC = Builder.CreateIntCast(V: Scope, DestTy: Builder.getInt32Ty(), isSigned: false);
5842 llvm::SwitchInst *SI = Builder.CreateSwitch(V: SC, Dest: ContBB);
5843 for (unsigned Scp : ScopeModel->getRuntimeValues()) {
5844 auto *B = BBs[Scp];
5845 SI->addCase(OnVal: Builder.getInt32(C: Scp), Dest: B);
5846
5847 Builder.SetInsertPoint(B);
5848 Builder.CreateFence(Ordering, SSID: getTargetHooks().getLLVMSyncScopeID(
5849 LangOpts: getLangOpts(), Scope: ScopeModel->map(S: Scp),
5850 Ordering, Ctx&: getLLVMContext()));
5851 Builder.CreateBr(Dest: ContBB);
5852 }
5853 }
5854 }
5855
5856 Builder.SetInsertPoint(ContBB);
5857 return RValue::get(V: nullptr);
5858 }
5859
5860 case Builtin::BI__builtin_signbit:
5861 case Builtin::BI__builtin_signbitf:
5862 case Builtin::BI__builtin_signbitl: {
5863 return RValue::get(
5864 V: Builder.CreateZExt(V: EmitSignBit(CGF&: *this, V: EmitScalarExpr(E: E->getArg(Arg: 0))),
5865 DestTy: ConvertType(T: E->getType())));
5866 }
5867 case Builtin::BI__warn_memset_zero_len:
5868 return RValue::getIgnored();
5869 case Builtin::BI__annotation: {
5870 // Re-encode each wide string to UTF8 and make an MDString.
5871 SmallVector<Metadata *, 1> Strings;
5872 for (const Expr *Arg : E->arguments()) {
5873 const auto *Str = cast<StringLiteral>(Val: Arg->IgnoreParenCasts());
5874 assert(Str->getCharByteWidth() == 2 || Str->getCharByteWidth() == 4);
5875 StringRef WideBytes = Str->getBytes();
5876 std::string StrUtf8;
5877 bool Converted =
5878 (Str->getCharByteWidth() == 2)
5879 ? convertUTF16ToUTF8String(
5880 SrcBytes: ArrayRef(WideBytes.data(), WideBytes.size()), Out&: StrUtf8)
5881 : convertUTF32ToUTF8String(
5882 SrcBytes: ArrayRef(WideBytes.data(), WideBytes.size()), Out&: StrUtf8);
5883 if (!Converted) {
5884 CGM.ErrorUnsupported(S: E, Type: "non-Unicode __annotation argument");
5885 continue;
5886 }
5887 Strings.push_back(Elt: llvm::MDString::get(Context&: getLLVMContext(), Str: StrUtf8));
5888 }
5889
5890 // Build and MDTuple of MDStrings and emit the intrinsic call.
5891 llvm::Function *F = CGM.getIntrinsic(IID: Intrinsic::codeview_annotation, Tys: {});
5892 MDTuple *StrTuple = MDTuple::get(Context&: getLLVMContext(), MDs: Strings);
5893 Builder.CreateCall(Callee: F, Args: MetadataAsValue::get(Context&: getLLVMContext(), MD: StrTuple));
5894 return RValue::getIgnored();
5895 }
5896 case Builtin::BI__builtin_annotation: {
5897 llvm::Value *AnnVal = EmitScalarExpr(E: E->getArg(Arg: 0));
5898 llvm::Function *F = CGM.getIntrinsic(
5899 IID: Intrinsic::annotation, Tys: {AnnVal->getType(), CGM.ConstGlobalsPtrTy});
5900
5901 // Get the annotation string, go through casts. Sema requires this to be a
5902 // non-wide string literal, potentially casted, so the cast<> is safe.
5903 const Expr *AnnotationStrExpr = E->getArg(Arg: 1)->IgnoreParenCasts();
5904 StringRef Str = cast<StringLiteral>(Val: AnnotationStrExpr)->getString();
5905 return RValue::get(
5906 V: EmitAnnotationCall(AnnotationFn: F, AnnotatedVal: AnnVal, AnnotationStr: Str, Location: E->getExprLoc(), Attr: nullptr));
5907 }
5908 case Builtin::BI__builtin_addcb:
5909 case Builtin::BI__builtin_addcs:
5910 case Builtin::BI__builtin_addc:
5911 case Builtin::BI__builtin_addcl:
5912 case Builtin::BI__builtin_addcll:
5913 case Builtin::BI__builtin_subcb:
5914 case Builtin::BI__builtin_subcs:
5915 case Builtin::BI__builtin_subc:
5916 case Builtin::BI__builtin_subcl:
5917 case Builtin::BI__builtin_subcll: {
5918
5919 // We translate all of these builtins from expressions of the form:
5920 // int x = ..., y = ..., carryin = ..., carryout, result;
5921 // result = __builtin_addc(x, y, carryin, &carryout);
5922 //
5923 // to LLVM IR of the form:
5924 //
5925 // %tmp1 = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %x, i32 %y)
5926 // %tmpsum1 = extractvalue {i32, i1} %tmp1, 0
5927 // %carry1 = extractvalue {i32, i1} %tmp1, 1
5928 // %tmp2 = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %tmpsum1,
5929 // i32 %carryin)
5930 // %result = extractvalue {i32, i1} %tmp2, 0
5931 // %carry2 = extractvalue {i32, i1} %tmp2, 1
5932 // %tmp3 = or i1 %carry1, %carry2
5933 // %tmp4 = zext i1 %tmp3 to i32
5934 // store i32 %tmp4, i32* %carryout
5935
5936 // Scalarize our inputs.
5937 llvm::Value *X = EmitScalarExpr(E: E->getArg(Arg: 0));
5938 llvm::Value *Y = EmitScalarExpr(E: E->getArg(Arg: 1));
5939 llvm::Value *Carryin = EmitScalarExpr(E: E->getArg(Arg: 2));
5940 Address CarryOutPtr = EmitPointerWithAlignment(Addr: E->getArg(Arg: 3));
5941
5942 // Decide if we are lowering to a uadd.with.overflow or usub.with.overflow.
5943 Intrinsic::ID IntrinsicId;
5944 switch (BuiltinID) {
5945 default: llvm_unreachable("Unknown multiprecision builtin id.");
5946 case Builtin::BI__builtin_addcb:
5947 case Builtin::BI__builtin_addcs:
5948 case Builtin::BI__builtin_addc:
5949 case Builtin::BI__builtin_addcl:
5950 case Builtin::BI__builtin_addcll:
5951 IntrinsicId = Intrinsic::uadd_with_overflow;
5952 break;
5953 case Builtin::BI__builtin_subcb:
5954 case Builtin::BI__builtin_subcs:
5955 case Builtin::BI__builtin_subc:
5956 case Builtin::BI__builtin_subcl:
5957 case Builtin::BI__builtin_subcll:
5958 IntrinsicId = Intrinsic::usub_with_overflow;
5959 break;
5960 }
5961
5962 // Construct our resulting LLVM IR expression.
5963 llvm::Value *Carry1;
5964 llvm::Value *Sum1 = EmitOverflowIntrinsic(CGF&: *this, IntrinsicID: IntrinsicId,
5965 X, Y, Carry&: Carry1);
5966 llvm::Value *Carry2;
5967 llvm::Value *Sum2 = EmitOverflowIntrinsic(CGF&: *this, IntrinsicID: IntrinsicId,
5968 X: Sum1, Y: Carryin, Carry&: Carry2);
5969 llvm::Value *CarryOut = Builder.CreateZExt(V: Builder.CreateOr(LHS: Carry1, RHS: Carry2),
5970 DestTy: X->getType());
5971 Builder.CreateStore(Val: CarryOut, Addr: CarryOutPtr);
5972 return RValue::get(V: Sum2);
5973 }
5974
5975 case Builtin::BI__builtin_add_overflow:
5976 case Builtin::BI__builtin_sub_overflow:
5977 case Builtin::BI__builtin_mul_overflow: {
5978 const clang::Expr *LeftArg = E->getArg(Arg: 0);
5979 const clang::Expr *RightArg = E->getArg(Arg: 1);
5980 const clang::Expr *ResultArg = E->getArg(Arg: 2);
5981
5982 clang::QualType ResultQTy =
5983 ResultArg->getType()->castAs<PointerType>()->getPointeeType();
5984
5985 WidthAndSignedness LeftInfo =
5986 getIntegerWidthAndSignedness(context: CGM.getContext(), Type: LeftArg->getType());
5987 WidthAndSignedness RightInfo =
5988 getIntegerWidthAndSignedness(context: CGM.getContext(), Type: RightArg->getType());
5989 WidthAndSignedness ResultInfo =
5990 getIntegerWidthAndSignedness(context: CGM.getContext(), Type: ResultQTy);
5991
5992 // Handle mixed-sign multiplication as a special case, because adding
5993 // runtime or backend support for our generic irgen would be too expensive.
5994 if (isSpecialMixedSignMultiply(BuiltinID, Op1Info: LeftInfo, Op2Info: RightInfo, ResultInfo))
5995 return EmitCheckedMixedSignMultiply(CGF&: *this, Op1: LeftArg, Op1Info: LeftInfo, Op2: RightArg,
5996 Op2Info: RightInfo, ResultArg, ResultQTy,
5997 ResultInfo);
5998
5999 if (isSpecialUnsignedMultiplySignedResult(BuiltinID, Op1Info: LeftInfo, Op2Info: RightInfo,
6000 ResultInfo))
6001 return EmitCheckedUnsignedMultiplySignedResult(
6002 CGF&: *this, Op1: LeftArg, Op1Info: LeftInfo, Op2: RightArg, Op2Info: RightInfo, ResultArg, ResultQTy,
6003 ResultInfo);
6004
6005 WidthAndSignedness EncompassingInfo =
6006 EncompassingIntegerType(Types: {LeftInfo, RightInfo, ResultInfo});
6007
6008 llvm::Type *EncompassingLLVMTy =
6009 llvm::IntegerType::get(C&: CGM.getLLVMContext(), NumBits: EncompassingInfo.Width);
6010
6011 llvm::Type *ResultLLVMTy = CGM.getTypes().ConvertType(T: ResultQTy);
6012
6013 Intrinsic::ID IntrinsicId;
6014 switch (BuiltinID) {
6015 default:
6016 llvm_unreachable("Unknown overflow builtin id.");
6017 case Builtin::BI__builtin_add_overflow:
6018 IntrinsicId = EncompassingInfo.Signed ? Intrinsic::sadd_with_overflow
6019 : Intrinsic::uadd_with_overflow;
6020 break;
6021 case Builtin::BI__builtin_sub_overflow:
6022 IntrinsicId = EncompassingInfo.Signed ? Intrinsic::ssub_with_overflow
6023 : Intrinsic::usub_with_overflow;
6024 break;
6025 case Builtin::BI__builtin_mul_overflow:
6026 IntrinsicId = EncompassingInfo.Signed ? Intrinsic::smul_with_overflow
6027 : Intrinsic::umul_with_overflow;
6028 break;
6029 }
6030
6031 llvm::Value *Left = EmitScalarExpr(E: LeftArg);
6032 llvm::Value *Right = EmitScalarExpr(E: RightArg);
6033 Address ResultPtr = EmitPointerWithAlignment(Addr: ResultArg);
6034
6035 // Extend each operand to the encompassing type.
6036 Left = Builder.CreateIntCast(V: Left, DestTy: EncompassingLLVMTy, isSigned: LeftInfo.Signed);
6037 Right = Builder.CreateIntCast(V: Right, DestTy: EncompassingLLVMTy, isSigned: RightInfo.Signed);
6038
6039 // Perform the operation on the extended values.
6040 llvm::Value *Overflow, *Result;
6041 Result = EmitOverflowIntrinsic(CGF&: *this, IntrinsicID: IntrinsicId, X: Left, Y: Right, Carry&: Overflow);
6042
6043 if (EncompassingInfo.Width > ResultInfo.Width) {
6044 // The encompassing type is wider than the result type, so we need to
6045 // truncate it.
6046 llvm::Value *ResultTrunc = Builder.CreateTrunc(V: Result, DestTy: ResultLLVMTy);
6047
6048 // To see if the truncation caused an overflow, we will extend
6049 // the result and then compare it to the original result.
6050 llvm::Value *ResultTruncExt = Builder.CreateIntCast(
6051 V: ResultTrunc, DestTy: EncompassingLLVMTy, isSigned: ResultInfo.Signed);
6052 llvm::Value *TruncationOverflow =
6053 Builder.CreateICmpNE(LHS: Result, RHS: ResultTruncExt);
6054
6055 Overflow = Builder.CreateOr(LHS: Overflow, RHS: TruncationOverflow);
6056 Result = ResultTrunc;
6057 }
6058
6059 // Finally, store the result using the pointer.
6060 bool isVolatile =
6061 ResultArg->getType()->getPointeeType().isVolatileQualified();
6062 Builder.CreateStore(Val: EmitToMemory(Value: Result, Ty: ResultQTy), Addr: ResultPtr, IsVolatile: isVolatile);
6063
6064 return RValue::get(V: Overflow);
6065 }
6066
6067 case Builtin::BI__builtin_uadd_overflow:
6068 case Builtin::BI__builtin_uaddl_overflow:
6069 case Builtin::BI__builtin_uaddll_overflow:
6070 case Builtin::BI__builtin_usub_overflow:
6071 case Builtin::BI__builtin_usubl_overflow:
6072 case Builtin::BI__builtin_usubll_overflow:
6073 case Builtin::BI__builtin_umul_overflow:
6074 case Builtin::BI__builtin_umull_overflow:
6075 case Builtin::BI__builtin_umulll_overflow:
6076 case Builtin::BI__builtin_sadd_overflow:
6077 case Builtin::BI__builtin_saddl_overflow:
6078 case Builtin::BI__builtin_saddll_overflow:
6079 case Builtin::BI__builtin_ssub_overflow:
6080 case Builtin::BI__builtin_ssubl_overflow:
6081 case Builtin::BI__builtin_ssubll_overflow:
6082 case Builtin::BI__builtin_smul_overflow:
6083 case Builtin::BI__builtin_smull_overflow:
6084 case Builtin::BI__builtin_smulll_overflow: {
6085
6086 // We translate all of these builtins directly to the relevant llvm IR node.
6087
6088 // Scalarize our inputs.
6089 llvm::Value *X = EmitScalarExpr(E: E->getArg(Arg: 0));
6090 llvm::Value *Y = EmitScalarExpr(E: E->getArg(Arg: 1));
6091 Address SumOutPtr = EmitPointerWithAlignment(Addr: E->getArg(Arg: 2));
6092
6093 // Decide which of the overflow intrinsics we are lowering to:
6094 Intrinsic::ID IntrinsicId;
6095 switch (BuiltinID) {
6096 default: llvm_unreachable("Unknown overflow builtin id.");
6097 case Builtin::BI__builtin_uadd_overflow:
6098 case Builtin::BI__builtin_uaddl_overflow:
6099 case Builtin::BI__builtin_uaddll_overflow:
6100 IntrinsicId = Intrinsic::uadd_with_overflow;
6101 break;
6102 case Builtin::BI__builtin_usub_overflow:
6103 case Builtin::BI__builtin_usubl_overflow:
6104 case Builtin::BI__builtin_usubll_overflow:
6105 IntrinsicId = Intrinsic::usub_with_overflow;
6106 break;
6107 case Builtin::BI__builtin_umul_overflow:
6108 case Builtin::BI__builtin_umull_overflow:
6109 case Builtin::BI__builtin_umulll_overflow:
6110 IntrinsicId = Intrinsic::umul_with_overflow;
6111 break;
6112 case Builtin::BI__builtin_sadd_overflow:
6113 case Builtin::BI__builtin_saddl_overflow:
6114 case Builtin::BI__builtin_saddll_overflow:
6115 IntrinsicId = Intrinsic::sadd_with_overflow;
6116 break;
6117 case Builtin::BI__builtin_ssub_overflow:
6118 case Builtin::BI__builtin_ssubl_overflow:
6119 case Builtin::BI__builtin_ssubll_overflow:
6120 IntrinsicId = Intrinsic::ssub_with_overflow;
6121 break;
6122 case Builtin::BI__builtin_smul_overflow:
6123 case Builtin::BI__builtin_smull_overflow:
6124 case Builtin::BI__builtin_smulll_overflow:
6125 IntrinsicId = Intrinsic::smul_with_overflow;
6126 break;
6127 }
6128
6129
6130 llvm::Value *Carry;
6131 llvm::Value *Sum = EmitOverflowIntrinsic(CGF&: *this, IntrinsicID: IntrinsicId, X, Y, Carry);
6132 Builder.CreateStore(Val: Sum, Addr: SumOutPtr);
6133
6134 return RValue::get(V: Carry);
6135 }
6136 case Builtin::BIaddressof:
6137 case Builtin::BI__addressof:
6138 case Builtin::BI__builtin_addressof:
6139 return RValue::get(V: EmitLValue(E: E->getArg(Arg: 0)).getPointer(CGF&: *this));
6140 case Builtin::BI__builtin_function_start:
6141 return RValue::get(V: CGM.GetFunctionStart(
6142 Decl: E->getArg(Arg: 0)->getAsBuiltinConstantDeclRef(Context: CGM.getContext())));
6143 case Builtin::BI__builtin_operator_new:
6144 return EmitBuiltinNewDeleteCall(
6145 Type: E->getCallee()->getType()->castAs<FunctionProtoType>(), TheCallExpr: E, IsDelete: false);
6146 case Builtin::BI__builtin_operator_delete:
6147 EmitBuiltinNewDeleteCall(
6148 Type: E->getCallee()->getType()->castAs<FunctionProtoType>(), TheCallExpr: E, IsDelete: true);
6149 return RValue::get(V: nullptr);
6150
6151 case Builtin::BI__builtin_is_aligned:
6152 return EmitBuiltinIsAligned(E);
6153 case Builtin::BI__builtin_align_up:
6154 return EmitBuiltinAlignTo(E, AlignUp: true);
6155 case Builtin::BI__builtin_align_down:
6156 return EmitBuiltinAlignTo(E, AlignUp: false);
6157
6158 case Builtin::BI__noop:
6159 // __noop always evaluates to an integer literal zero.
6160 return RValue::get(V: ConstantInt::get(Ty: IntTy, V: 0));
6161 case Builtin::BI__builtin_call_with_static_chain: {
6162 const CallExpr *Call = cast<CallExpr>(Val: E->getArg(Arg: 0));
6163 const Expr *Chain = E->getArg(Arg: 1);
6164 return EmitCall(FnType: Call->getCallee()->getType(),
6165 Callee: EmitCallee(E: Call->getCallee()), E: Call, ReturnValue,
6166 Chain: EmitScalarExpr(E: Chain));
6167 }
6168 case Builtin::BI_InterlockedExchange8:
6169 case Builtin::BI_InterlockedExchange16:
6170 case Builtin::BI_InterlockedExchange:
6171 case Builtin::BI_InterlockedExchangePointer:
6172 return RValue::get(
6173 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedExchange, E));
6174 case Builtin::BI_InterlockedCompareExchangePointer:
6175 return RValue::get(
6176 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedCompareExchange, E));
6177 case Builtin::BI_InterlockedCompareExchangePointer_nf:
6178 return RValue::get(
6179 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedCompareExchange_nf, E));
6180 case Builtin::BI_InterlockedCompareExchange8:
6181 case Builtin::BI_InterlockedCompareExchange16:
6182 case Builtin::BI_InterlockedCompareExchange:
6183 case Builtin::BI_InterlockedCompareExchange64:
6184 return RValue::get(V: EmitAtomicCmpXchgForMSIntrin(CGF&: *this, E));
6185 case Builtin::BI_InterlockedIncrement16:
6186 case Builtin::BI_InterlockedIncrement:
6187 return RValue::get(
6188 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedIncrement, E));
6189 case Builtin::BI_InterlockedDecrement16:
6190 case Builtin::BI_InterlockedDecrement:
6191 return RValue::get(
6192 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedDecrement, E));
6193 case Builtin::BI_InterlockedAnd8:
6194 case Builtin::BI_InterlockedAnd16:
6195 case Builtin::BI_InterlockedAnd:
6196 return RValue::get(V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedAnd, E));
6197 case Builtin::BI_InterlockedExchangeAdd8:
6198 case Builtin::BI_InterlockedExchangeAdd16:
6199 case Builtin::BI_InterlockedExchangeAdd:
6200 return RValue::get(
6201 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedExchangeAdd, E));
6202 case Builtin::BI_InterlockedExchangeSub8:
6203 case Builtin::BI_InterlockedExchangeSub16:
6204 case Builtin::BI_InterlockedExchangeSub:
6205 return RValue::get(
6206 V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedExchangeSub, E));
6207 case Builtin::BI_InterlockedOr8:
6208 case Builtin::BI_InterlockedOr16:
6209 case Builtin::BI_InterlockedOr:
6210 return RValue::get(V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedOr, E));
6211 case Builtin::BI_InterlockedXor8:
6212 case Builtin::BI_InterlockedXor16:
6213 case Builtin::BI_InterlockedXor:
6214 return RValue::get(V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::_InterlockedXor, E));
6215
6216 case Builtin::BI_bittest64:
6217 case Builtin::BI_bittest:
6218 case Builtin::BI_bittestandcomplement64:
6219 case Builtin::BI_bittestandcomplement:
6220 case Builtin::BI_bittestandreset64:
6221 case Builtin::BI_bittestandreset:
6222 case Builtin::BI_bittestandset64:
6223 case Builtin::BI_bittestandset:
6224 case Builtin::BI_interlockedbittestandreset:
6225 case Builtin::BI_interlockedbittestandreset64:
6226 case Builtin::BI_interlockedbittestandreset64_acq:
6227 case Builtin::BI_interlockedbittestandreset64_rel:
6228 case Builtin::BI_interlockedbittestandreset64_nf:
6229 case Builtin::BI_interlockedbittestandset64:
6230 case Builtin::BI_interlockedbittestandset64_acq:
6231 case Builtin::BI_interlockedbittestandset64_rel:
6232 case Builtin::BI_interlockedbittestandset64_nf:
6233 case Builtin::BI_interlockedbittestandset:
6234 case Builtin::BI_interlockedbittestandset_acq:
6235 case Builtin::BI_interlockedbittestandset_rel:
6236 case Builtin::BI_interlockedbittestandset_nf:
6237 case Builtin::BI_interlockedbittestandreset_acq:
6238 case Builtin::BI_interlockedbittestandreset_rel:
6239 case Builtin::BI_interlockedbittestandreset_nf:
6240 return RValue::get(V: EmitBitTestIntrinsic(CGF&: *this, BuiltinID, E));
6241
6242 // These builtins exist to emit regular volatile loads and stores not
6243 // affected by the -fms-volatile setting.
6244 case Builtin::BI__iso_volatile_load8:
6245 case Builtin::BI__iso_volatile_load16:
6246 case Builtin::BI__iso_volatile_load32:
6247 case Builtin::BI__iso_volatile_load64:
6248 return RValue::get(V: EmitISOVolatileLoad(CGF&: *this, E));
6249 case Builtin::BI__iso_volatile_store8:
6250 case Builtin::BI__iso_volatile_store16:
6251 case Builtin::BI__iso_volatile_store32:
6252 case Builtin::BI__iso_volatile_store64:
6253 return RValue::get(V: EmitISOVolatileStore(CGF&: *this, E));
6254
6255 case Builtin::BI__builtin_ptrauth_sign_constant:
6256 return RValue::get(V: ConstantEmitter(*this).emitAbstract(E, T: E->getType()));
6257
6258 case Builtin::BI__builtin_ptrauth_auth:
6259 case Builtin::BI__builtin_ptrauth_auth_and_resign:
6260 case Builtin::BI__builtin_ptrauth_auth_load_relative_and_sign:
6261 case Builtin::BI__builtin_ptrauth_blend_discriminator:
6262 case Builtin::BI__builtin_ptrauth_sign_generic_data:
6263 case Builtin::BI__builtin_ptrauth_sign_unauthenticated:
6264 case Builtin::BI__builtin_ptrauth_strip: {
6265 // Emit the arguments.
6266 SmallVector<llvm::Value *, 6> Args;
6267 for (auto argExpr : E->arguments())
6268 Args.push_back(Elt: EmitScalarExpr(E: argExpr));
6269
6270 // Cast the value to intptr_t, saving its original type.
6271 llvm::Type *OrigValueType = Args[0]->getType();
6272 if (OrigValueType->isPointerTy())
6273 Args[0] = Builder.CreatePtrToInt(V: Args[0], DestTy: IntPtrTy);
6274
6275 switch (BuiltinID) {
6276 case Builtin::BI__builtin_ptrauth_auth_and_resign:
6277 case Builtin::BI__builtin_ptrauth_auth_load_relative_and_sign:
6278 if (Args[4]->getType()->isPointerTy())
6279 Args[4] = Builder.CreatePtrToInt(V: Args[4], DestTy: IntPtrTy);
6280 [[fallthrough]];
6281
6282 case Builtin::BI__builtin_ptrauth_auth:
6283 case Builtin::BI__builtin_ptrauth_sign_unauthenticated:
6284 if (Args[2]->getType()->isPointerTy())
6285 Args[2] = Builder.CreatePtrToInt(V: Args[2], DestTy: IntPtrTy);
6286 break;
6287
6288 case Builtin::BI__builtin_ptrauth_sign_generic_data:
6289 if (Args[1]->getType()->isPointerTy())
6290 Args[1] = Builder.CreatePtrToInt(V: Args[1], DestTy: IntPtrTy);
6291 break;
6292
6293 case Builtin::BI__builtin_ptrauth_blend_discriminator:
6294 case Builtin::BI__builtin_ptrauth_strip:
6295 break;
6296 }
6297
6298 // Call the intrinsic.
6299 auto IntrinsicID = [&]() -> unsigned {
6300 switch (BuiltinID) {
6301 case Builtin::BI__builtin_ptrauth_auth:
6302 return Intrinsic::ptrauth_auth;
6303 case Builtin::BI__builtin_ptrauth_auth_and_resign:
6304 return Intrinsic::ptrauth_resign;
6305 case Builtin::BI__builtin_ptrauth_auth_load_relative_and_sign:
6306 return Intrinsic::ptrauth_resign_load_relative;
6307 case Builtin::BI__builtin_ptrauth_blend_discriminator:
6308 return Intrinsic::ptrauth_blend;
6309 case Builtin::BI__builtin_ptrauth_sign_generic_data:
6310 return Intrinsic::ptrauth_sign_generic;
6311 case Builtin::BI__builtin_ptrauth_sign_unauthenticated:
6312 return Intrinsic::ptrauth_sign;
6313 case Builtin::BI__builtin_ptrauth_strip:
6314 return Intrinsic::ptrauth_strip;
6315 }
6316 llvm_unreachable("bad ptrauth intrinsic");
6317 }();
6318 auto Intrinsic = CGM.getIntrinsic(IID: IntrinsicID);
6319 llvm::Value *Result = EmitRuntimeCall(callee: Intrinsic, args: Args);
6320
6321 if (BuiltinID != Builtin::BI__builtin_ptrauth_sign_generic_data &&
6322 BuiltinID != Builtin::BI__builtin_ptrauth_blend_discriminator &&
6323 OrigValueType->isPointerTy()) {
6324 Result = Builder.CreateIntToPtr(V: Result, DestTy: OrigValueType);
6325 }
6326 return RValue::get(V: Result);
6327 }
6328
6329 case Builtin::BI__builtin_get_vtable_pointer: {
6330 const Expr *Target = E->getArg(Arg: 0);
6331 QualType TargetType = Target->getType();
6332 const CXXRecordDecl *Decl = TargetType->getPointeeCXXRecordDecl();
6333 assert(Decl);
6334 auto ThisAddress = EmitPointerWithAlignment(Addr: Target);
6335 assert(ThisAddress.isValid());
6336 llvm::Value *VTablePointer =
6337 GetVTablePtr(This: ThisAddress, VTableTy: Int8PtrTy, VTableClass: Decl, AuthMode: VTableAuthMode::MustTrap);
6338 return RValue::get(V: VTablePointer);
6339 }
6340
6341 case Builtin::BI__exception_code:
6342 case Builtin::BI_exception_code:
6343 return RValue::get(V: EmitSEHExceptionCode());
6344 case Builtin::BI__exception_info:
6345 case Builtin::BI_exception_info:
6346 return RValue::get(V: EmitSEHExceptionInfo());
6347 case Builtin::BI__abnormal_termination:
6348 case Builtin::BI_abnormal_termination:
6349 return RValue::get(V: EmitSEHAbnormalTermination());
6350 case Builtin::BI_setjmpex:
6351 if (getTarget().getTriple().isOSMSVCRT() && E->getNumArgs() == 1 &&
6352 E->getArg(Arg: 0)->getType()->isPointerType())
6353 return EmitMSVCRTSetJmp(CGF&: *this, SJKind: MSVCSetJmpKind::_setjmpex, E);
6354 break;
6355 case Builtin::BI_setjmp:
6356 if (getTarget().getTriple().isOSMSVCRT() && E->getNumArgs() == 1 &&
6357 E->getArg(Arg: 0)->getType()->isPointerType()) {
6358 if (getTarget().getTriple().getArch() == llvm::Triple::x86)
6359 return EmitMSVCRTSetJmp(CGF&: *this, SJKind: MSVCSetJmpKind::_setjmp3, E);
6360 else if (getTarget().getTriple().getArch() == llvm::Triple::aarch64)
6361 return EmitMSVCRTSetJmp(CGF&: *this, SJKind: MSVCSetJmpKind::_setjmpex, E);
6362 return EmitMSVCRTSetJmp(CGF&: *this, SJKind: MSVCSetJmpKind::_setjmp, E);
6363 }
6364 break;
6365
6366 // C++ std:: builtins.
6367 case Builtin::BImove:
6368 case Builtin::BImove_if_noexcept:
6369 case Builtin::BIforward:
6370 case Builtin::BIforward_like:
6371 case Builtin::BIas_const:
6372 return RValue::get(V: EmitLValue(E: E->getArg(Arg: 0)).getPointer(CGF&: *this));
6373 case Builtin::BI__GetExceptionInfo: {
6374 if (llvm::GlobalVariable *GV =
6375 CGM.getCXXABI().getThrowInfo(T: FD->getParamDecl(i: 0)->getType()))
6376 return RValue::get(V: GV);
6377 break;
6378 }
6379
6380 case Builtin::BI__fastfail:
6381 return RValue::get(V: EmitMSVCBuiltinExpr(BuiltinID: MSVCIntrin::__fastfail, E));
6382
6383 case Builtin::BI__builtin_coro_id:
6384 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_id);
6385 case Builtin::BI__builtin_coro_promise:
6386 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_promise);
6387 case Builtin::BI__builtin_coro_resume:
6388 EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_resume);
6389 return RValue::get(V: nullptr);
6390 case Builtin::BI__builtin_coro_frame:
6391 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_frame);
6392 case Builtin::BI__builtin_coro_noop:
6393 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_noop);
6394 case Builtin::BI__builtin_coro_free:
6395 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_free);
6396 case Builtin::BI__builtin_coro_destroy:
6397 EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_destroy);
6398 return RValue::get(V: nullptr);
6399 case Builtin::BI__builtin_coro_done:
6400 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_done);
6401 case Builtin::BI__builtin_coro_alloc:
6402 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_alloc);
6403 case Builtin::BI__builtin_coro_begin:
6404 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_begin);
6405 case Builtin::BI__builtin_coro_end:
6406 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_end);
6407 case Builtin::BI__builtin_coro_suspend:
6408 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_suspend);
6409 case Builtin::BI__builtin_coro_size:
6410 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_size);
6411 case Builtin::BI__builtin_coro_align:
6412 return EmitCoroutineIntrinsic(E, IID: Intrinsic::coro_align);
6413
6414 // OpenCL v2.0 s6.13.16.2, Built-in pipe read and write functions
6415 case Builtin::BIread_pipe:
6416 case Builtin::BIwrite_pipe: {
6417 Value *Arg0 = EmitScalarExpr(E: E->getArg(Arg: 0)),
6418 *Arg1 = EmitScalarExpr(E: E->getArg(Arg: 1));
6419 CGOpenCLRuntime OpenCLRT(CGM);
6420 Value *PacketSize = OpenCLRT.getPipeElemSize(PipeArg: E->getArg(Arg: 0));
6421 Value *PacketAlign = OpenCLRT.getPipeElemAlign(PipeArg: E->getArg(Arg: 0));
6422
6423 // Type of the generic packet parameter.
6424 unsigned GenericAS =
6425 getContext().getTargetAddressSpace(AS: LangAS::opencl_generic);
6426 llvm::Type *I8PTy = llvm::PointerType::get(C&: getLLVMContext(), AddressSpace: GenericAS);
6427
6428 // Testing which overloaded version we should generate the call for.
6429 if (2U == E->getNumArgs()) {
6430 const char *Name = (BuiltinID == Builtin::BIread_pipe) ? "__read_pipe_2"
6431 : "__write_pipe_2";
6432 // Creating a generic function type to be able to call with any builtin or
6433 // user defined type.
6434 llvm::Type *ArgTys[] = {Arg0->getType(), I8PTy, Int32Ty, Int32Ty};
6435 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6436 Value *ACast = Builder.CreateAddrSpaceCast(V: Arg1, DestTy: I8PTy);
6437 return RValue::get(
6438 V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name),
6439 args: {Arg0, ACast, PacketSize, PacketAlign}));
6440 } else {
6441 assert(4 == E->getNumArgs() &&
6442 "Illegal number of parameters to pipe function");
6443 const char *Name = (BuiltinID == Builtin::BIread_pipe) ? "__read_pipe_4"
6444 : "__write_pipe_4";
6445
6446 llvm::Type *ArgTys[] = {Arg0->getType(), Arg1->getType(), Int32Ty, I8PTy,
6447 Int32Ty, Int32Ty};
6448 Value *Arg2 = EmitScalarExpr(E: E->getArg(Arg: 2)),
6449 *Arg3 = EmitScalarExpr(E: E->getArg(Arg: 3));
6450 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6451 Value *ACast = Builder.CreateAddrSpaceCast(V: Arg3, DestTy: I8PTy);
6452 // We know the third argument is an integer type, but we may need to cast
6453 // it to i32.
6454 if (Arg2->getType() != Int32Ty)
6455 Arg2 = Builder.CreateZExtOrTrunc(V: Arg2, DestTy: Int32Ty);
6456 return RValue::get(
6457 V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name),
6458 args: {Arg0, Arg1, Arg2, ACast, PacketSize, PacketAlign}));
6459 }
6460 }
6461 // OpenCL v2.0 s6.13.16 ,s9.17.3.5 - Built-in pipe reserve read and write
6462 // functions
6463 case Builtin::BIreserve_read_pipe:
6464 case Builtin::BIreserve_write_pipe:
6465 case Builtin::BIwork_group_reserve_read_pipe:
6466 case Builtin::BIwork_group_reserve_write_pipe:
6467 case Builtin::BIsub_group_reserve_read_pipe:
6468 case Builtin::BIsub_group_reserve_write_pipe: {
6469 // Composing the mangled name for the function.
6470 const char *Name;
6471 if (BuiltinID == Builtin::BIreserve_read_pipe)
6472 Name = "__reserve_read_pipe";
6473 else if (BuiltinID == Builtin::BIreserve_write_pipe)
6474 Name = "__reserve_write_pipe";
6475 else if (BuiltinID == Builtin::BIwork_group_reserve_read_pipe)
6476 Name = "__work_group_reserve_read_pipe";
6477 else if (BuiltinID == Builtin::BIwork_group_reserve_write_pipe)
6478 Name = "__work_group_reserve_write_pipe";
6479 else if (BuiltinID == Builtin::BIsub_group_reserve_read_pipe)
6480 Name = "__sub_group_reserve_read_pipe";
6481 else
6482 Name = "__sub_group_reserve_write_pipe";
6483
6484 Value *Arg0 = EmitScalarExpr(E: E->getArg(Arg: 0)),
6485 *Arg1 = EmitScalarExpr(E: E->getArg(Arg: 1));
6486 llvm::Type *ReservedIDTy = ConvertType(T: getContext().OCLReserveIDTy);
6487 CGOpenCLRuntime OpenCLRT(CGM);
6488 Value *PacketSize = OpenCLRT.getPipeElemSize(PipeArg: E->getArg(Arg: 0));
6489 Value *PacketAlign = OpenCLRT.getPipeElemAlign(PipeArg: E->getArg(Arg: 0));
6490
6491 // Building the generic function prototype.
6492 llvm::Type *ArgTys[] = {Arg0->getType(), Int32Ty, Int32Ty, Int32Ty};
6493 llvm::FunctionType *FTy =
6494 llvm::FunctionType::get(Result: ReservedIDTy, Params: ArgTys, isVarArg: false);
6495 // We know the second argument is an integer type, but we may need to cast
6496 // it to i32.
6497 if (Arg1->getType() != Int32Ty)
6498 Arg1 = Builder.CreateZExtOrTrunc(V: Arg1, DestTy: Int32Ty);
6499 return RValue::get(V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name),
6500 args: {Arg0, Arg1, PacketSize, PacketAlign}));
6501 }
6502 // OpenCL v2.0 s6.13.16, s9.17.3.5 - Built-in pipe commit read and write
6503 // functions
6504 case Builtin::BIcommit_read_pipe:
6505 case Builtin::BIcommit_write_pipe:
6506 case Builtin::BIwork_group_commit_read_pipe:
6507 case Builtin::BIwork_group_commit_write_pipe:
6508 case Builtin::BIsub_group_commit_read_pipe:
6509 case Builtin::BIsub_group_commit_write_pipe: {
6510 const char *Name;
6511 if (BuiltinID == Builtin::BIcommit_read_pipe)
6512 Name = "__commit_read_pipe";
6513 else if (BuiltinID == Builtin::BIcommit_write_pipe)
6514 Name = "__commit_write_pipe";
6515 else if (BuiltinID == Builtin::BIwork_group_commit_read_pipe)
6516 Name = "__work_group_commit_read_pipe";
6517 else if (BuiltinID == Builtin::BIwork_group_commit_write_pipe)
6518 Name = "__work_group_commit_write_pipe";
6519 else if (BuiltinID == Builtin::BIsub_group_commit_read_pipe)
6520 Name = "__sub_group_commit_read_pipe";
6521 else
6522 Name = "__sub_group_commit_write_pipe";
6523
6524 Value *Arg0 = EmitScalarExpr(E: E->getArg(Arg: 0)),
6525 *Arg1 = EmitScalarExpr(E: E->getArg(Arg: 1));
6526 CGOpenCLRuntime OpenCLRT(CGM);
6527 Value *PacketSize = OpenCLRT.getPipeElemSize(PipeArg: E->getArg(Arg: 0));
6528 Value *PacketAlign = OpenCLRT.getPipeElemAlign(PipeArg: E->getArg(Arg: 0));
6529
6530 // Building the generic function prototype.
6531 llvm::Type *ArgTys[] = {Arg0->getType(), Arg1->getType(), Int32Ty, Int32Ty};
6532 llvm::FunctionType *FTy = llvm::FunctionType::get(
6533 Result: llvm::Type::getVoidTy(C&: getLLVMContext()), Params: ArgTys, isVarArg: false);
6534
6535 return RValue::get(V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name),
6536 args: {Arg0, Arg1, PacketSize, PacketAlign}));
6537 }
6538 // OpenCL v2.0 s6.13.16.4 Built-in pipe query functions
6539 case Builtin::BIget_pipe_num_packets:
6540 case Builtin::BIget_pipe_max_packets: {
6541 const char *BaseName;
6542 const auto *PipeTy = E->getArg(Arg: 0)->getType()->castAs<PipeType>();
6543 if (BuiltinID == Builtin::BIget_pipe_num_packets)
6544 BaseName = "__get_pipe_num_packets";
6545 else
6546 BaseName = "__get_pipe_max_packets";
6547 std::string Name = std::string(BaseName) +
6548 std::string(PipeTy->isReadOnly() ? "_ro" : "_wo");
6549
6550 // Building the generic function prototype.
6551 Value *Arg0 = EmitScalarExpr(E: E->getArg(Arg: 0));
6552 CGOpenCLRuntime OpenCLRT(CGM);
6553 Value *PacketSize = OpenCLRT.getPipeElemSize(PipeArg: E->getArg(Arg: 0));
6554 Value *PacketAlign = OpenCLRT.getPipeElemAlign(PipeArg: E->getArg(Arg: 0));
6555 llvm::Type *ArgTys[] = {Arg0->getType(), Int32Ty, Int32Ty};
6556 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6557
6558 return RValue::get(V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name),
6559 args: {Arg0, PacketSize, PacketAlign}));
6560 }
6561
6562 // OpenCL v2.0 s6.13.9 - Address space qualifier functions.
6563 case Builtin::BIto_global:
6564 case Builtin::BIto_local:
6565 case Builtin::BIto_private: {
6566 auto Arg0 = EmitScalarExpr(E: E->getArg(Arg: 0));
6567 auto NewArgT = llvm::PointerType::get(
6568 C&: getLLVMContext(),
6569 AddressSpace: CGM.getContext().getTargetAddressSpace(AS: LangAS::opencl_generic));
6570 auto NewRetT = llvm::PointerType::get(
6571 C&: getLLVMContext(),
6572 AddressSpace: CGM.getContext().getTargetAddressSpace(
6573 AS: E->getType()->getPointeeType().getAddressSpace()));
6574 auto FTy = llvm::FunctionType::get(Result: NewRetT, Params: {NewArgT}, isVarArg: false);
6575 llvm::Value *NewArg;
6576 if (Arg0->getType()->getPointerAddressSpace() !=
6577 NewArgT->getPointerAddressSpace())
6578 NewArg = Builder.CreateAddrSpaceCast(V: Arg0, DestTy: NewArgT);
6579 else
6580 NewArg = Builder.CreateBitOrPointerCast(V: Arg0, DestTy: NewArgT);
6581 auto NewName = std::string("__") + E->getDirectCallee()->getName().str();
6582 auto NewCall =
6583 EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name: NewName), args: {NewArg});
6584 return RValue::get(V: Builder.CreateBitOrPointerCast(V: NewCall,
6585 DestTy: ConvertType(T: E->getType())));
6586 }
6587
6588 // OpenCL v2.0, s6.13.17 - Enqueue kernel function.
6589 // Table 6.13.17.1 specifies four overload forms of enqueue_kernel.
6590 // The code below expands the builtin call to a call to one of the following
6591 // functions that an OpenCL runtime library will have to provide:
6592 // __enqueue_kernel_basic
6593 // __enqueue_kernel_varargs
6594 // __enqueue_kernel_basic_events
6595 // __enqueue_kernel_events_varargs
6596 case Builtin::BIenqueue_kernel: {
6597 StringRef Name; // Generated function call name
6598 unsigned NumArgs = E->getNumArgs();
6599
6600 llvm::Type *QueueTy = ConvertType(T: getContext().OCLQueueTy);
6601 llvm::Type *GenericVoidPtrTy = Builder.getPtrTy(
6602 AddrSpace: getContext().getTargetAddressSpace(AS: LangAS::opencl_generic));
6603
6604 llvm::Value *Queue = EmitScalarExpr(E: E->getArg(Arg: 0));
6605 llvm::Value *Flags = EmitScalarExpr(E: E->getArg(Arg: 1));
6606 LValue NDRangeL = EmitAggExprToLValue(E: E->getArg(Arg: 2));
6607 llvm::Value *Range = NDRangeL.getAddress().emitRawPointer(CGF&: *this);
6608
6609 // FIXME: Look through the addrspacecast which may exist to the stack
6610 // temporary as a hack.
6611 //
6612 // This is hardcoding the assumed ABI of the target function. This assumes
6613 // direct passing for every argument except NDRange, which is assumed to be
6614 // byval or byref indirect passed.
6615 //
6616 // This should be fixed to query a signature from CGOpenCLRuntime, and go
6617 // through EmitCallArgs to get the correct target ABI.
6618 Range = Range->stripPointerCasts();
6619
6620 llvm::Type *RangePtrTy = Range->getType();
6621
6622 if (NumArgs == 4) {
6623 // The most basic form of the call with parameters:
6624 // queue_t, kernel_enqueue_flags_t, ndrange_t, block(void)
6625 Name = "__enqueue_kernel_basic";
6626 llvm::Type *ArgTys[] = {QueueTy, Int32Ty, RangePtrTy, GenericVoidPtrTy,
6627 GenericVoidPtrTy};
6628 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6629
6630 auto Info =
6631 CGM.getOpenCLRuntime().emitOpenCLEnqueuedBlock(CGF&: *this, E: E->getArg(Arg: 3));
6632 llvm::Value *Kernel =
6633 Builder.CreatePointerCast(V: Info.KernelHandle, DestTy: GenericVoidPtrTy);
6634 llvm::Value *Block =
6635 Builder.CreatePointerCast(V: Info.BlockArg, DestTy: GenericVoidPtrTy);
6636
6637 auto RTCall = EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name),
6638 args: {Queue, Flags, Range, Kernel, Block});
6639 return RValue::get(V: RTCall);
6640 }
6641 assert(NumArgs >= 5 && "Invalid enqueue_kernel signature");
6642
6643 // Create a temporary array to hold the sizes of local pointer arguments
6644 // for the block. \p First is the position of the first size argument.
6645 auto CreateArrayForSizeVar =
6646 [=](unsigned First) -> std::pair<llvm::Value *, llvm::Value *> {
6647 llvm::APInt ArraySize(32, NumArgs - First);
6648 QualType SizeArrayTy = getContext().getConstantArrayType(
6649 EltTy: getContext().getSizeType(), ArySize: ArraySize, SizeExpr: nullptr,
6650 ASM: ArraySizeModifier::Normal,
6651 /*IndexTypeQuals=*/0);
6652 auto Tmp = CreateMemTempWithoutCast(T: SizeArrayTy, Name: "block_sizes");
6653 llvm::Value *Alloca = Tmp.getPointer();
6654 llvm::Value *ElemPtr;
6655 EmitLifetimeStart(Addr: Alloca);
6656 // Each of the following arguments specifies the size of the corresponding
6657 // argument passed to the enqueued block.
6658 auto *Zero = llvm::ConstantInt::get(Ty: IntTy, V: 0);
6659 for (unsigned I = First; I < NumArgs; ++I) {
6660 auto *Index = llvm::ConstantInt::get(Ty: IntTy, V: I - First);
6661 auto *GEP =
6662 Builder.CreateGEP(Ty: Tmp.getElementType(), Ptr: Alloca, IdxList: {Zero, Index});
6663 if (I == First)
6664 ElemPtr = GEP;
6665 auto *V =
6666 Builder.CreateZExtOrTrunc(V: EmitScalarExpr(E: E->getArg(Arg: I)), DestTy: SizeTy);
6667 Builder.CreateAlignedStore(
6668 Val: V, Ptr: GEP, Align: CGM.getDataLayout().getPrefTypeAlign(Ty: SizeTy));
6669 }
6670 return {ElemPtr, Alloca};
6671 };
6672
6673 // Could have events and/or varargs.
6674 if (E->getArg(Arg: 3)->getType()->isBlockPointerType()) {
6675 // No events passed, but has variadic arguments.
6676 Name = "__enqueue_kernel_varargs";
6677 auto Info =
6678 CGM.getOpenCLRuntime().emitOpenCLEnqueuedBlock(CGF&: *this, E: E->getArg(Arg: 3));
6679 llvm::Value *Kernel =
6680 Builder.CreatePointerCast(V: Info.KernelHandle, DestTy: GenericVoidPtrTy);
6681 auto *Block = Builder.CreatePointerCast(V: Info.BlockArg, DestTy: GenericVoidPtrTy);
6682 auto [ElemPtr, TmpPtr] = CreateArrayForSizeVar(4);
6683
6684 // Create a vector of the arguments, as well as a constant value to
6685 // express to the runtime the number of variadic arguments.
6686 llvm::Value *const Args[] = {Queue, Flags,
6687 Range, Kernel,
6688 Block, ConstantInt::get(Ty: IntTy, V: NumArgs - 4),
6689 ElemPtr};
6690 llvm::Type *const ArgTys[] = {
6691 QueueTy, IntTy, RangePtrTy, GenericVoidPtrTy,
6692 GenericVoidPtrTy, IntTy, ElemPtr->getType()};
6693
6694 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6695 auto Call = RValue::get(
6696 V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name), args: Args));
6697 EmitLifetimeEnd(Addr: TmpPtr);
6698 return Call;
6699 }
6700 // Any calls now have event arguments passed.
6701 if (NumArgs >= 7) {
6702 llvm::PointerType *PtrTy = llvm::PointerType::get(
6703 C&: CGM.getLLVMContext(),
6704 AddressSpace: CGM.getContext().getTargetAddressSpace(AS: LangAS::opencl_generic));
6705
6706 llvm::Value *NumEvents =
6707 Builder.CreateZExtOrTrunc(V: EmitScalarExpr(E: E->getArg(Arg: 3)), DestTy: Int32Ty);
6708
6709 // Since SemaOpenCLBuiltinEnqueueKernel allows fifth and sixth arguments
6710 // to be a null pointer constant (including `0` literal), we can take it
6711 // into account and emit null pointer directly.
6712 llvm::Value *EventWaitList = nullptr;
6713 if (E->getArg(Arg: 4)->isNullPointerConstant(
6714 Ctx&: getContext(), NPC: Expr::NPC_ValueDependentIsNotNull)) {
6715 EventWaitList = llvm::ConstantPointerNull::get(T: PtrTy);
6716 } else {
6717 EventWaitList =
6718 E->getArg(Arg: 4)->getType()->isArrayType()
6719 ? EmitArrayToPointerDecay(Array: E->getArg(Arg: 4)).emitRawPointer(CGF&: *this)
6720 : EmitScalarExpr(E: E->getArg(Arg: 4));
6721 // Convert to generic address space.
6722 EventWaitList = Builder.CreatePointerCast(V: EventWaitList, DestTy: PtrTy);
6723 }
6724 llvm::Value *EventRet = nullptr;
6725 if (E->getArg(Arg: 5)->isNullPointerConstant(
6726 Ctx&: getContext(), NPC: Expr::NPC_ValueDependentIsNotNull)) {
6727 EventRet = llvm::ConstantPointerNull::get(T: PtrTy);
6728 } else {
6729 EventRet =
6730 Builder.CreatePointerCast(V: EmitScalarExpr(E: E->getArg(Arg: 5)), DestTy: PtrTy);
6731 }
6732
6733 auto Info =
6734 CGM.getOpenCLRuntime().emitOpenCLEnqueuedBlock(CGF&: *this, E: E->getArg(Arg: 6));
6735 llvm::Value *Kernel =
6736 Builder.CreatePointerCast(V: Info.KernelHandle, DestTy: GenericVoidPtrTy);
6737 llvm::Value *Block =
6738 Builder.CreatePointerCast(V: Info.BlockArg, DestTy: GenericVoidPtrTy);
6739
6740 std::vector<llvm::Type *> ArgTys = {
6741 QueueTy, Int32Ty, RangePtrTy, Int32Ty,
6742 PtrTy, PtrTy, GenericVoidPtrTy, GenericVoidPtrTy};
6743
6744 std::vector<llvm::Value *> Args = {Queue, Flags, Range,
6745 NumEvents, EventWaitList, EventRet,
6746 Kernel, Block};
6747
6748 if (NumArgs == 7) {
6749 // Has events but no variadics.
6750 Name = "__enqueue_kernel_basic_events";
6751 llvm::FunctionType *FTy =
6752 llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6753 return RValue::get(
6754 V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name), args: Args));
6755 }
6756 // Has event info and variadics
6757 // Pass the number of variadics to the runtime function too.
6758 Args.push_back(x: ConstantInt::get(Ty: Int32Ty, V: NumArgs - 7));
6759 ArgTys.push_back(x: Int32Ty);
6760 Name = "__enqueue_kernel_events_varargs";
6761
6762 auto [ElemPtr, TmpPtr] = CreateArrayForSizeVar(7);
6763 Args.push_back(x: ElemPtr);
6764 ArgTys.push_back(x: ElemPtr->getType());
6765
6766 llvm::FunctionType *FTy = llvm::FunctionType::get(Result: Int32Ty, Params: ArgTys, isVarArg: false);
6767 auto Call = RValue::get(
6768 V: EmitRuntimeCall(callee: CGM.CreateRuntimeFunction(Ty: FTy, Name), args: Args));
6769 EmitLifetimeEnd(Addr: TmpPtr);
6770 return Call;
6771 }
6772 llvm_unreachable("Unexpected enqueue_kernel signature");
6773 }
6774 // OpenCL v2.0 s6.13.17.6 - Kernel query functions need bitcast of block
6775 // parameter.
6776 case Builtin::BIget_kernel_work_group_size: {
6777 llvm::Type *GenericVoidPtrTy = Builder.getPtrTy(
6778 AddrSpace: getContext().getTargetAddressSpace(AS: LangAS::opencl_generic));
6779 auto Info =
6780 CGM.getOpenCLRuntime().emitOpenCLEnqueuedBlock(CGF&: *this, E: E->getArg(Arg: 0));
6781 Value *Kernel =
6782 Builder.CreatePointerCast(V: Info.KernelHandle, DestTy: GenericVoidPtrTy);
6783 Value *Arg = Builder.CreatePointerCast(V: Info.BlockArg, DestTy: GenericVoidPtrTy);
6784 return RValue::get(V: EmitRuntimeCall(
6785 callee: CGM.CreateRuntimeFunction(
6786 Ty: llvm::FunctionType::get(Result: IntTy, Params: {GenericVoidPtrTy, GenericVoidPtrTy},
6787 isVarArg: false),
6788 Name: "__get_kernel_work_group_size_impl"),
6789 args: {Kernel, Arg}));
6790 }
6791 case Builtin::BIget_kernel_preferred_work_group_size_multiple: {
6792 llvm::Type *GenericVoidPtrTy = Builder.getPtrTy(
6793 AddrSpace: getContext().getTargetAddressSpace(AS: LangAS::opencl_generic));
6794 auto Info =
6795 CGM.getOpenCLRuntime().emitOpenCLEnqueuedBlock(CGF&: *this, E: E->getArg(Arg: 0));
6796 Value *Kernel =
6797 Builder.CreatePointerCast(V: Info.KernelHandle, DestTy: GenericVoidPtrTy);
6798 Value *Arg = Builder.CreatePointerCast(V: Info.BlockArg, DestTy: GenericVoidPtrTy);
6799 return RValue::get(V: EmitRuntimeCall(
6800 callee: CGM.CreateRuntimeFunction(
6801 Ty: llvm::FunctionType::get(Result: IntTy, Params: {GenericVoidPtrTy, GenericVoidPtrTy},
6802 isVarArg: false),
6803 Name: "__get_kernel_preferred_work_group_size_multiple_impl"),
6804 args: {Kernel, Arg}));
6805 }
6806 case Builtin::BIget_kernel_max_sub_group_size_for_ndrange:
6807 case Builtin::BIget_kernel_sub_group_count_for_ndrange: {
6808 llvm::Type *GenericVoidPtrTy = Builder.getPtrTy(
6809 AddrSpace: getContext().getTargetAddressSpace(AS: LangAS::opencl_generic));
6810 LValue NDRangeL = EmitAggExprToLValue(E: E->getArg(Arg: 0));
6811 llvm::Value *NDRange = NDRangeL.getAddress().emitRawPointer(CGF&: *this);
6812 auto Info =
6813 CGM.getOpenCLRuntime().emitOpenCLEnqueuedBlock(CGF&: *this, E: E->getArg(Arg: 1));
6814 Value *Kernel =
6815 Builder.CreatePointerCast(V: Info.KernelHandle, DestTy: GenericVoidPtrTy);
6816 Value *Block = Builder.CreatePointerCast(V: Info.BlockArg, DestTy: GenericVoidPtrTy);
6817 const char *Name =
6818 BuiltinID == Builtin::BIget_kernel_max_sub_group_size_for_ndrange
6819 ? "__get_kernel_max_sub_group_size_for_ndrange_impl"
6820 : "__get_kernel_sub_group_count_for_ndrange_impl";
6821 return RValue::get(V: EmitRuntimeCall(
6822 callee: CGM.CreateRuntimeFunction(
6823 Ty: llvm::FunctionType::get(
6824 Result: IntTy, Params: {NDRange->getType(), GenericVoidPtrTy, GenericVoidPtrTy},
6825 isVarArg: false),
6826 Name),
6827 args: {NDRange, Kernel, Block}));
6828 }
6829 case Builtin::BI__builtin_store_half:
6830 case Builtin::BI__builtin_store_halff: {
6831 CodeGenFunction::CGFPOptionsRAII FPOptsRAII(*this, E);
6832 Value *Val = EmitScalarExpr(E: E->getArg(Arg: 0));
6833 Address Address = EmitPointerWithAlignment(Addr: E->getArg(Arg: 1));
6834 Value *HalfVal = Builder.CreateFPTrunc(V: Val, DestTy: Builder.getHalfTy());
6835 Builder.CreateStore(Val: HalfVal, Addr: Address);
6836 return RValue::get(V: nullptr);
6837 }
6838 case Builtin::BI__builtin_load_half: {
6839 Address Address = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
6840 Value *HalfVal = Builder.CreateLoad(Addr: Address);
6841 return RValue::get(V: Builder.CreateFPExt(V: HalfVal, DestTy: Builder.getDoubleTy()));
6842 }
6843 case Builtin::BI__builtin_load_halff: {
6844 Address Address = EmitPointerWithAlignment(Addr: E->getArg(Arg: 0));
6845 Value *HalfVal = Builder.CreateLoad(Addr: Address);
6846 return RValue::get(V: Builder.CreateFPExt(V: HalfVal, DestTy: Builder.getFloatTy()));
6847 }
6848 case Builtin::BI__builtin_printf:
6849 case Builtin::BIprintf:
6850 if (getTarget().getTriple().isNVPTX() ||
6851 getTarget().getTriple().isAMDGCN() ||
6852 (getTarget().getTriple().isSPIRV() &&
6853 getTarget().getTriple().getVendor() == Triple::VendorType::AMD)) {
6854 if (getTarget().getTriple().isNVPTX())
6855 return EmitNVPTXDevicePrintfCallExpr(E);
6856 if ((getTarget().getTriple().isAMDGCN() ||
6857 getTarget().getTriple().isSPIRV()) &&
6858 getLangOpts().HIP)
6859 return EmitAMDGPUDevicePrintfCallExpr(E);
6860 }
6861
6862 break;
6863 case Builtin::BI__builtin_canonicalize:
6864 case Builtin::BI__builtin_canonicalizef:
6865 case Builtin::BI__builtin_canonicalizef16:
6866 case Builtin::BI__builtin_canonicalizel:
6867 return RValue::get(
6868 V: emitBuiltinWithOneOverloadedType<1>(CGF&: *this, E, IntrinsicID: Intrinsic::canonicalize));
6869
6870 case Builtin::BI__builtin_thread_pointer: {
6871 if (!getContext().getTargetInfo().isTLSSupported())
6872 CGM.ErrorUnsupported(S: E, Type: "__builtin_thread_pointer");
6873
6874 return RValue::get(V: Builder.CreateIntrinsic(ID: llvm::Intrinsic::thread_pointer,
6875 OverloadTypes: {GlobalsInt8PtrTy}, Args: {}));
6876 }
6877 case Builtin::BI__builtin_os_log_format:
6878 return emitBuiltinOSLogFormat(E: *E);
6879
6880 case Builtin::BI__xray_customevent: {
6881 if (!ShouldXRayInstrumentFunction())
6882 return RValue::getIgnored();
6883
6884 if (!CGM.getCodeGenOpts().XRayInstrumentationBundle.has(
6885 K: XRayInstrKind::Custom))
6886 return RValue::getIgnored();
6887
6888 if (const auto *XRayAttr = CurFuncDecl->getAttr<XRayInstrumentAttr>())
6889 if (XRayAttr->neverXRayInstrument() && !AlwaysEmitXRayCustomEvents())
6890 return RValue::getIgnored();
6891
6892 Function *F = CGM.getIntrinsic(IID: Intrinsic::xray_customevent);
6893 auto FTy = F->getFunctionType();
6894 auto Arg0 = E->getArg(Arg: 0);
6895 auto Arg0Val = EmitScalarExpr(E: Arg0);
6896 auto Arg0Ty = Arg0->getType();
6897 auto PTy0 = FTy->getParamType(i: 0);
6898 if (PTy0 != Arg0Val->getType()) {
6899 if (Arg0Ty->isArrayType())
6900 Arg0Val = EmitArrayToPointerDecay(Array: Arg0).emitRawPointer(CGF&: *this);
6901 else
6902 Arg0Val = Builder.CreatePointerCast(V: Arg0Val, DestTy: PTy0);
6903 }
6904 auto Arg1 = EmitScalarExpr(E: E->getArg(Arg: 1));
6905 auto PTy1 = FTy->getParamType(i: 1);
6906 if (PTy1 != Arg1->getType())
6907 Arg1 = Builder.CreateTruncOrBitCast(V: Arg1, DestTy: PTy1);
6908 return RValue::get(V: Builder.CreateCall(Callee: F, Args: {Arg0Val, Arg1}));
6909 }
6910
6911 case Builtin::BI__xray_typedevent: {
6912 // TODO: There should be a way to always emit events even if the current
6913 // function is not instrumented. Losing events in a stream can cripple
6914 // a trace.
6915 if (!ShouldXRayInstrumentFunction())
6916 return RValue::getIgnored();
6917
6918 if (!CGM.getCodeGenOpts().XRayInstrumentationBundle.has(
6919 K: XRayInstrKind::Typed))
6920 return RValue::getIgnored();
6921
6922 if (const auto *XRayAttr = CurFuncDecl->getAttr<XRayInstrumentAttr>())
6923 if (XRayAttr->neverXRayInstrument() && !AlwaysEmitXRayTypedEvents())
6924 return RValue::getIgnored();
6925
6926 Function *F = CGM.getIntrinsic(IID: Intrinsic::xray_typedevent);
6927 auto FTy = F->getFunctionType();
6928 auto Arg0 = EmitScalarExpr(E: E->getArg(Arg: 0));
6929 auto PTy0 = FTy->getParamType(i: 0);
6930 if (PTy0 != Arg0->getType())
6931 Arg0 = Builder.CreateTruncOrBitCast(V: Arg0, DestTy: PTy0);
6932 auto Arg1 = E->getArg(Arg: 1);
6933 auto Arg1Val = EmitScalarExpr(E: Arg1);
6934 auto Arg1Ty = Arg1->getType();
6935 auto PTy1 = FTy->getParamType(i: 1);
6936 if (PTy1 != Arg1Val->getType()) {
6937 if (Arg1Ty->isArrayType())
6938 Arg1Val = EmitArrayToPointerDecay(Array: Arg1).emitRawPointer(CGF&: *this);
6939 else
6940 Arg1Val = Builder.CreatePointerCast(V: Arg1Val, DestTy: PTy1);
6941 }
6942 auto Arg2 = EmitScalarExpr(E: E->getArg(Arg: 2));
6943 auto PTy2 = FTy->getParamType(i: 2);
6944 if (PTy2 != Arg2->getType())
6945 Arg2 = Builder.CreateTruncOrBitCast(V: Arg2, DestTy: PTy2);
6946 return RValue::get(V: Builder.CreateCall(Callee: F, Args: {Arg0, Arg1Val, Arg2}));
6947 }
6948
6949 case Builtin::BI__builtin_ms_va_start:
6950 case Builtin::BI__builtin_ms_va_end:
6951 return RValue::get(
6952 V: EmitVAStartEnd(ArgValue: EmitMSVAListRef(E: E->getArg(Arg: 0)).emitRawPointer(CGF&: *this),
6953 IsStart: BuiltinID == Builtin::BI__builtin_ms_va_start));
6954
6955 case Builtin::BI__builtin_ms_va_copy: {
6956 // Lower this manually. We can't reliably determine whether or not any
6957 // given va_copy() is for a Win64 va_list from the calling convention
6958 // alone, because it's legal to do this from a System V ABI function.
6959 // With opaque pointer types, we won't have enough information in LLVM
6960 // IR to determine this from the argument types, either. Best to do it
6961 // now, while we have enough information.
6962 Address DestAddr = EmitMSVAListRef(E: E->getArg(Arg: 0));
6963 Address SrcAddr = EmitMSVAListRef(E: E->getArg(Arg: 1));
6964
6965 DestAddr = DestAddr.withElementType(ElemTy: Int8PtrTy);
6966 SrcAddr = SrcAddr.withElementType(ElemTy: Int8PtrTy);
6967
6968 Value *ArgPtr = Builder.CreateLoad(Addr: SrcAddr, Name: "ap.val");
6969 return RValue::get(V: Builder.CreateStore(Val: ArgPtr, Addr: DestAddr));
6970 }
6971
6972 case Builtin::BI__builtin_get_device_side_mangled_name: {
6973 auto Name = CGM.getCUDARuntime().getDeviceSideName(
6974 ND: cast<DeclRefExpr>(Val: E->getArg(Arg: 0)->IgnoreImpCasts())->getDecl());
6975 auto Str = CGM.GetAddrOfConstantCString(Str: Name, GlobalName: "");
6976 return RValue::get(V: Str.getPointer());
6977 }
6978 }
6979
6980 // If this is an alias for a lib function (e.g. __builtin_sin), emit
6981 // the call using the normal call path, but using the unmangled
6982 // version of the function name.
6983 const auto &BI = getContext().BuiltinInfo;
6984 if (!shouldEmitBuiltinAsIR(BuiltinID, BI, CGF: *this) &&
6985 BI.isLibFunction(ID: BuiltinID))
6986 return emitLibraryCall(CGF&: *this, FD, E,
6987 calleeValue: CGM.getBuiltinLibFunction(FD, BuiltinID));
6988
6989 // If this is a predefined lib function (e.g. malloc), emit the call
6990 // using exactly the normal call path.
6991 if (BI.isPredefinedLibFunction(ID: BuiltinID))
6992 return emitLibraryCall(CGF&: *this, FD, E, calleeValue: CGM.getRawFunctionPointer(GD: FD));
6993
6994 // Check that a call to a target specific builtin has the correct target
6995 // features.
6996 // This is down here to avoid non-target specific builtins, however, if
6997 // generic builtins start to require generic target features then we
6998 // can move this up to the beginning of the function.
6999 checkTargetFeatures(E, TargetDecl: FD);
7000
7001 if (unsigned VectorWidth = getContext().BuiltinInfo.getRequiredVectorWidth(ID: BuiltinID))
7002 LargestVectorWidth = std::max(a: LargestVectorWidth, b: VectorWidth);
7003
7004 // See if we have a target specific intrinsic.
7005 std::string Name = getContext().BuiltinInfo.getName(ID: BuiltinID);
7006 Intrinsic::ID IntrinsicID = Intrinsic::not_intrinsic;
7007 StringRef Prefix =
7008 llvm::Triple::getArchTypePrefix(Kind: getTarget().getTriple().getArch());
7009 if (!Prefix.empty()) {
7010 IntrinsicID = Intrinsic::getIntrinsicForClangBuiltin(TargetPrefix: Prefix.data(), BuiltinName: Name);
7011 if (IntrinsicID == Intrinsic::not_intrinsic && Prefix == "spv" &&
7012 getTarget().getTriple().getOS() == llvm::Triple::OSType::AMDHSA)
7013 IntrinsicID = Intrinsic::getIntrinsicForClangBuiltin(TargetPrefix: "amdgcn", BuiltinName: Name);
7014 // NOTE we don't need to perform a compatibility flag check here since the
7015 // intrinsics are declared in Builtins*.def via LANGBUILTIN which filter the
7016 // MS builtins via ALL_MS_LANGUAGES and are filtered earlier.
7017 if (IntrinsicID == Intrinsic::not_intrinsic)
7018 IntrinsicID = Intrinsic::getIntrinsicForMSBuiltin(TargetPrefix: Prefix.data(), BuiltinName: Name);
7019 }
7020
7021 if (IntrinsicID != Intrinsic::not_intrinsic) {
7022 SmallVector<Value*, 16> Args;
7023
7024 // Find out if any arguments are required to be integer constant
7025 // expressions.
7026 unsigned ICEArguments = 0;
7027 ASTContext::GetBuiltinTypeError Error;
7028 getContext().GetBuiltinType(ID: BuiltinID, Error, IntegerConstantArgs: &ICEArguments);
7029 assert(Error == ASTContext::GE_None && "Should not codegen an error");
7030
7031 Function *F = CGM.getIntrinsic(IID: IntrinsicID);
7032 llvm::FunctionType *FTy = F->getFunctionType();
7033
7034 for (unsigned i = 0, e = E->getNumArgs(); i != e; ++i) {
7035 Value *ArgValue = EmitScalarOrConstFoldImmArg(ICEArguments, Idx: i, E);
7036 // If the intrinsic arg type is different from the builtin arg type
7037 // we need to do a bit cast.
7038 llvm::Type *PTy = FTy->getParamType(i);
7039 if (PTy != ArgValue->getType()) {
7040 // XXX - vector of pointers?
7041 if (auto *PtrTy = dyn_cast<llvm::PointerType>(Val: PTy)) {
7042 if (PtrTy->getAddressSpace() !=
7043 ArgValue->getType()->getPointerAddressSpace()) {
7044 ArgValue = Builder.CreateAddrSpaceCast(
7045 V: ArgValue, DestTy: llvm::PointerType::get(C&: getLLVMContext(),
7046 AddressSpace: PtrTy->getAddressSpace()));
7047 }
7048 }
7049
7050 // Cast vector type (e.g., v256i32) to x86_amx, this only happen
7051 // in amx intrinsics.
7052 if (PTy->isX86_AMXTy())
7053 ArgValue = Builder.CreateIntrinsic(ID: Intrinsic::x86_cast_vector_to_tile,
7054 OverloadTypes: {ArgValue->getType()}, Args: {ArgValue});
7055 else
7056 ArgValue = Builder.CreateBitCast(V: ArgValue, DestTy: PTy);
7057 }
7058
7059 Args.push_back(Elt: ArgValue);
7060 }
7061
7062 Value *V = Builder.CreateCall(Callee: F, Args);
7063 QualType BuiltinRetType = E->getType();
7064
7065 llvm::Type *RetTy = VoidTy;
7066 if (!BuiltinRetType->isVoidType())
7067 RetTy = ConvertType(T: BuiltinRetType);
7068
7069 if (RetTy != V->getType()) {
7070 // XXX - vector of pointers?
7071 if (auto *PtrTy = dyn_cast<llvm::PointerType>(Val: RetTy)) {
7072 if (PtrTy->getAddressSpace() != V->getType()->getPointerAddressSpace()) {
7073 V = Builder.CreateAddrSpaceCast(
7074 V, DestTy: llvm::PointerType::get(C&: getLLVMContext(),
7075 AddressSpace: PtrTy->getAddressSpace()));
7076 }
7077 }
7078
7079 // Cast x86_amx to vector type (e.g., v256i32), this only happen
7080 // in amx intrinsics.
7081 if (V->getType()->isX86_AMXTy())
7082 V = Builder.CreateIntrinsic(ID: Intrinsic::x86_cast_tile_to_vector, OverloadTypes: {RetTy},
7083 Args: {V});
7084 else
7085 V = Builder.CreateBitCast(V, DestTy: RetTy);
7086 }
7087
7088 if (RetTy->isVoidTy())
7089 return RValue::get(V: nullptr);
7090
7091 return RValue::get(V);
7092 }
7093
7094 // Some target-specific builtins can have aggregate return values, e.g.
7095 // __builtin_arm_mve_vld2q_u32. So if the result is an aggregate, force
7096 // ReturnValue to be non-null, so that the target-specific emission code can
7097 // always just emit into it.
7098 TypeEvaluationKind EvalKind = getEvaluationKind(T: E->getType());
7099 if (EvalKind == TEK_Aggregate && ReturnValue.isNull()) {
7100 Address DestPtr = CreateMemTemp(T: E->getType(), Name: "agg.tmp");
7101 ReturnValue = ReturnValueSlot(DestPtr, false);
7102 }
7103
7104 // Now see if we can emit a target-specific builtin.
7105 if (Value *V = EmitTargetBuiltinExpr(BuiltinID, E, ReturnValue)) {
7106 switch (EvalKind) {
7107 case TEK_Scalar:
7108 if (V->getType()->isVoidTy())
7109 return RValue::get(V: nullptr);
7110 return RValue::get(V);
7111 case TEK_Aggregate:
7112 return RValue::getAggregate(addr: ReturnValue.getAddress(),
7113 isVolatile: ReturnValue.isVolatile());
7114 case TEK_Complex:
7115 llvm_unreachable("No current target builtin returns complex");
7116 }
7117 llvm_unreachable("Bad evaluation kind in EmitBuiltinExpr");
7118 }
7119
7120 // EmitHLSLBuiltinExpr will check getLangOpts().HLSL
7121 if (Value *V = EmitHLSLBuiltinExpr(BuiltinID, E, ReturnValue)) {
7122 switch (EvalKind) {
7123 case TEK_Scalar:
7124 if (V->getType()->isVoidTy())
7125 return RValue::get(V: nullptr);
7126 return RValue::get(V);
7127 case TEK_Aggregate:
7128 return RValue::getAggregate(addr: ReturnValue.getAddress(),
7129 isVolatile: ReturnValue.isVolatile());
7130 case TEK_Complex:
7131 llvm_unreachable("No current hlsl builtin returns complex");
7132 }
7133 llvm_unreachable("Bad evaluation kind in EmitBuiltinExpr");
7134 }
7135
7136 if (getLangOpts().HIPStdPar && getLangOpts().CUDAIsDevice)
7137 return EmitHipStdParUnsupportedBuiltin(CGF: this, FD);
7138
7139 ErrorUnsupported(S: E, Type: "builtin function");
7140
7141 // Unknown builtin, for now just dump it out and return undef.
7142 return GetUndefRValue(Ty: E->getType());
7143}
7144
7145namespace {
7146struct BuiltinAlignArgs {
7147 llvm::Value *Src = nullptr;
7148 llvm::Type *SrcType = nullptr;
7149 llvm::Value *Alignment = nullptr;
7150 llvm::Value *Mask = nullptr;
7151 llvm::IntegerType *IntType = nullptr;
7152
7153 BuiltinAlignArgs(const CallExpr *E, CodeGenFunction &CGF) {
7154 QualType AstType = E->getArg(Arg: 0)->getType();
7155 if (AstType->isArrayType())
7156 Src = CGF.EmitArrayToPointerDecay(Array: E->getArg(Arg: 0)).emitRawPointer(CGF);
7157 else
7158 Src = CGF.EmitScalarExpr(E: E->getArg(Arg: 0));
7159 SrcType = Src->getType();
7160 if (SrcType->isPointerTy()) {
7161 IntType = IntegerType::get(
7162 C&: CGF.getLLVMContext(),
7163 NumBits: CGF.CGM.getDataLayout().getIndexTypeSizeInBits(Ty: SrcType));
7164 } else {
7165 assert(SrcType->isIntegerTy());
7166 IntType = cast<llvm::IntegerType>(Val: SrcType);
7167 }
7168 Alignment = CGF.EmitScalarExpr(E: E->getArg(Arg: 1));
7169 Alignment = CGF.Builder.CreateZExtOrTrunc(V: Alignment, DestTy: IntType, Name: "alignment");
7170 auto *One = llvm::ConstantInt::get(Ty: IntType, V: 1);
7171 Mask = CGF.Builder.CreateSub(LHS: Alignment, RHS: One, Name: "mask");
7172 }
7173};
7174} // namespace
7175
7176/// Generate (x & (y-1)) == 0.
7177RValue CodeGenFunction::EmitBuiltinIsAligned(const CallExpr *E) {
7178 BuiltinAlignArgs Args(E, *this);
7179 llvm::Value *SrcAddress = Args.Src;
7180 if (Args.SrcType->isPointerTy())
7181 SrcAddress =
7182 Builder.CreateBitOrPointerCast(V: Args.Src, DestTy: Args.IntType, Name: "src_addr");
7183 return RValue::get(V: Builder.CreateICmpEQ(
7184 LHS: Builder.CreateAnd(LHS: SrcAddress, RHS: Args.Mask, Name: "set_bits"),
7185 RHS: llvm::Constant::getNullValue(Ty: Args.IntType), Name: "is_aligned"));
7186}
7187
7188/// Generate (x & ~(y-1)) to align down or ((x+(y-1)) & ~(y-1)) to align up.
7189/// Note: For pointer types we can avoid ptrtoint/inttoptr pairs by using the
7190/// llvm.ptrmask intrinsic (with a GEP before in the align_up case).
7191RValue CodeGenFunction::EmitBuiltinAlignTo(const CallExpr *E, bool AlignUp) {
7192 BuiltinAlignArgs Args(E, *this);
7193 llvm::Value *SrcForMask = Args.Src;
7194 if (AlignUp) {
7195 // When aligning up we have to first add the mask to ensure we go over the
7196 // next alignment value and then align down to the next valid multiple.
7197 // By adding the mask, we ensure that align_up on an already aligned
7198 // value will not change the value.
7199 if (Args.Src->getType()->isPointerTy()) {
7200 if (getLangOpts().PointerOverflowDefined)
7201 SrcForMask =
7202 Builder.CreateGEP(Ty: Int8Ty, Ptr: SrcForMask, IdxList: Args.Mask, Name: "over_boundary");
7203 else
7204 SrcForMask = EmitCheckedInBoundsGEP(ElemTy: Int8Ty, Ptr: SrcForMask, IdxList: Args.Mask,
7205 /*SignedIndices=*/true,
7206 /*isSubtraction=*/IsSubtraction: false,
7207 Loc: E->getExprLoc(), Name: "over_boundary");
7208 } else {
7209 SrcForMask = Builder.CreateAdd(LHS: SrcForMask, RHS: Args.Mask, Name: "over_boundary");
7210 }
7211 }
7212 // Invert the mask to only clear the lower bits.
7213 llvm::Value *InvertedMask = Builder.CreateNot(V: Args.Mask, Name: "inverted_mask");
7214 llvm::Value *Result = nullptr;
7215 if (Args.Src->getType()->isPointerTy()) {
7216 Result = Builder.CreateIntrinsic(
7217 ID: Intrinsic::ptrmask, OverloadTypes: {Args.SrcType, Args.IntType},
7218 Args: {SrcForMask, InvertedMask}, FMFSource: nullptr, Name: "aligned_result");
7219 } else {
7220 Result = Builder.CreateAnd(LHS: SrcForMask, RHS: InvertedMask, Name: "aligned_result");
7221 }
7222 assert(Result->getType() == Args.SrcType);
7223 return RValue::get(V: Result);
7224}
7225