1//===--- Function.h - Bytecode function for the VM --------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Defines the Function class which holds all bytecode function-specific data.
10//
11// The scope class which describes local variables is also defined here.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef LLVM_CLANG_AST_INTERP_FUNCTION_H
16#define LLVM_CLANG_AST_INTERP_FUNCTION_H
17
18#include "Descriptor.h"
19#include "Source.h"
20#include "clang/AST/Attr.h"
21#include "clang/AST/Decl.h"
22#include "clang/AST/DeclCXX.h"
23#include "llvm/ADT/PointerUnion.h"
24#include "llvm/Support/raw_ostream.h"
25
26namespace clang {
27namespace interp {
28class Program;
29class ByteCodeEmitter;
30class Pointer;
31enum PrimType : uint8_t;
32
33/// Describes a scope block.
34///
35/// The block gathers all the descriptors of the locals defined in this block.
36class Scope final {
37public:
38 /// Information about a local's storage.
39 struct Local {
40 /// Offset of the local in frame.
41 unsigned Offset;
42 /// Descriptor of the local.
43 Descriptor *Desc;
44 /// If the cleanup for this local should be emitted.
45 bool EnabledByDefault = true;
46 };
47
48 using LocalVectorTy = llvm::SmallVector<Local, 8>;
49
50 Scope(LocalVectorTy &&Descriptors) : Descriptors(std::move(Descriptors)) {}
51
52 llvm::iterator_range<LocalVectorTy::const_iterator> locals() const {
53 return llvm::make_range(x: Descriptors.begin(), y: Descriptors.end());
54 }
55
56 llvm::iterator_range<LocalVectorTy::const_reverse_iterator>
57 locals_reverse() const {
58 return llvm::reverse(C: Descriptors);
59 }
60
61private:
62 /// Object descriptors in this block.
63 LocalVectorTy Descriptors;
64};
65
66using FunctionDeclTy =
67 llvm::PointerUnion<const FunctionDecl *, const BlockExpr *>;
68
69/// Bytecode function.
70///
71/// Contains links to the bytecode of the function, as well as metadata
72/// describing all arguments and stack-local variables.
73///
74/// # Calling Convention
75///
76/// When calling a function, all argument values must be on the stack.
77///
78/// If the function has a This pointer (i.e. hasThisPointer() returns true,
79/// the argument values need to be preceeded by a Pointer for the This object.
80///
81/// If the function uses Return Value Optimization, the arguments (and
82/// potentially the This pointer) need to be preceeded by a Pointer pointing
83/// to the location to construct the returned value.
84///
85/// After the function has been called, it will remove all arguments,
86/// including RVO and This pointer, from the stack.
87///
88/// The parameters saved in a clang::intepr::Function include both the
89/// instance pointer as well as the RVO pointer.
90///
91/// \verbatim
92/// Stack position when calling ─────┐
93/// this Function │
94///
95/// ┌─────┬──────┬────────┬────────┬─────┬────────────────────┐
96/// │ RVO │ This │ Param1 │ Param2 │ ... │ │
97/// └─────┴──────┴────────┴────────┴─────┴────────────────────┘
98/// \endverbatim
99class Function final {
100public:
101 enum class FunctionKind {
102 Normal,
103 Ctor,
104 Dtor,
105 LambdaStaticInvoker,
106 LambdaCallOperator,
107 CopyOrMoveOperator,
108 };
109
110 struct ParamDescriptor {
111 const Descriptor *Desc;
112 /// Offset on the stack.
113 unsigned Offset;
114 /// Offset in the InterpFrame.
115 unsigned BlockOffset;
116 PrimType T;
117 ParamDescriptor(const Descriptor *Desc, unsigned Offset,
118 unsigned BlockOffset, PrimType T)
119 : Desc(Desc), Offset(Offset), BlockOffset(BlockOffset), T(T) {}
120 };
121
122 /// Returns the size of the function's local stack.
123 unsigned getFrameSize() const { return FrameSize; }
124 /// Returns the size of the argument stack.
125 unsigned getArgSize() const { return ArgSize; }
126
127 /// Returns a pointer to the start of the code.
128 CodePtr getCodeBegin() const { return Code.data(); }
129 /// Returns a pointer to the end of the code.
130 CodePtr getCodeEnd() const { return Code.data() + Code.size(); }
131
132 /// Returns the original FunctionDecl.
133 const FunctionDecl *getDecl() const {
134 return dyn_cast<const FunctionDecl *>(Val: Source);
135 }
136 const BlockExpr *getExpr() const {
137 return dyn_cast<const BlockExpr *>(Val: Source);
138 }
139
140 /// Returns the name of the function decl this code
141 /// was generated for.
142 std::string getName() const {
143 if (!Source || !getDecl())
144 return "<<expr>>";
145
146 return getDecl()->getQualifiedNameAsString();
147 }
148
149 /// Returns a parameter descriptor.
150 ParamDescriptor getParamDescriptor(unsigned Index) const {
151 return ParamDescriptors[Index];
152 }
153
154 /// Checks if the first argument is a RVO pointer.
155 bool hasRVO() const { return HasRVO; }
156
157 bool hasNonNullAttr() const { return getDecl()->hasAttr<NonNullAttr>(); }
158
159 /// Range over the scope blocks.
160 llvm::iterator_range<llvm::SmallVector<Scope, 2>::const_iterator>
161 scopes() const {
162 return llvm::make_range(x: Scopes.begin(), y: Scopes.end());
163 }
164
165 /// Range over argument types.
166 using arg_reverse_iterator =
167 SmallVectorImpl<ParamDescriptor>::const_reverse_iterator;
168 llvm::iterator_range<arg_reverse_iterator> args_reverse() const {
169 return llvm::reverse(C: ParamDescriptors);
170 }
171
172 /// Returns a specific scope.
173 Scope &getScope(unsigned Idx) { return Scopes[Idx]; }
174 const Scope &getScope(unsigned Idx) const { return Scopes[Idx]; }
175
176 /// Returns the source information at a given PC.
177 SourceInfo getSource(CodePtr PC) const;
178
179 /// Checks if the function is valid to call.
180 bool isValid() const { return IsValid || isLambdaStaticInvoker(); }
181
182 /// Checks if the function is virtual.
183 bool isVirtual() const { return Virtual; };
184 bool isImmediate() const { return Immediate; }
185 bool isConstexpr() const { return Constexpr; }
186
187 /// Checks if the function is a constructor.
188 bool isConstructor() const { return Kind == FunctionKind::Ctor; }
189 /// Checks if the function is a destructor.
190 bool isDestructor() const { return Kind == FunctionKind::Dtor; }
191 /// Checks if the function is copy or move operator.
192 bool isCopyOrMoveOperator() const {
193 return Kind == FunctionKind::CopyOrMoveOperator;
194 }
195
196 /// Returns whether this function is a lambda static invoker,
197 /// which we generate custom byte code for.
198 bool isLambdaStaticInvoker() const {
199 return Kind == FunctionKind::LambdaStaticInvoker;
200 }
201
202 /// Returns whether this function is the call operator
203 /// of a lambda record decl.
204 bool isLambdaCallOperator() const {
205 return Kind == FunctionKind::LambdaCallOperator;
206 }
207
208 /// Returns the parent record decl, if any.
209 const CXXRecordDecl *getParentDecl() const {
210 if (const auto *MD = dyn_cast_if_present<CXXMethodDecl>(
211 Val: dyn_cast<const FunctionDecl *>(Val: Source)))
212 return MD->getParent();
213 return nullptr;
214 }
215
216 /// Checks if the function is fully done compiling.
217 bool isFullyCompiled() const { return IsFullyCompiled; }
218
219 bool hasThisPointer() const { return HasThisPointer; }
220
221 /// Checks if the function already has a body attached.
222 bool hasBody() const { return HasBody; }
223
224 /// Checks if the function is defined.
225 bool isDefined() const { return Defined; }
226
227 bool isVariadic() const { return Variadic; }
228
229 unsigned getNumParams() const {
230 return ParamDescriptors.size() + hasThisPointer() + hasRVO();
231 }
232
233 /// Returns the number of parameter this function takes when it's called,
234 /// i.e excluding the instance pointer and the RVO pointer.
235 unsigned getNumWrittenParams() const {
236 assert(getNumParams() >= (unsigned)(hasThisPointer() + hasRVO()));
237 return ParamDescriptors.size();
238 }
239 unsigned getWrittenArgSize() const {
240 return ArgSize - (align(Size: primSize(Type: PT_Ptr)) * (hasThisPointer() + hasRVO()));
241 }
242
243 bool isThisPointerExplicit() const {
244 if (const auto *MD = dyn_cast_if_present<CXXMethodDecl>(
245 Val: dyn_cast<const FunctionDecl *>(Val: Source)))
246 return MD->isExplicitObjectMemberFunction();
247 return false;
248 }
249
250private:
251 /// Construct a function representing an actual function.
252 Function(Program &P, FunctionDeclTy Source, unsigned ArgSize,
253 llvm::SmallVectorImpl<ParamDescriptor> &&ParamDescriptors,
254 bool HasThisPointer, bool HasRVO, bool IsLambdaStaticInvoker);
255
256 /// Sets the code of a function.
257 void setCode(FunctionDeclTy Source, unsigned NewFrameSize,
258 llvm::SmallVector<std::byte> &&NewCode, SourceMap &&NewSrcMap,
259 llvm::SmallVector<Scope, 2> &&NewScopes, bool NewHasBody,
260 bool NewIsValid) {
261 this->Source = Source;
262 FrameSize = NewFrameSize;
263 Code = std::move(NewCode);
264 SrcMap = std::move(NewSrcMap);
265 Scopes = std::move(NewScopes);
266 IsValid = NewIsValid;
267 HasBody = NewHasBody;
268 }
269
270 void setIsFullyCompiled(bool FC) { IsFullyCompiled = FC; }
271 void setDefined(bool D) { Defined = D; }
272
273private:
274 friend class Program;
275 friend class ByteCodeEmitter;
276 friend class Context;
277
278 /// Program reference.
279 Program &P;
280 /// Function Kind.
281 FunctionKind Kind;
282 /// Declaration this function was compiled from.
283 FunctionDeclTy Source;
284 /// Local area size: storage + metadata.
285 unsigned FrameSize = 0;
286 /// Size of the argument stack.
287 unsigned ArgSize;
288 /// Program code.
289 llvm::SmallVector<std::byte> Code;
290 /// Opcode-to-expression mapping.
291 SourceMap SrcMap;
292 /// List of block descriptors.
293 llvm::SmallVector<Scope, 2> Scopes;
294 /// List of all parameters, including RVO and instance pointer.
295 llvm::SmallVector<ParamDescriptor> ParamDescriptors;
296 /// Flag to indicate if the function is valid.
297 LLVM_PREFERRED_TYPE(bool)
298 unsigned IsValid : 1;
299 /// Flag to indicate if the function is done being
300 /// compiled to bytecode.
301 LLVM_PREFERRED_TYPE(bool)
302 unsigned IsFullyCompiled : 1;
303 /// Flag indicating if this function takes the this pointer
304 /// as the first implicit argument
305 LLVM_PREFERRED_TYPE(bool)
306 unsigned HasThisPointer : 1;
307 /// Whether this function has Return Value Optimization, i.e.
308 /// the return value is constructed in the caller's stack frame.
309 /// This is done for functions that return non-primive values.
310 LLVM_PREFERRED_TYPE(bool)
311 unsigned HasRVO : 1;
312 /// If we've already compiled the function's body.
313 LLVM_PREFERRED_TYPE(bool)
314 unsigned HasBody : 1;
315 LLVM_PREFERRED_TYPE(bool)
316 unsigned Defined : 1;
317 LLVM_PREFERRED_TYPE(bool)
318 unsigned Variadic : 1;
319 LLVM_PREFERRED_TYPE(bool)
320 unsigned Virtual : 1;
321 LLVM_PREFERRED_TYPE(bool)
322 unsigned Immediate : 1;
323 LLVM_PREFERRED_TYPE(bool)
324 unsigned Constexpr : 1;
325
326public:
327 /// Dumps the disassembled bytecode to \c llvm::errs().
328 void dump() const { dump(PC: {}); }
329 void dump(CodePtr PC) const;
330 void dump(llvm::raw_ostream &OS, CodePtr PC = {}) const;
331};
332
333} // namespace interp
334} // namespace clang
335
336#endif
337