1//===-- AMDGPULibFunc.cpp -------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file contains utility functions to work with Itanium mangled names
10//
11//===----------------------------------------------------------------------===//
12
13#include "AMDGPULibFunc.h"
14#include "AMDGPU.h"
15#include "llvm/ADT/StringExtras.h"
16#include "llvm/ADT/StringMap.h"
17#include "llvm/ADT/StringSwitch.h"
18#include "llvm/IR/DerivedTypes.h"
19#include "llvm/IR/Function.h"
20#include "llvm/IR/Module.h"
21#include "llvm/IR/ValueSymbolTable.h"
22#include "llvm/Support/CommandLine.h"
23#include "llvm/Support/ModRef.h"
24#include "llvm/Support/raw_ostream.h"
25
26using namespace llvm;
27
28static cl::opt<bool> EnableOCLManglingMismatchWA(
29 "amdgpu-enable-ocl-mangling-mismatch-workaround", cl::init(Val: true),
30 cl::ReallyHidden,
31 cl::desc("Enable the workaround for OCL name mangling mismatch."));
32
33namespace {
34
35enum EManglingParam {
36 E_NONE,
37 EX_EVENT,
38 EX_FLOAT4,
39 EX_INTV4,
40 EX_RESERVEDID,
41 EX_SAMPLER,
42 EX_SIZET,
43 EX_UINT,
44 EX_UINTV4,
45 E_ANY,
46 E_CONSTPTR_ANY,
47 E_CONSTPTR_SWAPGL,
48 E_COPY,
49 E_IMAGECOORDS,
50 E_POINTEE,
51 E_SETBASE_I32,
52 E_SETBASE_U32,
53 E_MAKEBASE_UNS,
54 E_V16_OF_POINTEE,
55 E_V2_OF_POINTEE,
56 E_V3_OF_POINTEE,
57 E_V4_OF_POINTEE,
58 E_V8_OF_POINTEE,
59 E_VLTLPTR_ANY,
60};
61
62struct ManglingRule {
63 const char *Name;
64 unsigned char Lead[2];
65 unsigned char Param[5];
66
67 int maxLeadIndex() const { return (std::max)(a: Lead[0], b: Lead[1]); }
68 int getNumLeads() const { return (Lead[0] ? 1 : 0) + (Lead[1] ? 1 : 0); }
69
70 unsigned getNumArgs() const;
71
72 static StringMap<int> buildManglingRulesMap();
73};
74
75// Information about library functions with unmangled names.
76class UnmangledFuncInfo {
77 const char *Name;
78 unsigned NumArgs;
79
80 // Table for all lib functions with unmangled names.
81 static const UnmangledFuncInfo Table[];
82
83 // Number of entries in Table.
84 static const unsigned TableSize;
85
86 static StringMap<unsigned> buildNameMap();
87
88public:
89 using ID = AMDGPULibFunc::EFuncId;
90 constexpr UnmangledFuncInfo(const char *_Name, unsigned _NumArgs)
91 : Name(_Name), NumArgs(_NumArgs) {}
92 // Get index to Table by function name.
93 static bool lookup(StringRef Name, ID &Id);
94 static unsigned toIndex(ID Id) {
95 assert(static_cast<unsigned>(Id) >
96 static_cast<unsigned>(AMDGPULibFunc::EI_LAST_MANGLED) &&
97 "Invalid unmangled library function");
98 return static_cast<unsigned>(Id) - 1 -
99 static_cast<unsigned>(AMDGPULibFunc::EI_LAST_MANGLED);
100 }
101 static ID toFuncId(unsigned Index) {
102 assert(Index < TableSize &&
103 "Invalid unmangled library function");
104 return static_cast<ID>(
105 Index + 1 + static_cast<unsigned>(AMDGPULibFunc::EI_LAST_MANGLED));
106 }
107 static unsigned getNumArgs(ID Id) { return Table[toIndex(Id)].NumArgs; }
108 static StringRef getName(ID Id) { return Table[toIndex(Id)].Name; }
109};
110
111unsigned ManglingRule::getNumArgs() const {
112 unsigned I=0;
113 while (I < (sizeof Param/sizeof Param[0]) && Param[I]) ++I;
114 return I;
115}
116
117// This table describes function formal argument type rules. The order of rules
118// corresponds to the EFuncId enum at AMDGPULibFunc.h
119//
120// "<func name>", { <leads> }, { <param rules> }
121// where:
122// <leads> - list of integers that are one-based indexes of formal argument
123// used to mangle a function name. Other argument types are derived from types
124// of these 'leads'. The order of integers in this list correspond to the
125// order in which these arguments are mangled in the EDG mangling scheme. The
126// same order should be preserved for arguments in the AMDGPULibFunc structure
127// when it is used for mangling. For example:
128// { "vstorea_half", {3,1}, {E_ANY,EX_SIZET,E_ANY}},
129// will be mangled in EDG scheme as vstorea_half_<3dparam>_<1stparam>
130// When mangling from code use:
131// AMDGPULibFunc insc;
132// insc.param[0] = ... // describe 3rd parameter
133// insc.param[1] = ... // describe 1rd parameter
134//
135// <param rules> - list of rules used to derive all of the function formal
136// argument types. EX_ prefixed are simple types, other derived from the
137// latest 'lead' argument type in the order of encoding from first to last.
138// E_ANY - use prev lead type, E_CONSTPTR_ANY - make const pointer out of
139// prev lead type, etc. see ParamIterator::getNextParam() for details.
140
141static constexpr ManglingRule manglingRules[] = {
142{ .Name: "", .Lead: {0}, .Param: {0} },
143{ .Name: "abs" , .Lead: {1}, .Param: {E_ANY}},
144{ .Name: "abs_diff" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
145{ .Name: "acos" , .Lead: {1}, .Param: {E_ANY}},
146{ .Name: "acosh" , .Lead: {1}, .Param: {E_ANY}},
147{ .Name: "acospi" , .Lead: {1}, .Param: {E_ANY}},
148{ .Name: "add_sat" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
149{ .Name: "all" , .Lead: {1}, .Param: {E_ANY}},
150{ .Name: "any" , .Lead: {1}, .Param: {E_ANY}},
151{ .Name: "asin" , .Lead: {1}, .Param: {E_ANY}},
152{ .Name: "asinh" , .Lead: {1}, .Param: {E_ANY}},
153{ .Name: "asinpi" , .Lead: {1}, .Param: {E_ANY}},
154{ .Name: "async_work_group_copy" , .Lead: {1}, .Param: {E_ANY,E_CONSTPTR_SWAPGL,EX_SIZET,EX_EVENT}},
155{ .Name: "async_work_group_strided_copy" , .Lead: {1}, .Param: {E_ANY,E_CONSTPTR_SWAPGL,EX_SIZET,EX_SIZET,EX_EVENT}},
156{ .Name: "atan" , .Lead: {1}, .Param: {E_ANY}},
157{ .Name: "atan2" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
158{ .Name: "atan2pi" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
159{ .Name: "atanh" , .Lead: {1}, .Param: {E_ANY}},
160{ .Name: "atanpi" , .Lead: {1}, .Param: {E_ANY}},
161{ .Name: "atomic_add" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
162{ .Name: "atomic_and" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
163{ .Name: "atomic_cmpxchg" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE,E_POINTEE}},
164{ .Name: "atomic_dec" , .Lead: {1}, .Param: {E_VLTLPTR_ANY}},
165{ .Name: "atomic_inc" , .Lead: {1}, .Param: {E_VLTLPTR_ANY}},
166{ .Name: "atomic_max" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
167{ .Name: "atomic_min" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
168{ .Name: "atomic_or" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
169{ .Name: "atomic_sub" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
170{ .Name: "atomic_xchg" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
171{ .Name: "atomic_xor" , .Lead: {1}, .Param: {E_VLTLPTR_ANY,E_POINTEE}},
172{ .Name: "bitselect" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
173{ .Name: "cbrt" , .Lead: {1}, .Param: {E_ANY}},
174{ .Name: "ceil" , .Lead: {1}, .Param: {E_ANY}},
175{ .Name: "clamp" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
176{ .Name: "clz" , .Lead: {1}, .Param: {E_ANY}},
177{ .Name: "commit_read_pipe" , .Lead: {1}, .Param: {E_ANY,EX_RESERVEDID}},
178{ .Name: "commit_write_pipe" , .Lead: {1}, .Param: {E_ANY,EX_RESERVEDID}},
179{ .Name: "copysign" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
180{ .Name: "cos" , .Lead: {1}, .Param: {E_ANY}},
181{ .Name: "cosh" , .Lead: {1}, .Param: {E_ANY}},
182{ .Name: "cospi" , .Lead: {1}, .Param: {E_ANY}},
183{ .Name: "cross" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
184{ .Name: "ctz" , .Lead: {1}, .Param: {E_ANY}},
185{ .Name: "degrees" , .Lead: {1}, .Param: {E_ANY}},
186{ .Name: "distance" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
187{ .Name: "divide" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
188{ .Name: "dot" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
189{ .Name: "erf" , .Lead: {1}, .Param: {E_ANY}},
190{ .Name: "erfc" , .Lead: {1}, .Param: {E_ANY}},
191{ .Name: "exp" , .Lead: {1}, .Param: {E_ANY}},
192{ .Name: "exp10" , .Lead: {1}, .Param: {E_ANY}},
193{ .Name: "exp2" , .Lead: {1}, .Param: {E_ANY}},
194{ .Name: "expm1" , .Lead: {1}, .Param: {E_ANY}},
195{ .Name: "fabs" , .Lead: {1}, .Param: {E_ANY}},
196{ .Name: "fast_distance" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
197{ .Name: "fast_length" , .Lead: {1}, .Param: {E_ANY}},
198{ .Name: "fast_normalize" , .Lead: {1}, .Param: {E_ANY}},
199{ .Name: "fdim" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
200{ .Name: "floor" , .Lead: {1}, .Param: {E_ANY}},
201{ .Name: "fma" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
202{ .Name: "fmax" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
203{ .Name: "fmin" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
204{ .Name: "fmod" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
205{ .Name: "fract" , .Lead: {2}, .Param: {E_POINTEE,E_ANY}},
206{ .Name: "frexp" , .Lead: {1,2}, .Param: {E_ANY,E_ANY}},
207{ .Name: "get_image_array_size" , .Lead: {1}, .Param: {E_ANY}},
208{ .Name: "get_image_channel_data_type" , .Lead: {1}, .Param: {E_ANY}},
209{ .Name: "get_image_channel_order" , .Lead: {1}, .Param: {E_ANY}},
210{ .Name: "get_image_dim" , .Lead: {1}, .Param: {E_ANY}},
211{ .Name: "get_image_height" , .Lead: {1}, .Param: {E_ANY}},
212{ .Name: "get_image_width" , .Lead: {1}, .Param: {E_ANY}},
213{ .Name: "get_pipe_max_packets" , .Lead: {1}, .Param: {E_ANY}},
214{ .Name: "get_pipe_num_packets" , .Lead: {1}, .Param: {E_ANY}},
215{ .Name: "hadd" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
216{ .Name: "hypot" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
217{ .Name: "ilogb" , .Lead: {1}, .Param: {E_ANY}},
218{ .Name: "isequal" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
219{ .Name: "isfinite" , .Lead: {1}, .Param: {E_ANY}},
220{ .Name: "isgreater" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
221{ .Name: "isgreaterequal" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
222{ .Name: "isinf" , .Lead: {1}, .Param: {E_ANY}},
223{ .Name: "isless" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
224{ .Name: "islessequal" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
225{ .Name: "islessgreater" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
226{ .Name: "isnan" , .Lead: {1}, .Param: {E_ANY}},
227{ .Name: "isnormal" , .Lead: {1}, .Param: {E_ANY}},
228{ .Name: "isnotequal" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
229{ .Name: "isordered" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
230{ .Name: "isunordered" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
231{ .Name: "ldexp" , .Lead: {1}, .Param: {E_ANY,E_SETBASE_I32}},
232{ .Name: "length" , .Lead: {1}, .Param: {E_ANY}},
233{ .Name: "lgamma" , .Lead: {1}, .Param: {E_ANY}},
234{ .Name: "lgamma_r" , .Lead: {1,2}, .Param: {E_ANY,E_ANY}},
235{ .Name: "log" , .Lead: {1}, .Param: {E_ANY}},
236{ .Name: "log10" , .Lead: {1}, .Param: {E_ANY}},
237{ .Name: "log1p" , .Lead: {1}, .Param: {E_ANY}},
238{ .Name: "log2" , .Lead: {1}, .Param: {E_ANY}},
239{ .Name: "logb" , .Lead: {1}, .Param: {E_ANY}},
240{ .Name: "mad" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
241{ .Name: "mad24" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
242{ .Name: "mad_hi" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
243{ .Name: "mad_sat" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
244{ .Name: "max" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
245{ .Name: "maxmag" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
246{ .Name: "min" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
247{ .Name: "minmag" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
248{ .Name: "mix" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
249{ .Name: "modf" , .Lead: {2}, .Param: {E_POINTEE,E_ANY}},
250{ .Name: "mul24" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
251{ .Name: "mul_hi" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
252{ .Name: "nan" , .Lead: {1}, .Param: {E_ANY}},
253{ .Name: "nextafter" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
254{ .Name: "normalize" , .Lead: {1}, .Param: {E_ANY}},
255{ .Name: "popcount" , .Lead: {1}, .Param: {E_ANY}},
256{ .Name: "pow" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
257{ .Name: "pown" , .Lead: {1}, .Param: {E_ANY,E_SETBASE_I32}},
258{ .Name: "powr" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
259{ .Name: "prefetch" , .Lead: {1}, .Param: {E_CONSTPTR_ANY,EX_SIZET}},
260{ .Name: "radians" , .Lead: {1}, .Param: {E_ANY}},
261{ .Name: "recip" , .Lead: {1}, .Param: {E_ANY}},
262{ .Name: "remainder" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
263{ .Name: "remquo" , .Lead: {1,3}, .Param: {E_ANY,E_COPY,E_ANY}},
264{ .Name: "reserve_read_pipe" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
265{ .Name: "reserve_write_pipe" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
266{ .Name: "rhadd" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
267{ .Name: "rint" , .Lead: {1}, .Param: {E_ANY}},
268{ .Name: "rootn" , .Lead: {1}, .Param: {E_ANY,E_SETBASE_I32}},
269{ .Name: "rotate" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
270{ .Name: "round" , .Lead: {1}, .Param: {E_ANY}},
271{ .Name: "rsqrt" , .Lead: {1}, .Param: {E_ANY}},
272{ .Name: "select" , .Lead: {1,3}, .Param: {E_ANY,E_COPY,E_ANY}},
273{ .Name: "shuffle" , .Lead: {1,2}, .Param: {E_ANY,E_ANY}},
274{ .Name: "shuffle2" , .Lead: {1,3}, .Param: {E_ANY,E_COPY,E_ANY}},
275{ .Name: "sign" , .Lead: {1}, .Param: {E_ANY}},
276{ .Name: "signbit" , .Lead: {1}, .Param: {E_ANY}},
277{ .Name: "sin" , .Lead: {1}, .Param: {E_ANY}},
278{ .Name: "sincos" , .Lead: {2}, .Param: {E_POINTEE,E_ANY}},
279{ .Name: "sinh" , .Lead: {1}, .Param: {E_ANY}},
280{ .Name: "sinpi" , .Lead: {1}, .Param: {E_ANY}},
281{ .Name: "smoothstep" , .Lead: {1}, .Param: {E_ANY,E_COPY,E_COPY}},
282{ .Name: "sqrt" , .Lead: {1}, .Param: {E_ANY}},
283{ .Name: "step" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
284{ .Name: "sub_group_broadcast" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
285{ .Name: "sub_group_commit_read_pipe" , .Lead: {1}, .Param: {E_ANY,EX_RESERVEDID}},
286{ .Name: "sub_group_commit_write_pipe" , .Lead: {1}, .Param: {E_ANY,EX_RESERVEDID}},
287{ .Name: "sub_group_reduce_add" , .Lead: {1}, .Param: {E_ANY}},
288{ .Name: "sub_group_reduce_max" , .Lead: {1}, .Param: {E_ANY}},
289{ .Name: "sub_group_reduce_min" , .Lead: {1}, .Param: {E_ANY}},
290{ .Name: "sub_group_reserve_read_pipe" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
291{ .Name: "sub_group_reserve_write_pipe" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
292{ .Name: "sub_group_scan_exclusive_add" , .Lead: {1}, .Param: {E_ANY}},
293{ .Name: "sub_group_scan_exclusive_max" , .Lead: {1}, .Param: {E_ANY}},
294{ .Name: "sub_group_scan_exclusive_min" , .Lead: {1}, .Param: {E_ANY}},
295{ .Name: "sub_group_scan_inclusive_add" , .Lead: {1}, .Param: {E_ANY}},
296{ .Name: "sub_group_scan_inclusive_max" , .Lead: {1}, .Param: {E_ANY}},
297{ .Name: "sub_group_scan_inclusive_min" , .Lead: {1}, .Param: {E_ANY}},
298{ .Name: "sub_sat" , .Lead: {1}, .Param: {E_ANY,E_COPY}},
299{ .Name: "tan" , .Lead: {1}, .Param: {E_ANY}},
300{ .Name: "tanh" , .Lead: {1}, .Param: {E_ANY}},
301{ .Name: "tanpi" , .Lead: {1}, .Param: {E_ANY}},
302{ .Name: "tgamma" , .Lead: {1}, .Param: {E_ANY}},
303{ .Name: "trunc" , .Lead: {1}, .Param: {E_ANY}},
304{ .Name: "upsample" , .Lead: {1}, .Param: {E_ANY,E_MAKEBASE_UNS}},
305{ .Name: "vec_step" , .Lead: {1}, .Param: {E_ANY}},
306{ .Name: "vstore" , .Lead: {3}, .Param: {E_POINTEE,EX_SIZET,E_ANY}},
307{ .Name: "vstore16" , .Lead: {3}, .Param: {E_V16_OF_POINTEE,EX_SIZET,E_ANY}},
308{ .Name: "vstore2" , .Lead: {3}, .Param: {E_V2_OF_POINTEE,EX_SIZET,E_ANY}},
309{ .Name: "vstore3" , .Lead: {3}, .Param: {E_V3_OF_POINTEE,EX_SIZET,E_ANY}},
310{ .Name: "vstore4" , .Lead: {3}, .Param: {E_V4_OF_POINTEE,EX_SIZET,E_ANY}},
311{ .Name: "vstore8" , .Lead: {3}, .Param: {E_V8_OF_POINTEE,EX_SIZET,E_ANY}},
312{ .Name: "work_group_commit_read_pipe" , .Lead: {1}, .Param: {E_ANY,EX_RESERVEDID}},
313{ .Name: "work_group_commit_write_pipe" , .Lead: {1}, .Param: {E_ANY,EX_RESERVEDID}},
314{ .Name: "work_group_reduce_add" , .Lead: {1}, .Param: {E_ANY}},
315{ .Name: "work_group_reduce_max" , .Lead: {1}, .Param: {E_ANY}},
316{ .Name: "work_group_reduce_min" , .Lead: {1}, .Param: {E_ANY}},
317{ .Name: "work_group_reserve_read_pipe" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
318{ .Name: "work_group_reserve_write_pipe" , .Lead: {1}, .Param: {E_ANY,EX_UINT}},
319{ .Name: "work_group_scan_exclusive_add" , .Lead: {1}, .Param: {E_ANY}},
320{ .Name: "work_group_scan_exclusive_max" , .Lead: {1}, .Param: {E_ANY}},
321{ .Name: "work_group_scan_exclusive_min" , .Lead: {1}, .Param: {E_ANY}},
322{ .Name: "work_group_scan_inclusive_add" , .Lead: {1}, .Param: {E_ANY}},
323{ .Name: "work_group_scan_inclusive_max" , .Lead: {1}, .Param: {E_ANY}},
324{ .Name: "work_group_scan_inclusive_min" , .Lead: {1}, .Param: {E_ANY}},
325{ .Name: "write_imagef" , .Lead: {1}, .Param: {E_ANY,E_IMAGECOORDS,EX_FLOAT4}},
326{ .Name: "write_imagei" , .Lead: {1}, .Param: {E_ANY,E_IMAGECOORDS,EX_INTV4}},
327{ .Name: "write_imageui" , .Lead: {1}, .Param: {E_ANY,E_IMAGECOORDS,EX_UINTV4}},
328{ .Name: "ncos" , .Lead: {1}, .Param: {E_ANY} },
329{ .Name: "nexp2" , .Lead: {1}, .Param: {E_ANY} },
330{ .Name: "nfma" , .Lead: {1}, .Param: {E_ANY, E_COPY, E_COPY} },
331{ .Name: "nlog2" , .Lead: {1}, .Param: {E_ANY} },
332{ .Name: "nrcp" , .Lead: {1}, .Param: {E_ANY} },
333{ .Name: "nrsqrt" , .Lead: {1}, .Param: {E_ANY} },
334{ .Name: "nsin" , .Lead: {1}, .Param: {E_ANY} },
335{ .Name: "nsqrt" , .Lead: {1}, .Param: {E_ANY} },
336{ .Name: "ftz" , .Lead: {1}, .Param: {E_ANY} },
337{ .Name: "fldexp" , .Lead: {1}, .Param: {E_ANY, EX_UINT} },
338{ .Name: "class" , .Lead: {1}, .Param: {E_ANY, EX_UINT} },
339{ .Name: "rcbrt" , .Lead: {1}, .Param: {E_ANY} },
340};
341
342// Library functions with unmangled name.
343const UnmangledFuncInfo UnmangledFuncInfo::Table[] = {
344 {"__read_pipe_2", 4},
345 {"__read_pipe_4", 6},
346 {"__write_pipe_2", 4},
347 {"__write_pipe_4", 6},
348};
349
350const unsigned UnmangledFuncInfo::TableSize =
351 std::size(UnmangledFuncInfo::Table);
352
353static AMDGPULibFunc::Param getRetType(AMDGPULibFunc::EFuncId id,
354 const AMDGPULibFunc::Param (&Leads)[2]) {
355 AMDGPULibFunc::Param Res = Leads[0];
356 // TBD - This switch may require to be extended for other intrinsics
357 switch (id) {
358 case AMDGPULibFunc::EI_SINCOS:
359 Res.PtrKind = AMDGPULibFunc::BYVALUE;
360 break;
361 default:
362 break;
363 }
364 return Res;
365}
366
367class ParamIterator {
368 const AMDGPULibFunc::Param (&Leads)[2];
369 const ManglingRule& Rule;
370 int Index = 0;
371public:
372 ParamIterator(const AMDGPULibFunc::Param (&leads)[2],
373 const ManglingRule& rule)
374 : Leads(leads), Rule(rule) {}
375
376 AMDGPULibFunc::Param getNextParam();
377};
378
379AMDGPULibFunc::Param ParamIterator::getNextParam() {
380 AMDGPULibFunc::Param P;
381 if (Index >= int(sizeof Rule.Param/sizeof Rule.Param[0])) return P;
382
383 const char R = Rule.Param[Index];
384 switch (R) {
385 case E_NONE: break;
386 case EX_UINT:
387 P.ArgType = AMDGPULibFunc::U32; break;
388 case EX_INTV4:
389 P.ArgType = AMDGPULibFunc::I32; P.VectorSize = 4; break;
390 case EX_UINTV4:
391 P.ArgType = AMDGPULibFunc::U32; P.VectorSize = 4; break;
392 case EX_FLOAT4:
393 P.ArgType = AMDGPULibFunc::F32; P.VectorSize = 4; break;
394 case EX_SIZET:
395 P.ArgType = AMDGPULibFunc::U64; break;
396 case EX_EVENT:
397 P.ArgType = AMDGPULibFunc::EVENT; break;
398 case EX_SAMPLER:
399 P.ArgType = AMDGPULibFunc::SAMPLER; break;
400 case EX_RESERVEDID: break; // TBD
401 default:
402 if (Index == (Rule.Lead[1] - 1)) P = Leads[1];
403 else P = Leads[0];
404
405 switch (R) {
406 case E_ANY:
407 case E_COPY: break;
408
409 case E_POINTEE:
410 P.PtrKind = AMDGPULibFunc::BYVALUE; break;
411 case E_V2_OF_POINTEE:
412 P.VectorSize = 2; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
413 case E_V3_OF_POINTEE:
414 P.VectorSize = 3; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
415 case E_V4_OF_POINTEE:
416 P.VectorSize = 4; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
417 case E_V8_OF_POINTEE:
418 P.VectorSize = 8; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
419 case E_V16_OF_POINTEE:
420 P.VectorSize = 16; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
421 case E_CONSTPTR_ANY:
422 P.PtrKind |= AMDGPULibFunc::CONST; break;
423 case E_VLTLPTR_ANY:
424 P.PtrKind |= AMDGPULibFunc::VOLATILE; break;
425 case E_SETBASE_I32:
426 P.ArgType = AMDGPULibFunc::I32; break;
427 case E_SETBASE_U32:
428 P.ArgType = AMDGPULibFunc::U32; break;
429
430 case E_MAKEBASE_UNS:
431 P.ArgType &= ~AMDGPULibFunc::BASE_TYPE_MASK;
432 P.ArgType |= AMDGPULibFunc::UINT;
433 break;
434
435 case E_IMAGECOORDS:
436 switch (P.ArgType) {
437 case AMDGPULibFunc::IMG1DA: P.VectorSize = 2; break;
438 case AMDGPULibFunc::IMG1DB: P.VectorSize = 1; break;
439 case AMDGPULibFunc::IMG2DA: P.VectorSize = 4; break;
440 case AMDGPULibFunc::IMG1D: P.VectorSize = 1; break;
441 case AMDGPULibFunc::IMG2D: P.VectorSize = 2; break;
442 case AMDGPULibFunc::IMG3D: P.VectorSize = 4; break;
443 }
444 P.PtrKind = AMDGPULibFunc::BYVALUE;
445 P.ArgType = AMDGPULibFunc::I32;
446 break;
447
448 case E_CONSTPTR_SWAPGL: {
449 unsigned AS = AMDGPULibFunc::getAddrSpaceFromEPtrKind(Kind: P.PtrKind);
450 switch (AS) {
451 case AMDGPUAS::GLOBAL_ADDRESS: AS = AMDGPUAS::LOCAL_ADDRESS; break;
452 case AMDGPUAS::LOCAL_ADDRESS: AS = AMDGPUAS::GLOBAL_ADDRESS; break;
453 }
454 P.PtrKind = AMDGPULibFunc::getEPtrKindFromAddrSpace(AS);
455 P.PtrKind |= AMDGPULibFunc::CONST;
456 break;
457 }
458
459 default:
460 llvm_unreachable("Unhandled param rule");
461 }
462 }
463 ++Index;
464 return P;
465}
466
467inline static void drop_front(StringRef& str, size_t n = 1) {
468 str = str.drop_front(N: n);
469}
470
471static bool eatTerm(StringRef& mangledName, const char c) {
472 if (mangledName.front() == c) {
473 drop_front(str&: mangledName);
474 return true;
475 }
476 return false;
477}
478
479template <size_t N>
480static bool eatTerm(StringRef& mangledName, const char (&str)[N]) {
481 if (mangledName.starts_with(Prefix: StringRef(str, N - 1))) {
482 drop_front(str&: mangledName, n: N-1);
483 return true;
484 }
485 return false;
486}
487
488static int eatNumber(StringRef& s) {
489 size_t const savedSize = s.size();
490 int n = 0;
491 while (!s.empty() && isDigit(C: s.front())) {
492 n = n*10 + s.front() - '0';
493 drop_front(str&: s);
494 }
495 return s.size() < savedSize ? n : -1;
496}
497
498static StringRef eatLengthPrefixedName(StringRef& mangledName) {
499 int const Len = eatNumber(s&: mangledName);
500 if (Len <= 0 || static_cast<size_t>(Len) > mangledName.size())
501 return StringRef();
502 StringRef Res = mangledName.substr(Start: 0, N: Len);
503 drop_front(str&: mangledName, n: Len);
504 return Res;
505}
506
507} // end anonymous namespace
508
509AMDGPUMangledLibFunc::AMDGPUMangledLibFunc() {
510 FuncId = EI_NONE;
511 FKind = NOPFX;
512 Leads[0].reset();
513 Leads[1].reset();
514 Name.clear();
515}
516
517AMDGPUUnmangledLibFunc::AMDGPUUnmangledLibFunc() {
518 FuncId = EI_NONE;
519 FuncTy = nullptr;
520}
521
522AMDGPUMangledLibFunc::AMDGPUMangledLibFunc(
523 EFuncId id, const AMDGPUMangledLibFunc &copyFrom) {
524 FuncId = id;
525 FKind = copyFrom.FKind;
526 Leads[0] = copyFrom.Leads[0];
527 Leads[1] = copyFrom.Leads[1];
528}
529
530AMDGPUMangledLibFunc::AMDGPUMangledLibFunc(EFuncId id, FunctionType *FT,
531 bool SignedInts) {
532 FuncId = id;
533 unsigned NumArgs = FT->getNumParams();
534 if (NumArgs >= 1)
535 Leads[0] = Param::getFromTy(Ty: FT->getParamType(i: 0), Signed: SignedInts);
536 if (NumArgs >= 2)
537 Leads[1] = Param::getFromTy(Ty: FT->getParamType(i: 1), Signed: SignedInts);
538}
539
540///////////////////////////////////////////////////////////////////////////////
541// Demangling
542
543static int parseVecSize(StringRef& mangledName) {
544 size_t const Len = eatNumber(s&: mangledName);
545 switch (Len) {
546 case 2: case 3: case 4: case 8: case 16:
547 return Len;
548 default:
549 break;
550 }
551 return 1;
552}
553
554static AMDGPULibFunc::ENamePrefix parseNamePrefix(StringRef& mangledName) {
555 std::pair<StringRef, StringRef> const P = mangledName.split(Separator: '_');
556 AMDGPULibFunc::ENamePrefix Pfx =
557 StringSwitch<AMDGPULibFunc::ENamePrefix>(P.first)
558 .Case(S: "native", Value: AMDGPULibFunc::NATIVE)
559 .Case(S: "half" , Value: AMDGPULibFunc::HALF)
560 .Default(Value: AMDGPULibFunc::NOPFX);
561
562 if (Pfx != AMDGPULibFunc::NOPFX)
563 mangledName = P.second;
564
565 return Pfx;
566}
567
568StringMap<int> ManglingRule::buildManglingRulesMap() {
569 StringMap<int> Map(std::size(manglingRules));
570 int Id = 0;
571 for (auto Rule : manglingRules)
572 Map.insert(KV: {Rule.Name, Id++});
573 return Map;
574}
575
576bool AMDGPUMangledLibFunc::parseUnmangledName(StringRef FullName) {
577 static const StringMap<int> manglingRulesMap =
578 ManglingRule::buildManglingRulesMap();
579 FuncId = static_cast<EFuncId>(manglingRulesMap.lookup(Key: FullName));
580 return FuncId != EI_NONE;
581}
582
583///////////////////////////////////////////////////////////////////////////////
584// Itanium Demangling
585
586namespace {
587struct ItaniumParamParser {
588 AMDGPULibFunc::Param Prev;
589 bool parseItaniumParam(StringRef& param, AMDGPULibFunc::Param &res);
590};
591} // namespace
592
593bool ItaniumParamParser::parseItaniumParam(StringRef& param,
594 AMDGPULibFunc::Param &res) {
595 res.reset();
596 if (param.empty()) return false;
597
598 // parse pointer prefix
599 if (eatTerm(mangledName&: param, c: 'P')) {
600 if (eatTerm(mangledName&: param, c: 'K')) res.PtrKind |= AMDGPULibFunc::CONST;
601 if (eatTerm(mangledName&: param, c: 'V')) res.PtrKind |= AMDGPULibFunc::VOLATILE;
602 unsigned AS;
603 if (!eatTerm(mangledName&: param, str: "U3AS")) {
604 AS = 0;
605 } else {
606 AS = param.front() - '0';
607 drop_front(str&: param, n: 1);
608 }
609 res.PtrKind |= AMDGPULibFuncBase::getEPtrKindFromAddrSpace(AS);
610 } else {
611 res.PtrKind = AMDGPULibFunc::BYVALUE;
612 }
613
614 // parse vector size
615 if (eatTerm(mangledName&: param,str: "Dv")) {
616 res.VectorSize = parseVecSize(mangledName&: param);
617 if (res.VectorSize==1 || !eatTerm(mangledName&: param, c: '_')) return false;
618 }
619
620 // parse type
621 char const TC = param.front();
622 if (isDigit(C: TC)) {
623 res.ArgType = StringSwitch<AMDGPULibFunc::EType>
624 (eatLengthPrefixedName(mangledName&: param))
625 .Case(S: "ocl_image1darray" , Value: AMDGPULibFunc::IMG1DA)
626 .Case(S: "ocl_image1dbuffer", Value: AMDGPULibFunc::IMG1DB)
627 .Case(S: "ocl_image2darray" , Value: AMDGPULibFunc::IMG2DA)
628 .Case(S: "ocl_image1d" , Value: AMDGPULibFunc::IMG1D)
629 .Case(S: "ocl_image2d" , Value: AMDGPULibFunc::IMG2D)
630 .Case(S: "ocl_image3d" , Value: AMDGPULibFunc::IMG3D)
631 .Case(S: "ocl_event" , Value: AMDGPULibFunc::DUMMY)
632 .Case(S: "ocl_sampler" , Value: AMDGPULibFunc::DUMMY)
633 .Default(Value: AMDGPULibFunc::DUMMY);
634 } else {
635 drop_front(str&: param);
636 switch (TC) {
637 case 'h': res.ArgType = AMDGPULibFunc::U8; break;
638 case 't': res.ArgType = AMDGPULibFunc::U16; break;
639 case 'j': res.ArgType = AMDGPULibFunc::U32; break;
640 case 'm': res.ArgType = AMDGPULibFunc::U64; break;
641 case 'c': res.ArgType = AMDGPULibFunc::I8; break;
642 case 's': res.ArgType = AMDGPULibFunc::I16; break;
643 case 'i': res.ArgType = AMDGPULibFunc::I32; break;
644 case 'l': res.ArgType = AMDGPULibFunc::I64; break;
645 case 'f': res.ArgType = AMDGPULibFunc::F32; break;
646 case 'd': res.ArgType = AMDGPULibFunc::F64; break;
647 case 'D': if (!eatTerm(mangledName&: param, c: 'h')) return false;
648 res.ArgType = AMDGPULibFunc::F16; break;
649 case 'S':
650 if (!eatTerm(mangledName&: param, c: '_')) {
651 eatNumber(s&: param);
652 if (!eatTerm(mangledName&: param, c: '_')) return false;
653 }
654 res.VectorSize = Prev.VectorSize;
655 res.ArgType = Prev.ArgType;
656 break;
657 default:;
658 }
659 }
660 if (res.ArgType == 0) return false;
661 Prev.VectorSize = res.VectorSize;
662 Prev.ArgType = res.ArgType;
663 return true;
664}
665
666bool AMDGPUMangledLibFunc::parseFuncName(StringRef &mangledName) {
667 StringRef Name = eatLengthPrefixedName(mangledName);
668 FKind = parseNamePrefix(mangledName&: Name);
669 if (!parseUnmangledName(FullName: Name))
670 return false;
671
672 const ManglingRule& Rule = manglingRules[FuncId];
673 ItaniumParamParser Parser;
674 for (int I=0; I < Rule.maxLeadIndex(); ++I) {
675 Param P;
676 if (!Parser.parseItaniumParam(param&: mangledName, res&: P))
677 return false;
678
679 if ((I + 1) == Rule.Lead[0]) Leads[0] = P;
680 if ((I + 1) == Rule.Lead[1]) Leads[1] = P;
681 }
682 return true;
683}
684
685bool AMDGPUUnmangledLibFunc::parseFuncName(StringRef &Name) {
686 if (!UnmangledFuncInfo::lookup(Name, Id&: FuncId))
687 return false;
688 setName(Name);
689 return true;
690}
691
692bool AMDGPULibFunc::parse(StringRef FuncName, AMDGPULibFunc &F) {
693 if (FuncName.empty()) {
694 F.Impl = std::unique_ptr<AMDGPULibFuncImpl>();
695 return false;
696 }
697
698 if (eatTerm(mangledName&: FuncName, str: "_Z"))
699 F.Impl = std::make_unique<AMDGPUMangledLibFunc>();
700 else
701 F.Impl = std::make_unique<AMDGPUUnmangledLibFunc>();
702 if (F.Impl->parseFuncName(mangledName&: FuncName))
703 return true;
704
705 F.Impl = std::unique_ptr<AMDGPULibFuncImpl>();
706 return false;
707}
708
709StringRef AMDGPUMangledLibFunc::getUnmangledName(StringRef mangledName) {
710 StringRef S = mangledName;
711 if (eatTerm(mangledName&: S, str: "_Z"))
712 return eatLengthPrefixedName(mangledName&: S);
713 return StringRef();
714}
715
716///////////////////////////////////////////////////////////////////////////////
717// Mangling
718
719template <typename Stream>
720void AMDGPUMangledLibFunc::writeName(Stream &OS) const {
721 const char *Pfx = "";
722 switch (FKind) {
723 case NATIVE: Pfx = "native_"; break;
724 case HALF: Pfx = "half_"; break;
725 default: break;
726 }
727 if (!Name.empty()) {
728 OS << Pfx << Name;
729 } else if (FuncId != EI_NONE) {
730 OS << Pfx;
731 const StringRef& S = manglingRules[FuncId].Name;
732 OS.write(S.data(), S.size());
733 }
734}
735
736std::string AMDGPUMangledLibFunc::mangle() const { return mangleNameItanium(); }
737
738///////////////////////////////////////////////////////////////////////////////
739// Itanium Mangling
740
741static const char *getItaniumTypeName(AMDGPULibFunc::EType T) {
742 switch (T) {
743 case AMDGPULibFunc::U8: return "h";
744 case AMDGPULibFunc::U16: return "t";
745 case AMDGPULibFunc::U32: return "j";
746 case AMDGPULibFunc::U64: return "m";
747 case AMDGPULibFunc::I8: return "c";
748 case AMDGPULibFunc::I16: return "s";
749 case AMDGPULibFunc::I32: return "i";
750 case AMDGPULibFunc::I64: return "l";
751 case AMDGPULibFunc::F16: return "Dh";
752 case AMDGPULibFunc::F32: return "f";
753 case AMDGPULibFunc::F64: return "d";
754 case AMDGPULibFunc::IMG1DA: return "16ocl_image1darray";
755 case AMDGPULibFunc::IMG1DB: return "17ocl_image1dbuffer";
756 case AMDGPULibFunc::IMG2DA: return "16ocl_image2darray";
757 case AMDGPULibFunc::IMG1D: return "11ocl_image1d";
758 case AMDGPULibFunc::IMG2D: return "11ocl_image2d";
759 case AMDGPULibFunc::IMG3D: return "11ocl_image3d";
760 case AMDGPULibFunc::SAMPLER: return "11ocl_sampler";
761 case AMDGPULibFunc::EVENT: return "9ocl_event";
762 default:
763 llvm_unreachable("Unhandled param type");
764 }
765 return nullptr;
766}
767
768namespace {
769// Itanium mangling ABI says:
770// "5.1.8. Compression
771// ... Each non-terminal in the grammar for which <substitution> appears on the
772// right-hand side is both a source of future substitutions and a candidate
773// for being substituted. There are two exceptions that appear to be
774// substitution candidates from the grammar, but are explicitly excluded:
775// 1. <builtin-type> other than vendor extended types ..."
776
777// For the purpose of functions the following productions make sense for the
778// substitution:
779// <type> ::= <builtin-type>
780// ::= <class-enum-type>
781// ::= <array-type>
782// ::=<CV-qualifiers> <type>
783// ::= P <type> # pointer-to
784// ::= <substitution>
785//
786// Note that while types like images, samplers and events are by the ABI encoded
787// using <class-enum-type> production rule they're not used for substitution
788// because clang consider them as builtin types.
789//
790// DvNN_ type is GCC extension for vectors and is a subject for the
791// substitution.
792
793class ItaniumMangler {
794 SmallVector<AMDGPULibFunc::Param, 10> Str; // list of accumulated substitutions
795 bool UseAddrSpace;
796
797 int findSubst(const AMDGPULibFunc::Param& P) const {
798 for(unsigned I = 0; I < Str.size(); ++I) {
799 const AMDGPULibFunc::Param& T = Str[I];
800 if (P.PtrKind == T.PtrKind &&
801 P.VectorSize == T.VectorSize &&
802 P.ArgType == T.ArgType) {
803 return I;
804 }
805 }
806 return -1;
807 }
808
809 template <typename Stream>
810 bool trySubst(Stream& os, const AMDGPULibFunc::Param& p) {
811 int const subst = findSubst(P: p);
812 if (subst < 0) return false;
813 // Substitutions are mangled as S(XX)?_ where XX is a hexadecimal number
814 // 0 1 2
815 // S_ S0_ S1_
816 if (subst == 0) os << "S_";
817 else os << 'S' << (subst-1) << '_';
818 return true;
819 }
820
821public:
822 ItaniumMangler(bool useAddrSpace)
823 : UseAddrSpace(useAddrSpace) {}
824
825 template <typename Stream>
826 void operator()(Stream& os, AMDGPULibFunc::Param p) {
827
828 // Itanium mangling ABI 5.1.8. Compression:
829 // Logically, the substitutable components of a mangled name are considered
830 // left-to-right, components before the composite structure of which they
831 // are a part. If a component has been encountered before, it is substituted
832 // as described below. This decision is independent of whether its components
833 // have been substituted, so an implementation may optimize by considering
834 // large structures for substitution before their components. If a component
835 // has not been encountered before, its mangling is identified, and it is
836 // added to a dictionary of substitution candidates. No entity is added to
837 // the dictionary twice.
838 AMDGPULibFunc::Param Ptr;
839
840 if (p.PtrKind) {
841 if (trySubst(os, p)) return;
842 os << 'P';
843 if (p.PtrKind & AMDGPULibFunc::CONST) os << 'K';
844 if (p.PtrKind & AMDGPULibFunc::VOLATILE) os << 'V';
845 unsigned AS = UseAddrSpace
846 ? AMDGPULibFuncBase::getAddrSpaceFromEPtrKind(Kind: p.PtrKind)
847 : 0;
848 if (EnableOCLManglingMismatchWA || AS != 0)
849 os << "U3AS" << AS;
850 Ptr = p;
851 p.PtrKind = 0;
852 }
853
854 if (p.VectorSize > 1) {
855 if (trySubst(os, p)) goto exit;
856 Str.push_back(Elt: p);
857 os << "Dv" << static_cast<unsigned>(p.VectorSize) << '_';
858 }
859
860 os << getItaniumTypeName(T: (AMDGPULibFunc::EType)p.ArgType);
861
862 exit:
863 if (Ptr.ArgType) Str.push_back(Elt: Ptr);
864 }
865};
866} // namespace
867
868std::string AMDGPUMangledLibFunc::mangleNameItanium() const {
869 SmallString<128> Buf;
870 raw_svector_ostream S(Buf);
871 SmallString<128> NameBuf;
872 raw_svector_ostream Name(NameBuf);
873 writeName(OS&: Name);
874 const StringRef& NameStr = Name.str();
875 S << "_Z" << static_cast<int>(NameStr.size()) << NameStr;
876
877 ItaniumMangler Mangler(true);
878 ParamIterator I(Leads, manglingRules[FuncId]);
879 Param P;
880 while ((P = I.getNextParam()).ArgType != 0)
881 Mangler(S, P);
882 return std::string(S.str());
883}
884
885///////////////////////////////////////////////////////////////////////////////
886// Misc
887
888AMDGPULibFuncBase::Param AMDGPULibFuncBase::Param::getFromTy(Type *Ty,
889 bool Signed) {
890 Param P;
891 if (FixedVectorType *VT = dyn_cast<FixedVectorType>(Val: Ty)) {
892 P.VectorSize = VT->getNumElements();
893 Ty = VT->getElementType();
894 }
895
896 switch (Ty->getTypeID()) {
897 case Type::FloatTyID:
898 P.ArgType = AMDGPULibFunc::F32;
899 break;
900 case Type::DoubleTyID:
901 P.ArgType = AMDGPULibFunc::F64;
902 break;
903 case Type::HalfTyID:
904 P.ArgType = AMDGPULibFunc::F16;
905 break;
906 case Type::IntegerTyID:
907 switch (cast<IntegerType>(Val: Ty)->getBitWidth()) {
908 case 8:
909 P.ArgType = Signed ? AMDGPULibFunc::I8 : AMDGPULibFunc::U8;
910 break;
911 case 16:
912 P.ArgType = Signed ? AMDGPULibFunc::I16 : AMDGPULibFunc::U16;
913 break;
914 case 32:
915 P.ArgType = Signed ? AMDGPULibFunc::I32 : AMDGPULibFunc::U32;
916 break;
917 case 64:
918 P.ArgType = Signed ? AMDGPULibFunc::I64 : AMDGPULibFunc::U64;
919 break;
920 default:
921 llvm_unreachable("unhandled libcall argument type");
922 }
923
924 break;
925 default:
926 llvm_unreachable("unhandled libcall argument type");
927 }
928
929 return P;
930}
931
932static Type* getIntrinsicParamType(
933 LLVMContext& C,
934 const AMDGPULibFunc::Param& P,
935 bool useAddrSpace) {
936 Type* T = nullptr;
937 switch (P.ArgType) {
938 case AMDGPULibFunc::U8:
939 case AMDGPULibFunc::I8: T = Type::getInt8Ty(C); break;
940 case AMDGPULibFunc::U16:
941 case AMDGPULibFunc::I16: T = Type::getInt16Ty(C); break;
942 case AMDGPULibFunc::U32:
943 case AMDGPULibFunc::I32: T = Type::getInt32Ty(C); break;
944 case AMDGPULibFunc::U64:
945 case AMDGPULibFunc::I64: T = Type::getInt64Ty(C); break;
946 case AMDGPULibFunc::F16: T = Type::getHalfTy(C); break;
947 case AMDGPULibFunc::F32: T = Type::getFloatTy(C); break;
948 case AMDGPULibFunc::F64: T = Type::getDoubleTy(C); break;
949
950 case AMDGPULibFunc::IMG1DA:
951 case AMDGPULibFunc::IMG1DB:
952 case AMDGPULibFunc::IMG2DA:
953 case AMDGPULibFunc::IMG1D:
954 case AMDGPULibFunc::IMG2D:
955 case AMDGPULibFunc::IMG3D:
956 T = StructType::create(Context&: C,Name: "ocl_image")->getPointerTo(); break;
957 case AMDGPULibFunc::SAMPLER:
958 T = StructType::create(Context&: C,Name: "ocl_sampler")->getPointerTo(); break;
959 case AMDGPULibFunc::EVENT:
960 T = StructType::create(Context&: C,Name: "ocl_event")->getPointerTo(); break;
961 default:
962 llvm_unreachable("Unhandled param type");
963 return nullptr;
964 }
965 if (P.VectorSize > 1)
966 T = FixedVectorType::get(ElementType: T, NumElts: P.VectorSize);
967 if (P.PtrKind != AMDGPULibFunc::BYVALUE)
968 T = useAddrSpace ? T->getPointerTo(AddrSpace: (P.PtrKind & AMDGPULibFunc::ADDR_SPACE)
969 - 1)
970 : T->getPointerTo();
971 return T;
972}
973
974FunctionType *AMDGPUMangledLibFunc::getFunctionType(Module &M) const {
975 LLVMContext& C = M.getContext();
976 std::vector<Type*> Args;
977 ParamIterator I(Leads, manglingRules[FuncId]);
978 Param P;
979 while ((P=I.getNextParam()).ArgType != 0)
980 Args.push_back(x: getIntrinsicParamType(C, P, useAddrSpace: true));
981
982 return FunctionType::get(
983 Result: getIntrinsicParamType(C, P: getRetType(id: FuncId, Leads), useAddrSpace: true),
984 Params: Args, isVarArg: false);
985}
986
987unsigned AMDGPUMangledLibFunc::getNumArgs() const {
988 return manglingRules[FuncId].getNumArgs();
989}
990
991unsigned AMDGPUUnmangledLibFunc::getNumArgs() const {
992 return UnmangledFuncInfo::getNumArgs(Id: FuncId);
993}
994
995std::string AMDGPUMangledLibFunc::getName() const {
996 SmallString<128> Buf;
997 raw_svector_ostream OS(Buf);
998 writeName(OS);
999 return std::string(OS.str());
1000}
1001
1002bool AMDGPULibFunc::isCompatibleSignature(const FunctionType *FuncTy) const {
1003 // TODO: Validate types make sense
1004 return !FuncTy->isVarArg() && FuncTy->getNumParams() == getNumArgs();
1005}
1006
1007Function *AMDGPULibFunc::getFunction(Module *M, const AMDGPULibFunc &fInfo) {
1008 std::string FuncName = fInfo.mangle();
1009 Function *F = dyn_cast_or_null<Function>(
1010 Val: M->getValueSymbolTable().lookup(Name: FuncName));
1011 if (!F || F->isDeclaration())
1012 return nullptr;
1013
1014 if (F->hasFnAttribute(Kind: Attribute::NoBuiltin))
1015 return nullptr;
1016
1017 if (!fInfo.isCompatibleSignature(FuncTy: F->getFunctionType()))
1018 return nullptr;
1019
1020 return F;
1021}
1022
1023FunctionCallee AMDGPULibFunc::getOrInsertFunction(Module *M,
1024 const AMDGPULibFunc &fInfo) {
1025 std::string const FuncName = fInfo.mangle();
1026 Function *F = dyn_cast_or_null<Function>(
1027 Val: M->getValueSymbolTable().lookup(Name: FuncName));
1028
1029 if (F) {
1030 if (F->hasFnAttribute(Kind: Attribute::NoBuiltin))
1031 return nullptr;
1032 if (!F->isDeclaration() &&
1033 fInfo.isCompatibleSignature(FuncTy: F->getFunctionType()))
1034 return F;
1035 }
1036
1037 FunctionType *FuncTy = fInfo.getFunctionType(M&: *M);
1038
1039 bool hasPtr = false;
1040 for (FunctionType::param_iterator
1041 PI = FuncTy->param_begin(),
1042 PE = FuncTy->param_end();
1043 PI != PE; ++PI) {
1044 const Type* argTy = static_cast<const Type*>(*PI);
1045 if (argTy->isPointerTy()) {
1046 hasPtr = true;
1047 break;
1048 }
1049 }
1050
1051 FunctionCallee C;
1052 if (hasPtr) {
1053 // Do not set extra attributes for functions with pointer arguments.
1054 C = M->getOrInsertFunction(Name: FuncName, T: FuncTy);
1055 } else {
1056 AttributeList Attr;
1057 LLVMContext &Ctx = M->getContext();
1058 Attr = Attr.addFnAttribute(
1059 C&: Ctx, Attr: Attribute::getWithMemoryEffects(Context&: Ctx, ME: MemoryEffects::readOnly()));
1060 Attr = Attr.addFnAttribute(C&: Ctx, Kind: Attribute::NoUnwind);
1061 C = M->getOrInsertFunction(Name: FuncName, T: FuncTy, AttributeList: Attr);
1062 }
1063
1064 return C;
1065}
1066
1067StringMap<unsigned> UnmangledFuncInfo::buildNameMap() {
1068 StringMap<unsigned> Map;
1069 for (unsigned I = 0; I != TableSize; ++I)
1070 Map[Table[I].Name] = I;
1071 return Map;
1072}
1073
1074bool UnmangledFuncInfo::lookup(StringRef Name, ID &Id) {
1075 static const StringMap<unsigned> Map = buildNameMap();
1076 auto Loc = Map.find(Key: Name);
1077 if (Loc != Map.end()) {
1078 Id = toFuncId(Index: Loc->second);
1079 return true;
1080 }
1081 Id = AMDGPULibFunc::EI_NONE;
1082 return false;
1083}
1084
1085AMDGPULibFunc::AMDGPULibFunc(const AMDGPULibFunc &F) {
1086 if (auto *MF = dyn_cast<AMDGPUMangledLibFunc>(Val: F.Impl.get()))
1087 Impl = std::make_unique<AMDGPUMangledLibFunc>(args&: *MF);
1088 else if (auto *UMF = dyn_cast<AMDGPUUnmangledLibFunc>(Val: F.Impl.get()))
1089 Impl = std::make_unique<AMDGPUUnmangledLibFunc>(args&: *UMF);
1090 else
1091 Impl = std::unique_ptr<AMDGPULibFuncImpl>();
1092}
1093
1094AMDGPULibFunc &AMDGPULibFunc::operator=(const AMDGPULibFunc &F) {
1095 if (this == &F)
1096 return *this;
1097 new (this) AMDGPULibFunc(F);
1098 return *this;
1099}
1100
1101AMDGPULibFunc::AMDGPULibFunc(EFuncId Id, const AMDGPULibFunc &CopyFrom) {
1102 assert(AMDGPULibFuncBase::isMangled(Id) && CopyFrom.isMangled() &&
1103 "not supported");
1104 Impl = std::make_unique<AMDGPUMangledLibFunc>(
1105 args&: Id, args&: *cast<AMDGPUMangledLibFunc>(Val: CopyFrom.Impl.get()));
1106}
1107
1108AMDGPULibFunc::AMDGPULibFunc(EFuncId Id, FunctionType *FT, bool SignedInts) {
1109 Impl = std::make_unique<AMDGPUMangledLibFunc>(args&: Id, args&: FT, args&: SignedInts);
1110}
1111
1112AMDGPULibFunc::AMDGPULibFunc(StringRef Name, FunctionType *FT) {
1113 Impl = std::make_unique<AMDGPUUnmangledLibFunc>(args&: Name, args&: FT);
1114}
1115
1116void AMDGPULibFunc::initMangled() {
1117 Impl = std::make_unique<AMDGPUMangledLibFunc>();
1118}
1119
1120AMDGPULibFunc::Param *AMDGPULibFunc::getLeads() {
1121 if (!Impl)
1122 initMangled();
1123 return cast<AMDGPUMangledLibFunc>(Val: Impl.get())->Leads;
1124}
1125
1126const AMDGPULibFunc::Param *AMDGPULibFunc::getLeads() const {
1127 return cast<const AMDGPUMangledLibFunc>(Val: Impl.get())->Leads;
1128}
1129