Writer.cpp source code [llvm_projects/lld/ELF/Writer.cpp]

1	//===- Writer.cpp ---------------------------------------------------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8
9	#include "Writer.h"
10	#include "AArch64ErrataFix.h"
11	#include "ARMErrataFix.h"
12	#include "BPSectionOrderer.h"
13	#include "CallGraphSort.h"
14	#include "Config.h"
15	#include "InputFiles.h"
16	#include "LinkerScript.h"
17	#include "MapFile.h"
18	#include "OutputSections.h"
19	#include "Relocations.h"
20	#include "SymbolTable.h"
21	#include "Symbols.h"
22	#include "SyntheticSections.h"
23	#include "Target.h"
24	#include "lld/Common/Arrays.h"
25	#include "lld/Common/CommonLinkerContext.h"
26	#include "lld/Common/Filesystem.h"
27	#include "lld/Common/Strings.h"
28	#include "llvm/ADT/STLExtras.h"
29	#include "llvm/ADT/StringMap.h"
30	#include "llvm/Support/BLAKE3.h"
31	#include "llvm/Support/Parallel.h"
32	#include "llvm/Support/RandomNumberGenerator.h"
33	#include "llvm/Support/TimeProfiler.h"
34	#include "llvm/Support/xxhash.h"
35	#include <climits>
36
37	#define DEBUG_TYPE "lld"
38
39	using namespace llvm;
40	using namespace llvm::ELF;
41	using namespace llvm::object;
42	using namespace llvm::support;
43	using namespace llvm::support::endian;
44	using namespace lld;
45	using namespace lld::elf;
46
47	namespace {
48	// The writer writes a SymbolTable result to a file.
49	template <class ELFT> class Writer {
50	public:
51	LLVM_ELF_IMPORT_TYPES_ELFT(ELFT)
52
53	Writer(Ctx &ctx) : ctx(ctx), buffer(ctx.e.outputBuffer), tc (ctx) {}
54
55	void run();
56
57	private:
58	void addSectionSymbols();
59	void sortSections();
60	void resolveShfLinkOrder();
61	void finalizeAddressDependentContent();
62	void optimizeBasicBlockJumps();
63	void sortInputSections();
64	void sortOrphanSections();
65	void finalizeSections();
66	void checkExecuteOnly();
67	void checkExecuteOnlyReport();
68	void setReservedSymbolSections();
69
70	SmallVector<std::unique_ptr<PhdrEntry>, `0`> createPhdrs(Partition &part);
71	void addPhdrForSection(Partition &part, unsigned shType, unsigned pType,
72	unsigned pFlags);
73	void assignFileOffsets();
74	void assignFileOffsetsBinary();
75	void setPhdrs(Partition &part);
76	void checkSections();
77	void fixSectionAlignments();
78	void openFile();
79	void writeTrapInstr();
80	void writeHeader();
81	void writeSections();
82	void writeSectionsBinary();
83	void writeBuildId();
84
85	Ctx &ctx;
86	std::unique_ptr<FileOutputBuffer> &buffer;
87	// ThunkCreator holds Thunks that are used at writeTo time.
88	ThunkCreator tc;
89
90	void addRelIpltSymbols();
91	void addStartEndSymbols();
92	void addStartStopSymbols(OutputSection &osec);
93
94	uint64_t fileSize;
95	uint64_t sectionHeaderOff;
96	};
97	} // anonymous namespace
98
99	template <class ELFT> void elf::writeResult(Ctx &ctx) {
100	Writer<ELFT>(ctx).run();
101	}
102
103	static void
104	removeEmptyPTLoad(Ctx &ctx, SmallVector<std::unique_ptr<PhdrEntry>, `0`> &phdrs) {
105	auto it = std::stable_partition(first: phdrs.begin(), last: phdrs.end(), pred: [&](auto &p) {
106	if (p->p_type != PT_LOAD)
107	return true;
108	if (!p->firstSec)
109	return false;
110	uint64_t size = p->lastSec->addr + p->lastSec->size - p->firstSec->addr;
111	return size != `0`;
112	});
113
114	// Clear OutputSection::ptLoad for sections contained in removed
115	// segments.
116	DenseSet<PhdrEntry *> removed;
117	for (auto it2 = it; it2 != phdrs.end(); ++it2)
118	removed.insert(V: it2->get());
119	for (OutputSection *sec : ctx.outputSections)
120	if (removed.contains(V: sec->ptLoad))
121	sec->ptLoad = nullptr;
122	phdrs.erase(CS: it, CE: phdrs.end());
123	}
124
125	void elf::copySectionsIntoPartitions(Ctx &ctx) {
126	SmallVector<InputSectionBase *, `0`> newSections;
127	const size_t ehSize = ctx.ehInputSections.size();
128	for (unsigned part = `2`; part != ctx.partitions.size() + `1`; ++part) {
129	for (InputSectionBase *s : ctx.inputSections) {
130	if (!(s->flags & SHF_ALLOC) \|\| !s->isLive() \|\| s->type != SHT_NOTE)
131	continue;
132	auto copy = make<InputSection>(args&: cast<InputSection>(Val&: s));
133	copy->partition = part;
134	newSections.push_back(Elt: copy);
135	}
136	for (size_t i = `0`; i != ehSize; ++i) {
137	assert(ctx.ehInputSections[i]->isLive());
138	auto copy = make<EhInputSection>(args&: ctx.ehInputSections [i]);
139	copy->partition = part;
140	ctx.ehInputSections.push_back(Elt: copy);
141	}
142	}
143
144	ctx.inputSections.insert(I: ctx.inputSections.end(), From: newSections.begin(),
145	To: newSections.end());
146	}
147
148	static Defined addOptionalRegular(Ctx &ctx, StringRef name, SectionBase sec,
149	uint64_t val, uint8_t stOther = STV_HIDDEN) {
150	Symbol *s = ctx.symtab ->find(name);
151	if (!s \|\| s->isDefined() \|\| s->isCommon())
152	return nullptr;
153
154	ctx.synthesizedSymbols.push_back(Elt: s);
155	s->resolve(ctx, other: Defined {ctx, ctx.internalFile, StringRef (), STB_GLOBAL,
156	stOther, STT_NOTYPE, val,
157	/size=/`0`, sec});
158	s->isUsedInRegularObj = true;
159	return cast<Defined>(Val: s);
160	}
161
162	// The linker is expected to define some symbols depending on
163	// the linking result. This function defines such symbols.
164	void elf::addReservedSymbols(Ctx &ctx) {
165	if (ctx.arg.emachine == EM_MIPS) {
166	auto addAbsolute = [&](StringRef name) {
167	Symbol *sym =
168	ctx.symtab ->addSymbol(newSym: Defined {ctx, ctx.internalFile, name, STB_GLOBAL,
169	STV_HIDDEN, STT_NOTYPE, `0`, `0`, nullptr});
170	sym->isUsedInRegularObj = true;
171	return cast<Defined>(Val: sym);
172	};
173	// Define _gp for MIPS. st_value of _gp symbol will be updated by Writer
174	// so that it points to an absolute address which by default is relative
175	// to GOT. Default offset is 0x7ff0.
176	// See "Global Data Symbols" in Chapter 6 in the following document:
177	// ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf
178	ctx.sym.mipsGp = addAbsolute ("_gp");
179
180	// On MIPS O32 ABI, _gp_disp is a magic symbol designates offset between
181	// start of function and 'gp' pointer into GOT.
182	if (ctx.symtab ->find(name: "_gp_disp"))
183	ctx.sym.mipsGpDisp = addAbsolute ("_gp_disp");
184
185	// The __gnu_local_gp is a magic symbol equal to the current value of 'gp'
186	// pointer. This symbol is used in the code generated by .cpload pseudo-op
187	// in case of using -mno-shared option.
188	// https://sourceware.org/ml/binutils/2004-12/msg00094.html
189	if (ctx.symtab ->find(name: "__gnu_local_gp"))
190	ctx.sym.mipsLocalGp = addAbsolute ("__gnu_local_gp");
191	} else if (ctx.arg.emachine == EM_PPC) {
192	// glibc crt1.o has a undefined reference to _SDA_BASE_. Since we don't*
193	// support Small Data Area, define it arbitrarily as 0.
194	addOptionalRegular(ctx, name: "_SDA_BASE_", sec: nullptr, val: `0`, stOther: STV_HIDDEN);
195	} else if (ctx.arg.emachine == EM_PPC64) {
196	addPPC64SaveRestore(ctx);
197	}
198
199	// The Power Architecture 64-bit v2 ABI defines a TableOfContents (TOC) which
200	// combines the typical ELF GOT with the small data sections. It commonly
201	// includes .got .toc .sdata .sbss. The .TOC. symbol replaces both
202	// _GLOBAL_OFFSET_TABLE_ and _SDA_BASE_ from the 32-bit ABI. It is used to
203	// represent the TOC base which is offset by 0x8000 bytes from the start of
204	// the .got section.
205	// We do not allow _GLOBAL_OFFSET_TABLE_ to be defined by input objects as the
206	// correctness of some relocations depends on its value.
207	StringRef gotSymName =
208	(ctx.arg.emachine == EM_PPC64) ? ".TOC." : "_GLOBAL_OFFSET_TABLE_";
209
210	if (Symbol *s = ctx.symtab ->find(name: gotSymName)) {
211	if (s->isDefined()) {
212	ErrAlways(ctx) << s->file << " cannot redefine linker defined symbol '"
213	<< gotSymName << "'";
214	return;
215	}
216
217	uint64_t gotOff = `0`;
218	if (ctx.arg.emachine == EM_PPC64)
219	gotOff = `0x8000`;
220
221	s->resolve(ctx, other: Defined {ctx, ctx.internalFile, StringRef(), STB_GLOBAL,
222	STV_HIDDEN, STT_NOTYPE, gotOff, /size=/`0`,
223	ctx.out.elfHeader.get()});
224	ctx.sym.globalOffsetTable = cast<Defined>(Val: s);
225	}
226
227	// __ehdr_start is the location of ELF file headers. Note that we define
228	// this symbol unconditionally even when using a linker script, which
229	// differs from the behavior implemented by GNU linker which only define
230	// this symbol if ELF headers are in the memory mapped segment.
231	addOptionalRegular(ctx, name: "__ehdr_start", sec: ctx.out.elfHeader.get(), val: `0`,
232	stOther: STV_HIDDEN);
233
234	// __executable_start is not documented, but the expectation of at
235	// least the Android libc is that it points to the ELF header.
236	addOptionalRegular(ctx, name: "__executable_start", sec: ctx.out.elfHeader.get(), val: `0`,
237	stOther: STV_HIDDEN);
238
239	// __dso_handle symbol is passed to cxa_finalize as a marker to identify
240	// each DSO. The address of the symbol doesn't matter as long as they are
241	// different in different DSOs, so we chose the start address of the DSO.
242	addOptionalRegular(ctx, name: "__dso_handle", sec: ctx.out.elfHeader.get(), val: `0`,
243	stOther: STV_HIDDEN);
244
245	// If linker script do layout we do not need to create any standard symbols.
246	if (ctx.script->hasSectionsCommand)
247	return;
248
249	auto add = [&](StringRef s, int64_t pos) {
250	return addOptionalRegular(ctx, name: s, sec: ctx.out.elfHeader.get(), val: pos,
251	stOther: STV_DEFAULT);
252	};
253
254	ctx.sym.bss = add ("__bss_start", `0`);
255	ctx.sym.end1 = add ("end", -`1`);
256	ctx.sym.end2 = add ("_end", -`1`);
257	ctx.sym.etext1 = add ("etext", -`1`);
258	ctx.sym.etext2 = add ("_etext", -`1`);
259	ctx.sym.edata1 = add ("edata", -`1`);
260	ctx.sym.edata2 = add ("_edata", -`1`);
261	}
262
263	static void demoteDefined(Defined &sym, DenseMap<SectionBase *, size_t> &map) {
264	if (map.empty())
265	for (auto [i, sec] : llvm::enumerate(First: sym.file->getSections()))
266	map.try_emplace(Key: sec, Args&: i);
267	// Change WEAK to GLOBAL so that if a scanned relocation references sym,
268	// maybeReportUndefined will report an error.
269	uint8_t binding = sym.isWeak() ? uint8_t(STB_GLOBAL) : sym.binding;
270	Undefined (sym.file, sym.getName(), binding, sym.stOther, sym.type,
271	/discardedSecIdx=/map.lookup(Val: sym.section))
272	.overwrite(sym);
273	// Eliminate from the symbol table, otherwise we would leave an undefined
274	// symbol if the symbol is unreferenced in the absence of GC.
275	sym.isUsedInRegularObj = false;
276	}
277
278	// If all references to a DSO happen to be weak, the DSO is not added to
279	// DT_NEEDED. If that happens, replace ShardSymbol with Undefined to avoid
280	// dangling references to an unneeded DSO. Use a weak binding to avoid
281	// --no-allow-shlib-undefined diagnostics. Similarly, demote lazy symbols.
282	//
283	// In addition, demote symbols defined in discarded sections, so that
284	// references to /DISCARD/ discarded symbols will lead to errors.
285	static void demoteSymbolsAndComputeIsPreemptible(Ctx &ctx) {
286	llvm::TimeTraceScope timeScope("Demote symbols");
287	DenseMap<InputFile , DenseMap<SectionBase , size_t>> sectionIndexMap;
288	for (Symbol *sym : ctx.symtab ->getSymbols()) {
289	if (auto *d = dyn_cast<Defined>(Val: sym)) {
290	if (d->section && !d->section->isLive())
291	demoteDefined(sym&: *d, map&: sectionIndexMap [d->file]);
292	} else {
293	auto *s = dyn_cast<SharedSymbol>(Val: sym);
294	if (sym->isLazy() \|\| (s && !cast<SharedFile>(Val: s->file)->isNeeded)) {
295	uint8_t binding = sym->isLazy() ? sym->binding : uint8_t(STB_WEAK);
296	Undefined (ctx.internalFile, sym->getName(), binding, sym->stOther,
297	sym->type)
298	.overwrite(sym&: *sym);
299	sym->versionId = VER_NDX_GLOBAL;
300	}
301	}
302
303	sym->isPreemptible = (sym->isUndefined() \|\| sym->isExported) &&
304	computeIsPreemptible(ctx, sym: *sym);
305	}
306	}
307
308	static OutputSection *findSection(Ctx &ctx, StringRef name,
309	unsigned partition = `1`) {
310	for (SectionCommand *cmd : ctx.script->sectionCommands)
311	if (auto *osd = dyn_cast<OutputDesc>(Val: cmd))
312	if (osd->osec.name == name && osd->osec.partition == partition)
313	return &osd->osec;
314	return nullptr;
315	}
316
317	// The main function of the writer.
318	template <class ELFT> void Writer<ELFT>::run() {
319	// Now that we have a complete set of output sections. This function
320	// completes section contents. For example, we need to add strings
321	// to the string table, and add entries to .got and .plt.
322	// finalizeSections does that.
323	finalizeSections();
324	checkExecuteOnly();
325	checkExecuteOnlyReport();
326
327	// If --compressed-debug-sections is specified, compress .debug_ sections.*
328	// Do it right now because it changes the size of output sections.
329	for (OutputSection *sec : ctx.outputSections)
330	sec->maybeCompress<ELFT>(ctx);
331
332	if (ctx.script->hasSectionsCommand)
333	ctx.script->allocateHeaders(phdrs&: ctx.mainPart->phdrs);
334
335	// Remove empty PT_LOAD to avoid causing the dynamic linker to try to mmap a
336	// 0 sized region. This has to be done late since only after assignAddresses
337	// we know the size of the sections.
338	for (Partition &part : ctx.partitions)
339	removeEmptyPTLoad(ctx, phdrs&: part.phdrs);
340
341	if (!ctx.arg.oFormatBinary)
342	assignFileOffsets();
343	else
344	assignFileOffsetsBinary();
345
346	for (Partition &part : ctx.partitions)
347	setPhdrs(part);
348
349	// Handle --print-map(-M)/--Map and --cref. Dump them before checkSections()
350	// because the files may be useful in case checkSections() or openFile()
351	// fails, for example, due to an erroneous file size.
352	writeMapAndCref(ctx);
353
354	// Handle --print-memory-usage option.
355	if (ctx.arg.printMemoryUsage)
356	ctx.script->printMemoryUsage(os&: ctx.e.outs());
357
358	if (ctx.arg.checkSections)
359	checkSections();
360
361	// It does not make sense try to open the file if we have error already.
362	if (errCount(ctx))
363	return;
364
365	{
366	llvm::TimeTraceScope timeScope("Write output file");
367	// Write the result down to a file.
368	openFile();
369	if (errCount(ctx))
370	return;
371
372	if (!ctx.arg.oFormatBinary) {
373	if (ctx.arg.zSeparate != SeparateSegmentKind::None)
374	writeTrapInstr();
375	writeHeader();
376	writeSections();
377	} else {
378	writeSectionsBinary();
379	}
380
381	// Backfill .note.gnu.build-id section content. This is done at last
382	// because the content is usually a hash value of the entire output file.
383	writeBuildId();
384	if (errCount(ctx))
385	return;
386
387	if (!ctx.e.disableOutput) {
388	if (auto e = buffer ->commit())
389	Err(ctx) << "failed to write output '" << buffer ->getPath()
390	<< "': " << std::move(e);
391	}
392
393	if (!ctx.arg.cmseOutputLib.empty())
394	writeARMCmseImportLib<ELFT>(ctx);
395	}
396	}
397
398	template <class ELFT, class RelTy>
399	static void markUsedLocalSymbolsImpl(ObjFile<ELFT> *file,
400	llvm::ArrayRef<RelTy> rels) {
401	for (const RelTy &rel : rels) {
402	Symbol &sym = file->getRelocTargetSym(rel);
403	if (sym.isLocal())
404	sym.used = true;
405	}
406	}
407
408	// The function ensures that the "used" field of local symbols reflects the fact
409	// that the symbol is used in a relocation from a live section.
410	template <class ELFT> static void markUsedLocalSymbols(Ctx &ctx) {
411	// With --gc-sections, the field is already filled.
412	// See MarkLive<ELFT>::resolveReloc().
413	if (ctx.arg.gcSections)
414	return;
415	for (ELFFileBase *file : ctx.objectFiles) {
416	ObjFile<ELFT> *f = cast<ObjFile<ELFT>>(file);
417	for (InputSectionBase *s : f->getSections()) {
418	InputSection *isec = dyn_cast_or_null<InputSection>(Val: s);
419	if (!isec)
420	continue;
421	if (isec->type == SHT_REL) {
422	markUsedLocalSymbolsImpl(f, isec->getDataAs<typename ELFT::Rel>());
423	} else if (isec->type == SHT_RELA) {
424	markUsedLocalSymbolsImpl(f, isec->getDataAs<typename ELFT::Rela>());
425	} else if (isec->type == SHT_CREL) {
426	// The is64=true variant also works with ELF32 since only the r_symidx
427	// member is used.
428	for (Elf_Crel_Impl<true> r : RelocsCrel<true>(isec->content_)) {
429	Symbol &sym = file->getSymbol(symbolIndex: r.r_symidx);
430	if (sym.isLocal())
431	sym.used = true;
432	}
433	}
434	}
435	}
436	}
437
438	static bool shouldKeepInSymtab(Ctx &ctx, const Defined &sym) {
439	if (sym.isSection())
440	return false;
441
442	// If --emit-reloc or -r is given, preserve symbols referenced by relocations
443	// from live sections.
444	if (sym.used && ctx.arg.copyRelocs)
445	return true;
446
447	// Exclude local symbols pointing to .ARM.exidx sections.
448	// They are probably mapping symbols "$d", which are optional for these
449	// sections. After merging the .ARM.exidx sections, some of these symbols
450	// may become dangling. The easiest way to avoid the issue is not to add
451	// them to the symbol table from the beginning.
452	if (ctx.arg.emachine == EM_ARM && sym.section &&
453	sym.section->type == SHT_ARM_EXIDX)
454	return false;
455
456	if (ctx.arg.discard == DiscardPolicy::None)
457	return true;
458	if (ctx.arg.discard == DiscardPolicy::All)
459	return false;
460
461	// In ELF assembly .L symbols are normally discarded by the assembler.
462	// If the assembler fails to do so, the linker discards them if
463	// --discard-locals is used.*
464	// The symbol is in a SHF_MERGE section, which is normally the reason for*
465	// the assembler keeping the .L symbol.
466	if (sym.getName().starts_with(Prefix: ".L") &&
467	(ctx.arg.discard == DiscardPolicy::Locals \|\|
468	(sym.section && (sym.section->flags & SHF_MERGE))))
469	return false;
470	return true;
471	}
472
473	bool elf::includeInSymtab(Ctx &ctx, const Symbol &b) {
474	if (auto *d = dyn_cast<Defined>(Val: &b)) {
475	// Always include absolute symbols.
476	SectionBase *sec = d->section;
477	if (!sec)
478	return true;
479	assert(sec->isLive());
480
481	if (auto *s = dyn_cast<MergeInputSection>(Val: sec))
482	return s->getSectionPiece(offset: d->value).live;
483	return true;
484	}
485	return b.used \|\| !ctx.arg.gcSections;
486	}
487
488	// Scan local symbols to:
489	//
490	// - demote symbols defined relative to /DISCARD/ discarded input sections so
491	// that relocations referencing them will lead to errors.
492	// - copy eligible symbols to .symTab
493	static void demoteAndCopyLocalSymbols(Ctx &ctx) {
494	llvm::TimeTraceScope timeScope("Add local symbols");
495	for (ELFFileBase *file : ctx.objectFiles) {
496	DenseMap<SectionBase *, size_t> sectionIndexMap;
497	for (Symbol *b : file->getLocalSymbols()) {
498	assert(b->isLocal() && "should have been caught in initializeSymbols()");
499	auto *dr = dyn_cast<Defined>(Val: b);
500	if (!dr)
501	continue;
502
503	if (dr->section && !dr->section->isLive())
504	demoteDefined(sym&: *dr, map&: sectionIndexMap);
505	else if (ctx.in.symTab && includeInSymtab(ctx, b: *b) &&
506	shouldKeepInSymtab(ctx, sym: *dr))
507	ctx.in.symTab ->addSymbol(sym: b);
508	}
509	}
510	}
511
512	// Create a section symbol for each output section so that we can represent
513	// relocations that point to the section. If we know that no relocation is
514	// referring to a section (that happens if the section is a synthetic one), we
515	// don't create a section symbol for that section.
516	template <class ELFT> void Writer<ELFT>::addSectionSymbols() {
517	for (SectionCommand *cmd : ctx.script->sectionCommands) {
518	auto *osd = dyn_cast<OutputDesc>(Val: cmd);
519	if (!osd)
520	continue;
521	OutputSection &osec = osd->osec;
522	InputSectionBase isec = nullptr*;
523	// Iterate over all input sections and add a STT_SECTION symbol if any input
524	// section may be a relocation target.
525	for (SectionCommand *cmd : osec.commands) {
526	auto *isd = dyn_cast<InputSectionDescription>(Val: cmd);
527	if (!isd)
528	continue;
529	for (InputSectionBase *s : isd->sections) {
530	// Relocations are not using REL[A] section symbols.
531	if (isStaticRelSecType(type: s->type))
532	continue;
533
534	// Unlike other synthetic sections, mergeable output sections contain
535	// data copied from input sections, and there may be a relocation
536	// pointing to its contents if -r or --emit-reloc is given.
537	if (isa<SyntheticSection>(Val: s) && !(s->flags & SHF_MERGE))
538	continue;
539
540	isec = s;
541	break;
542	}
543	}
544	if (!isec)
545	continue;
546
547	// Set the symbol to be relative to the output section so that its st_value
548	// equals the output section address. Note, there may be a gap between the
549	// start of the output section and isec.
550	ctx.in.symTab ->addSymbol(sym: makeDefined(args&: ctx, args&: isec->file, args: "", args: STB_LOCAL,
551	/stOther=/args: `0`, args: STT_SECTION,
552	/value=/args: `0`, /size=/args: `0`, args: &osec));
553	}
554	}
555
556	// Returns true if this is a variant of .data.rel.ro.
557	static bool isRelRoDataSection(Ctx &ctx, StringRef secName) {
558	if (!secName.consume_front(Prefix: ".data.rel.ro"))
559	return false;
560	if (secName.empty())
561	return true;
562	// If -z keep-data-section-prefix is specified, additionally allow
563	// '.data.rel.ro.hot' and '.data.rel.ro.unlikely'.
564	if (ctx.arg.zKeepDataSectionPrefix)
565	return secName == ".hot" \|\| secName == ".unlikely";
566	return false;
567	}
568
569	// Today's loaders have a feature to make segments read-only after
570	// processing dynamic relocations to enhance security. PT_GNU_RELRO
571	// is defined for that.
572	//
573	// This function returns true if a section needs to be put into a
574	// PT_GNU_RELRO segment.
575	static bool isRelroSection(Ctx &ctx, const OutputSection *sec) {
576	if (!ctx.arg.zRelro)
577	return false;
578	if (sec->relro)
579	return true;
580
581	uint64_t flags = sec->flags;
582
583	// Non-allocatable or non-writable sections don't need RELRO because
584	// they are not writable or not even mapped to memory in the first place.
585	// RELRO is for sections that are essentially read-only but need to
586	// be writable only at process startup to allow dynamic linker to
587	// apply relocations.
588	if (!(flags & SHF_ALLOC) \|\| !(flags & SHF_WRITE))
589	return false;
590
591	// Once initialized, TLS data segments are used as data templates
592	// for a thread-local storage. For each new thread, runtime
593	// allocates memory for a TLS and copy templates there. No thread
594	// are supposed to use templates directly. Thus, it can be in RELRO.
595	if (flags & SHF_TLS)
596	return true;
597
598	// .init_array, .preinit_array and .fini_array contain pointers to
599	// functions that are executed on process startup or exit. These
600	// pointers are set by the static linker, and they are not expected
601	// to change at runtime. But if you are an attacker, you could do
602	// interesting things by manipulating pointers in .fini_array, for
603	// example. So they are put into RELRO.
604	uint32_t type = sec->type;
605	if (type == SHT_INIT_ARRAY \|\| type == SHT_FINI_ARRAY \|\|
606	type == SHT_PREINIT_ARRAY)
607	return true;
608
609	// .got contains pointers to external symbols. They are resolved by
610	// the dynamic linker when a module is loaded into memory, and after
611	// that they are not expected to change. So, it can be in RELRO.
612	if (ctx.in.got && sec == ctx.in.got ->getParent())
613	return true;
614
615	// .toc is a GOT-ish section for PowerPC64. Their contents are accessed
616	// through r2 register, which is reserved for that purpose. Since r2 is used
617	// for accessing .got as well, .got and .toc need to be close enough in the
618	// virtual address space. Usually, .toc comes just after .got. Since we place
619	// .got into RELRO, .toc needs to be placed into RELRO too.
620	if (sec->name == ".toc")
621	return true;
622
623	// .got.plt contains pointers to external function symbols. They are
624	// by default resolved lazily, so we usually cannot put it into RELRO.
625	// However, if "-z now" is given, the lazy symbol resolution is
626	// disabled, which enables us to put it into RELRO.
627	if (sec == ctx.in.gotPlt ->getParent())
628	return ctx.arg.zNow;
629
630	if (ctx.in.relroPadding && sec == ctx.in.relroPadding ->getParent())
631	return true;
632
633	// .dynamic section contains data for the dynamic linker, and
634	// there's no need to write to it at runtime, so it's better to put
635	// it into RELRO.
636	if (sec->name == ".dynamic")
637	return true;
638
639	// Sections with some special names are put into RELRO. This is a
640	// bit unfortunate because section names shouldn't be significant in
641	// ELF in spirit. But in reality many linker features depend on
642	// magic section names.
643	StringRef s = sec->name;
644
645	bool abiAgnostic = isRelRoDataSection(ctx, secName: s) \|\| s == ".bss.rel.ro" \|\|
646	s == ".ctors" \|\| s == ".dtors" \|\| s == ".jcr" \|\|
647	s == ".eh_frame" \|\| s == ".fini_array" \|\|
648	s == ".init_array" \|\| s == ".preinit_array";
649
650	bool abiSpecific =
651	ctx.arg.osabi == ELFOSABI_OPENBSD && s == ".openbsd.randomdata";
652
653	return abiAgnostic \|\| abiSpecific;
654	}
655
656	// We compute a rank for each section. The rank indicates where the
657	// section should be placed in the file. Instead of using simple
658	// numbers (0,1,2...), we use a series of flags. One for each decision
659	// point when placing the section.
660	// Using flags has two key properties:
661	// It is easy to check if a give branch was taken.*
662	// It is easy two see how similar two ranks are (see getRankProximity).*
663	enum RankFlags {
664	RF_NOT_ADDR_SET = `1` << `27`,
665	RF_NOT_ALLOC = `1` << `26`,
666	RF_PARTITION = `1` << `18`, // Partition number (8 bits)
667	RF_LARGE_EXEC_WRITE = `1` << `16`,
668	RF_LARGE_ALT = `1` << `15`,
669	RF_WRITE = `1` << `14`,
670	RF_EXEC_WRITE = `1` << `13`,
671	RF_EXEC = `1` << `12`,
672	RF_RODATA = `1` << `11`,
673	RF_LARGE_EXEC = `1` << `10`,
674	RF_LARGE = `1` << `9`,
675	RF_NOT_RELRO = `1` << `8`,
676	RF_NOT_TLS = `1` << `7`,
677	RF_BSS = `1` << `6`,
678	};
679
680	unsigned elf::getSectionRank(Ctx &ctx, OutputSection &osec) {
681	unsigned rank = osec.partition * RF_PARTITION;
682
683	// We want to put section specified by -T option first, so we
684	// can start assigning VA starting from them later.
685	if (ctx.arg.sectionStartMap.contains(Key: osec.name))
686	return rank;
687	rank \|= RF_NOT_ADDR_SET;
688
689	// Allocatable sections go first to reduce the total PT_LOAD size and
690	// so debug info doesn't change addresses in actual code.
691	if (!(osec.flags & SHF_ALLOC))
692	return rank \| RF_NOT_ALLOC;
693
694	// Sort sections based on their access permission in the following
695	// order: R, RX, RXW, RW(RELRO), RW(non-RELRO).
696	//
697	// Read-only sections come first such that they go in the PT_LOAD covering the
698	// program headers at the start of the file.
699	//
700	// The layout for writable sections is PT_LOAD(PT_GNU_RELRO(.data.rel.ro
701	// .bss.rel.ro) \| .data .bss), where \| marks where page alignment happens.
702	// An alternative ordering is PT_LOAD(.data \| PT_GNU_RELRO( .data.rel.ro
703	// .bss.rel.ro) \| .bss), but it may waste more bytes due to 2 alignment
704	// places.
705	bool isExec = osec.flags & SHF_EXECINSTR;
706	bool isWrite = osec.flags & SHF_WRITE;
707	bool isLarge = osec.flags & SHF_X86_64_LARGE && ctx.arg.emachine == EM_X86_64;
708
709	if (!isWrite && !isExec) {
710	// Among PROGBITS sections, place .lrodata further from .text.
711	// For -z lrodata-after-bss, place .lrodata after .lbss like GNU ld. This
712	// layout has one extra PT_LOAD, but alleviates relocation overflow
713	// pressure for absolute relocations referencing small data from -fno-pic
714	// relocatable files.
715	if (isLarge)
716	rank \|= ctx.arg.zLrodataAfterBss ? RF_LARGE_ALT : `0`;
717	else
718	rank \|= ctx.arg.zLrodataAfterBss ? `0` : RF_LARGE;
719
720	if (osec.type == SHT_LLVM_PART_EHDR)
721	;
722	else if (osec.type == SHT_LLVM_PART_PHDR)
723	rank \|= `1`;
724	else if (osec.name == ".interp")
725	rank \|= `2`;
726	// Put .note sections at the beginning so that they are likely to be
727	// included in a truncate core file. In particular, .note.gnu.build-id, if
728	// available, can identify the object file.
729	else if (osec.type == SHT_NOTE)
730	rank \|= `3`;
731	// Make PROGBITS sections (e.g .rodata .eh_frame) closer to .text to
732	// alleviate relocation overflow pressure. Large special sections such as
733	// .dynstr and .dynsym can be away from .text.
734	else if (osec.type != SHT_PROGBITS)
735	rank \|= `4`;
736	else
737	rank \|= RF_RODATA;
738	} else if (isExec) {
739	// Place readonly .ltext before .lrodata and writable .ltext after .lbss to
740	// keep writable and readonly segments separate.
741	if (isLarge) {
742	rank \|= isWrite ? RF_LARGE_EXEC_WRITE : RF_LARGE_EXEC;
743	} else {
744	rank \|= isWrite ? RF_EXEC_WRITE : RF_EXEC;
745	}
746	} else {
747	rank \|= RF_WRITE;
748	// The TLS initialization block needs to be a single contiguous block. Place
749	// TLS sections directly before the other RELRO sections.
750	if (!(osec.flags & SHF_TLS))
751	rank \|= RF_NOT_TLS;
752	if (isRelroSection(ctx, sec: &osec))
753	osec.relro = true;
754	else
755	rank \|= RF_NOT_RELRO;
756	// Place .ldata and .lbss after .bss. Making .bss closer to .text
757	// alleviates relocation overflow pressure.
758	// For -z lrodata-after-bss, place .lbss/.lrodata/.ldata after .bss.
759	// .bss/.lbss being adjacent reuses the NOBITS size optimization.
760	if (isLarge) {
761	rank \|= ctx.arg.zLrodataAfterBss
762	? (osec.type == SHT_NOBITS ? `1` : RF_LARGE_ALT)
763	: RF_LARGE;
764	}
765	}
766
767	// Within TLS sections, or within other RelRo sections, or within non-RelRo
768	// sections, place non-NOBITS sections first.
769	if (osec.type == SHT_NOBITS)
770	rank \|= RF_BSS;
771
772	// Some architectures have additional ordering restrictions for sections
773	// within the same PT_LOAD.
774	if (ctx.arg.emachine == EM_PPC64) {
775	// PPC64 has a number of special SHT_PROGBITS+SHF_ALLOC+SHF_WRITE sections
776	// that we would like to make sure appear is a specific order to maximize
777	// their coverage by a single signed 16-bit offset from the TOC base
778	// pointer.
779	StringRef name = osec.name;
780	if (name == ".got")
781	rank \|= `1`;
782	else if (name == ".toc")
783	rank \|= `2`;
784	}
785
786	if (ctx.arg.emachine == EM_MIPS) {
787	if (osec.name != ".got")
788	rank \|= `1`;
789	// All sections with SHF_MIPS_GPREL flag should be grouped together
790	// because data in these sections is addressable with a gp relative address.
791	if (osec.flags & SHF_MIPS_GPREL)
792	rank \|= `2`;
793	}
794
795	if (ctx.arg.emachine == EM_RISCV) {
796	// .sdata and .sbss are placed closer to make GP relaxation more profitable
797	// and match GNU ld.
798	StringRef name = osec.name;
799	if (name == ".sdata" \|\| (osec.type == SHT_NOBITS && name != ".sbss"))
800	rank \|= `1`;
801	}
802
803	return rank;
804	}
805
806	static bool compareSections(Ctx &ctx, const SectionCommand *aCmd,
807	const SectionCommand *bCmd) {
808	const OutputSection *a = &cast<OutputDesc>(Val: aCmd)->osec;
809	const OutputSection *b = &cast<OutputDesc>(Val: bCmd)->osec;
810
811	if (a->sortRank != b->sortRank)
812	return a->sortRank < b->sortRank;
813
814	if (!(a->sortRank & RF_NOT_ADDR_SET))
815	return ctx.arg.sectionStartMap.lookup(Key: a->name) <
816	ctx.arg.sectionStartMap.lookup(Key: b->name);
817	return false;
818	}
819
820	void PhdrEntry::add(OutputSection *sec) {
821	lastSec = sec;
822	if (!firstSec)
823	firstSec = sec;
824	p_align = std::max(a: p_align, b: sec->addralign);
825	if (p_type == PT_LOAD)
826	sec->ptLoad = this;
827	}
828
829	// A statically linked position-dependent executable should only contain
830	// IRELATIVE relocations and no other dynamic relocations. Encapsulation symbols
831	// __rel[a]_iplt_{start,end} will be defined for .rel[a].dyn, to be
832	// processed by the libc runtime. Other executables or DSOs use dynamic tags
833	// instead.
834	template <class ELFT> void Writer<ELFT>::addRelIpltSymbols() {
835	if (ctx.arg.isPic)
836	return;
837
838	// __rela_iplt_{start,end} are initially defined relative to dummy section 0.
839	// We'll override ctx.out.elfHeader with relaDyn later when we are sure that
840	// .rela.dyn will be present in the output.
841	std::string name = ctx.arg.isRela ? "__rela_iplt_start" : "__rel_iplt_start";
842	ctx.sym.relaIpltStart =
843	addOptionalRegular(ctx, name, sec: ctx.out.elfHeader.get(), val: `0`, stOther: STV_HIDDEN);
844	name.replace(pos: name.size() - `5`, n1: `5`, s: "end");
845	ctx.sym.relaIpltEnd =
846	addOptionalRegular(ctx, name, sec: ctx.out.elfHeader.get(), val: `0`, stOther: STV_HIDDEN);
847	}
848
849	// This function generates assignments for predefined symbols (e.g. _end or
850	// _etext) and inserts them into the commands sequence to be processed at the
851	// appropriate time. This ensures that the value is going to be correct by the
852	// time any references to these symbols are processed and is equivalent to
853	// defining these symbols explicitly in the linker script.
854	template <class ELFT> void Writer<ELFT>::setReservedSymbolSections() {
855	if (ctx.sym.globalOffsetTable) {
856	// The _GLOBAL_OFFSET_TABLE_ symbol is defined by target convention usually
857	// to the start of the .got or .got.plt section.
858	InputSection *sec = ctx.in.gotPlt.get();
859	if (!ctx.target ->gotBaseSymInGotPlt)
860	sec = ctx.in.mipsGot ? cast<InputSection>(Val: ctx.in.mipsGot.get())
861	: cast<InputSection>(Val: ctx.in.got.get());
862	ctx.sym.globalOffsetTable->section = sec;
863	}
864
865	// .rela_iplt_{start,end} mark the start and the end of the section containing
866	// IRELATIVE relocations.
867	if (ctx.sym.relaIpltStart) {
868	auto &dyn = getIRelativeSection(ctx);
869	if (dyn.isNeeded()) {
870	ctx.sym.relaIpltStart->section = &dyn;
871	ctx.sym.relaIpltEnd->section = &dyn;
872	ctx.sym.relaIpltEnd->value = dyn.getSize();
873	}
874	}
875
876	PhdrEntry last = nullptr*;
877	OutputSection lastRO = nullptr*;
878	auto isLarge = [&ctx = ctx](OutputSection *osec) {
879	return ctx.arg.emachine == EM_X86_64 && osec->flags & SHF_X86_64_LARGE;
880	};
881	for (Partition &part : ctx.partitions) {
882	for (auto &p : part.phdrs) {
883	if (p ->p_type != PT_LOAD)
884	continue;
885	last = p.get();
886	if (!(p ->p_flags & PF_W) && p ->lastSec && !isLarge(p ->lastSec))
887	lastRO = p ->lastSec;
888	}
889	}
890
891	if (lastRO) {
892	// _etext is the first location after the last read-only loadable segment
893	// that does not contain large sections.
894	if (ctx.sym.etext1)
895	ctx.sym.etext1->section = lastRO;
896	if (ctx.sym.etext2)
897	ctx.sym.etext2->section = lastRO;
898	}
899
900	if (last) {
901	// _edata points to the end of the last non-large mapped initialized
902	// section.
903	OutputSection edata = nullptr*;
904	for (OutputSection *os : ctx.outputSections) {
905	if (os->type != SHT_NOBITS && !isLarge(os))
906	edata = os;
907	if (os == last->lastSec)
908	break;
909	}
910
911	if (ctx.sym.edata1)
912	ctx.sym.edata1->section = edata;
913	if (ctx.sym.edata2)
914	ctx.sym.edata2->section = edata;
915
916	// _end is the first location after the uninitialized data region.
917	if (ctx.sym.end1)
918	ctx.sym.end1->section = last->lastSec;
919	if (ctx.sym.end2)
920	ctx.sym.end2->section = last->lastSec;
921	}
922
923	if (ctx.sym.bss) {
924	// On RISC-V, set __bss_start to the start of .sbss if present.
925	OutputSection *sbss =
926	ctx.arg.emachine == EM_RISCV ? findSection(ctx, name: ".sbss") : nullptr;
927	ctx.sym.bss->section = sbss ? sbss : findSection(ctx, name: ".bss");
928	}
929
930	// Setup MIPS _gp_disp/__gnu_local_gp symbols which should
931	// be equal to the _gp symbol's value.
932	if (ctx.sym.mipsGp) {
933	// Find GP-relative section with the lowest address
934	// and use this address to calculate default _gp value.
935	for (OutputSection *os : ctx.outputSections) {
936	if (os->flags & SHF_MIPS_GPREL) {
937	ctx.sym.mipsGp->section = os;
938	ctx.sym.mipsGp->value = `0x7ff0`;
939	break;
940	}
941	}
942	}
943	}
944
945	// We want to find how similar two ranks are.
946	// The more branches in getSectionRank that match, the more similar they are.
947	// Since each branch corresponds to a bit flag, we can just use
948	// countLeadingZeros.
949	static int getRankProximity(OutputSection a, SectionCommand b) {
950	auto *osd = dyn_cast<OutputDesc>(Val: b);
951	return (osd && osd->osec.hasInputSections)
952	? llvm::countl_zero(Val: a->sortRank ^ osd->osec.sortRank)
953	: -`1`;
954	}
955
956	// When placing orphan sections, we want to place them after symbol assignments
957	// so that an orphan after
958	// begin_foo = .;
959	// foo : { (foo) }*
960	// end_foo = .;
961	// doesn't break the intended meaning of the begin/end symbols.
962	// We don't want to go over sections since findOrphanPos is the
963	// one in charge of deciding the order of the sections.
964	// We don't want to go over changes to '.', since doing so in
965	// rx_sec : { (rx_sec) }*
966	// . = ALIGN(0x1000);
967	// / The RW PT_LOAD starts here/
968	// rw_sec : { (rw_sec) }*
969	// would mean that the RW PT_LOAD would become unaligned.
970	static bool shouldSkip(SectionCommand *cmd) {
971	if (auto *assign = dyn_cast<SymbolAssignment>(Val: cmd))
972	return assign->name != ".";
973	return false;
974	}
975
976	// We want to place orphan sections so that they share as much
977	// characteristics with their neighbors as possible. For example, if
978	// both are rw, or both are tls.
979	static SmallVectorImpl<SectionCommand *>::iterator
980	findOrphanPos(Ctx &ctx, SmallVectorImpl<SectionCommand *>::iterator b,
981	SmallVectorImpl<SectionCommand *>::iterator e) {
982	// Place non-alloc orphan sections at the end. This matches how we assign file
983	// offsets to non-alloc sections.
984	OutputSection sec = &cast<OutputDesc>(Val: e)->osec;
985	if (!(sec->flags & SHF_ALLOC))
986	return e;
987
988	// As a special case, place .relro_padding before the SymbolAssignment using
989	// DATA_SEGMENT_RELRO_END, if present.
990	if (ctx.in.relroPadding && sec == ctx.in.relroPadding ->getParent()) {
991	auto i = std::find_if(first: b, last: e, pred: [=](SectionCommand *a) {
992	if (auto *assign = dyn_cast<SymbolAssignment>(Val: a))
993	return assign->dataSegmentRelroEnd;
994	return false;
995	});
996	if (i != e)
997	return i;
998	}
999
1000	// Find the most similar output section as the anchor. Rank Proximity is a
1001	// value in the range [-1, 32] where [0, 32] indicates potential anchors (0:
1002	// least similar; 32: identical). -1 means not an anchor.
1003	//
1004	// In the event of proximity ties, we select the first or last section
1005	// depending on whether the orphan's rank is smaller.
1006	int maxP = `0`;
1007	auto i = e;
1008	for (auto j = b; j != e; ++j) {
1009	int p = getRankProximity(a: sec, b: *j);
1010	if (p > maxP \|\|
1011	(p == maxP && cast<OutputDesc>(Val: *j)->osec.sortRank <= sec->sortRank)) {
1012	maxP = p;
1013	i = j;
1014	}
1015	}
1016	if (i == e)
1017	return e;
1018
1019	auto isOutputSecWithInputSections = [](SectionCommand *cmd) {
1020	auto *osd = dyn_cast<OutputDesc>(Val: cmd);
1021	return osd && osd->osec.hasInputSections;
1022	};
1023
1024	// Then, scan backward or forward through the script for a suitable insertion
1025	// point. If i's rank is larger, the orphan section can be placed before i.
1026	//
1027	// However, don't do this if custom program headers are defined. Otherwise,
1028	// adding the orphan to a previous segment can change its flags, for example,
1029	// making a read-only segment writable. If memory regions are defined, an
1030	// orphan section should continue the same region as the found section to
1031	// better resemble the behavior of GNU ld.
1032	bool mustAfter =
1033	ctx.script->hasPhdrsCommands() \|\| !ctx.script->memoryRegions.empty();
1034	if (cast<OutputDesc>(Val: *i)->osec.sortRank <= sec->sortRank \|\| mustAfter) {
1035	for (auto j = ++i; j != e; ++j) {
1036	if (!isOutputSecWithInputSections (*j))
1037	continue;
1038	if (getRankProximity(a: sec, b: *j) != maxP)
1039	break;
1040	i = j + `1`;
1041	}
1042	} else {
1043	for (; i != b; --i)
1044	if (isOutputSecWithInputSections (i[-`1`]))
1045	break;
1046	}
1047
1048	// As a special case, if the orphan section is the last section, put
1049	// it at the very end, past any other commands.
1050	// This matches bfd's behavior and is convenient when the linker script fully
1051	// specifies the start of the file, but doesn't care about the end (the non
1052	// alloc sections for example).
1053	if (std::none_of(first: i, last: e, pred: isOutputSecWithInputSections))
1054	return e;
1055
1056	while (i != e && shouldSkip(cmd: *i))
1057	++i;
1058	return i;
1059	}
1060
1061	// Adds random priorities to sections not already in the map.
1062	static void maybeShuffle(Ctx &ctx,
1063	DenseMap<const InputSectionBase , int*> &order) {
1064	if (ctx.arg.shuffleSections.empty())
1065	return;
1066
1067	SmallVector<InputSectionBase *, `0`> matched, sections = ctx.inputSections;
1068	matched.reserve(N: sections.size());
1069	for (const auto &patAndSeed : ctx.arg.shuffleSections) {
1070	matched.clear();
1071	for (InputSectionBase *sec : sections)
1072	if (patAndSeed.first.match(S: sec->name))
1073	matched.push_back(Elt: sec);
1074	const uint32_t seed = patAndSeed.second;
1075	if (seed == UINT32_MAX) {
1076	// If --shuffle-sections <section-glob>=-1, reverse the section order. The
1077	// section order is stable even if the number of sections changes. This is
1078	// useful to catch issues like static initialization order fiasco
1079	// reliably.
1080	std::reverse(first: matched.begin(), last: matched.end());
1081	} else {
1082	std::mt19937 g(seed ? seed : std::random_device ()());
1083	llvm::shuffle(first: matched.begin(), last: matched.end(), g);
1084	}
1085	size_t i = `0`;
1086	for (InputSectionBase *&sec : sections)
1087	if (patAndSeed.first.match(S: sec->name))
1088	sec = matched [i++];
1089	}
1090
1091	// Existing priorities are < 0, so use priorities >= 0 for the missing
1092	// sections.
1093	int prio = `0`;
1094	for (InputSectionBase *sec : sections) {
1095	if (order.try_emplace(Key: sec, Args&: prio).second)
1096	++prio;
1097	}
1098	}
1099
1100	// Return section order within an InputSectionDescription.
1101	// If both --symbol-ordering-file and call graph profile are present, the order
1102	// file takes precedence, but the call graph profile is still used for symbols
1103	// that don't appear in the order file.
1104	static DenseMap<const InputSectionBase , int*> buildSectionOrder(Ctx &ctx) {
1105	DenseMap<const InputSectionBase , int*> sectionOrder;
1106	if (ctx.arg.bpStartupFunctionSort \|\| ctx.arg.bpFunctionOrderForCompression \|\|
1107	ctx.arg.bpDataOrderForCompression) {
1108	TimeTraceScope timeScope("Balanced Partitioning Section Orderer");
1109	sectionOrder = runBalancedPartitioning(
1110	ctx, profilePath: ctx.arg.bpStartupFunctionSort ? ctx.arg.irpgoProfilePath : "",
1111	forFunctionCompression: ctx.arg.bpFunctionOrderForCompression,
1112	forDataCompression: ctx.arg.bpDataOrderForCompression,
1113	compressionSortStartupFunctions: ctx.arg.bpCompressionSortStartupFunctions,
1114	verbose: ctx.arg.bpVerboseSectionOrderer);
1115	} else if (!ctx.arg.callGraphProfile.empty()) {
1116	sectionOrder = computeCallGraphProfileOrder(ctx);
1117	}
1118
1119	if (ctx.arg.symbolOrderingFile.empty())
1120	return sectionOrder;
1121
1122	struct SymbolOrderEntry {
1123	int priority;
1124	bool present;
1125	};
1126
1127	// Build a map from symbols to their priorities. Symbols that didn't
1128	// appear in the symbol ordering file have the lowest priority 0.
1129	// All explicitly mentioned symbols have negative (higher) priorities.
1130	DenseMap<CachedHashStringRef, SymbolOrderEntry> symbolOrder;
1131	int priority = -sectionOrder.size() - ctx.arg.symbolOrderingFile.size();
1132	for (StringRef s : ctx.arg.symbolOrderingFile)
1133	symbolOrder.insert(KV: {CachedHashStringRef (s), {.priority: priority++, .present: false}});
1134
1135	// Build a map from sections to their priorities.
1136	auto addSym = [&](Symbol &sym) {
1137	auto it = symbolOrder.find(Val: CachedHashStringRef (sym.getName()));
1138	if (it == symbolOrder.end())
1139	return;
1140	SymbolOrderEntry &ent = it ->second;
1141	ent.present = true;
1142
1143	maybeWarnUnorderableSymbol(ctx, sym: &sym);
1144
1145	if (auto *d = dyn_cast<Defined>(Val: &sym)) {
1146	if (auto *sec = dyn_cast_or_null<InputSectionBase>(Val: d->section)) {
1147	int &priority = sectionOrder [cast<InputSectionBase>(Val: sec)];
1148	priority = std::min(a: priority, b: ent.priority);
1149	}
1150	}
1151	};
1152
1153	// We want both global and local symbols. We get the global ones from the
1154	// symbol table and iterate the object files for the local ones.
1155	for (Symbol *sym : ctx.symtab ->getSymbols())
1156	addSym (*sym);
1157
1158	for (ELFFileBase *file : ctx.objectFiles)
1159	for (Symbol *sym : file->getLocalSymbols())
1160	addSym (*sym);
1161
1162	if (ctx.arg.warnSymbolOrdering)
1163	for (auto orderEntry : symbolOrder)
1164	if (!orderEntry.second.present)
1165	Warn(ctx) << "symbol ordering file: no such symbol: "
1166	<< orderEntry.first.val();
1167
1168	return sectionOrder;
1169	}
1170
1171	// Sorts the sections in ISD according to the provided section order.
1172	static void
1173	sortISDBySectionOrder(Ctx &ctx, InputSectionDescription *isd,
1174	const DenseMap<const InputSectionBase , int*> &order,
1175	bool executableOutputSection) {
1176	SmallVector<InputSection *, `0`> unorderedSections;
1177	SmallVector<std::pair<InputSection , int*>, `0`> orderedSections;
1178	uint64_t unorderedSize = `0`;
1179	uint64_t totalSize = `0`;
1180
1181	for (InputSection *isec : isd->sections) {
1182	if (executableOutputSection)
1183	totalSize += isec->getSize();
1184	auto i = order.find(Val: isec);
1185	if (i == order.end()) {
1186	unorderedSections.push_back(Elt: isec);
1187	unorderedSize += isec->getSize();
1188	continue;
1189	}
1190	orderedSections.push_back(Elt: {isec, i ->second});
1191	}
1192	llvm::sort(C&: orderedSections, Comp: llvm::less_second ());
1193
1194	// Find an insertion point for the ordered section list in the unordered
1195	// section list. On targets with limited-range branches, this is the mid-point
1196	// of the unordered section list. This decreases the likelihood that a range
1197	// extension thunk will be needed to enter or exit the ordered region. If the
1198	// ordered section list is a list of hot functions, we can generally expect
1199	// the ordered functions to be called more often than the unordered functions,
1200	// making it more likely that any particular call will be within range, and
1201	// therefore reducing the number of thunks required.
1202	//
1203	// For example, imagine that you have 8MB of hot code and 32MB of cold code.
1204	// If the layout is:
1205	//
1206	// 8MB hot
1207	// 32MB cold
1208	//
1209	// only the first 8-16MB of the cold code (depending on which hot function it
1210	// is actually calling) can call the hot code without a range extension thunk.
1211	// However, if we use this layout:
1212	//
1213	// 16MB cold
1214	// 8MB hot
1215	// 16MB cold
1216	//
1217	// both the last 8-16MB of the first block of cold code and the first 8-16MB
1218	// of the second block of cold code can call the hot code without a thunk. So
1219	// we effectively double the amount of code that could potentially call into
1220	// the hot code without a thunk.
1221	//
1222	// The above is not necessary if total size of input sections in this "isd"
1223	// is small. Note that we assume all input sections are executable if the
1224	// output section is executable (which is not always true but supposed to
1225	// cover most cases).
1226	size_t insPt = `0`;
1227	if (executableOutputSection && !orderedSections.empty() &&
1228	ctx.target ->getThunkSectionSpacing() &&
1229	totalSize >= ctx.target ->getThunkSectionSpacing()) {
1230	uint64_t unorderedPos = `0`;
1231	for (; insPt != unorderedSections.size(); ++insPt) {
1232	unorderedPos += unorderedSections [insPt]->getSize();
1233	if (unorderedPos > unorderedSize / `2`)
1234	break;
1235	}
1236	}
1237
1238	isd->sections.clear();
1239	for (InputSection *isec : ArrayRef(unorderedSections).slice(N: `0`, M: insPt))
1240	isd->sections.push_back(Elt: isec);
1241	for (std::pair<InputSection , int*> p : orderedSections)
1242	isd->sections.push_back(Elt: p.first);
1243	for (InputSection *isec : ArrayRef(unorderedSections).slice(N: insPt))
1244	isd->sections.push_back(Elt: isec);
1245	}
1246
1247	static void sortSection(Ctx &ctx, OutputSection &osec,
1248	const DenseMap<const InputSectionBase , int*> &order) {
1249	StringRef name = osec.name;
1250
1251	// Never sort these.
1252	if (name == ".init" \|\| name == ".fini")
1253	return;
1254
1255	// Sort input sections by priority using the list provided by
1256	// --symbol-ordering-file or --shuffle-sections=. This is a least significant
1257	// digit radix sort. The sections may be sorted stably again by a more
1258	// significant key.
1259	if (!order.empty())
1260	for (SectionCommand *b : osec.commands)
1261	if (auto *isd = dyn_cast<InputSectionDescription>(Val: b))
1262	sortISDBySectionOrder(ctx, isd, order, executableOutputSection: osec.flags & SHF_EXECINSTR);
1263
1264	if (ctx.script->hasSectionsCommand)
1265	return;
1266
1267	if (name == ".init_array" \|\| name == ".fini_array") {
1268	osec.sortInitFini();
1269	} else if (name == ".ctors" \|\| name == ".dtors") {
1270	osec.sortCtorsDtors();
1271	} else if (ctx.arg.emachine == EM_PPC64 && name == ".toc") {
1272	// .toc is allocated just after .got and is accessed using GOT-relative
1273	// relocations. Object files compiled with small code model have an
1274	// addressable range of [.got, .got + 0xFFFC] for GOT-relative relocations.
1275	// To reduce the risk of relocation overflow, .toc contents are sorted so
1276	// that sections having smaller relocation offsets are at beginning of .toc
1277	assert(osec.commands.size() == `1`);
1278	auto *isd = cast<InputSectionDescription>(Val: osec.commands [`0`]);
1279	llvm::stable_sort(Range&: isd->sections,
1280	C: [](const InputSection a, const* InputSection b) -> bool* {
1281	return a->file->ppc64SmallCodeModelTocRelocs &&
1282	!b->file->ppc64SmallCodeModelTocRelocs;
1283	});
1284	}
1285	}
1286
1287	// Sort sections within each InputSectionDescription.
1288	template <class ELFT> void Writer<ELFT>::sortInputSections() {
1289	// Assign negative priorities.
1290	DenseMap<const InputSectionBase , int*> order = buildSectionOrder(ctx);
1291	// Assign non-negative priorities due to --shuffle-sections.
1292	maybeShuffle(ctx, order);
1293	for (SectionCommand *cmd : ctx.script->sectionCommands)
1294	if (auto *osd = dyn_cast<OutputDesc>(Val: cmd))
1295	sortSection(ctx, osec&: osd->osec, order);
1296	}
1297
1298	template <class ELFT> void Writer<ELFT>::sortSections() {
1299	llvm::TimeTraceScope timeScope("Sort sections");
1300
1301	// Don't sort if using -r. It is not necessary and we want to preserve the
1302	// relative order for SHF_LINK_ORDER sections.
1303	if (ctx.arg.relocatable) {
1304	ctx.script->adjustOutputSections();
1305	return;
1306	}
1307
1308	sortInputSections();
1309
1310	for (SectionCommand *cmd : ctx.script->sectionCommands)
1311	if (auto *osd = dyn_cast<OutputDesc>(Val: cmd))
1312	osd->osec.sortRank = getSectionRank(ctx, osec&: osd->osec);
1313	if (!ctx.script->hasSectionsCommand) {
1314	// OutputDescs are mostly contiguous, but may be interleaved with
1315	// SymbolAssignments in the presence of INSERT commands.
1316	auto mid = std::stable_partition(
1317	ctx.script->sectionCommands.begin(), ctx.script->sectionCommands.end(),
1318	[](SectionCommand cmd) { return* isa<OutputDesc>(Val: cmd); });
1319	std::stable_sort(
1320	ctx.script->sectionCommands.begin(), mid,
1321	[&ctx = ctx](auto l, auto* r) { return* compareSections(ctx, l, r); });
1322	}
1323
1324	// Process INSERT commands and update output section attributes. From this
1325	// point onwards the order of script->sectionCommands is fixed.
1326	ctx.script->processInsertCommands();
1327	ctx.script->adjustOutputSections();
1328
1329	if (ctx.script->hasSectionsCommand)
1330	sortOrphanSections();
1331
1332	ctx.script->adjustSectionsAfterSorting();
1333	}
1334
1335	template <class ELFT> void Writer<ELFT>::sortOrphanSections() {
1336	// Orphan sections are sections present in the input files which are
1337	// not explicitly placed into the output file by the linker script.
1338	//
1339	// The sections in the linker script are already in the correct
1340	// order. We have to figuere out where to insert the orphan
1341	// sections.
1342	//
1343	// The order of the sections in the script is arbitrary and may not agree with
1344	// compareSections. This means that we cannot easily define a strict weak
1345	// ordering. To see why, consider a comparison of a section in the script and
1346	// one not in the script. We have a two simple options:
1347	// Make them equivalent (a is not less than b, and b is not less than a).*
1348	// The problem is then that equivalence has to be transitive and we can
1349	// have sections a, b and c with only b in a script and a less than c
1350	// which breaks this property.
1351	// Use compareSectionsNonScript. Given that the script order doesn't have*
1352	// to match, we can end up with sections a, b, c, d where b and c are in the
1353	// script and c is compareSectionsNonScript less than b. In which case d
1354	// can be equivalent to c, a to b and d < a. As a concrete example:
1355	// .a (rx) # not in script
1356	// .b (rx) # in script
1357	// .c (ro) # in script
1358	// .d (ro) # not in script
1359	//
1360	// The way we define an order then is:
1361	// Sort only the orphan sections. They are in the end right now.*
1362	// Move each orphan section to its preferred position. We try*
1363	// to put each section in the last position where it can share
1364	// a PT_LOAD.
1365	//
1366	// There is some ambiguity as to where exactly a new entry should be
1367	// inserted, because Commands contains not only output section
1368	// commands but also other types of commands such as symbol assignment
1369	// expressions. There's no correct answer here due to the lack of the
1370	// formal specification of the linker script. We use heuristics to
1371	// determine whether a new output command should be added before or
1372	// after another commands. For the details, look at shouldSkip
1373	// function.
1374
1375	auto i = ctx.script->sectionCommands.begin();
1376	auto e = ctx.script->sectionCommands.end();
1377	auto nonScriptI = std::find_if(i, e, [](SectionCommand *cmd) {
1378	if (auto *osd = dyn_cast<OutputDesc>(Val: cmd))
1379	return osd->osec.sectionIndex == UINT32_MAX;
1380	return false;
1381	});
1382
1383	// Sort the orphan sections.
1384	std::stable_sort(nonScriptI, e, [&ctx = ctx](auto l, auto* *r) {
1385	return compareSections(ctx, l, r);
1386	});
1387
1388	// As a horrible special case, skip the first . assignment if it is before any
1389	// section. We do this because it is common to set a load address by starting
1390	// the script with ". = 0xabcd" and the expectation is that every section is
1391	// after that.
1392	auto firstSectionOrDotAssignment =
1393	std::find_if(i, e, [](SectionCommand cmd) { return* !shouldSkip(cmd); });
1394	if (firstSectionOrDotAssignment != e &&
1395	isa<SymbolAssignment>(**firstSectionOrDotAssignment))
1396	++firstSectionOrDotAssignment;
1397	i = firstSectionOrDotAssignment;
1398
1399	while (nonScriptI != e) {
1400	auto pos = findOrphanPos(ctx, i, nonScriptI);
1401	OutputSection orphan = &cast<OutputDesc>(nonScriptI)->osec;
1402
1403	// As an optimization, find all sections with the same sort rank
1404	// and insert them with one rotate.
1405	unsigned rank = orphan->sortRank;
1406	auto end = std::find_if(nonScriptI + `1`, e, [=](SectionCommand *cmd) {
1407	return cast<OutputDesc>(Val: cmd)->osec.sortRank != rank;
1408	});
1409	std::rotate(pos, nonScriptI, end);
1410	nonScriptI = end;
1411	}
1412	}
1413
1414	static bool compareByFilePosition(InputSection a, InputSection b) {
1415	InputSection la = a->flags & SHF_LINK_ORDER ? a->getLinkOrderDep() : nullptr*;
1416	InputSection lb = b->flags & SHF_LINK_ORDER ? b->getLinkOrderDep() : nullptr*;
1417	// SHF_LINK_ORDER sections with non-zero sh_link are ordered before
1418	// non-SHF_LINK_ORDER sections and SHF_LINK_ORDER sections with zero sh_link.
1419	if (!la \|\| !lb)
1420	return la && !lb;
1421	OutputSection *aOut = la->getParent();
1422	OutputSection *bOut = lb->getParent();
1423
1424	if (aOut == bOut)
1425	return la->outSecOff < lb->outSecOff;
1426	if (aOut->addr == bOut->addr)
1427	return aOut->sectionIndex < bOut->sectionIndex;
1428	return aOut->addr < bOut->addr;
1429	}
1430
1431	template <class ELFT> void Writer<ELFT>::resolveShfLinkOrder() {
1432	llvm::TimeTraceScope timeScope("Resolve SHF_LINK_ORDER");
1433	for (OutputSection *sec : ctx.outputSections) {
1434	if (!(sec->flags & SHF_LINK_ORDER))
1435	continue;
1436
1437	// The ARM.exidx section use SHF_LINK_ORDER, but we have consolidated
1438	// this processing inside the ARMExidxsyntheticsection::finalizeContents().
1439	if (!ctx.arg.relocatable && ctx.arg.emachine == EM_ARM &&
1440	sec->type == SHT_ARM_EXIDX)
1441	continue;
1442
1443	// Link order may be distributed across several InputSectionDescriptions.
1444	// Sorting is performed separately.
1445	SmallVector<InputSection **, `0`> scriptSections;
1446	SmallVector<InputSection *, `0`> sections;
1447	for (SectionCommand *cmd : sec->commands) {
1448	auto *isd = dyn_cast<InputSectionDescription>(Val: cmd);
1449	if (!isd)
1450	continue;
1451	bool hasLinkOrder = false;
1452	scriptSections.clear();
1453	sections.clear();
1454	for (InputSection *&isec : isd->sections) {
1455	if (isec->flags & SHF_LINK_ORDER) {
1456	InputSection *link = isec->getLinkOrderDep();
1457	if (link && !link->getParent())
1458	ErrAlways(ctx) << isec << ": sh_link points to discarded section "
1459	<< link;
1460	hasLinkOrder = true;
1461	}
1462	scriptSections.push_back(Elt: &isec);
1463	sections.push_back(Elt: isec);
1464	}
1465	if (hasLinkOrder && errCount(ctx) == `0`) {
1466	llvm::stable_sort(Range&: sections, C: compareByFilePosition);
1467	for (int i = `0`, n = sections.size(); i != n; ++i)
1468	*scriptSections [i] = sections [i];
1469	}
1470	}
1471	}
1472	}
1473
1474	static void finalizeSynthetic(Ctx &ctx, SyntheticSection *sec) {
1475	if (sec && sec->isNeeded() && sec->getParent()) {
1476	llvm::TimeTraceScope timeScope("Finalize synthetic sections", sec->name);
1477	sec->finalizeContents();
1478	}
1479	}
1480
1481	static bool canInsertPadding(OutputSection *sec) {
1482	StringRef s = sec->name;
1483	return s == ".bss" \|\| s == ".data" \|\| s == ".data.rel.ro" \|\| s == ".lbss" \|\|
1484	s == ".ldata" \|\| s == ".lrodata" \|\| s == ".ltext" \|\| s == ".rodata" \|\|
1485	s.starts_with(Prefix: ".text");
1486	}
1487
1488	static void randomizeSectionPadding(Ctx &ctx) {
1489	std::mt19937 g(*ctx.arg.randomizeSectionPadding);
1490	PhdrEntry curPtLoad = nullptr*;
1491	for (OutputSection *os : ctx.outputSections) {
1492	if (!canInsertPadding(sec: os))
1493	continue;
1494	for (SectionCommand *bc : os->commands) {
1495	if (auto *isd = dyn_cast<InputSectionDescription>(Val: bc)) {
1496	SmallVector<InputSection *, `0`> tmp;
1497	if (os->ptLoad != curPtLoad) {
1498	tmp.push_back(
1499	Elt: make<PaddingSection>(args&: ctx, args: g () % ctx.arg.maxPageSize, args&: os));
1500	curPtLoad = os->ptLoad;
1501	}
1502	for (InputSection *isec : isd->sections) {
1503	// Probability of inserting padding is 1 in 16.
1504	if (g () % `16` == `0`)
1505	tmp.push_back(Elt: make<PaddingSection>(args&: ctx, args&: isec->addralign, args&: os));
1506	tmp.push_back(Elt: isec);
1507	}
1508	isd->sections = std::move(tmp);
1509	}
1510	}
1511	}
1512	}
1513
1514	// We need to generate and finalize the content that depends on the address of
1515	// InputSections. As the generation of the content may also alter InputSection
1516	// addresses we must converge to a fixed point. We do that here. See the comment
1517	// in Writer<ELFT>::finalizeSections().
1518	template <class ELFT> void Writer<ELFT>::finalizeAddressDependentContent() {
1519	llvm::TimeTraceScope timeScope("Finalize address dependent content");
1520	AArch64Err843419Patcher a64p(ctx);
1521	ARMErr657417Patcher a32p(ctx);
1522	ctx.script->assignAddresses();
1523
1524	// .ARM.exidx and SHF_LINK_ORDER do not require precise addresses, but they
1525	// do require the relative addresses of OutputSections because linker scripts
1526	// can assign Virtual Addresses to OutputSections that are not monotonically
1527	// increasing. Anything here must be repeatable, since spilling may change
1528	// section order.
1529	const auto finalizeOrderDependentContent = [this] {
1530	for (Partition &part : ctx.partitions)
1531	finalizeSynthetic(ctx, sec: part.armExidx.get());
1532	resolveShfLinkOrder();
1533	};
1534	finalizeOrderDependentContent();
1535
1536	// Converts call x@GDPLT to call __tls_get_addr
1537	if (ctx.arg.emachine == EM_HEXAGON)
1538	hexagonTLSSymbolUpdate(ctx);
1539
1540	if (ctx.arg.randomizeSectionPadding)
1541	randomizeSectionPadding(ctx);
1542
1543	// Iterate until a fixed point is reached, skipping relocatable links since
1544	// the final addresses are unavailable.
1545	uint32_t pass = `0`, assignPasses = `0`;
1546	while (!ctx.arg.relocatable) {
1547	bool changed = ctx.target ->needsThunks
1548	? tc.createThunks(pass, outputSections: ctx.outputSections)
1549	: ctx.target ->relaxOnce(pass);
1550	bool spilled = ctx.script->spillSections();
1551	changed \|= spilled;
1552	++pass;
1553
1554	// With Thunk Size much smaller than branch range we expect to
1555	// converge quickly; if we get to 30 something has gone wrong.
1556	if (changed && pass >= `30`) {
1557	Err(ctx) << "address assignment did not converge";
1558	break;
1559	}
1560
1561	if (ctx.arg.fixCortexA53Errata843419) {
1562	if (changed)
1563	ctx.script->assignAddresses();
1564	changed \|= a64p.createFixes();
1565	}
1566	if (ctx.arg.fixCortexA8) {
1567	if (changed)
1568	ctx.script->assignAddresses();
1569	changed \|= a32p.createFixes();
1570	}
1571
1572	finalizeSynthetic(ctx, sec: ctx.in.got.get());
1573	if (ctx.in.mipsGot)
1574	ctx.in.mipsGot ->updateAllocSize(ctx);
1575
1576	for (Partition &part : ctx.partitions) {
1577	// The R_AARCH64_AUTH_RELATIVE has a smaller addend field as bits [63:32]
1578	// encode the signing schema. We've put relocations in .relr.auth.dyn
1579	// during RelocationScanner::processAux, but the target VA for some of
1580	// them might be wider than 32 bits. We can only know the final VA at this
1581	// point, so move relocations with large values from .relr.auth.dyn to
1582	// .rela.dyn. See also AArch64::relocate.
1583	if (part.relrAuthDyn) {
1584	auto it = llvm::remove_if(
1585	part.relrAuthDyn ->relocs, [this, &part](const RelativeReloc &elem) {
1586	Relocation &reloc = elem.inputSec->relocs()[elem.relocIdx];
1587	if (isInt<`32`>(x: reloc.sym->getVA(ctx, addend: reloc.addend)))
1588	return false;
1589	reloc.expr = R_NONE;
1590	part.relaDyn ->addReloc(reloc: {R_AARCH64_AUTH_RELATIVE, elem.inputSec,
1591	reloc.offset, false, *reloc.sym,
1592	reloc.addend, R_ABS});
1593	return true;
1594	});
1595	changed \|= (it != part.relrAuthDyn ->relocs.end());
1596	part.relrAuthDyn ->relocs.erase(it, part.relrAuthDyn ->relocs.end());
1597	}
1598	if (part.relaDyn)
1599	changed \|= part.relaDyn ->updateAllocSize(ctx);
1600	if (part.relrDyn)
1601	changed \|= part.relrDyn ->updateAllocSize(ctx);
1602	if (part.relrAuthDyn)
1603	changed \|= part.relrAuthDyn ->updateAllocSize(ctx);
1604	if (part.memtagGlobalDescriptors)
1605	changed \|= part.memtagGlobalDescriptors ->updateAllocSize(ctx);
1606	if (part.ehFrameHdr && part.ehFrameHdr ->isNeeded())
1607	changed \|= part.ehFrameHdr ->updateAllocSize(ctx);
1608	}
1609
1610	std::pair<const OutputSection , const* Defined *> changes =
1611	ctx.script->assignAddresses();
1612	if (!changed) {
1613	// Some symbols may be dependent on section addresses. When we break the
1614	// loop, the symbol values are finalized because a previous
1615	// assignAddresses() finalized section addresses.
1616	if (!changes.first && !changes.second)
1617	break;
1618	if (++assignPasses == `5`) {
1619	if (changes.first)
1620	Err(ctx) << "address (0x" << Twine::utohexstr(Val: changes.first->addr)
1621	<< ") of section '" << changes.first->name
1622	<< "' does not converge";
1623	if (changes.second)
1624	Err(ctx) << "assignment to symbol " << changes.second
1625	<< " does not converge";
1626	break;
1627	}
1628	} else if (spilled) {
1629	// Spilling can change relative section order.
1630	finalizeOrderDependentContent();
1631	}
1632	// If updateAllocSize reported errors (e.g. "unknown FDE size encoding" for
1633	// part.ehFrameHdr), break to avoid duplicate diagnostics from the loop.
1634	if (errCount(ctx))
1635	break;
1636	}
1637	if (!ctx.arg.relocatable)
1638	ctx.target ->finalizeRelax(passes: pass);
1639
1640	if (ctx.arg.relocatable)
1641	for (OutputSection *sec : ctx.outputSections)
1642	sec->addr = `0`;
1643
1644	uint64_t imageBase = ctx.script->hasSectionsCommand \|\| ctx.arg.relocatable
1645	? `0`
1646	: ctx.target ->getImageBase();
1647	for (SectionCommand *cmd : ctx.script->sectionCommands) {
1648	auto *osd = dyn_cast<OutputDesc>(Val: cmd);
1649	if (!osd)
1650	continue;
1651	OutputSection *osec = &osd->osec;
1652	// Error if the address is below the image base when SECTIONS is absent
1653	// (e.g. when -Ttext is specified and smaller than the default target image
1654	// base for no-pie).
1655	if (osec->addr < imageBase && (osec->flags & SHF_ALLOC)) {
1656	Err(ctx) << "section '" << osec->name << "' address (0x"
1657	<< Twine::utohexstr(Val: osec->addr)
1658	<< ") is smaller than image base (0x"
1659	<< Twine::utohexstr(Val: imageBase) << "); specify --image-base";
1660	}
1661
1662	// If addrExpr is set, the address may not be a multiple of the alignment.
1663	// Warn because this is error-prone.
1664	if (osec->addr % osec->addralign != `0`)
1665	Warn(ctx) << "address (0x" << Twine::utohexstr(Val: osec->addr)
1666	<< ") of section " << osec->name
1667	<< " is not a multiple of alignment (" << osec->addralign
1668	<< ")";
1669	}
1670
1671	// Sizes are no longer allowed to grow, so all allowable spills have been
1672	// taken. Remove any leftover potential spills.
1673	ctx.script->erasePotentialSpillSections();
1674	}
1675
1676	// If Input Sections have been shrunk (basic block sections) then
1677	// update symbol values and sizes associated with these sections. With basic
1678	// block sections, input sections can shrink when the jump instructions at
1679	// the end of the section are relaxed.
1680	static void fixSymbolsAfterShrinking(Ctx &ctx) {
1681	for (InputFile *File : ctx.objectFiles) {
1682	parallelForEach(R: File->getSymbols(), Fn: [&](Symbol *Sym) {
1683	auto *def = dyn_cast<Defined>(Val: Sym);
1684	if (!def)
1685	return;
1686
1687	const SectionBase *sec = def->section;
1688	if (!sec)
1689	return;
1690
1691	const InputSectionBase *inputSec = dyn_cast<InputSectionBase>(Val: sec);
1692	if (!inputSec \|\| !inputSec->bytesDropped)
1693	return;
1694
1695	const size_t OldSize = inputSec->content().size();
1696	const size_t NewSize = OldSize - inputSec->bytesDropped;
1697
1698	if (def->value > NewSize && def->value <= OldSize) {
1699	LLVM_DEBUG(llvm::dbgs()
1700	<< "Moving symbol " << Sym->getName() << " from "
1701	<< def->value << " to "
1702	<< def->value - inputSec->bytesDropped << " bytes\n");
1703	def->value -= inputSec->bytesDropped;
1704	return;
1705	}
1706
1707	if (def->value + def->size > NewSize && def->value <= OldSize &&
1708	def->value + def->size <= OldSize) {
1709	LLVM_DEBUG(llvm::dbgs()
1710	<< "Shrinking symbol " << Sym->getName() << " from "
1711	<< def->size << " to " << def->size - inputSec->bytesDropped
1712	<< " bytes\n");
1713	def->size -= inputSec->bytesDropped;
1714	}
1715	});
1716	}
1717	}
1718
1719	// If basic block sections exist, there are opportunities to delete fall thru
1720	// jumps and shrink jump instructions after basic block reordering. This
1721	// relaxation pass does that. It is only enabled when --optimize-bb-jumps
1722	// option is used.
1723	template <class ELFT> void Writer<ELFT>::optimizeBasicBlockJumps() {
1724	assert(ctx.arg.optimizeBBJumps);
1725	SmallVector<InputSection *, `0`> storage;
1726
1727	ctx.script->assignAddresses();
1728	// For every output section that has executable input sections, this
1729	// does the following:
1730	// 1. Deletes all direct jump instructions in input sections that
1731	// jump to the following section as it is not required.
1732	// 2. If there are two consecutive jump instructions, it checks
1733	// if they can be flipped and one can be deleted.
1734	for (OutputSection *osec : ctx.outputSections) {
1735	if (!(osec->flags & SHF_EXECINSTR))
1736	continue;
1737	ArrayRef<InputSection > sections = getInputSections(os: osec, storage);
1738	size_t numDeleted = `0`;
1739	// Delete all fall through jump instructions. Also, check if two
1740	// consecutive jump instructions can be flipped so that a fall
1741	// through jmp instruction can be deleted.
1742	for (size_t i = `0`, e = sections.size(); i != e; ++i) {
1743	InputSection next = i + `1` < sections.size() ? sections [i + `1`] : nullptr*;
1744	InputSection &sec = *sections [i];
1745	numDeleted += ctx.target ->deleteFallThruJmpInsn(is&: sec, nextIS: next);
1746	}
1747	if (numDeleted > `0`) {
1748	ctx.script->assignAddresses();
1749	LLVM_DEBUG(llvm::dbgs()
1750	<< "Removing " << numDeleted << " fall through jumps\n");
1751	}
1752	}
1753
1754	fixSymbolsAfterShrinking(ctx);
1755
1756	for (OutputSection *osec : ctx.outputSections)
1757	for (InputSection is : getInputSections(os: osec, storage))
1758	is->trim();
1759	}
1760
1761	// In order to allow users to manipulate linker-synthesized sections,
1762	// we had to add synthetic sections to the input section list early,
1763	// even before we make decisions whether they are needed. This allows
1764	// users to write scripts like this: ".mygot : { .got }".
1765	//
1766	// Doing it has an unintended side effects. If it turns out that we
1767	// don't need a .got (for example) at all because there's no
1768	// relocation that needs a .got, we don't want to emit .got.
1769	//
1770	// To deal with the above problem, this function is called after
1771	// scanRelocations is called to remove synthetic sections that turn
1772	// out to be empty.
1773	static void removeUnusedSyntheticSections(Ctx &ctx) {
1774	// All input synthetic sections that can be empty are placed after
1775	// all regular ones. Reverse iterate to find the first synthetic section
1776	// after a non-synthetic one which will be our starting point.
1777	auto start =
1778	llvm::find_if(Range: llvm::reverse(C&: ctx.inputSections), P: [](InputSectionBase *s) {
1779	return !isa<SyntheticSection>(Val: s);
1780	}).base();
1781
1782	// Remove unused synthetic sections from ctx.inputSections;
1783	DenseSet<InputSectionBase *> unused;
1784	auto end =
1785	std::remove_if(first: start, last: ctx.inputSections.end(), pred: [&](InputSectionBase *s) {
1786	auto *sec = cast<SyntheticSection>(Val: s);
1787	if (sec->getParent() && sec->isNeeded())
1788	return false;
1789	// .relr.auth.dyn relocations may be moved to .rela.dyn in
1790	// finalizeAddressDependentContent, making .rela.dyn no longer empty.
1791	// Conservatively keep .rela.dyn. .relr.auth.dyn can be made empty, but
1792	// we would fail to remove it here.
1793	if (ctx.arg.emachine == EM_AARCH64 && ctx.arg.relrPackDynRelocs &&
1794	sec == ctx.mainPart->relaDyn.get())
1795	return false;
1796	unused.insert(V: sec);
1797	return true;
1798	});
1799	ctx.inputSections.erase(CS: end, CE: ctx.inputSections.end());
1800
1801	// Remove unused synthetic sections from the corresponding input section
1802	// description and orphanSections.
1803	for (auto *sec : unused)
1804	if (OutputSection *osec = cast<SyntheticSection>(Val: sec)->getParent())
1805	for (SectionCommand *cmd : osec->commands)
1806	if (auto *isd = dyn_cast<InputSectionDescription>(Val: cmd))
1807	llvm::erase_if(C&: isd->sections, P: [&](InputSection *isec) {
1808	return unused.contains(V: isec);
1809	});
1810	llvm::erase_if(C&: ctx.script->orphanSections, P: [&](const InputSectionBase *sec) {
1811	return unused.contains(V: sec);
1812	});
1813	}
1814
1815	// Create output section objects and add them to OutputSections.
1816	template <class ELFT> void Writer<ELFT>::finalizeSections() {
1817	if (!ctx.arg.relocatable) {
1818	ctx.out.preinitArray = findSection(ctx, name: ".preinit_array");
1819	ctx.out.initArray = findSection(ctx, name: ".init_array");
1820	ctx.out.finiArray = findSection(ctx, name: ".fini_array");
1821
1822	// The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop
1823	// symbols for sections, so that the runtime can get the start and end
1824	// addresses of each section by section name. Add such symbols.
1825	addStartEndSymbols();
1826	for (SectionCommand *cmd : ctx.script->sectionCommands)
1827	if (auto *osd = dyn_cast<OutputDesc>(Val: cmd))
1828	addStartStopSymbols(osec&: osd->osec);
1829
1830	// Add _DYNAMIC symbol. Unlike GNU gold, our _DYNAMIC symbol has no type.
1831	// It should be okay as no one seems to care about the type.
1832	// Even the author of gold doesn't remember why gold behaves that way.
1833	// https://sourceware.org/ml/binutils/2002-03/msg00360.html
1834	if (ctx.mainPart->dynamic ->parent) {
1835	Symbol *s = ctx.symtab ->addSymbol(newSym: Defined {
1836	ctx, ctx.internalFile, "_DYNAMIC", STB_WEAK, STV_HIDDEN, STT_NOTYPE,
1837	/value=/`0`, /size=/`0`, ctx.mainPart->dynamic.get()});
1838	s->isUsedInRegularObj = true;
1839	}
1840
1841	// Define __rel[a]_iplt_{start,end} symbols if needed.
1842	addRelIpltSymbols();
1843
1844	// RISC-V's gp can address +/- 2 KiB, set it to .sdata + 0x800. This symbol
1845	// should only be defined in an executable. If .sdata does not exist, its
1846	// value/section does not matter but it has to be relative, so set its
1847	// st_shndx arbitrarily to 1 (ctx.out.elfHeader).
1848	if (ctx.arg.emachine == EM_RISCV) {
1849	if (!ctx.arg.shared) {
1850	OutputSection *sec = findSection(ctx, name: ".sdata");
1851	addOptionalRegular(ctx, name: "__global_pointer$",
1852	sec: sec ? sec : ctx.out.elfHeader.get(), val: `0x800`,
1853	stOther: STV_DEFAULT);
1854	// Set riscvGlobalPointer to be used by the optional global pointer
1855	// relaxation.
1856	if (ctx.arg.relaxGP) {
1857	Symbol *s = ctx.symtab ->find(name: "__global_pointer$");
1858	if (s && s->isDefined())
1859	ctx.sym.riscvGlobalPointer = cast<Defined>(Val: s);
1860	}
1861	}
1862	}
1863
1864	if (ctx.arg.emachine == EM_386 \|\| ctx.arg.emachine == EM_X86_64) {
1865	// On targets that support TLSDESC, _TLS_MODULE_BASE_ is defined in such a
1866	// way that:
1867	//
1868	// 1) Without relaxation: it produces a dynamic TLSDESC relocation that
1869	// computes 0.
1870	// 2) With LD->LE relaxation: _TLS_MODULE_BASE_@tpoff = 0 (lowest address
1871	// in the TLS block).
1872	//
1873	// 2) is special cased in @tpoff computation. To satisfy 1), we define it
1874	// as an absolute symbol of zero. This is different from GNU linkers which
1875	// define _TLS_MODULE_BASE_ relative to the first TLS section.
1876	Symbol *s = ctx.symtab ->find(name: "_TLS_MODULE_BASE_");
1877	if (s && s->isUndefined()) {
1878	s->resolve(ctx, other: Defined {ctx, ctx.internalFile, StringRef (), STB_GLOBAL,
1879	STV_HIDDEN, STT_TLS, /value=/`0`, `0`,
1880	/section=/nullptr});
1881	ctx.sym.tlsModuleBase = cast<Defined>(Val: s);
1882	}
1883	}
1884
1885	// This responsible for splitting up .eh_frame section into
1886	// pieces. The relocation scan uses those pieces, so this has to be
1887	// earlier.
1888	{
1889	llvm::TimeTraceScope timeScope("Finalize .eh_frame");
1890	for (Partition &part : ctx.partitions)
1891	finalizeSynthetic(ctx, sec: part.ehFrame.get());
1892	}
1893	}
1894
1895	// If the previous code block defines any non-hidden symbols (e.g.
1896	// __global_pointer$), they may be exported.
1897	if (ctx.arg.exportDynamic)
1898	for (Symbol *sym : ctx.synthesizedSymbols)
1899	if (sym->computeBinding(ctx) != STB_LOCAL)
1900	sym->isExported = true;
1901
1902	demoteSymbolsAndComputeIsPreemptible(ctx);
1903
1904	if (ctx.arg.copyRelocs && ctx.arg.discard != DiscardPolicy::None)
1905	markUsedLocalSymbols<ELFT>(ctx);
1906	demoteAndCopyLocalSymbols(ctx);
1907
1908	if (ctx.arg.copyRelocs)
1909	addSectionSymbols();
1910
1911	// Change values of linker-script-defined symbols from placeholders (assigned
1912	// by declareSymbols) to actual definitions.
1913	ctx.script->processSymbolAssignments();
1914
1915	if (!ctx.arg.relocatable) {
1916	llvm::TimeTraceScope timeScope("Scan relocations");
1917	// Scan relocations. This must be done after every symbol is declared so
1918	// that we can correctly decide if a dynamic relocation is needed. This is
1919	// called after processSymbolAssignments() because it needs to know whether
1920	// a linker-script-defined symbol is absolute.
1921	scanRelocations<ELFT>(ctx);
1922	reportUndefinedSymbols(ctx);
1923	postScanRelocations(ctx);
1924
1925	if (ctx.in.plt && ctx.in.plt ->isNeeded())
1926	ctx.in.plt ->addSymbols();
1927	if (ctx.in.iplt && ctx.in.iplt ->isNeeded())
1928	ctx.in.iplt ->addSymbols();
1929
1930	if (ctx.arg.unresolvedSymbolsInShlib != UnresolvedPolicy::Ignore) {
1931	auto diag =
1932	ctx.arg.unresolvedSymbolsInShlib == UnresolvedPolicy::ReportError &&
1933	!ctx.arg.noinhibitExec
1934	? DiagLevel::Err
1935	: DiagLevel::Warn;
1936	// Error on undefined symbols in a shared object, if all of its DT_NEEDED
1937	// entries are seen. These cases would otherwise lead to runtime errors
1938	// reported by the dynamic linker.
1939	//
1940	// ld.bfd traces all DT_NEEDED to emulate the logic of the dynamic linker
1941	// to catch more cases. That is too much for us. Our approach resembles
1942	// the one used in ld.gold, achieves a good balance to be useful but not
1943	// too smart.
1944	//
1945	// If a DSO reference is resolved by a SharedSymbol, but the SharedSymbol
1946	// is overridden by a hidden visibility Defined (which is later discarded
1947	// due to GC), don't report the diagnostic. However, this may indicate an
1948	// unintended SharedSymbol.
1949	for (SharedFile *file : ctx.sharedFiles) {
1950	bool allNeededIsKnown =
1951	llvm::all_of(file->dtNeeded, [&](StringRef needed) {
1952	return ctx.symtab ->soNames.contains(Val: CachedHashStringRef (needed));
1953	});
1954	if (!allNeededIsKnown)
1955	continue;
1956	for (Symbol *sym : file->requiredSymbols) {
1957	if (sym->dsoDefined)
1958	continue;
1959	if (sym->isUndefined() && !sym->isWeak()) {
1960	ELFSyncStream (ctx, diag)
1961	<< "undefined reference: " << sym << "\n>>> referenced by "
1962	<< file << " (disallowed by --no-allow-shlib-undefined)";
1963	} else if (sym->isDefined() &&
1964	sym->computeBinding(ctx) == STB_LOCAL) {
1965	ELFSyncStream (ctx, diag)
1966	<< "non-exported symbol '" << sym << "' in '" << sym->file
1967	<< "' is referenced by DSO '" << file << "'";
1968	}
1969	}
1970	}
1971	}
1972	}
1973
1974	{
1975	llvm::TimeTraceScope timeScope("Add symbols to symtabs");
1976	// Now that we have defined all possible global symbols including linker-
1977	// synthesized ones. Visit all symbols to give the finishing touches.
1978	for (Symbol *sym : ctx.symtab ->getSymbols()) {
1979	if (!sym->isUsedInRegularObj \|\| !includeInSymtab(ctx, b: *sym))
1980	continue;
1981	if (!ctx.arg.relocatable)
1982	sym->binding = sym->computeBinding(ctx);
1983	if (ctx.in.symTab)
1984	ctx.in.symTab ->addSymbol(sym);
1985
1986	// computeBinding might localize a symbol that was considered exported
1987	// but then synthesized as hidden (e.g. _DYNAMIC).
1988	if ((sym->isExported \|\| sym->isPreemptible) && !sym->isLocal()) {
1989	ctx.partitions [sym->partition - `1`].dynSymTab ->addSymbol(sym);
1990	if (auto *file = dyn_cast<SharedFile>(Val: sym->file))
1991	if (file->isNeeded && !sym->isUndefined())
1992	addVerneed(ctx, ss&: *sym);
1993	}
1994	}
1995
1996	// We also need to scan the dynamic relocation tables of the other
1997	// partitions and add any referenced symbols to the partition's dynsym.
1998	for (Partition &part :
1999	MutableArrayRef<Partition>(ctx.partitions).slice(N: `1`)) {
2000	DenseSet<Symbol *> syms;
2001	for (const SymbolTableEntry &e : part.dynSymTab ->getSymbols())
2002	syms.insert(V: e.sym);
2003	for (DynamicReloc &reloc : part.relaDyn ->relocs)
2004	if (reloc.sym && reloc.needsDynSymIndex() &&
2005	syms.insert(V: reloc.sym).second)
2006	part.dynSymTab ->addSymbol(sym: reloc.sym);
2007	}
2008	}
2009
2010	if (ctx.in.mipsGot)
2011	ctx.in.mipsGot ->build();
2012
2013	removeUnusedSyntheticSections(ctx);
2014	ctx.script->diagnoseOrphanHandling();
2015	ctx.script->diagnoseMissingSGSectionAddress();
2016
2017	sortSections();
2018
2019	// Create a list of OutputSections, assign sectionIndex, and populate
2020	// ctx.in.shStrTab. If -z nosectionheader is specified, drop non-ALLOC
2021	// sections.
2022	for (SectionCommand *cmd : ctx.script->sectionCommands)
2023	if (auto *osd = dyn_cast<OutputDesc>(Val: cmd)) {
2024	OutputSection *osec = &osd->osec;
2025	if (!ctx.in.shStrTab && !(osec->flags & SHF_ALLOC))
2026	continue;
2027	ctx.outputSections.push_back(Elt: osec);
2028	osec->sectionIndex = ctx.outputSections.size();
2029	if (ctx.in.shStrTab)
2030	osec->shName = ctx.in.shStrTab ->addString(s: osec->name);
2031	}
2032
2033	// Prefer command line supplied address over other constraints.
2034	for (OutputSection *sec : ctx.outputSections) {
2035	auto i = ctx.arg.sectionStartMap.find(Key: sec->name);
2036	if (i != ctx.arg.sectionStartMap.end())
2037	sec->addrExpr = [=] { return i ->second; };
2038	}
2039
2040	// With the ctx.outputSections available check for GDPLT relocations
2041	// and add __tls_get_addr symbol if needed.
2042	if (ctx.arg.emachine == EM_HEXAGON &&
2043	hexagonNeedsTLSSymbol(outputSections: ctx.outputSections)) {
2044	Symbol *sym =
2045	ctx.symtab ->addSymbol(newSym: Undefined {ctx.internalFile, "__tls_get_addr",
2046	STB_GLOBAL, STV_DEFAULT, STT_NOTYPE});
2047	sym->isPreemptible = true;
2048	ctx.partitions [`0`].dynSymTab ->addSymbol(sym);
2049	}
2050
2051	// This is a bit of a hack. A value of 0 means undef, so we set it
2052	// to 1 to make __ehdr_start defined. The section number is not
2053	// particularly relevant.
2054	ctx.out.elfHeader ->sectionIndex = `1`;
2055	ctx.out.elfHeader ->size = sizeof(typename ELFT::Ehdr);
2056
2057	// Binary and relocatable output does not have PHDRS.
2058	// The headers have to be created before finalize as that can influence the
2059	// image base and the dynamic section on mips includes the image base.
2060	if (!ctx.arg.relocatable && !ctx.arg.oFormatBinary) {
2061	for (Partition &part : ctx.partitions) {
2062	part.phdrs = ctx.script->hasPhdrsCommands() ? ctx.script->createPhdrs()
2063	: createPhdrs(part);
2064	if (ctx.arg.emachine == EM_ARM) {
2065	// PT_ARM_EXIDX is the ARM EHABI equivalent of PT_GNU_EH_FRAME
2066	addPhdrForSection(part, shType: SHT_ARM_EXIDX, pType: PT_ARM_EXIDX, pFlags: PF_R);
2067	}
2068	if (ctx.arg.emachine == EM_MIPS) {
2069	// Add separate segments for MIPS-specific sections.
2070	addPhdrForSection(part, shType: SHT_MIPS_REGINFO, pType: PT_MIPS_REGINFO, pFlags: PF_R);
2071	addPhdrForSection(part, shType: SHT_MIPS_OPTIONS, pType: PT_MIPS_OPTIONS, pFlags: PF_R);
2072	addPhdrForSection(part, shType: SHT_MIPS_ABIFLAGS, pType: PT_MIPS_ABIFLAGS, pFlags: PF_R);
2073	}
2074	if (ctx.arg.emachine == EM_RISCV)
2075	addPhdrForSection(part, shType: SHT_RISCV_ATTRIBUTES, pType: PT_RISCV_ATTRIBUTES,
2076	pFlags: PF_R);
2077	}
2078	ctx.out.programHeaders ->size =
2079	sizeof(Elf_Phdr) * ctx.mainPart->phdrs.size();
2080
2081	// Find the TLS segment. This happens before the section layout loop so that
2082	// Android relocation packing can look up TLS symbol addresses. We only need
2083	// to care about the main partition here because all TLS symbols were moved
2084	// to the main partition (see MarkLive.cpp).
2085	for (auto &p : ctx.mainPart->phdrs)
2086	if (p ->p_type == PT_TLS)
2087	ctx.tlsPhdr = p.get();
2088	}
2089
2090	// Some symbols are defined in term of program headers. Now that we
2091	// have the headers, we can find out which sections they point to.
2092	setReservedSymbolSections();
2093
2094	if (ctx.script->noCrossRefs.size()) {
2095	llvm::TimeTraceScope timeScope("Check NOCROSSREFS");
2096	checkNoCrossRefs<ELFT>(ctx);
2097	}
2098
2099	{
2100	llvm::TimeTraceScope timeScope("Finalize synthetic sections");
2101
2102	finalizeSynthetic(ctx, sec: ctx.in.bss.get());
2103	finalizeSynthetic(ctx, sec: ctx.in.bssRelRo.get());
2104	finalizeSynthetic(ctx, sec: ctx.in.symTabShndx.get());
2105	finalizeSynthetic(ctx, sec: ctx.in.shStrTab.get());
2106	finalizeSynthetic(ctx, sec: ctx.in.strTab.get());
2107	finalizeSynthetic(ctx, sec: ctx.in.got.get());
2108	finalizeSynthetic(ctx, sec: ctx.in.mipsGot.get());
2109	finalizeSynthetic(ctx, sec: ctx.in.igotPlt.get());
2110	finalizeSynthetic(ctx, sec: ctx.in.gotPlt.get());
2111	finalizeSynthetic(ctx, sec: ctx.in.relaPlt.get());
2112	finalizeSynthetic(ctx, sec: ctx.in.plt.get());
2113	finalizeSynthetic(ctx, sec: ctx.in.iplt.get());
2114	finalizeSynthetic(ctx, sec: ctx.in.ppc32Got2.get());
2115	finalizeSynthetic(ctx, sec: ctx.in.partIndex.get());
2116
2117	// Dynamic section must be the last one in this list and dynamic
2118	// symbol table section (dynSymTab) must be the first one.
2119	for (Partition &part : ctx.partitions) {
2120	finalizeSynthetic(ctx, sec: part.relaDyn.get());
2121	finalizeSynthetic(ctx, sec: part.relrDyn.get());
2122	finalizeSynthetic(ctx, sec: part.relrAuthDyn.get());
2123
2124	finalizeSynthetic(ctx, sec: part.dynSymTab.get());
2125	finalizeSynthetic(ctx, sec: part.gnuHashTab.get());
2126	finalizeSynthetic(ctx, sec: part.hashTab.get());
2127	finalizeSynthetic(ctx, sec: part.verDef.get());
2128	finalizeSynthetic(ctx, sec: part.ehFrameHdr.get());
2129	finalizeSynthetic(ctx, sec: part.verSym.get());
2130	finalizeSynthetic(ctx, sec: part.verNeed.get());
2131	finalizeSynthetic(ctx, sec: part.dynamic.get());
2132	}
2133	}
2134
2135	if (!ctx.script->hasSectionsCommand && !ctx.arg.relocatable)
2136	fixSectionAlignments();
2137
2138	// This is used to:
2139	// 1) Create "thunks":
2140	// Jump instructions in many ISAs have small displacements, and therefore
2141	// they cannot jump to arbitrary addresses in memory. For example, RISC-V
2142	// JAL instruction can target only +-1 MiB from PC. It is a linker's
2143	// responsibility to create and insert small pieces of code between
2144	// sections to extend the ranges if jump targets are out of range. Such
2145	// code pieces are called "thunks".
2146	//
2147	// We add thunks at this stage. We couldn't do this before this point
2148	// because this is the earliest point where we know sizes of sections and
2149	// their layouts (that are needed to determine if jump targets are in
2150	// range).
2151	//
2152	// 2) Update the sections. We need to generate content that depends on the
2153	// address of InputSections. For example, MIPS GOT section content or
2154	// android packed relocations sections content.
2155	//
2156	// 3) Assign the final values for the linker script symbols. Linker scripts
2157	// sometimes using forward symbol declarations. We want to set the correct
2158	// values. They also might change after adding the thunks.
2159	finalizeAddressDependentContent();
2160
2161	// All information needed for OutputSection part of Map file is available.
2162	if (errCount(ctx))
2163	return;
2164
2165	{
2166	llvm::TimeTraceScope timeScope("Finalize synthetic sections");
2167	// finalizeAddressDependentContent may have added local symbols to the
2168	// static symbol table.
2169	finalizeSynthetic(ctx, sec: ctx.in.symTab.get());
2170	finalizeSynthetic(ctx, sec: ctx.in.debugNames.get());
2171	finalizeSynthetic(ctx, sec: ctx.in.ppc64LongBranchTarget.get());
2172	finalizeSynthetic(ctx, sec: ctx.in.armCmseSGSection.get());
2173	}
2174
2175	// Relaxation to delete inter-basic block jumps created by basic block
2176	// sections. Run after ctx.in.symTab is finalized as optimizeBasicBlockJumps
2177	// can relax jump instructions based on symbol offset.
2178	if (ctx.arg.optimizeBBJumps)
2179	optimizeBasicBlockJumps();
2180
2181	// Fill other section headers. The dynamic table is finalized
2182	// at the end because some tags like RELSZ depend on result
2183	// of finalizing other sections.
2184	for (OutputSection *sec : ctx.outputSections)
2185	sec->finalize(ctx);
2186
2187	ctx.script->checkFinalScriptConditions();
2188
2189	if (ctx.arg.emachine == EM_ARM && !ctx.arg.isLE && ctx.arg.armBe8) {
2190	addArmInputSectionMappingSymbols(ctx);
2191	sortArmMappingSymbols(ctx);
2192	}
2193	}
2194
2195	// Ensure data sections are not mixed with executable sections when
2196	// --execute-only is used. --execute-only make pages executable but not
2197	// readable.
2198	template <class ELFT> void Writer<ELFT>::checkExecuteOnly() {
2199	if (!ctx.arg.executeOnly)
2200	return;
2201
2202	SmallVector<InputSection *, `0`> storage;
2203	for (OutputSection *osec : ctx.outputSections)
2204	if (osec->flags & SHF_EXECINSTR)
2205	for (InputSection isec : getInputSections(os: osec, storage))
2206	if (!(isec->flags & SHF_EXECINSTR))
2207	ErrAlways(ctx) << "cannot place " << isec << " into " << osec->name
2208	<< ": --execute-only does not support intermingling "
2209	"data and code";
2210	}
2211
2212	// Check which input sections of RX output sections don't have the
2213	// SHF_AARCH64_PURECODE or SHF_ARM_PURECODE flag set.
2214	template <class ELFT> void Writer<ELFT>::checkExecuteOnlyReport() {
2215	if (ctx.arg.zExecuteOnlyReport == ReportPolicy::None)
2216	return;
2217
2218	auto reportUnless = [&](bool cond) -> ELFSyncStream {
2219	if (cond)
2220	return {ctx, DiagLevel::None};
2221	return {ctx, toDiagLevel(policy: ctx.arg.zExecuteOnlyReport)};
2222	};
2223
2224	uint64_t purecodeFlag =
2225	ctx.arg.emachine == EM_AARCH64 ? SHF_AARCH64_PURECODE : SHF_ARM_PURECODE;
2226	StringRef purecodeFlagName = ctx.arg.emachine == EM_AARCH64
2227	? "SHF_AARCH64_PURECODE"
2228	: "SHF_ARM_PURECODE";
2229	SmallVector<InputSection *, `0`> storage;
2230	for (OutputSection *osec : ctx.outputSections) {
2231	if (osec->getPhdrFlags() != (PF_R \| PF_X))
2232	continue;
2233	for (InputSection sec : getInputSections(os: osec, storage)) {
2234	if (isa<SyntheticSection>(Val: sec))
2235	continue;
2236	reportUnless(sec->flags & purecodeFlag)
2237	<< "-z execute-only-report: " << sec << " does not have "
2238	<< purecodeFlagName << " flag set";
2239	}
2240	}
2241	}
2242
2243	// The linker is expected to define SECNAME_start and SECNAME_end
2244	// symbols for a few sections. This function defines them.
2245	template <class ELFT> void Writer<ELFT>::addStartEndSymbols() {
2246	// If the associated output section does not exist, there is ambiguity as to
2247	// how we define _start and _end symbols for an init/fini section. Users
2248	// expect no "undefined symbol" linker errors and loaders expect equal
2249	// st_value but do not particularly care whether the symbols are defined or
2250	// not. We retain the output section so that the section indexes will be
2251	// correct.
2252	auto define = [=](StringRef start, StringRef end, OutputSection *os) {
2253	if (os) {
2254	Defined *startSym = addOptionalRegular(ctx, name: start, sec: os, val: `0`);
2255	Defined *stopSym = addOptionalRegular(ctx, name: end, sec: os, val: -`1`);
2256	if (startSym \|\| stopSym)
2257	os->usedInExpression = true;
2258	} else {
2259	addOptionalRegular(ctx, name: start, sec: ctx.out.elfHeader.get(), val: `0`);
2260	addOptionalRegular(ctx, name: end, sec: ctx.out.elfHeader.get(), val: `0`);
2261	}
2262	};
2263
2264	define("__preinit_array_start", "__preinit_array_end", ctx.out.preinitArray);
2265	define("__init_array_start", "__init_array_end", ctx.out.initArray);
2266	define("__fini_array_start", "__fini_array_end", ctx.out.finiArray);
2267
2268	// As a special case, don't unnecessarily retain .ARM.exidx, which would
2269	// create an empty PT_ARM_EXIDX.
2270	if (OutputSection *sec = findSection(ctx, name: ".ARM.exidx"))
2271	define("__exidx_start", "__exidx_end", sec);
2272	}
2273
2274	// If a section name is valid as a C identifier (which is rare because of
2275	// the leading '.'), linkers are expected to define __start_<secname> and
2276	// __stop_<secname> symbols. They are at beginning and end of the section,
2277	// respectively. This is not requested by the ELF standard, but GNU ld and
2278	// gold provide the feature, and used by many programs.
2279	template <class ELFT>
2280	void Writer<ELFT>::addStartStopSymbols(OutputSection &osec) {
2281	StringRef s = osec.name;
2282	if (!isValidCIdentifier(s))
2283	return;
2284	StringSaver &ss = ctx.saver;
2285	Defined *startSym = addOptionalRegular(ctx, name: ss.save(S: "__start_" + s), sec: &osec, val: `0`,
2286	stOther: ctx.arg.zStartStopVisibility);
2287	Defined *stopSym = addOptionalRegular(ctx, name: ss.save(S: "__stop_" + s), sec: &osec, val: -`1`,
2288	stOther: ctx.arg.zStartStopVisibility);
2289	if (startSym \|\| stopSym)
2290	osec.usedInExpression = true;
2291	}
2292
2293	static bool needsPtLoad(OutputSection *sec) {
2294	if (!(sec->flags & SHF_ALLOC))
2295	return false;
2296
2297	// Don't allocate VA space for TLS NOBITS sections. The PT_TLS PHDR is
2298	// responsible for allocating space for them, not the PT_LOAD that
2299	// contains the TLS initialization image.
2300	if ((sec->flags & SHF_TLS) && sec->type == SHT_NOBITS)
2301	return false;
2302	return true;
2303	}
2304
2305	// Adjust phdr flags according to certain options.
2306	static uint64_t computeFlags(Ctx &ctx, uint64_t flags) {
2307	if (ctx.arg.omagic)
2308	return PF_R \| PF_W \| PF_X;
2309	if (ctx.arg.executeOnly && (flags & PF_X))
2310	return flags & ~PF_R;
2311	return flags;
2312	}
2313
2314	// Decide which program headers to create and which sections to include in each
2315	// one.
2316	template <class ELFT>
2317	SmallVector<std::unique_ptr<PhdrEntry>, `0`>
2318	Writer<ELFT>::createPhdrs(Partition &part) {
2319	SmallVector<std::unique_ptr<PhdrEntry>, `0`> ret;
2320	auto addHdr = [&, &ctx = ctx](unsigned type, unsigned flags) -> PhdrEntry * {
2321	ret.push_back(Elt: std::make_unique<PhdrEntry>(args&: ctx, args&: type, args&: flags));
2322	return ret.back().get();
2323	};
2324
2325	unsigned partNo = part.getNumber(ctx);
2326	bool isMain = partNo == `1`;
2327
2328	// Add the first PT_LOAD segment for regular output sections.
2329	uint64_t flags = computeFlags(ctx, flags: PF_R);
2330	PhdrEntry load = nullptr*;
2331
2332	// nmagic or omagic output does not have PT_PHDR, PT_INTERP, or the readonly
2333	// PT_LOAD.
2334	if (!ctx.arg.nmagic && !ctx.arg.omagic) {
2335	// The first phdr entry is PT_PHDR which describes the program header
2336	// itself.
2337	if (isMain)
2338	addHdr(PT_PHDR, PF_R)->add(ctx.out.programHeaders.get());
2339	else
2340	addHdr(PT_PHDR, PF_R)->add(part.programHeaders ->getParent());
2341
2342	// PT_INTERP must be the second entry if exists.
2343	if (OutputSection *cmd = findSection(ctx, name: ".interp", partition: partNo))
2344	addHdr(PT_INTERP, cmd->getPhdrFlags())->add(cmd);
2345
2346	// Add the headers. We will remove them if they don't fit.
2347	// In the other partitions the headers are ordinary sections, so they don't
2348	// need to be added here.
2349	if (isMain) {
2350	load = addHdr(PT_LOAD, flags);
2351	load->add(sec: ctx.out.elfHeader.get());
2352	load->add(sec: ctx.out.programHeaders.get());
2353	}
2354	}
2355
2356	// PT_GNU_RELRO includes all sections that should be marked as
2357	// read-only by dynamic linker after processing relocations.
2358	// Current dynamic loaders only support one PT_GNU_RELRO PHDR, give
2359	// an error message if more than one PT_GNU_RELRO PHDR is required.
2360	auto relRo = std::make_unique<PhdrEntry>(args&: ctx, args: PT_GNU_RELRO, args: PF_R);
2361	bool inRelroPhdr = false;
2362	OutputSection relroEnd = nullptr*;
2363	for (OutputSection *sec : ctx.outputSections) {
2364	if (sec->partition != partNo \|\| !needsPtLoad(sec))
2365	continue;
2366	if (isRelroSection(ctx, sec)) {
2367	inRelroPhdr = true;
2368	if (!relroEnd)
2369	relRo ->add(sec);
2370	else
2371	ErrAlways(ctx) << "section: " << sec->name
2372	<< " is not contiguous with other relro" << " sections";
2373	} else if (inRelroPhdr) {
2374	inRelroPhdr = false;
2375	relroEnd = sec;
2376	}
2377	}
2378	relRo ->p_align = `1`;
2379
2380	for (OutputSection *sec : ctx.outputSections) {
2381	if (!needsPtLoad(sec))
2382	continue;
2383
2384	// Normally, sections in partitions other than the current partition are
2385	// ignored. But partition number 255 is a special case: it contains the
2386	// partition end marker (.part.end). It needs to be added to the main
2387	// partition so that a segment is created for it in the main partition,
2388	// which will cause the dynamic loader to reserve space for the other
2389	// partitions.
2390	if (sec->partition != partNo) {
2391	if (isMain && sec->partition == `255`)
2392	addHdr(PT_LOAD, computeFlags(ctx, flags: sec->getPhdrFlags()))->add(sec);
2393	continue;
2394	}
2395
2396	// Segments are contiguous memory regions that has the same attributes
2397	// (e.g. executable or writable). There is one phdr for each segment.
2398	// Therefore, we need to create a new phdr when the next section has
2399	// incompatible flags or is loaded at a discontiguous address or memory
2400	// region using AT or AT> linker script command, respectively.
2401	//
2402	// As an exception, we don't create a separate load segment for the ELF
2403	// headers, even if the first "real" output has an AT or AT> attribute.
2404	//
2405	// In addition, NOBITS sections should only be placed at the end of a LOAD
2406	// segment (since it's represented as p_filesz < p_memsz). If we have a
2407	// not-NOBITS section after a NOBITS, we create a new LOAD for the latter
2408	// even if flags match, so as not to require actually writing the
2409	// supposed-to-be-NOBITS section to the output file. (However, we cannot do
2410	// so when hasSectionsCommand, since we cannot introduce the extra alignment
2411	// needed to create a new LOAD)
2412	uint64_t newFlags = computeFlags(ctx, flags: sec->getPhdrFlags());
2413	uint64_t incompatible = flags ^ newFlags;
2414	if (!(newFlags & PF_W)) {
2415	// When --no-rosegment is specified, RO and RX sections are compatible.
2416	if (ctx.arg.singleRoRx)
2417	incompatible &= ~PF_X;
2418	// When --no-xosegment is specified (the default), XO and RX sections are
2419	// compatible.
2420	if (ctx.arg.singleXoRx)
2421	incompatible &= ~PF_R;
2422	}
2423	if (incompatible)
2424	load = nullptr;
2425
2426	bool sameLMARegion =
2427	load && !sec->lmaExpr && sec->lmaRegion == load->firstSec->lmaRegion;
2428	if (load && sec != relroEnd &&
2429	sec->memRegion == load->firstSec->memRegion &&
2430	(sameLMARegion \|\| load->lastSec == ctx.out.programHeaders.get()) &&
2431	(ctx.script->hasSectionsCommand \|\| sec->type == SHT_NOBITS \|\|
2432	load->lastSec->type != SHT_NOBITS)) {
2433	load->p_flags \|= newFlags;
2434	} else {
2435	load = addHdr(PT_LOAD, newFlags);
2436	flags = newFlags;
2437	}
2438
2439	load->add(sec);
2440	}
2441
2442	// Add a TLS segment if any.
2443	auto tlsHdr = std::make_unique<PhdrEntry>(args&: ctx, args: PT_TLS, args: PF_R);
2444	for (OutputSection *sec : ctx.outputSections)
2445	if (sec->partition == partNo && sec->flags & SHF_TLS)
2446	tlsHdr ->add(sec);
2447	if (tlsHdr ->firstSec)
2448	ret.push_back(Elt: std::move(tlsHdr));
2449
2450	// Add an entry for .dynamic.
2451	if (OutputSection *sec = part.dynamic ->getParent())
2452	addHdr(PT_DYNAMIC, sec->getPhdrFlags())->add(sec);
2453
2454	if (relRo ->firstSec)
2455	ret.push_back(Elt: std::move(relRo));
2456
2457	// PT_GNU_EH_FRAME is a special section pointing on .eh_frame_hdr.
2458	if (part.ehFrameHdr && part.ehFrameHdr ->isNeeded())
2459	addHdr(PT_GNU_EH_FRAME, part.ehFrameHdr ->getParent()->getPhdrFlags())
2460	->add(part.ehFrameHdr ->getParent());
2461
2462	if (ctx.arg.osabi == ELFOSABI_OPENBSD) {
2463	// PT_OPENBSD_MUTABLE makes the dynamic linker fill the segment with
2464	// zero data, like bss, but it can be treated differently.
2465	if (OutputSection *cmd = findSection(ctx, name: ".openbsd.mutable", partition: partNo))
2466	addHdr(PT_OPENBSD_MUTABLE, cmd->getPhdrFlags())->add(cmd);
2467
2468	// PT_OPENBSD_RANDOMIZE makes the dynamic linker fill the segment
2469	// with random data.
2470	if (OutputSection *cmd = findSection(ctx, name: ".openbsd.randomdata", partition: partNo))
2471	addHdr(PT_OPENBSD_RANDOMIZE, cmd->getPhdrFlags())->add(cmd);
2472
2473	// PT_OPENBSD_SYSCALLS makes the kernel and dynamic linker register
2474	// system call sites.
2475	if (OutputSection *cmd = findSection(ctx, name: ".openbsd.syscalls", partition: partNo))
2476	addHdr(PT_OPENBSD_SYSCALLS, cmd->getPhdrFlags())->add(cmd);
2477	}
2478
2479	if (ctx.arg.zGnustack != GnuStackKind::None) {
2480	// PT_GNU_STACK is a special section to tell the loader to make the
2481	// pages for the stack non-executable. If you really want an executable
2482	// stack, you can pass -z execstack, but that's not recommended for
2483	// security reasons.
2484	unsigned perm = PF_R \| PF_W;
2485	if (ctx.arg.zGnustack == GnuStackKind::Exec)
2486	perm \|= PF_X;
2487	addHdr(PT_GNU_STACK, perm)->p_memsz = ctx.arg.zStackSize;
2488	}
2489
2490	// PT_OPENBSD_NOBTCFI is an OpenBSD-specific header to mark that the
2491	// executable is expected to violate branch-target CFI checks.
2492	if (ctx.arg.zNoBtCfi)
2493	addHdr(PT_OPENBSD_NOBTCFI, PF_X);
2494
2495	// PT_OPENBSD_WXNEEDED is a OpenBSD-specific header to mark the executable
2496	// is expected to perform W^X violations, such as calling mprotect(2) or
2497	// mmap(2) with PROT_WRITE \| PROT_EXEC, which is prohibited by default on
2498	// OpenBSD.
2499	if (ctx.arg.zWxneeded)
2500	addHdr(PT_OPENBSD_WXNEEDED, PF_X);
2501
2502	if (OutputSection *cmd = findSection(ctx, name: ".note.gnu.property", partition: partNo))
2503	addHdr(PT_GNU_PROPERTY, PF_R)->add(cmd);
2504
2505	// Create one PT_NOTE per a group of contiguous SHT_NOTE sections with the
2506	// same alignment.
2507	PhdrEntry note = nullptr*;
2508	for (OutputSection *sec : ctx.outputSections) {
2509	if (sec->partition != partNo)
2510	continue;
2511	if (sec->type == SHT_NOTE && (sec->flags & SHF_ALLOC)) {
2512	if (!note \|\| sec->lmaExpr \|\| note->lastSec->addralign != sec->addralign)
2513	note = addHdr(PT_NOTE, PF_R);
2514	note->add(sec);
2515	} else {
2516	note = nullptr;
2517	}
2518	}
2519	return ret;
2520	}
2521
2522	template <class ELFT>
2523	void Writer<ELFT>::addPhdrForSection(Partition &part, unsigned shType,
2524	unsigned pType, unsigned pFlags) {
2525	unsigned partNo = part.getNumber(ctx);
2526	auto i = llvm::find_if(ctx.outputSections, [=](OutputSection *cmd) {
2527	return cmd->partition == partNo && cmd->type == shType;
2528	});
2529	if (i == ctx.outputSections.end())
2530	return;
2531
2532	auto entry = std::make_unique<PhdrEntry>(args&: ctx, args&: pType, args&: pFlags);
2533	entry ->add(sec: *i);
2534	part.phdrs.push_back(Elt: std::move(entry));
2535	}
2536
2537	// Place the first section of each PT_LOAD to a different page (of maxPageSize).
2538	// This is achieved by assigning an alignment expression to addrExpr of each
2539	// such section.
2540	template <class ELFT> void Writer<ELFT>::fixSectionAlignments() {
2541	const PhdrEntry *prev;
2542	auto pageAlign = [&, &ctx = this->ctx](const PhdrEntry *p) {
2543	OutputSection *cmd = p->firstSec;
2544	if (!cmd)
2545	return;
2546	cmd->alignExpr = [align = cmd->addralign]() { return align; };
2547	if (!cmd->addrExpr) {
2548	// Prefer advancing to align(dot, maxPageSize) + dot%maxPageSize to avoid
2549	// padding in the file contents.
2550	//
2551	// When -z separate-code is used we must not have any overlap in pages
2552	// between an executable segment and a non-executable segment. We align to
2553	// the next maximum page size boundary on transitions between executable
2554	// and non-executable segments.
2555	//
2556	// SHT_LLVM_PART_EHDR marks the start of a partition. The partition
2557	// sections will be extracted to a separate file. Align to the next
2558	// maximum page size boundary so that we can find the ELF header at the
2559	// start. We cannot benefit from overlapping p_offset ranges with the
2560	// previous segment anyway.
2561	if (ctx.arg.zSeparate == SeparateSegmentKind::Loadable \|\|
2562	(ctx.arg.zSeparate == SeparateSegmentKind::Code && prev &&
2563	(prev->p_flags & PF_X) != (p->p_flags & PF_X)) \|\|
2564	cmd->type == SHT_LLVM_PART_EHDR)
2565	cmd->addrExpr = [&ctx = this->ctx] {
2566	return alignToPowerOf2(ctx.script->getDot(), ctx.arg.maxPageSize);
2567	};
2568	// PT_TLS is at the start of the first RW PT_LOAD. If `p` includes PT_TLS,
2569	// it must be the RW. Align to p_align(PT_TLS) to make sure
2570	// p_vaddr(PT_LOAD)%p_align(PT_LOAD) = 0. Otherwise, if
2571	// sh_addralign(.tdata) < sh_addralign(.tbss), we will set p_align(PT_TLS)
2572	// to sh_addralign(.tbss), while p_vaddr(PT_TLS)=p_vaddr(PT_LOAD) may not
2573	// be congruent to 0 modulo p_align(PT_TLS).
2574	//
2575	// Technically this is not required, but as of 2019, some dynamic loaders
2576	// don't handle p_vaddr%p_align != 0 correctly, e.g. glibc (i386 and
2577	// x86-64) doesn't make runtime address congruent to p_vaddr modulo
2578	// p_align for dynamic TLS blocks (PR/24606), FreeBSD rtld has the same
2579	// bug, musl (TLS Variant 1 architectures) before 1.1.23 handled TLS
2580	// blocks correctly. We need to keep the workaround for a while.
2581	else if (ctx.tlsPhdr && ctx.tlsPhdr->firstSec == p->firstSec)
2582	cmd->addrExpr = [&ctx] {
2583	return alignToPowerOf2(ctx.script->getDot(), ctx.arg.maxPageSize) +
2584	alignToPowerOf2(ctx.script->getDot() % ctx.arg.maxPageSize,
2585	ctx.tlsPhdr->p_align);
2586	};
2587	else
2588	cmd->addrExpr = [&ctx] {
2589	return alignToPowerOf2(ctx.script->getDot(), ctx.arg.maxPageSize) +
2590	ctx.script->getDot() % ctx.arg.maxPageSize;
2591	};
2592	}
2593	};
2594
2595	for (Partition &part : ctx.partitions) {
2596	prev = nullptr;
2597	for (auto &p : part.phdrs)
2598	if (p ->p_type == PT_LOAD && p ->firstSec) {
2599	pageAlign(p.get());
2600	prev = p.get();
2601	}
2602	}
2603	}
2604
2605	// Compute an in-file position for a given section. The file offset must be the
2606	// same with its virtual address modulo the page size, so that the loader can
2607	// load executables without any address adjustment.
2608	static uint64_t computeFileOffset(Ctx &ctx, OutputSection *os, uint64_t off) {
2609	// The first section in a PT_LOAD has to have congruent offset and address
2610	// modulo the maximum page size.
2611	if (os->ptLoad && os->ptLoad->firstSec == os)
2612	return alignTo(Value: off, Align: os->ptLoad->p_align, Skew: os->addr);
2613
2614	// File offsets are not significant for .bss sections other than the first one
2615	// in a PT_LOAD/PT_TLS. By convention, we keep section offsets monotonically
2616	// increasing rather than setting to zero.
2617	if (os->type == SHT_NOBITS && (!ctx.tlsPhdr \|\| ctx.tlsPhdr->firstSec != os))
2618	return off;
2619
2620	// If the section is not in a PT_LOAD, we just have to align it.
2621	if (!os->ptLoad)
2622	return alignToPowerOf2(Value: off, Align: os->addralign);
2623
2624	// If two sections share the same PT_LOAD the file offset is calculated
2625	// using this formula: Off2 = Off1 + (VA2 - VA1).
2626	OutputSection *first = os->ptLoad->firstSec;
2627	return first->offset + os->addr - first->addr;
2628	}
2629
2630	template <class ELFT> void Writer<ELFT>::assignFileOffsetsBinary() {
2631	// Compute the minimum LMA of all non-empty non-NOBITS sections as minAddr.
2632	auto needsOffset = [](OutputSection &sec) {
2633	return sec.type != SHT_NOBITS && (sec.flags & SHF_ALLOC) && sec.size > `0`;
2634	};
2635	uint64_t minAddr = UINT64_MAX;
2636	for (OutputSection *sec : ctx.outputSections)
2637	if (needsOffset(*sec)) {
2638	sec->offset = sec->getLMA();
2639	minAddr = std::min(a: minAddr, b: sec->offset);
2640	}
2641
2642	// Sections are laid out at LMA minus minAddr.
2643	fileSize = `0`;
2644	for (OutputSection *sec : ctx.outputSections)
2645	if (needsOffset(*sec)) {
2646	sec->offset -= minAddr;
2647	fileSize = std::max(a: fileSize, b: sec->offset + sec->size);
2648	}
2649	}
2650
2651	static std::string rangeToString(uint64_t addr, uint64_t len) {
2652	return "[0x" + utohexstr(X: addr) + ", 0x" + utohexstr(X: addr + len - `1`) + "]";
2653	}
2654
2655	// Assign file offsets to output sections.
2656	template <class ELFT> void Writer<ELFT>::assignFileOffsets() {
2657	ctx.out.programHeaders ->offset = ctx.out.elfHeader ->size;
2658	uint64_t off = ctx.out.elfHeader ->size + ctx.out.programHeaders ->size;
2659
2660	PhdrEntry lastRX = nullptr*;
2661	for (Partition &part : ctx.partitions)
2662	for (auto &p : part.phdrs)
2663	if (p ->p_type == PT_LOAD && (p ->p_flags & PF_X))
2664	lastRX = p.get();
2665
2666	// Layout SHF_ALLOC sections before non-SHF_ALLOC sections. A non-SHF_ALLOC
2667	// will not occupy file offsets contained by a PT_LOAD.
2668	for (OutputSection *sec : ctx.outputSections) {
2669	if (!(sec->flags & SHF_ALLOC))
2670	continue;
2671	off = computeFileOffset(ctx, os: sec, off);
2672	sec->offset = off;
2673	if (sec->type != SHT_NOBITS)
2674	off += sec->size;
2675
2676	// If this is a last section of the last executable segment and that
2677	// segment is the last loadable segment, align the offset of the
2678	// following section to avoid loading non-segments parts of the file.
2679	if (ctx.arg.zSeparate != SeparateSegmentKind::None && lastRX &&
2680	lastRX->lastSec == sec)
2681	off = alignToPowerOf2(Value: off, Align: ctx.arg.maxPageSize);
2682	}
2683	for (OutputSection *osec : ctx.outputSections) {
2684	if (osec->flags & SHF_ALLOC)
2685	continue;
2686	osec->offset = alignToPowerOf2(Value: off, Align: osec->addralign);
2687	off = osec->offset + osec->size;
2688	}
2689
2690	sectionHeaderOff = alignToPowerOf2(Value: off, Align: ctx.arg.wordsize);
2691	fileSize =
2692	sectionHeaderOff + (ctx.outputSections.size() + `1`) * sizeof(Elf_Shdr);
2693
2694	// Our logic assumes that sections have rising VA within the same segment.
2695	// With use of linker scripts it is possible to violate this rule and get file
2696	// offset overlaps or overflows. That should never happen with a valid script
2697	// which does not move the location counter backwards and usually scripts do
2698	// not do that. Unfortunately, there are apps in the wild, for example, Linux
2699	// kernel, which control segment distribution explicitly and move the counter
2700	// backwards, so we have to allow doing that to support linking them. We
2701	// perform non-critical checks for overlaps in checkSectionOverlap(), but here
2702	// we want to prevent file size overflows because it would crash the linker.
2703	for (OutputSection *sec : ctx.outputSections) {
2704	if (sec->type == SHT_NOBITS)
2705	continue;
2706	if ((sec->offset > fileSize) \|\| (sec->offset + sec->size > fileSize))
2707	ErrAlways(ctx) << "unable to place section " << sec->name
2708	<< " at file offset "
2709	<< rangeToString(addr: sec->offset, len: sec->size)
2710	<< "; check your linker script for overflows";
2711	}
2712	}
2713
2714	// Finalize the program headers. We call this function after we assign
2715	// file offsets and VAs to all sections.
2716	template <class ELFT> void Writer<ELFT>::setPhdrs(Partition &part) {
2717	for (std::unique_ptr<PhdrEntry> &p : part.phdrs) {
2718	OutputSection *first = p ->firstSec;
2719	OutputSection *last = p ->lastSec;
2720
2721	// .ARM.exidx sections may not be within a single .ARM.exidx
2722	// output section. We always want to describe just the
2723	// SyntheticSection.
2724	if (part.armExidx && p ->p_type == PT_ARM_EXIDX) {
2725	p ->p_filesz = part.armExidx ->getSize();
2726	p ->p_memsz = p ->p_filesz;
2727	p ->p_offset = first->offset + part.armExidx ->outSecOff;
2728	p ->p_vaddr = first->addr + part.armExidx ->outSecOff;
2729	p ->p_align = part.armExidx ->addralign;
2730	if (part.elfHeader)
2731	p ->p_offset -= part.elfHeader ->getParent()->offset;
2732
2733	if (!p ->hasLMA)
2734	p ->p_paddr = first->getLMA() + part.armExidx ->outSecOff;
2735	return;
2736	}
2737
2738	if (first) {
2739	p ->p_filesz = last->offset - first->offset;
2740	if (last->type != SHT_NOBITS)
2741	p ->p_filesz += last->size;
2742
2743	p ->p_memsz = last->addr + last->size - first->addr;
2744	p ->p_offset = first->offset;
2745	p ->p_vaddr = first->addr;
2746
2747	// File offsets in partitions other than the main partition are relative
2748	// to the offset of the ELF headers. Perform that adjustment now.
2749	if (part.elfHeader)
2750	p ->p_offset -= part.elfHeader ->getParent()->offset;
2751
2752	if (!p ->hasLMA)
2753	p ->p_paddr = first->getLMA();
2754	}
2755	}
2756	}
2757
2758	// A helper struct for checkSectionOverlap.
2759	namespace {
2760	struct SectionOffset {
2761	OutputSection *sec;
2762	uint64_t offset;
2763	};
2764	} // namespace
2765
2766	// Check whether sections overlap for a specific address range (file offsets,
2767	// load and virtual addresses).
2768	static void checkOverlap(Ctx &ctx, StringRef name,
2769	std::vector<SectionOffset> &sections,
2770	bool isVirtualAddr) {
2771	llvm::sort(C&: sections, Comp: [=](const SectionOffset &a, const SectionOffset &b) {
2772	return a.offset < b.offset;
2773	});
2774
2775	// Finding overlap is easy given a vector is sorted by start position.
2776	// If an element starts before the end of the previous element, they overlap.
2777	for (size_t i = `1`, end = sections.size(); i < end; ++i) {
2778	SectionOffset a = sections [i - `1`];
2779	SectionOffset b = sections [i];
2780	if (b.offset >= a.offset + a.sec->size)
2781	continue;
2782
2783	// If both sections are in OVERLAY we allow the overlapping of virtual
2784	// addresses, because it is what OVERLAY was designed for.
2785	if (isVirtualAddr && a.sec->inOverlay && b.sec->inOverlay)
2786	continue;
2787
2788	Err(ctx) << "section " << a.sec->name << " " << name
2789	<< " range overlaps with " << b.sec->name << "\n>>> "
2790	<< a.sec->name << " range is "
2791	<< rangeToString(addr: a.offset, len: a.sec->size) << "\n>>> " << b.sec->name
2792	<< " range is " << rangeToString(addr: b.offset, len: b.sec->size);
2793	}
2794	}
2795
2796	// Check for overlapping sections and address overflows.
2797	//
2798	// In this function we check that none of the output sections have overlapping
2799	// file offsets. For SHF_ALLOC sections we also check that the load address
2800	// ranges and the virtual address ranges don't overlap
2801	template <class ELFT> void Writer<ELFT>::checkSections() {
2802	// First, check that section's VAs fit in available address space for target.
2803	for (OutputSection *os : ctx.outputSections)
2804	if ((os->addr + os->size < os->addr) \|\|
2805	(!ELFT::Is64Bits && os->addr + os->size > uint64_t(UINT32_MAX) + `1`))
2806	Err(ctx) << "section " << os->name << " at 0x"
2807	<< utohexstr(X: os->addr, LowerCase: true) << " of size 0x"
2808	<< utohexstr(X: os->size, LowerCase: true)
2809	<< " exceeds available address space";
2810
2811	// Check for overlapping file offsets. In this case we need to skip any
2812	// section marked as SHT_NOBITS. These sections don't actually occupy space in
2813	// the file so Sec->Offset + Sec->Size can overlap with others. If --oformat
2814	// binary is specified only add SHF_ALLOC sections are added to the output
2815	// file so we skip any non-allocated sections in that case.
2816	std::vector<SectionOffset> fileOffs;
2817	for (OutputSection *sec : ctx.outputSections)
2818	if (sec->size > `0` && sec->type != SHT_NOBITS &&
2819	(!ctx.arg.oFormatBinary \|\| (sec->flags & SHF_ALLOC)))
2820	fileOffs.push_back(x: {.sec: sec, .offset: sec->offset});
2821	checkOverlap(ctx, name: "file", sections&: fileOffs, isVirtualAddr: false);
2822
2823	// When linking with -r there is no need to check for overlapping virtual/load
2824	// addresses since those addresses will only be assigned when the final
2825	// executable/shared object is created.
2826	if (ctx.arg.relocatable)
2827	return;
2828
2829	// Checking for overlapping virtual and load addresses only needs to take
2830	// into account SHF_ALLOC sections since others will not be loaded.
2831	// Furthermore, we also need to skip SHF_TLS sections since these will be
2832	// mapped to other addresses at runtime and can therefore have overlapping
2833	// ranges in the file.
2834	std::vector<SectionOffset> vmas;
2835	for (OutputSection *sec : ctx.outputSections)
2836	if (sec->size > `0` && (sec->flags & SHF_ALLOC) && !(sec->flags & SHF_TLS))
2837	vmas.push_back(x: {.sec: sec, .offset: sec->addr});
2838	checkOverlap(ctx, name: "virtual address", sections&: vmas, isVirtualAddr: true);
2839
2840	// Finally, check that the load addresses don't overlap. This will usually be
2841	// the same as the virtual addresses but can be different when using a linker
2842	// script with AT().
2843	std::vector<SectionOffset> lmas;
2844	for (OutputSection *sec : ctx.outputSections)
2845	if (sec->size > `0` && (sec->flags & SHF_ALLOC) && !(sec->flags & SHF_TLS))
2846	lmas.push_back(x: {.sec: sec, .offset: sec->getLMA()});
2847	checkOverlap(ctx, name: "load address", sections&: lmas, isVirtualAddr: false);
2848	}
2849
2850	// The entry point address is chosen in the following ways.
2851	//
2852	// 1. the '-e' entry command-line option;
2853	// 2. the ENTRY(symbol) command in a linker control script;
2854	// 3. the value of the symbol _start, if present;
2855	// 4. the number represented by the entry symbol, if it is a number;
2856	// 5. the address 0.
2857	static uint64_t getEntryAddr(Ctx &ctx) {
2858	// Case 1, 2 or 3
2859	if (Symbol *b = ctx.symtab ->find(name: ctx.arg.entry))
2860	return b->getVA(ctx);
2861
2862	// Case 4
2863	uint64_t addr;
2864	if (to_integer(S: ctx.arg.entry, Num&: addr))
2865	return addr;
2866
2867	// Case 5
2868	if (ctx.arg.warnMissingEntry)
2869	Warn(ctx) << "cannot find entry symbol " << ctx.arg.entry
2870	<< "; not setting start address";
2871	return `0`;
2872	}
2873
2874	static uint16_t getELFType(Ctx &ctx) {
2875	if (ctx.arg.isPic)
2876	return ET_DYN;
2877	if (ctx.arg.relocatable)
2878	return ET_REL;
2879	return ET_EXEC;
2880	}
2881
2882	template <class ELFT> void Writer<ELFT>::writeHeader() {
2883	writeEhdr<ELFT>(ctx, ctx.bufferStart, *ctx.mainPart);
2884	writePhdrs<ELFT>(ctx.bufferStart + sizeof(Elf_Ehdr), *ctx.mainPart);
2885
2886	auto eHdr = reinterpret_cast<Elf_Ehdr >(ctx.bufferStart);
2887	eHdr->e_type = getELFType(ctx);
2888	eHdr->e_entry = getEntryAddr(ctx);
2889
2890	// If -z nosectionheader is specified, omit the section header table.
2891	if (!ctx.in.shStrTab)
2892	return;
2893	eHdr->e_shoff = sectionHeaderOff;
2894
2895	// Write the section header table.
2896	//
2897	// The ELF header can only store numbers up to SHN_LORESERVE in the e_shnum
2898	// and e_shstrndx fields. When the value of one of these fields exceeds
2899	// SHN_LORESERVE ELF requires us to put sentinel values in the ELF header and
2900	// use fields in the section header at index 0 to store
2901	// the value. The sentinel values and fields are:
2902	// e_shnum = 0, SHdrs[0].sh_size = number of sections.
2903	// e_shstrndx = SHN_XINDEX, SHdrs[0].sh_link = .shstrtab section index.
2904	auto sHdrs = reinterpret_cast<Elf_Shdr >(ctx.bufferStart + eHdr->e_shoff);
2905	size_t num = ctx.outputSections.size() + `1`;
2906	if (num >= SHN_LORESERVE)
2907	sHdrs->sh_size = num;
2908	else
2909	eHdr->e_shnum = num;
2910
2911	uint32_t strTabIndex = ctx.in.shStrTab ->getParent()->sectionIndex;
2912	if (strTabIndex >= SHN_LORESERVE) {
2913	sHdrs->sh_link = strTabIndex;
2914	eHdr->e_shstrndx = SHN_XINDEX;
2915	} else {
2916	eHdr->e_shstrndx = strTabIndex;
2917	}
2918
2919	for (OutputSection *sec : ctx.outputSections)
2920	sec->writeHeaderTo<ELFT>(++sHdrs);
2921	}
2922
2923	// Open a result file.
2924	template <class ELFT> void Writer<ELFT>::openFile() {
2925	uint64_t maxSize = ctx.arg.is64 ? INT64_MAX : UINT32_MAX;
2926	if (fileSize != size_t(fileSize) \|\| maxSize < fileSize) {
2927	std::string msg;
2928	raw_string_ostream s(msg);
2929	s << "output file too large: " << fileSize << " bytes\n"
2930	<< "section sizes:\n";
2931	for (OutputSection *os : ctx.outputSections)
2932	s << os->name << `' '` << os->size << "\n";
2933	ErrAlways(ctx) << msg;
2934	return;
2935	}
2936
2937	unlinkAsync(path: ctx.arg.outputFile);
2938	unsigned flags = `0`;
2939	if (!ctx.arg.relocatable)
2940	flags \|= FileOutputBuffer::F_executable;
2941	if (ctx.arg.mmapOutputFile)
2942	flags \|= FileOutputBuffer::F_mmap;
2943	Expected<std::unique_ptr<FileOutputBuffer>> bufferOrErr =
2944	FileOutputBuffer::create(FilePath: ctx.arg.outputFile, Size: fileSize, Flags: flags);
2945
2946	if (!bufferOrErr) {
2947	ErrAlways(ctx) << "failed to open " << ctx.arg.outputFile << ": "
2948	<< bufferOrErr.takeError();
2949	return;
2950	}
2951	buffer = std::move(*bufferOrErr);
2952	ctx.bufferStart = buffer ->getBufferStart();
2953	}
2954
2955	template <class ELFT> void Writer<ELFT>::writeSectionsBinary() {
2956	parallel::TaskGroup tg;
2957	for (OutputSection *sec : ctx.outputSections)
2958	if (sec->flags & SHF_ALLOC)
2959	sec->writeTo<ELFT>(ctx, ctx.bufferStart + sec->offset, tg);
2960	}
2961
2962	static void fillTrap(std::array<uint8_t, `4`> trapInstr, uint8_t *i,
2963	uint8_t *end) {
2964	for (; i + `4` <= end; i += `4`)
2965	memcpy(dest: i, src: trapInstr.data(), n: `4`);
2966	}
2967
2968	// Fill executable segments with trap instructions. This includes both the
2969	// gaps between sections (due to alignment) and the tail padding to the page
2970	// boundary. Even though it is not required by any standard, it is in general
2971	// a good thing to do for security reasons.
2972	template <class ELFT> void Writer<ELFT>::writeTrapInstr() {
2973	for (Partition &part : ctx.partitions) {
2974	// Fill gaps between consecutive sections in the same executable segment.
2975	OutputSection prev = nullptr*;
2976	for (OutputSection *sec : ctx.outputSections) {
2977	PhdrEntry *p = sec->ptLoad;
2978	if (!p \|\| !(p->p_flags & PF_X))
2979	continue;
2980	if (prev && prev->ptLoad == p)
2981	fillTrap(trapInstr: ctx.target ->trapInstr,
2982	i: ctx.bufferStart + alignDown(Value: prev->offset + prev->size, Align: `4`),
2983	end: ctx.bufferStart + sec->offset);
2984	prev = sec;
2985	}
2986
2987	// Fill the last page.
2988	for (std::unique_ptr<PhdrEntry> &p : part.phdrs)
2989	if (p ->p_type == PT_LOAD && (p ->p_flags & PF_X))
2990	fillTrap(
2991	trapInstr: ctx.target ->trapInstr,
2992	i: ctx.bufferStart + alignDown(Value: p ->firstSec->offset + p ->p_filesz, Align: `4`),
2993	end: ctx.bufferStart + alignToPowerOf2(Value: p ->firstSec->offset + p ->p_filesz,
2994	Align: ctx.arg.maxPageSize));
2995
2996	// Round up the file size of the last segment to the page boundary iff it is
2997	// an executable segment to ensure that other tools don't accidentally
2998	// trim the instruction padding (e.g. when stripping the file).
2999	PhdrEntry last = nullptr*;
3000	for (std::unique_ptr<PhdrEntry> &p : part.phdrs)
3001	if (p ->p_type == PT_LOAD)
3002	last = p.get();
3003
3004	if (last && (last->p_flags & PF_X)) {
3005	last->p_filesz = alignToPowerOf2(Value: last->p_filesz, Align: ctx.arg.maxPageSize);
3006	// p_memsz might be larger than the aligned p_filesz due to trailing BSS
3007	// sections. Don't decrease it.
3008	last->p_memsz = std::max(a: last->p_memsz, b: last->p_filesz);
3009	}
3010	}
3011	}
3012
3013	// Write section contents to a mmap'ed file.
3014	template <class ELFT> void Writer<ELFT>::writeSections() {
3015	llvm::TimeTraceScope timeScope("Write sections");
3016
3017	{
3018	// In -r or --emit-relocs mode, write the relocation sections first as in
3019	// ELf_Rel targets we might find out that we need to modify the relocated
3020	// section while doing it.
3021	parallel::TaskGroup tg;
3022	for (OutputSection *sec : ctx.outputSections)
3023	if (isStaticRelSecType(type: sec->type))
3024	sec->writeTo<ELFT>(ctx, ctx.bufferStart + sec->offset, tg);
3025	}
3026	{
3027	parallel::TaskGroup tg;
3028	for (OutputSection *sec : ctx.outputSections)
3029	if (!isStaticRelSecType(type: sec->type))
3030	sec->writeTo<ELFT>(ctx, ctx.bufferStart + sec->offset, tg);
3031	}
3032
3033	// Finally, check that all dynamic relocation addends were written correctly.
3034	if (ctx.arg.checkDynamicRelocs && ctx.arg.writeAddends) {
3035	for (OutputSection *sec : ctx.outputSections)
3036	if (isStaticRelSecType(type: sec->type))
3037	sec->checkDynRelAddends(ctx);
3038	}
3039	}
3040
3041	// Computes a hash value of Data using a given hash function.
3042	// In order to utilize multiple cores, we first split data into 1MB
3043	// chunks, compute a hash for each chunk, and then compute a hash value
3044	// of the hash values.
3045	static void
3046	computeHash(llvm::MutableArrayRef<uint8_t> hashBuf,
3047	llvm::ArrayRef<uint8_t> data,
3048	std::function<void(uint8_t *dest, ArrayRef<uint8_t> arr)> hashFn) {
3049	std::vector<ArrayRef<uint8_t>> chunks = split(arr: data, chunkSize: `1024` * `1024`);
3050	const size_t hashesSize = chunks.size() * hashBuf.size();
3051	std::unique_ptr<uint8_t[]> hashes(new uint8_t[hashesSize]);
3052
3053	// Compute hash values.
3054	parallelFor(Begin: `0`, End: chunks.size(), Fn: [&](size_t i) {
3055	hashFn (hashes.get() + i * hashBuf.size(), chunks [i]);
3056	});
3057
3058	// Write to the final output buffer.
3059	hashFn (hashBuf.data(), ArrayRef(hashes.get(), hashesSize));
3060	}
3061
3062	template <class ELFT> void Writer<ELFT>::writeBuildId() {
3063	if (!ctx.mainPart->buildId \|\| !ctx.mainPart->buildId ->getParent())
3064	return;
3065
3066	if (ctx.arg.buildId == BuildIdKind::Hexstring) {
3067	for (Partition &part : ctx.partitions)
3068	part.buildId ->writeBuildId(buf: ctx.arg.buildIdVector);
3069	return;
3070	}
3071
3072	// Compute a hash of all sections of the output file.
3073	size_t hashSize = ctx.mainPart->buildId ->hashSize;
3074	std::unique_ptr<uint8_t[]> buildId(new uint8_t[hashSize]);
3075	MutableArrayRef<uint8_t> output(buildId.get(), hashSize);
3076	llvm::ArrayRef<uint8_t> input{ctx.bufferStart, size_t(fileSize)};
3077
3078	// Fedora introduced build ID as "approximation of true uniqueness across all
3079	// binaries that might be used by overlapping sets of people". It does not
3080	// need some security goals that some hash algorithms strive to provide, e.g.
3081	// (second-)preimage and collision resistance. In practice people use 'md5'
3082	// and 'sha1' just for different lengths. Implement them with the more
3083	// efficient BLAKE3.
3084	switch (ctx.arg.buildId) {
3085	case BuildIdKind::Fast:
3086	computeHash(output, input, [](uint8_t *dest, ArrayRef<uint8_t> arr) {
3087	write64le(P: dest, V: xxh3_64bits(data: arr));
3088	});
3089	break;
3090	case BuildIdKind::Md5:
3091	computeHash(output, input, [&](uint8_t *dest, ArrayRef<uint8_t> arr) {
3092	memcpy(dest: dest, src: BLAKE3::hash<`16`>(Data: arr).data(), n: hashSize);
3093	});
3094	break;
3095	case BuildIdKind::Sha1:
3096	computeHash(output, input, [&](uint8_t *dest, ArrayRef<uint8_t> arr) {
3097	memcpy(dest: dest, src: BLAKE3::hash<`20`>(Data: arr).data(), n: hashSize);
3098	});
3099	break;
3100	case BuildIdKind::Uuid:
3101	if (auto ec = llvm::getRandomBytes(Buffer: buildId.get(), Size: hashSize))
3102	ErrAlways(ctx) << "entropy source failure: " << ec.message();
3103	break;
3104	default:
3105	llvm_unreachable("unknown BuildIdKind");
3106	}
3107	for (Partition &part : ctx.partitions)
3108	part.buildId ->writeBuildId(buf: output);
3109	}
3110
3111	template void elf::writeResult<ELF32LE>(Ctx &);
3112	template void elf::writeResult<ELF32BE>(Ctx &);
3113	template void elf::writeResult<ELF64LE>(Ctx &);
3114	template void elf::writeResult<ELF64BE>(Ctx &);
3115

Browse the source code of llvm_projects/lld/ELF/Writer.cpp