1 | //===- OutputSegment.cpp --------------------------------------------------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | |
9 | #include "OutputSegment.h" |
10 | #include "ConcatOutputSection.h" |
11 | #include "InputSection.h" |
12 | #include "Sections.h" |
13 | #include "Symbols.h" |
14 | #include "SyntheticSections.h" |
15 | |
16 | #include "lld/Common/Memory.h" |
17 | #include "llvm/ADT/StringSwitch.h" |
18 | #include "llvm/BinaryFormat/MachO.h" |
19 | |
20 | using namespace llvm; |
21 | using namespace llvm::MachO; |
22 | using namespace lld; |
23 | using namespace lld::macho; |
24 | |
25 | static uint32_t initProt(StringRef name) { |
26 | auto it = find_if( |
27 | Range&: config->segmentProtections, |
28 | P: [&](const SegmentProtection &segprot) { return segprot.name == name; }); |
29 | if (it != config->segmentProtections.end()) |
30 | return it->initProt; |
31 | |
32 | if (name == segment_names::text) |
33 | return VM_PROT_READ | VM_PROT_EXECUTE; |
34 | if (name == segment_names::pageZero) |
35 | return 0; |
36 | if (name == segment_names::linkEdit) |
37 | return VM_PROT_READ; |
38 | return VM_PROT_READ | VM_PROT_WRITE; |
39 | } |
40 | |
41 | static uint32_t maxProt(StringRef name) { |
42 | assert(config->arch() != AK_i386 && |
43 | "TODO: i386 has different maxProt requirements" ); |
44 | auto it = find_if( |
45 | Range&: config->segmentProtections, |
46 | P: [&](const SegmentProtection &segprot) { return segprot.name == name; }); |
47 | if (it != config->segmentProtections.end()) |
48 | return it->maxProt; |
49 | |
50 | return initProt(name); |
51 | } |
52 | |
53 | static uint32_t flags(StringRef name) { |
54 | // If we ever implement shared cache output support, SG_READ_ONLY should not |
55 | // be used for dylibs that can be placed in it. |
56 | return name == segment_names::dataConst ? (uint32_t)SG_READ_ONLY : 0; |
57 | } |
58 | |
59 | size_t OutputSegment::numNonHiddenSections() const { |
60 | size_t count = 0; |
61 | for (const OutputSection *osec : sections) |
62 | count += (!osec->isHidden() ? 1 : 0); |
63 | return count; |
64 | } |
65 | |
66 | void OutputSegment::addOutputSection(OutputSection *osec) { |
67 | inputOrder = std::min(a: inputOrder, b: osec->inputOrder); |
68 | |
69 | osec->parent = this; |
70 | sections.push_back(x: osec); |
71 | |
72 | for (const SectionAlign §Align : config->sectionAlignments) |
73 | if (sectAlign.segName == name && sectAlign.sectName == osec->name) |
74 | osec->align = sectAlign.align; |
75 | } |
76 | |
77 | template <typename T, typename F> static auto compareByOrder(F ord) { |
78 | return [=](T a, T b) { return ord(a) < ord(b); }; |
79 | } |
80 | |
81 | static int segmentOrder(OutputSegment *seg) { |
82 | return StringSwitch<int>(seg->name) |
83 | .Case(S: segment_names::pageZero, Value: -4) |
84 | .Case(S: segment_names::text, Value: -3) |
85 | .Case(S: segment_names::dataConst, Value: -2) |
86 | .Case(S: segment_names::data, Value: -1) |
87 | .Case(S: segment_names::llvm, Value: std::numeric_limits<int>::max() - 1) |
88 | // Make sure __LINKEDIT is the last segment (i.e. all its hidden |
89 | // sections must be ordered after other sections). |
90 | .Case(S: segment_names::linkEdit, Value: std::numeric_limits<int>::max()) |
91 | .Default(Value: seg->inputOrder); |
92 | } |
93 | |
94 | static int sectionOrder(OutputSection *osec) { |
95 | StringRef segname = osec->parent->name; |
96 | // Sections are uniquely identified by their segment + section name. |
97 | if (segname == segment_names::text) { |
98 | if (osec->name == section_names::header) |
99 | return -7; |
100 | // `__text` needs to precede the other code sections since its |
101 | // expected to be the largest. This means in effect that it will |
102 | // be the section that determines whether we need thunks or not. |
103 | if (osec->name == section_names::text) |
104 | return -6; |
105 | |
106 | // Prioritize specific section ordering based on our knowledge. This ensures |
107 | // that certain sections are placed in a particular order, even if they |
108 | // are also categorized as code sections. This explicit ordering takes |
109 | // precedence over the general code section ordering. |
110 | int knownPriority = |
111 | StringSwitch<int>(osec->name) |
112 | .Case(S: section_names::stubs, Value: -4) |
113 | .Case(S: section_names::stubHelper, Value: -3) |
114 | .Case(S: section_names::objcStubs, Value: -2) |
115 | .Case(S: section_names::initOffsets, Value: -1) |
116 | .Case(S: section_names::unwindInfo, |
117 | Value: std::numeric_limits<int>::max() - 1) |
118 | .Case(S: section_names::ehFrame, Value: std::numeric_limits<int>::max()) |
119 | .Default(Value: 0); |
120 | |
121 | if (knownPriority != 0) |
122 | return knownPriority; |
123 | |
124 | // Ensure all code sections are contiguous with `__text` for thunk |
125 | // calculations. |
126 | if (sections::isCodeSection(name: osec->name, segName: segment_names::text, flags: osec->flags)) { |
127 | return -5; |
128 | } |
129 | |
130 | return osec->inputOrder; |
131 | } else if (segname == segment_names::data || |
132 | segname == segment_names::dataConst) { |
133 | // For each thread spawned, dyld will initialize its TLVs by copying the |
134 | // address range from the start of the first thread-local data section to |
135 | // the end of the last one. We therefore arrange these sections contiguously |
136 | // to minimize the amount of memory used. Additionally, since zerofill |
137 | // sections must be at the end of their segments, and since TLV data |
138 | // sections can be zerofills, we end up putting all TLV data sections at the |
139 | // end of the segment. |
140 | switch (sectionType(flags: osec->flags)) { |
141 | case S_THREAD_LOCAL_VARIABLE_POINTERS: |
142 | return std::numeric_limits<int>::max() - 3; |
143 | case S_THREAD_LOCAL_REGULAR: |
144 | return std::numeric_limits<int>::max() - 2; |
145 | case S_THREAD_LOCAL_ZEROFILL: |
146 | return std::numeric_limits<int>::max() - 1; |
147 | case S_ZEROFILL: |
148 | return std::numeric_limits<int>::max(); |
149 | default: |
150 | return StringSwitch<int>(osec->name) |
151 | .Case(S: section_names::got, Value: -3) |
152 | .Case(S: section_names::lazySymbolPtr, Value: -2) |
153 | .Case(S: section_names::const_, Value: -1) |
154 | .Default(Value: osec->inputOrder); |
155 | } |
156 | } else if (segname == segment_names::linkEdit) { |
157 | return StringSwitch<int>(osec->name) |
158 | .Case(S: section_names::chainFixups, Value: -11) |
159 | .Case(S: section_names::rebase, Value: -10) |
160 | .Case(S: section_names::binding, Value: -9) |
161 | .Case(S: section_names::weakBinding, Value: -8) |
162 | .Case(S: section_names::lazyBinding, Value: -7) |
163 | .Case(S: section_names::export_, Value: -6) |
164 | .Case(S: section_names::functionStarts, Value: -5) |
165 | .Case(S: section_names::dataInCode, Value: -4) |
166 | .Case(S: section_names::symbolTable, Value: -3) |
167 | .Case(S: section_names::indirectSymbolTable, Value: -2) |
168 | .Case(S: section_names::stringTable, Value: -1) |
169 | .Case(S: section_names::codeSignature, Value: std::numeric_limits<int>::max()) |
170 | .Default(Value: osec->inputOrder); |
171 | } |
172 | // ZeroFill sections must always be the at the end of their segments: |
173 | // dyld checks if a segment's file size is smaller than its in-memory |
174 | // size to detect if a segment has zerofill sections, and if so it maps |
175 | // the missing tail as zerofill. |
176 | if (sectionType(flags: osec->flags) == S_ZEROFILL) |
177 | return std::numeric_limits<int>::max(); |
178 | return osec->inputOrder; |
179 | } |
180 | |
181 | void OutputSegment::sortOutputSections() { |
182 | // Must be stable_sort() to keep special sections such as |
183 | // S_THREAD_LOCAL_REGULAR in input order. |
184 | llvm::stable_sort(Range&: sections, C: compareByOrder<OutputSection *>(ord: sectionOrder)); |
185 | } |
186 | |
187 | void OutputSegment::assignAddressesToStartEndSymbols() { |
188 | for (Defined *d : segmentStartSymbols) |
189 | d->value = addr; |
190 | for (Defined *d : segmentEndSymbols) |
191 | d->value = addr + vmSize; |
192 | } |
193 | |
194 | void macho::sortOutputSegments() { |
195 | llvm::stable_sort(Range&: outputSegments, |
196 | C: compareByOrder<OutputSegment *>(ord: segmentOrder)); |
197 | } |
198 | |
199 | static DenseMap<StringRef, OutputSegment *> nameToOutputSegment; |
200 | std::vector<OutputSegment *> macho::outputSegments; |
201 | |
202 | void macho::resetOutputSegments() { |
203 | outputSegments.clear(); |
204 | nameToOutputSegment.clear(); |
205 | } |
206 | |
207 | static StringRef maybeRenameSegment(StringRef name) { |
208 | auto newName = config->segmentRenameMap.find(Val: name); |
209 | if (newName != config->segmentRenameMap.end()) |
210 | return newName->second; |
211 | return name; |
212 | } |
213 | |
214 | OutputSegment *macho::getOrCreateOutputSegment(StringRef name) { |
215 | name = maybeRenameSegment(name); |
216 | |
217 | OutputSegment *&segRef = nameToOutputSegment[name]; |
218 | if (segRef) |
219 | return segRef; |
220 | |
221 | segRef = make<OutputSegment>(); |
222 | segRef->name = name; |
223 | segRef->maxProt = maxProt(name); |
224 | segRef->initProt = initProt(name); |
225 | segRef->flags = flags(name); |
226 | |
227 | outputSegments.push_back(x: segRef); |
228 | return segRef; |
229 | } |
230 | |