annotate lld/ELF/ARMErrataFix.cpp @ 192:d7606dcf6fce

Added tag llvm10 for changeset 0572611fdcc8
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Mon, 14 Dec 2020 18:01:34 +0900
parents 0572611fdcc8
children 2e18cbf3894f
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
150
anatofuz
parents:
diff changeset
1 //===- ARMErrataFix.cpp ---------------------------------------------------===//
anatofuz
parents:
diff changeset
2 //
anatofuz
parents:
diff changeset
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
anatofuz
parents:
diff changeset
4 // See https://llvm.org/LICENSE.txt for license information.
anatofuz
parents:
diff changeset
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
anatofuz
parents:
diff changeset
6 //
anatofuz
parents:
diff changeset
7 //===----------------------------------------------------------------------===//
anatofuz
parents:
diff changeset
8 // This file implements Section Patching for the purpose of working around the
anatofuz
parents:
diff changeset
9 // Cortex-a8 erratum 657417 "A 32bit branch instruction that spans 2 4K regions
anatofuz
parents:
diff changeset
10 // can result in an incorrect instruction fetch or processor deadlock." The
anatofuz
parents:
diff changeset
11 // erratum affects all but r1p7, r2p5, r2p6, r3p1 and r3p2 revisions of the
anatofuz
parents:
diff changeset
12 // Cortex-A8. A high level description of the patching technique is given in
anatofuz
parents:
diff changeset
13 // the opening comment of AArch64ErrataFix.cpp.
anatofuz
parents:
diff changeset
14 //===----------------------------------------------------------------------===//
anatofuz
parents:
diff changeset
15
anatofuz
parents:
diff changeset
16 #include "ARMErrataFix.h"
anatofuz
parents:
diff changeset
17
anatofuz
parents:
diff changeset
18 #include "Config.h"
anatofuz
parents:
diff changeset
19 #include "LinkerScript.h"
anatofuz
parents:
diff changeset
20 #include "OutputSections.h"
anatofuz
parents:
diff changeset
21 #include "Relocations.h"
anatofuz
parents:
diff changeset
22 #include "Symbols.h"
anatofuz
parents:
diff changeset
23 #include "SyntheticSections.h"
anatofuz
parents:
diff changeset
24 #include "Target.h"
anatofuz
parents:
diff changeset
25 #include "lld/Common/Memory.h"
anatofuz
parents:
diff changeset
26 #include "lld/Common/Strings.h"
anatofuz
parents:
diff changeset
27 #include "llvm/Support/Endian.h"
anatofuz
parents:
diff changeset
28 #include "llvm/Support/raw_ostream.h"
anatofuz
parents:
diff changeset
29 #include <algorithm>
anatofuz
parents:
diff changeset
30
anatofuz
parents:
diff changeset
31 using namespace llvm;
anatofuz
parents:
diff changeset
32 using namespace llvm::ELF;
anatofuz
parents:
diff changeset
33 using namespace llvm::object;
anatofuz
parents:
diff changeset
34 using namespace llvm::support;
anatofuz
parents:
diff changeset
35 using namespace llvm::support::endian;
173
0572611fdcc8 reorgnization done
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
36 using namespace lld;
0572611fdcc8 reorgnization done
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
37 using namespace lld::elf;
150
anatofuz
parents:
diff changeset
38
anatofuz
parents:
diff changeset
39 // The documented title for Erratum 657417 is:
anatofuz
parents:
diff changeset
40 // "A 32bit branch instruction that spans two 4K regions can result in an
anatofuz
parents:
diff changeset
41 // incorrect instruction fetch or processor deadlock". Graphically using a
anatofuz
parents:
diff changeset
42 // 32-bit B.w instruction encoded as a pair of halfwords 0xf7fe 0xbfff
anatofuz
parents:
diff changeset
43 // xxxxxx000 // Memory region 1 start
anatofuz
parents:
diff changeset
44 // target:
anatofuz
parents:
diff changeset
45 // ...
anatofuz
parents:
diff changeset
46 // xxxxxxffe f7fe // First halfword of branch to target:
anatofuz
parents:
diff changeset
47 // xxxxxx000 // Memory region 2 start
anatofuz
parents:
diff changeset
48 // xxxxxx002 bfff // Second halfword of branch to target:
anatofuz
parents:
diff changeset
49 //
anatofuz
parents:
diff changeset
50 // The specific trigger conditions that can be detected at link time are:
anatofuz
parents:
diff changeset
51 // - There is a 32-bit Thumb-2 branch instruction with an address of the form
anatofuz
parents:
diff changeset
52 // xxxxxxFFE. The first 2 bytes of the instruction are in 4KiB region 1, the
anatofuz
parents:
diff changeset
53 // second 2 bytes are in region 2.
anatofuz
parents:
diff changeset
54 // - The branch instruction is one of BLX, BL, B.w BCC.w
anatofuz
parents:
diff changeset
55 // - The instruction preceding the branch is a 32-bit non-branch instruction.
anatofuz
parents:
diff changeset
56 // - The target of the branch is in region 1.
anatofuz
parents:
diff changeset
57 //
anatofuz
parents:
diff changeset
58 // The linker mitigation for the fix is to redirect any branch that meets the
anatofuz
parents:
diff changeset
59 // erratum conditions to a patch section containing a branch to the target.
anatofuz
parents:
diff changeset
60 //
anatofuz
parents:
diff changeset
61 // As adding patch sections may move branches onto region boundaries the patch
anatofuz
parents:
diff changeset
62 // must iterate until no more patches are added.
anatofuz
parents:
diff changeset
63 //
anatofuz
parents:
diff changeset
64 // Example, before:
anatofuz
parents:
diff changeset
65 // 00000FFA func: NOP.w // 32-bit Thumb function
anatofuz
parents:
diff changeset
66 // 00000FFE B.W func // 32-bit branch spanning 2 regions, dest in 1st.
anatofuz
parents:
diff changeset
67 // Example, after:
anatofuz
parents:
diff changeset
68 // 00000FFA func: NOP.w // 32-bit Thumb function
anatofuz
parents:
diff changeset
69 // 00000FFE B.w __CortexA8657417_00000FFE
anatofuz
parents:
diff changeset
70 // 00001002 2 - bytes padding
anatofuz
parents:
diff changeset
71 // 00001004 __CortexA8657417_00000FFE: B.w func
anatofuz
parents:
diff changeset
72
173
0572611fdcc8 reorgnization done
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
73 class elf::Patch657417Section : public SyntheticSection {
150
anatofuz
parents:
diff changeset
74 public:
anatofuz
parents:
diff changeset
75 Patch657417Section(InputSection *p, uint64_t off, uint32_t instr, bool isARM);
anatofuz
parents:
diff changeset
76
anatofuz
parents:
diff changeset
77 void writeTo(uint8_t *buf) override;
anatofuz
parents:
diff changeset
78
anatofuz
parents:
diff changeset
79 size_t getSize() const override { return 4; }
anatofuz
parents:
diff changeset
80
anatofuz
parents:
diff changeset
81 // Get the virtual address of the branch instruction at patcheeOffset.
anatofuz
parents:
diff changeset
82 uint64_t getBranchAddr() const;
anatofuz
parents:
diff changeset
83
anatofuz
parents:
diff changeset
84 static bool classof(const SectionBase *d) {
anatofuz
parents:
diff changeset
85 return d->kind() == InputSectionBase::Synthetic && d->name ==".text.patch";
anatofuz
parents:
diff changeset
86 }
anatofuz
parents:
diff changeset
87
anatofuz
parents:
diff changeset
88 // The Section we are patching.
anatofuz
parents:
diff changeset
89 const InputSection *patchee;
anatofuz
parents:
diff changeset
90 // The offset of the instruction in the Patchee section we are patching.
anatofuz
parents:
diff changeset
91 uint64_t patcheeOffset;
anatofuz
parents:
diff changeset
92 // A label for the start of the Patch that we can use as a relocation target.
anatofuz
parents:
diff changeset
93 Symbol *patchSym;
anatofuz
parents:
diff changeset
94 // A decoding of the branch instruction at patcheeOffset.
anatofuz
parents:
diff changeset
95 uint32_t instr;
anatofuz
parents:
diff changeset
96 // True If the patch is to be written in ARM state, otherwise the patch will
anatofuz
parents:
diff changeset
97 // be written in Thumb state.
anatofuz
parents:
diff changeset
98 bool isARM;
anatofuz
parents:
diff changeset
99 };
anatofuz
parents:
diff changeset
100
anatofuz
parents:
diff changeset
101 // Return true if the half-word, when taken as the first of a pair of halfwords
anatofuz
parents:
diff changeset
102 // is the first half of a 32-bit instruction.
anatofuz
parents:
diff changeset
103 // Reference from ARM Architecture Reference Manual ARMv7-A and ARMv7-R edition
anatofuz
parents:
diff changeset
104 // section A6.3: 32-bit Thumb instruction encoding
anatofuz
parents:
diff changeset
105 // | HW1 | HW2 |
anatofuz
parents:
diff changeset
106 // | 1 1 1 | op1 (2) | op2 (7) | x (4) |op| x (15) |
anatofuz
parents:
diff changeset
107 // With op1 == 0b00, a 16-bit instruction is encoded.
anatofuz
parents:
diff changeset
108 //
anatofuz
parents:
diff changeset
109 // We test only the first halfword, looking for op != 0b00.
anatofuz
parents:
diff changeset
110 static bool is32bitInstruction(uint16_t hw) {
anatofuz
parents:
diff changeset
111 return (hw & 0xe000) == 0xe000 && (hw & 0x1800) != 0x0000;
anatofuz
parents:
diff changeset
112 }
anatofuz
parents:
diff changeset
113
anatofuz
parents:
diff changeset
114 // Reference from ARM Architecture Reference Manual ARMv7-A and ARMv7-R edition
anatofuz
parents:
diff changeset
115 // section A6.3.4 Branches and miscellaneous control.
anatofuz
parents:
diff changeset
116 // | HW1 | HW2 |
anatofuz
parents:
diff changeset
117 // | 1 1 1 | 1 0 | op (7) | x (4) | 1 | op1 (3) | op2 (4) | imm8 (8) |
anatofuz
parents:
diff changeset
118 // op1 == 0x0 op != x111xxx | Conditional branch (Bcc.W)
anatofuz
parents:
diff changeset
119 // op1 == 0x1 | Branch (B.W)
anatofuz
parents:
diff changeset
120 // op1 == 1x0 | Branch with Link and Exchange (BLX.w)
anatofuz
parents:
diff changeset
121 // op1 == 1x1 | Branch with Link (BL.W)
anatofuz
parents:
diff changeset
122
anatofuz
parents:
diff changeset
123 static bool isBcc(uint32_t instr) {
anatofuz
parents:
diff changeset
124 return (instr & 0xf800d000) == 0xf0008000 &&
anatofuz
parents:
diff changeset
125 (instr & 0x03800000) != 0x03800000;
anatofuz
parents:
diff changeset
126 }
anatofuz
parents:
diff changeset
127
anatofuz
parents:
diff changeset
128 static bool isB(uint32_t instr) { return (instr & 0xf800d000) == 0xf0009000; }
anatofuz
parents:
diff changeset
129
anatofuz
parents:
diff changeset
130 static bool isBLX(uint32_t instr) { return (instr & 0xf800d000) == 0xf000c000; }
anatofuz
parents:
diff changeset
131
anatofuz
parents:
diff changeset
132 static bool isBL(uint32_t instr) { return (instr & 0xf800d000) == 0xf000d000; }
anatofuz
parents:
diff changeset
133
anatofuz
parents:
diff changeset
134 static bool is32bitBranch(uint32_t instr) {
anatofuz
parents:
diff changeset
135 return isBcc(instr) || isB(instr) || isBL(instr) || isBLX(instr);
anatofuz
parents:
diff changeset
136 }
anatofuz
parents:
diff changeset
137
anatofuz
parents:
diff changeset
138 Patch657417Section::Patch657417Section(InputSection *p, uint64_t off,
anatofuz
parents:
diff changeset
139 uint32_t instr, bool isARM)
anatofuz
parents:
diff changeset
140 : SyntheticSection(SHF_ALLOC | SHF_EXECINSTR, SHT_PROGBITS, 4,
anatofuz
parents:
diff changeset
141 ".text.patch"),
anatofuz
parents:
diff changeset
142 patchee(p), patcheeOffset(off), instr(instr), isARM(isARM) {
anatofuz
parents:
diff changeset
143 parent = p->getParent();
anatofuz
parents:
diff changeset
144 patchSym = addSyntheticLocal(
anatofuz
parents:
diff changeset
145 saver.save("__CortexA8657417_" + utohexstr(getBranchAddr())), STT_FUNC,
anatofuz
parents:
diff changeset
146 isARM ? 0 : 1, getSize(), *this);
anatofuz
parents:
diff changeset
147 addSyntheticLocal(saver.save(isARM ? "$a" : "$t"), STT_NOTYPE, 0, 0, *this);
anatofuz
parents:
diff changeset
148 }
anatofuz
parents:
diff changeset
149
anatofuz
parents:
diff changeset
150 uint64_t Patch657417Section::getBranchAddr() const {
anatofuz
parents:
diff changeset
151 return patchee->getVA(patcheeOffset);
anatofuz
parents:
diff changeset
152 }
anatofuz
parents:
diff changeset
153
anatofuz
parents:
diff changeset
154 // Given a branch instruction instr at sourceAddr work out its destination
anatofuz
parents:
diff changeset
155 // address. This is only used when the branch instruction has no relocation.
anatofuz
parents:
diff changeset
156 static uint64_t getThumbDestAddr(uint64_t sourceAddr, uint32_t instr) {
anatofuz
parents:
diff changeset
157 uint8_t buf[4];
anatofuz
parents:
diff changeset
158 write16le(buf, instr >> 16);
anatofuz
parents:
diff changeset
159 write16le(buf + 2, instr & 0x0000ffff);
anatofuz
parents:
diff changeset
160 int64_t offset;
anatofuz
parents:
diff changeset
161 if (isBcc(instr))
anatofuz
parents:
diff changeset
162 offset = target->getImplicitAddend(buf, R_ARM_THM_JUMP19);
anatofuz
parents:
diff changeset
163 else if (isB(instr))
anatofuz
parents:
diff changeset
164 offset = target->getImplicitAddend(buf, R_ARM_THM_JUMP24);
anatofuz
parents:
diff changeset
165 else
anatofuz
parents:
diff changeset
166 offset = target->getImplicitAddend(buf, R_ARM_THM_CALL);
anatofuz
parents:
diff changeset
167 return sourceAddr + offset + 4;
anatofuz
parents:
diff changeset
168 }
anatofuz
parents:
diff changeset
169
anatofuz
parents:
diff changeset
170 void Patch657417Section::writeTo(uint8_t *buf) {
anatofuz
parents:
diff changeset
171 // The base instruction of the patch is always a 32-bit unconditional branch.
anatofuz
parents:
diff changeset
172 if (isARM)
anatofuz
parents:
diff changeset
173 write32le(buf, 0xea000000);
anatofuz
parents:
diff changeset
174 else
anatofuz
parents:
diff changeset
175 write32le(buf, 0x9000f000);
anatofuz
parents:
diff changeset
176 // If we have a relocation then apply it. For a SyntheticSection buf already
anatofuz
parents:
diff changeset
177 // has outSecOff added, but relocateAlloc also adds outSecOff so we need to
anatofuz
parents:
diff changeset
178 // subtract to avoid double counting.
anatofuz
parents:
diff changeset
179 if (!relocations.empty()) {
anatofuz
parents:
diff changeset
180 relocateAlloc(buf - outSecOff, buf - outSecOff + getSize());
anatofuz
parents:
diff changeset
181 return;
anatofuz
parents:
diff changeset
182 }
anatofuz
parents:
diff changeset
183
anatofuz
parents:
diff changeset
184 // If we don't have a relocation then we must calculate and write the offset
anatofuz
parents:
diff changeset
185 // ourselves.
anatofuz
parents:
diff changeset
186 // Get the destination offset from the addend in the branch instruction.
anatofuz
parents:
diff changeset
187 // We cannot use the instruction in the patchee section as this will have
anatofuz
parents:
diff changeset
188 // been altered to point to us!
anatofuz
parents:
diff changeset
189 uint64_t s = getThumbDestAddr(getBranchAddr(), instr);
anatofuz
parents:
diff changeset
190 uint64_t p = getVA(4);
anatofuz
parents:
diff changeset
191 target->relocateNoSym(buf, isARM ? R_ARM_JUMP24 : R_ARM_THM_JUMP24, s - p);
anatofuz
parents:
diff changeset
192 }
anatofuz
parents:
diff changeset
193
anatofuz
parents:
diff changeset
194 // Given a branch instruction spanning two 4KiB regions, at offset off from the
anatofuz
parents:
diff changeset
195 // start of isec, return true if the destination of the branch is within the
anatofuz
parents:
diff changeset
196 // first of the two 4Kib regions.
anatofuz
parents:
diff changeset
197 static bool branchDestInFirstRegion(const InputSection *isec, uint64_t off,
anatofuz
parents:
diff changeset
198 uint32_t instr, const Relocation *r) {
anatofuz
parents:
diff changeset
199 uint64_t sourceAddr = isec->getVA(0) + off;
anatofuz
parents:
diff changeset
200 assert((sourceAddr & 0xfff) == 0xffe);
anatofuz
parents:
diff changeset
201 uint64_t destAddr = sourceAddr;
anatofuz
parents:
diff changeset
202 // If there is a branch relocation at the same offset we must use this to
anatofuz
parents:
diff changeset
203 // find the destination address as the branch could be indirected via a thunk
anatofuz
parents:
diff changeset
204 // or the PLT.
anatofuz
parents:
diff changeset
205 if (r) {
anatofuz
parents:
diff changeset
206 uint64_t dst = (r->expr == R_PLT_PC) ? r->sym->getPltVA() : r->sym->getVA();
anatofuz
parents:
diff changeset
207 // Account for Thumb PC bias, usually cancelled to 0 by addend of -4.
anatofuz
parents:
diff changeset
208 destAddr = dst + r->addend + 4;
anatofuz
parents:
diff changeset
209 } else {
anatofuz
parents:
diff changeset
210 // If there is no relocation, we must have an intra-section branch
anatofuz
parents:
diff changeset
211 // We must extract the offset from the addend manually.
anatofuz
parents:
diff changeset
212 destAddr = getThumbDestAddr(sourceAddr, instr);
anatofuz
parents:
diff changeset
213 }
anatofuz
parents:
diff changeset
214
anatofuz
parents:
diff changeset
215 return (destAddr & 0xfffff000) == (sourceAddr & 0xfffff000);
anatofuz
parents:
diff changeset
216 }
anatofuz
parents:
diff changeset
217
anatofuz
parents:
diff changeset
218 // Return true if a branch can reach a patch section placed after isec.
anatofuz
parents:
diff changeset
219 // The Bcc.w instruction has a range of 1 MiB, all others have 16 MiB.
anatofuz
parents:
diff changeset
220 static bool patchInRange(const InputSection *isec, uint64_t off,
anatofuz
parents:
diff changeset
221 uint32_t instr) {
anatofuz
parents:
diff changeset
222
anatofuz
parents:
diff changeset
223 // We need the branch at source to reach a patch section placed immediately
anatofuz
parents:
diff changeset
224 // after isec. As there can be more than one patch in the patch section we
anatofuz
parents:
diff changeset
225 // add 0x100 as contingency to account for worst case of 1 branch every 4KiB
anatofuz
parents:
diff changeset
226 // for a 1 MiB range.
anatofuz
parents:
diff changeset
227 return target->inBranchRange(
anatofuz
parents:
diff changeset
228 isBcc(instr) ? R_ARM_THM_JUMP19 : R_ARM_THM_JUMP24, isec->getVA(off),
anatofuz
parents:
diff changeset
229 isec->getVA() + isec->getSize() + 0x100);
anatofuz
parents:
diff changeset
230 }
anatofuz
parents:
diff changeset
231
anatofuz
parents:
diff changeset
232 struct ScanResult {
anatofuz
parents:
diff changeset
233 // Offset of branch within its InputSection.
anatofuz
parents:
diff changeset
234 uint64_t off;
anatofuz
parents:
diff changeset
235 // Cached decoding of the branch instruction.
anatofuz
parents:
diff changeset
236 uint32_t instr;
anatofuz
parents:
diff changeset
237 // Branch relocation at off. Will be nullptr if no relocation exists.
anatofuz
parents:
diff changeset
238 Relocation *rel;
anatofuz
parents:
diff changeset
239 };
anatofuz
parents:
diff changeset
240
anatofuz
parents:
diff changeset
241 // Detect the erratum sequence, returning the offset of the branch instruction
anatofuz
parents:
diff changeset
242 // and a decoding of the branch. If the erratum sequence is not found then
anatofuz
parents:
diff changeset
243 // return an offset of 0 for the branch. 0 is a safe value to use for no patch
anatofuz
parents:
diff changeset
244 // as there must be at least one 32-bit non-branch instruction before the
anatofuz
parents:
diff changeset
245 // branch so the minimum offset for a patch is 4.
anatofuz
parents:
diff changeset
246 static ScanResult scanCortexA8Errata657417(InputSection *isec, uint64_t &off,
anatofuz
parents:
diff changeset
247 uint64_t limit) {
anatofuz
parents:
diff changeset
248 uint64_t isecAddr = isec->getVA(0);
anatofuz
parents:
diff changeset
249 // Advance Off so that (isecAddr + off) modulo 0x1000 is at least 0xffa. We
anatofuz
parents:
diff changeset
250 // need to check for a 32-bit instruction immediately before a 32-bit branch
anatofuz
parents:
diff changeset
251 // at 0xffe modulo 0x1000.
anatofuz
parents:
diff changeset
252 off = alignTo(isecAddr + off, 0x1000, 0xffa) - isecAddr;
anatofuz
parents:
diff changeset
253 if (off >= limit || limit - off < 8) {
anatofuz
parents:
diff changeset
254 // Need at least 2 4-byte sized instructions to trigger erratum.
anatofuz
parents:
diff changeset
255 off = limit;
anatofuz
parents:
diff changeset
256 return {0, 0, nullptr};
anatofuz
parents:
diff changeset
257 }
anatofuz
parents:
diff changeset
258
anatofuz
parents:
diff changeset
259 ScanResult scanRes = {0, 0, nullptr};
anatofuz
parents:
diff changeset
260 const uint8_t *buf = isec->data().begin();
anatofuz
parents:
diff changeset
261 // ARMv7-A Thumb 32-bit instructions are encoded 2 consecutive
anatofuz
parents:
diff changeset
262 // little-endian halfwords.
anatofuz
parents:
diff changeset
263 const ulittle16_t *instBuf = reinterpret_cast<const ulittle16_t *>(buf + off);
anatofuz
parents:
diff changeset
264 uint16_t hw11 = *instBuf++;
anatofuz
parents:
diff changeset
265 uint16_t hw12 = *instBuf++;
anatofuz
parents:
diff changeset
266 uint16_t hw21 = *instBuf++;
anatofuz
parents:
diff changeset
267 uint16_t hw22 = *instBuf++;
anatofuz
parents:
diff changeset
268 if (is32bitInstruction(hw11) && is32bitInstruction(hw21)) {
anatofuz
parents:
diff changeset
269 uint32_t instr1 = (hw11 << 16) | hw12;
anatofuz
parents:
diff changeset
270 uint32_t instr2 = (hw21 << 16) | hw22;
anatofuz
parents:
diff changeset
271 if (!is32bitBranch(instr1) && is32bitBranch(instr2)) {
anatofuz
parents:
diff changeset
272 // Find a relocation for the branch if it exists. This will be used
anatofuz
parents:
diff changeset
273 // to determine the target.
anatofuz
parents:
diff changeset
274 uint64_t branchOff = off + 4;
anatofuz
parents:
diff changeset
275 auto relIt = llvm::find_if(isec->relocations, [=](const Relocation &r) {
anatofuz
parents:
diff changeset
276 return r.offset == branchOff &&
anatofuz
parents:
diff changeset
277 (r.type == R_ARM_THM_JUMP19 || r.type == R_ARM_THM_JUMP24 ||
anatofuz
parents:
diff changeset
278 r.type == R_ARM_THM_CALL);
anatofuz
parents:
diff changeset
279 });
anatofuz
parents:
diff changeset
280 if (relIt != isec->relocations.end())
anatofuz
parents:
diff changeset
281 scanRes.rel = &(*relIt);
anatofuz
parents:
diff changeset
282 if (branchDestInFirstRegion(isec, branchOff, instr2, scanRes.rel)) {
anatofuz
parents:
diff changeset
283 if (patchInRange(isec, branchOff, instr2)) {
anatofuz
parents:
diff changeset
284 scanRes.off = branchOff;
anatofuz
parents:
diff changeset
285 scanRes.instr = instr2;
anatofuz
parents:
diff changeset
286 } else {
anatofuz
parents:
diff changeset
287 warn(toString(isec->file) +
anatofuz
parents:
diff changeset
288 ": skipping cortex-a8 657417 erratum sequence, section " +
anatofuz
parents:
diff changeset
289 isec->name + " is too large to patch");
anatofuz
parents:
diff changeset
290 }
anatofuz
parents:
diff changeset
291 }
anatofuz
parents:
diff changeset
292 }
anatofuz
parents:
diff changeset
293 }
anatofuz
parents:
diff changeset
294 off += 0x1000;
anatofuz
parents:
diff changeset
295 return scanRes;
anatofuz
parents:
diff changeset
296 }
anatofuz
parents:
diff changeset
297
anatofuz
parents:
diff changeset
298 void ARMErr657417Patcher::init() {
anatofuz
parents:
diff changeset
299 // The Arm ABI permits a mix of ARM, Thumb and Data in the same
anatofuz
parents:
diff changeset
300 // InputSection. We must only scan Thumb instructions to avoid false
anatofuz
parents:
diff changeset
301 // matches. We use the mapping symbols in the InputObjects to identify this
anatofuz
parents:
diff changeset
302 // data, caching the results in sectionMap so we don't have to recalculate
anatofuz
parents:
diff changeset
303 // it each pass.
anatofuz
parents:
diff changeset
304
anatofuz
parents:
diff changeset
305 // The ABI Section 4.5.5 Mapping symbols; defines local symbols that describe
anatofuz
parents:
diff changeset
306 // half open intervals [Symbol Value, Next Symbol Value) of code and data
anatofuz
parents:
diff changeset
307 // within sections. If there is no next symbol then the half open interval is
anatofuz
parents:
diff changeset
308 // [Symbol Value, End of section). The type, code or data, is determined by
anatofuz
parents:
diff changeset
309 // the mapping symbol name, $a for Arm code, $t for Thumb code, $d for data.
anatofuz
parents:
diff changeset
310 auto isArmMapSymbol = [](const Symbol *s) {
anatofuz
parents:
diff changeset
311 return s->getName() == "$a" || s->getName().startswith("$a.");
anatofuz
parents:
diff changeset
312 };
anatofuz
parents:
diff changeset
313 auto isThumbMapSymbol = [](const Symbol *s) {
anatofuz
parents:
diff changeset
314 return s->getName() == "$t" || s->getName().startswith("$t.");
anatofuz
parents:
diff changeset
315 };
anatofuz
parents:
diff changeset
316 auto isDataMapSymbol = [](const Symbol *s) {
anatofuz
parents:
diff changeset
317 return s->getName() == "$d" || s->getName().startswith("$d.");
anatofuz
parents:
diff changeset
318 };
anatofuz
parents:
diff changeset
319
anatofuz
parents:
diff changeset
320 // Collect mapping symbols for every executable InputSection.
anatofuz
parents:
diff changeset
321 for (InputFile *file : objectFiles) {
anatofuz
parents:
diff changeset
322 auto *f = cast<ObjFile<ELF32LE>>(file);
anatofuz
parents:
diff changeset
323 for (Symbol *s : f->getLocalSymbols()) {
anatofuz
parents:
diff changeset
324 auto *def = dyn_cast<Defined>(s);
anatofuz
parents:
diff changeset
325 if (!def)
anatofuz
parents:
diff changeset
326 continue;
anatofuz
parents:
diff changeset
327 if (!isArmMapSymbol(def) && !isThumbMapSymbol(def) &&
anatofuz
parents:
diff changeset
328 !isDataMapSymbol(def))
anatofuz
parents:
diff changeset
329 continue;
anatofuz
parents:
diff changeset
330 if (auto *sec = dyn_cast_or_null<InputSection>(def->section))
anatofuz
parents:
diff changeset
331 if (sec->flags & SHF_EXECINSTR)
anatofuz
parents:
diff changeset
332 sectionMap[sec].push_back(def);
anatofuz
parents:
diff changeset
333 }
anatofuz
parents:
diff changeset
334 }
anatofuz
parents:
diff changeset
335 // For each InputSection make sure the mapping symbols are in sorted in
anatofuz
parents:
diff changeset
336 // ascending order and are in alternating Thumb, non-Thumb order.
anatofuz
parents:
diff changeset
337 for (auto &kv : sectionMap) {
anatofuz
parents:
diff changeset
338 std::vector<const Defined *> &mapSyms = kv.second;
anatofuz
parents:
diff changeset
339 llvm::stable_sort(mapSyms, [](const Defined *a, const Defined *b) {
anatofuz
parents:
diff changeset
340 return a->value < b->value;
anatofuz
parents:
diff changeset
341 });
anatofuz
parents:
diff changeset
342 mapSyms.erase(std::unique(mapSyms.begin(), mapSyms.end(),
anatofuz
parents:
diff changeset
343 [=](const Defined *a, const Defined *b) {
anatofuz
parents:
diff changeset
344 return (isThumbMapSymbol(a) ==
anatofuz
parents:
diff changeset
345 isThumbMapSymbol(b));
anatofuz
parents:
diff changeset
346 }),
anatofuz
parents:
diff changeset
347 mapSyms.end());
anatofuz
parents:
diff changeset
348 // Always start with a Thumb Mapping Symbol
anatofuz
parents:
diff changeset
349 if (!mapSyms.empty() && !isThumbMapSymbol(mapSyms.front()))
anatofuz
parents:
diff changeset
350 mapSyms.erase(mapSyms.begin());
anatofuz
parents:
diff changeset
351 }
anatofuz
parents:
diff changeset
352 initialized = true;
anatofuz
parents:
diff changeset
353 }
anatofuz
parents:
diff changeset
354
anatofuz
parents:
diff changeset
355 void ARMErr657417Patcher::insertPatches(
anatofuz
parents:
diff changeset
356 InputSectionDescription &isd, std::vector<Patch657417Section *> &patches) {
anatofuz
parents:
diff changeset
357 uint64_t spacing = 0x100000 - 0x7500;
anatofuz
parents:
diff changeset
358 uint64_t isecLimit;
anatofuz
parents:
diff changeset
359 uint64_t prevIsecLimit = isd.sections.front()->outSecOff;
anatofuz
parents:
diff changeset
360 uint64_t patchUpperBound = prevIsecLimit + spacing;
anatofuz
parents:
diff changeset
361 uint64_t outSecAddr = isd.sections.front()->getParent()->addr;
anatofuz
parents:
diff changeset
362
anatofuz
parents:
diff changeset
363 // Set the outSecOff of patches to the place where we want to insert them.
anatofuz
parents:
diff changeset
364 // We use a similar strategy to initial thunk placement, using 1 MiB as the
anatofuz
parents:
diff changeset
365 // range of the Thumb-2 conditional branch with a contingency accounting for
anatofuz
parents:
diff changeset
366 // thunk generation.
anatofuz
parents:
diff changeset
367 auto patchIt = patches.begin();
anatofuz
parents:
diff changeset
368 auto patchEnd = patches.end();
anatofuz
parents:
diff changeset
369 for (const InputSection *isec : isd.sections) {
anatofuz
parents:
diff changeset
370 isecLimit = isec->outSecOff + isec->getSize();
anatofuz
parents:
diff changeset
371 if (isecLimit > patchUpperBound) {
anatofuz
parents:
diff changeset
372 for (; patchIt != patchEnd; ++patchIt) {
anatofuz
parents:
diff changeset
373 if ((*patchIt)->getBranchAddr() - outSecAddr >= prevIsecLimit)
anatofuz
parents:
diff changeset
374 break;
anatofuz
parents:
diff changeset
375 (*patchIt)->outSecOff = prevIsecLimit;
anatofuz
parents:
diff changeset
376 }
anatofuz
parents:
diff changeset
377 patchUpperBound = prevIsecLimit + spacing;
anatofuz
parents:
diff changeset
378 }
anatofuz
parents:
diff changeset
379 prevIsecLimit = isecLimit;
anatofuz
parents:
diff changeset
380 }
anatofuz
parents:
diff changeset
381 for (; patchIt != patchEnd; ++patchIt)
anatofuz
parents:
diff changeset
382 (*patchIt)->outSecOff = isecLimit;
anatofuz
parents:
diff changeset
383
anatofuz
parents:
diff changeset
384 // Merge all patch sections. We use the outSecOff assigned above to
anatofuz
parents:
diff changeset
385 // determine the insertion point. This is ok as we only merge into an
anatofuz
parents:
diff changeset
386 // InputSectionDescription once per pass, and at the end of the pass
anatofuz
parents:
diff changeset
387 // assignAddresses() will recalculate all the outSecOff values.
anatofuz
parents:
diff changeset
388 std::vector<InputSection *> tmp;
anatofuz
parents:
diff changeset
389 tmp.reserve(isd.sections.size() + patches.size());
anatofuz
parents:
diff changeset
390 auto mergeCmp = [](const InputSection *a, const InputSection *b) {
anatofuz
parents:
diff changeset
391 if (a->outSecOff != b->outSecOff)
anatofuz
parents:
diff changeset
392 return a->outSecOff < b->outSecOff;
anatofuz
parents:
diff changeset
393 return isa<Patch657417Section>(a) && !isa<Patch657417Section>(b);
anatofuz
parents:
diff changeset
394 };
anatofuz
parents:
diff changeset
395 std::merge(isd.sections.begin(), isd.sections.end(), patches.begin(),
anatofuz
parents:
diff changeset
396 patches.end(), std::back_inserter(tmp), mergeCmp);
anatofuz
parents:
diff changeset
397 isd.sections = std::move(tmp);
anatofuz
parents:
diff changeset
398 }
anatofuz
parents:
diff changeset
399
anatofuz
parents:
diff changeset
400 // Given a branch instruction described by ScanRes redirect it to a patch
anatofuz
parents:
diff changeset
401 // section containing an unconditional branch instruction to the target.
anatofuz
parents:
diff changeset
402 // Ensure that this patch section is 4-byte aligned so that the branch cannot
anatofuz
parents:
diff changeset
403 // span two 4 KiB regions. Place the patch section so that it is always after
anatofuz
parents:
diff changeset
404 // isec so the branch we are patching always goes forwards.
anatofuz
parents:
diff changeset
405 static void implementPatch(ScanResult sr, InputSection *isec,
anatofuz
parents:
diff changeset
406 std::vector<Patch657417Section *> &patches) {
anatofuz
parents:
diff changeset
407
anatofuz
parents:
diff changeset
408 log("detected cortex-a8-657419 erratum sequence starting at " +
anatofuz
parents:
diff changeset
409 utohexstr(isec->getVA(sr.off)) + " in unpatched output.");
anatofuz
parents:
diff changeset
410 Patch657417Section *psec;
anatofuz
parents:
diff changeset
411 // We have two cases to deal with.
anatofuz
parents:
diff changeset
412 // Case 1. There is a relocation at patcheeOffset to a symbol. The
anatofuz
parents:
diff changeset
413 // unconditional branch in the patch must have a relocation so that any
anatofuz
parents:
diff changeset
414 // further redirection via the PLT or a Thunk happens as normal. At
anatofuz
parents:
diff changeset
415 // patcheeOffset we redirect the existing relocation to a Symbol defined at
anatofuz
parents:
diff changeset
416 // the start of the patch section.
anatofuz
parents:
diff changeset
417 //
anatofuz
parents:
diff changeset
418 // Case 2. There is no relocation at patcheeOffset. We are unlikely to have
anatofuz
parents:
diff changeset
419 // a symbol that we can use as a target for a relocation in the patch section.
anatofuz
parents:
diff changeset
420 // Luckily we know that the destination cannot be indirected via the PLT or
anatofuz
parents:
diff changeset
421 // a Thunk so we can just write the destination directly.
anatofuz
parents:
diff changeset
422 if (sr.rel) {
anatofuz
parents:
diff changeset
423 // Case 1. We have an existing relocation to redirect to patch and a
anatofuz
parents:
diff changeset
424 // Symbol target.
anatofuz
parents:
diff changeset
425
anatofuz
parents:
diff changeset
426 // Create a branch relocation for the unconditional branch in the patch.
anatofuz
parents:
diff changeset
427 // This can be redirected via the PLT or Thunks.
anatofuz
parents:
diff changeset
428 RelType patchRelType = R_ARM_THM_JUMP24;
anatofuz
parents:
diff changeset
429 int64_t patchRelAddend = sr.rel->addend;
anatofuz
parents:
diff changeset
430 bool destIsARM = false;
anatofuz
parents:
diff changeset
431 if (isBL(sr.instr) || isBLX(sr.instr)) {
anatofuz
parents:
diff changeset
432 // The final target of the branch may be ARM or Thumb, if the target
anatofuz
parents:
diff changeset
433 // is ARM then we write the patch in ARM state to avoid a state change
anatofuz
parents:
diff changeset
434 // Thunk from the patch to the target.
anatofuz
parents:
diff changeset
435 uint64_t dstSymAddr = (sr.rel->expr == R_PLT_PC) ? sr.rel->sym->getPltVA()
anatofuz
parents:
diff changeset
436 : sr.rel->sym->getVA();
anatofuz
parents:
diff changeset
437 destIsARM = (dstSymAddr & 1) == 0;
anatofuz
parents:
diff changeset
438 }
anatofuz
parents:
diff changeset
439 psec = make<Patch657417Section>(isec, sr.off, sr.instr, destIsARM);
anatofuz
parents:
diff changeset
440 if (destIsARM) {
anatofuz
parents:
diff changeset
441 // The patch will be in ARM state. Use an ARM relocation and account for
anatofuz
parents:
diff changeset
442 // the larger ARM PC-bias of 8 rather than Thumb's 4.
anatofuz
parents:
diff changeset
443 patchRelType = R_ARM_JUMP24;
anatofuz
parents:
diff changeset
444 patchRelAddend -= 4;
anatofuz
parents:
diff changeset
445 }
anatofuz
parents:
diff changeset
446 psec->relocations.push_back(
anatofuz
parents:
diff changeset
447 Relocation{sr.rel->expr, patchRelType, 0, patchRelAddend, sr.rel->sym});
anatofuz
parents:
diff changeset
448 // Redirect the existing branch relocation to the patch.
anatofuz
parents:
diff changeset
449 sr.rel->expr = R_PC;
anatofuz
parents:
diff changeset
450 sr.rel->addend = -4;
anatofuz
parents:
diff changeset
451 sr.rel->sym = psec->patchSym;
anatofuz
parents:
diff changeset
452 } else {
anatofuz
parents:
diff changeset
453 // Case 2. We do not have a relocation to the patch. Add a relocation of the
anatofuz
parents:
diff changeset
454 // appropriate type to the patch at patcheeOffset.
anatofuz
parents:
diff changeset
455
anatofuz
parents:
diff changeset
456 // The destination is ARM if we have a BLX.
anatofuz
parents:
diff changeset
457 psec = make<Patch657417Section>(isec, sr.off, sr.instr, isBLX(sr.instr));
anatofuz
parents:
diff changeset
458 RelType type;
anatofuz
parents:
diff changeset
459 if (isBcc(sr.instr))
anatofuz
parents:
diff changeset
460 type = R_ARM_THM_JUMP19;
anatofuz
parents:
diff changeset
461 else if (isB(sr.instr))
anatofuz
parents:
diff changeset
462 type = R_ARM_THM_JUMP24;
anatofuz
parents:
diff changeset
463 else
anatofuz
parents:
diff changeset
464 type = R_ARM_THM_CALL;
anatofuz
parents:
diff changeset
465 isec->relocations.push_back(
anatofuz
parents:
diff changeset
466 Relocation{R_PC, type, sr.off, -4, psec->patchSym});
anatofuz
parents:
diff changeset
467 }
anatofuz
parents:
diff changeset
468 patches.push_back(psec);
anatofuz
parents:
diff changeset
469 }
anatofuz
parents:
diff changeset
470
anatofuz
parents:
diff changeset
471 // Scan all the instructions in InputSectionDescription, for each instance of
anatofuz
parents:
diff changeset
472 // the erratum sequence create a Patch657417Section. We return the list of
anatofuz
parents:
diff changeset
473 // Patch657417Sections that need to be applied to the InputSectionDescription.
anatofuz
parents:
diff changeset
474 std::vector<Patch657417Section *>
anatofuz
parents:
diff changeset
475 ARMErr657417Patcher::patchInputSectionDescription(
anatofuz
parents:
diff changeset
476 InputSectionDescription &isd) {
anatofuz
parents:
diff changeset
477 std::vector<Patch657417Section *> patches;
anatofuz
parents:
diff changeset
478 for (InputSection *isec : isd.sections) {
anatofuz
parents:
diff changeset
479 // LLD doesn't use the erratum sequence in SyntheticSections.
anatofuz
parents:
diff changeset
480 if (isa<SyntheticSection>(isec))
anatofuz
parents:
diff changeset
481 continue;
anatofuz
parents:
diff changeset
482 // Use sectionMap to make sure we only scan Thumb code and not Arm or inline
anatofuz
parents:
diff changeset
483 // data. We have already sorted mapSyms in ascending order and removed
anatofuz
parents:
diff changeset
484 // consecutive mapping symbols of the same type. Our range of executable
anatofuz
parents:
diff changeset
485 // instructions to scan is therefore [thumbSym->value, nonThumbSym->value)
anatofuz
parents:
diff changeset
486 // or [thumbSym->value, section size).
anatofuz
parents:
diff changeset
487 std::vector<const Defined *> &mapSyms = sectionMap[isec];
anatofuz
parents:
diff changeset
488
anatofuz
parents:
diff changeset
489 auto thumbSym = mapSyms.begin();
anatofuz
parents:
diff changeset
490 while (thumbSym != mapSyms.end()) {
anatofuz
parents:
diff changeset
491 auto nonThumbSym = std::next(thumbSym);
anatofuz
parents:
diff changeset
492 uint64_t off = (*thumbSym)->value;
anatofuz
parents:
diff changeset
493 uint64_t limit = (nonThumbSym == mapSyms.end()) ? isec->data().size()
anatofuz
parents:
diff changeset
494 : (*nonThumbSym)->value;
anatofuz
parents:
diff changeset
495
anatofuz
parents:
diff changeset
496 while (off < limit) {
anatofuz
parents:
diff changeset
497 ScanResult sr = scanCortexA8Errata657417(isec, off, limit);
anatofuz
parents:
diff changeset
498 if (sr.off)
anatofuz
parents:
diff changeset
499 implementPatch(sr, isec, patches);
anatofuz
parents:
diff changeset
500 }
anatofuz
parents:
diff changeset
501 if (nonThumbSym == mapSyms.end())
anatofuz
parents:
diff changeset
502 break;
anatofuz
parents:
diff changeset
503 thumbSym = std::next(nonThumbSym);
anatofuz
parents:
diff changeset
504 }
anatofuz
parents:
diff changeset
505 }
anatofuz
parents:
diff changeset
506 return patches;
anatofuz
parents:
diff changeset
507 }
anatofuz
parents:
diff changeset
508
anatofuz
parents:
diff changeset
509 bool ARMErr657417Patcher::createFixes() {
anatofuz
parents:
diff changeset
510 if (!initialized)
anatofuz
parents:
diff changeset
511 init();
anatofuz
parents:
diff changeset
512
anatofuz
parents:
diff changeset
513 bool addressesChanged = false;
anatofuz
parents:
diff changeset
514 for (OutputSection *os : outputSections) {
anatofuz
parents:
diff changeset
515 if (!(os->flags & SHF_ALLOC) || !(os->flags & SHF_EXECINSTR))
anatofuz
parents:
diff changeset
516 continue;
anatofuz
parents:
diff changeset
517 for (BaseCommand *bc : os->sectionCommands)
anatofuz
parents:
diff changeset
518 if (auto *isd = dyn_cast<InputSectionDescription>(bc)) {
anatofuz
parents:
diff changeset
519 std::vector<Patch657417Section *> patches =
anatofuz
parents:
diff changeset
520 patchInputSectionDescription(*isd);
anatofuz
parents:
diff changeset
521 if (!patches.empty()) {
anatofuz
parents:
diff changeset
522 insertPatches(*isd, patches);
anatofuz
parents:
diff changeset
523 addressesChanged = true;
anatofuz
parents:
diff changeset
524 }
anatofuz
parents:
diff changeset
525 }
anatofuz
parents:
diff changeset
526 }
anatofuz
parents:
diff changeset
527 return addressesChanged;
anatofuz
parents:
diff changeset
528 }