//===- ARMErrataFix.cpp ---------------------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // This file implements Section Patching for the purpose of working around the // Cortex-a8 erratum 657417 "A 32bit branch instruction that spans 2 4K regions // can result in an incorrect instruction fetch or processor deadlock." The // erratum affects all but r1p7, r2p5, r2p6, r3p1 and r3p2 revisions of the // Cortex-A8. A high level description of the patching technique is given in // the opening comment of AArch64ErrataFix.cpp. //===----------------------------------------------------------------------===// #include "ARMErrataFix.h" #include "InputFiles.h" #include "LinkerScript.h" #include "OutputSections.h" #include "Relocations.h" #include "Symbols.h" #include "SyntheticSections.h" #include "Target.h" #include "lld/Common/CommonLinkerContext.h" #include "lld/Common/Strings.h" #include "llvm/Support/Endian.h" #include <algorithm> usingnamespacellvm; usingnamespacellvm::ELF; usingnamespacellvm::object; usingnamespacellvm::support; usingnamespacellvm::support::endian; usingnamespacelld; usingnamespacelld::elf; // The documented title for Erratum 657417 is: // "A 32bit branch instruction that spans two 4K regions can result in an // incorrect instruction fetch or processor deadlock". Graphically using a // 32-bit B.w instruction encoded as a pair of halfwords 0xf7fe 0xbfff // xxxxxx000 // Memory region 1 start // target: // ... // xxxxxxffe f7fe // First halfword of branch to target: // xxxxxx000 // Memory region 2 start // xxxxxx002 bfff // Second halfword of branch to target: // // The specific trigger conditions that can be detected at link time are: // - There is a 32-bit Thumb-2 branch instruction with an address of the form // xxxxxxFFE. The first 2 bytes of the instruction are in 4KiB region 1, the // second 2 bytes are in region 2. // - The branch instruction is one of BLX, BL, B.w BCC.w // - The instruction preceding the branch is a 32-bit non-branch instruction. // - The target of the branch is in region 1. // // The linker mitigation for the fix is to redirect any branch that meets the // erratum conditions to a patch section containing a branch to the target. // // As adding patch sections may move branches onto region boundaries the patch // must iterate until no more patches are added. // // Example, before: // 00000FFA func: NOP.w // 32-bit Thumb function // 00000FFE B.W func // 32-bit branch spanning 2 regions, dest in 1st. // Example, after: // 00000FFA func: NOP.w // 32-bit Thumb function // 00000FFE B.w __CortexA8657417_00000FFE // 00001002 2 - bytes padding // 00001004 __CortexA8657417_00000FFE: B.w func class elf::Patch657417Section final : public SyntheticSection { … }; // Return true if the half-word, when taken as the first of a pair of halfwords // is the first half of a 32-bit instruction. // Reference from ARM Architecture Reference Manual ARMv7-A and ARMv7-R edition // section A6.3: 32-bit Thumb instruction encoding // | HW1 | HW2 | // | 1 1 1 | op1 (2) | op2 (7) | x (4) |op| x (15) | // With op1 == 0b00, a 16-bit instruction is encoded. // // We test only the first halfword, looking for op != 0b00. static bool is32bitInstruction(uint16_t hw) { … } // Reference from ARM Architecture Reference Manual ARMv7-A and ARMv7-R edition // section A6.3.4 Branches and miscellaneous control. // | HW1 | HW2 | // | 1 1 1 | 1 0 | op (7) | x (4) | 1 | op1 (3) | op2 (4) | imm8 (8) | // op1 == 0x0 op != x111xxx | Conditional branch (Bcc.W) // op1 == 0x1 | Branch (B.W) // op1 == 1x0 | Branch with Link and Exchange (BLX.w) // op1 == 1x1 | Branch with Link (BL.W) static bool isBcc(uint32_t instr) { … } static bool isB(uint32_t instr) { … } static bool isBLX(uint32_t instr) { … } static bool isBL(uint32_t instr) { … } static bool is32bitBranch(uint32_t instr) { … } Patch657417Section::Patch657417Section(Ctx &ctx, InputSection *p, uint64_t off, uint32_t instr, bool isARM) : … { … } uint64_t Patch657417Section::getBranchAddr() const { … } // Given a branch instruction instr at sourceAddr work out its destination // address. This is only used when the branch instruction has no relocation. static uint64_t getThumbDestAddr(Ctx &ctx, uint64_t sourceAddr, uint32_t instr) { … } void Patch657417Section::writeTo(uint8_t *buf) { … } // Given a branch instruction spanning two 4KiB regions, at offset off from the // start of isec, return true if the destination of the branch is within the // first of the two 4Kib regions. static bool branchDestInFirstRegion(Ctx &ctx, const InputSection *isec, uint64_t off, uint32_t instr, const Relocation *r) { … } // Return true if a branch can reach a patch section placed after isec. // The Bcc.w instruction has a range of 1 MiB, all others have 16 MiB. static bool patchInRange(Ctx &ctx, const InputSection *isec, uint64_t off, uint32_t instr) { … } struct ScanResult { … }; // Detect the erratum sequence, returning the offset of the branch instruction // and a decoding of the branch. If the erratum sequence is not found then // return an offset of 0 for the branch. 0 is a safe value to use for no patch // as there must be at least one 32-bit non-branch instruction before the // branch so the minimum offset for a patch is 4. static ScanResult scanCortexA8Errata657417(InputSection *isec, uint64_t &off, uint64_t limit) { … } void ARMErr657417Patcher::init() { … } void ARMErr657417Patcher::insertPatches( InputSectionDescription &isd, std::vector<Patch657417Section *> &patches) { … } // Given a branch instruction described by ScanRes redirect it to a patch // section containing an unconditional branch instruction to the target. // Ensure that this patch section is 4-byte aligned so that the branch cannot // span two 4 KiB regions. Place the patch section so that it is always after // isec so the branch we are patching always goes forwards. static void implementPatch(ScanResult sr, InputSection *isec, std::vector<Patch657417Section *> &patches) { … } // Scan all the instructions in InputSectionDescription, for each instance of // the erratum sequence create a Patch657417Section. We return the list of // Patch657417Sections that need to be applied to the InputSectionDescription. std::vector<Patch657417Section *> ARMErr657417Patcher::patchInputSectionDescription( InputSectionDescription &isd) { … } bool ARMErr657417Patcher::createFixes() { … }