[lld-macho][nfc] Refactor to accommodate paired relocs

This is a refactor to pave the way for supporting paired-ADDEND for ARM64. The only paired reloc type for X86_64 is SUBTRACTOR. In a later diff, I will add SUBTRACTOR for both X86_64 and ARM64.

* s/`getImplicitAddend`/`getAddend`/ because it handles all forms of addend: implicit, explicit, paired.
* add predicate `bool isPairedReloc()`
* check range of `relInfo.r_symbolnum` is internal, unrelated to user-input, so use `assert()`, not `error()`
* minor cleanups & rearrangements in `InputFile::parseRelocations()`

Differential Revision: https://reviews.llvm.org/D90614
This commit is contained in:
Greg McGary 2020-10-14 09:49:54 -07:00
parent ed6a135246
commit d4ec3346b1
3 changed files with 54 additions and 25 deletions

View File

@ -25,8 +25,9 @@ namespace {
struct X86_64 : TargetInfo { struct X86_64 : TargetInfo {
X86_64(); X86_64();
uint64_t getImplicitAddend(MemoryBufferRef, const section_64 &, bool isPairedReloc(relocation_info) const override;
const relocation_info &) const override; uint64_t getAddend(MemoryBufferRef, const section_64 &, relocation_info,
relocation_info) const override;
void relocateOne(uint8_t *loc, const Reloc &, uint64_t val) const override; void relocateOne(uint8_t *loc, const Reloc &, uint64_t val) const override;
void writeStub(uint8_t *buf, const macho::Symbol &) const override; void writeStub(uint8_t *buf, const macho::Symbol &) const override;
@ -43,7 +44,7 @@ struct X86_64 : TargetInfo {
} // namespace } // namespace
static std::string getErrorLocation(MemoryBufferRef mb, const section_64 &sec, static std::string getErrorLocation(MemoryBufferRef mb, const section_64 &sec,
const relocation_info &rel) { relocation_info rel) {
return ("invalid relocation at offset " + std::to_string(rel.r_address) + return ("invalid relocation at offset " + std::to_string(rel.r_address) +
" of " + sec.segname + "," + sec.sectname + " in " + " of " + sec.segname + "," + sec.sectname + " in " +
mb.getBufferIdentifier()) mb.getBufferIdentifier())
@ -51,7 +52,7 @@ static std::string getErrorLocation(MemoryBufferRef mb, const section_64 &sec,
} }
static void validateLength(MemoryBufferRef mb, const section_64 &sec, static void validateLength(MemoryBufferRef mb, const section_64 &sec,
const relocation_info &rel, relocation_info rel,
ArrayRef<uint8_t> validLengths) { ArrayRef<uint8_t> validLengths) {
if (find(validLengths, rel.r_length) != validLengths.end()) if (find(validLengths, rel.r_length) != validLengths.end())
return; return;
@ -68,8 +69,13 @@ static void validateLength(MemoryBufferRef mb, const section_64 &sec,
fatal(msg); fatal(msg);
} }
uint64_t X86_64::getImplicitAddend(MemoryBufferRef mb, const section_64 &sec, bool X86_64::isPairedReloc(relocation_info rel) const {
const relocation_info &rel) const { return rel.r_type == X86_64_RELOC_SUBTRACTOR;
}
uint64_t X86_64::getAddend(MemoryBufferRef mb, const section_64 &sec,
relocation_info rel,
relocation_info pairedRel) const {
auto *buf = reinterpret_cast<const uint8_t *>(mb.getBufferStart()); auto *buf = reinterpret_cast<const uint8_t *>(mb.getBufferStart());
const uint8_t *loc = buf + sec.offset + rel.r_address; const uint8_t *loc = buf + sec.offset + rel.r_address;
@ -139,7 +145,7 @@ void X86_64::relocateOne(uint8_t *loc, const Reloc &r, uint64_t val) const {
break; break;
default: default:
llvm_unreachable( llvm_unreachable(
"getImplicitAddend should have flagged all unhandled relocation types"); "getAddend should have flagged all unhandled relocation types");
} }
switch (r.length) { switch (r.length) {

View File

@ -206,31 +206,53 @@ static InputSection *findContainingSubsection(SubsectionMap &map,
void ObjFile::parseRelocations(const section_64 &sec, void ObjFile::parseRelocations(const section_64 &sec,
SubsectionMap &subsecMap) { SubsectionMap &subsecMap) {
auto *buf = reinterpret_cast<const uint8_t *>(mb.getBufferStart()); auto *buf = reinterpret_cast<const uint8_t *>(mb.getBufferStart());
ArrayRef<any_relocation_info> anyRelInfos( ArrayRef<relocation_info> relInfos(
reinterpret_cast<const any_relocation_info *>(buf + sec.reloff), reinterpret_cast<const relocation_info *>(buf + sec.reloff), sec.nreloc);
sec.nreloc);
for (const any_relocation_info &anyRelInfo : anyRelInfos) { for (size_t i = 0; i < relInfos.size(); i++) {
if (anyRelInfo.r_word0 & R_SCATTERED) // Paired relocations serve as Mach-O's method for attaching a
// supplemental datum to a primary relocation record. ELF does not
// need them because the *_RELOC_RELA records contain the extra
// addend field, vs. *_RELOC_REL which omit the addend.
//
// The {X86_64,ARM64}_RELOC_SUBTRACTOR record holds the subtrahend,
// and the paired *_RELOC_UNSIGNED record holds the minuend. The
// datum for each is a symbolic address. The result is the runtime
// offset between two addresses.
//
// The ARM64_RELOC_ADDEND record holds the addend, and the paired
// ARM64_RELOC_BRANCH26 or ARM64_RELOC_PAGE21/PAGEOFF12 holds the
// base symbolic address.
//
// Note: X86 does not use *_RELOC_ADDEND because it can embed an
// addend into the instruction stream. On X86, a relocatable address
// field always occupies an entire contiguous sequence of byte(s),
// so there is no need to merge opcode bits with address
// bits. Therefore, it's easy and convenient to store addends in the
// instruction-stream bytes that would otherwise contain zeroes. By
// contrast, RISC ISAs such as ARM64 mix opcode bits with with
// address bits so that bitwise arithmetic is necessary to extract
// and insert them. Storing addends in the instruction stream is
// possible, but inconvenient and more costly at link time.
relocation_info pairedInfo = relInfos[i];
relocation_info relInfo =
target->isPairedReloc(pairedInfo) ? relInfos[++i] : pairedInfo;
assert(i < relInfos.size());
if (relInfo.r_address & R_SCATTERED)
fatal("TODO: Scattered relocations not supported"); fatal("TODO: Scattered relocations not supported");
auto relInfo = reinterpret_cast<const relocation_info &>(anyRelInfo);
Reloc r; Reloc r;
r.type = relInfo.r_type; r.type = relInfo.r_type;
r.pcrel = relInfo.r_pcrel; r.pcrel = relInfo.r_pcrel;
r.length = relInfo.r_length; r.length = relInfo.r_length;
uint64_t rawAddend = target->getImplicitAddend(mb, sec, relInfo); r.offset = relInfo.r_address;
// For unpaired relocs, pairdInfo (just a copy of relInfo) is ignored
uint64_t rawAddend = target->getAddend(mb, sec, relInfo, pairedInfo);
if (relInfo.r_extern) { if (relInfo.r_extern) {
r.referent = symbols[relInfo.r_symbolnum]; r.referent = symbols[relInfo.r_symbolnum];
r.addend = rawAddend; r.addend = rawAddend;
} else { } else {
if (relInfo.r_symbolnum == 0 || relInfo.r_symbolnum > subsections.size())
fatal("invalid section index in relocation for offset " +
std::to_string(r.offset) + " in section " + sec.sectname +
" of " + getName());
SubsectionMap &referentSubsecMap = subsections[relInfo.r_symbolnum - 1]; SubsectionMap &referentSubsecMap = subsections[relInfo.r_symbolnum - 1];
const section_64 &referentSec = sectionHeaders[relInfo.r_symbolnum - 1]; const section_64 &referentSec = sectionHeaders[relInfo.r_symbolnum - 1];
uint32_t referentOffset; uint32_t referentOffset;
@ -250,7 +272,6 @@ void ObjFile::parseRelocations(const section_64 &sec,
r.addend = referentOffset; r.addend = referentOffset;
} }
r.offset = relInfo.r_address;
InputSection *subsec = findContainingSubsection(subsecMap, &r.offset); InputSection *subsec = findContainingSubsection(subsecMap, &r.offset);
subsec->relocs.push_back(r); subsec->relocs.push_back(r);
} }

View File

@ -37,9 +37,11 @@ public:
virtual ~TargetInfo() = default; virtual ~TargetInfo() = default;
// Validate the relocation structure and get its addend. // Validate the relocation structure and get its addend.
virtual uint64_t virtual uint64_t getAddend(llvm::MemoryBufferRef,
getImplicitAddend(llvm::MemoryBufferRef, const llvm::MachO::section_64 &, const llvm::MachO::section_64 &,
const llvm::MachO::relocation_info &) const = 0; llvm::MachO::relocation_info,
llvm::MachO::relocation_info) const = 0;
virtual bool isPairedReloc(llvm::MachO::relocation_info) const = 0;
virtual void relocateOne(uint8_t *loc, const Reloc &, uint64_t val) const = 0; virtual void relocateOne(uint8_t *loc, const Reloc &, uint64_t val) const = 0;
// Write code for lazy binding. See the comments on StubsSection for more // Write code for lazy binding. See the comments on StubsSection for more