blob: 591a1fdadd1eb76f8e85beaa10b6b47e5f212117 [file] [log] [blame]
// Copyright 2014 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "crazy_linker_elf_relocations.h"
#include <errno.h>
#include "crazy_linker_debug.h"
#include "crazy_linker_elf_symbols.h"
#include "crazy_linker_elf_view.h"
#include "crazy_linker_error.h"
#include "crazy_linker_util.h"
#include "linker_phdr.h"
#define DEBUG_RELOCATIONS 0
#define RLOG(...) LOG_IF(DEBUG_RELOCATIONS, __VA_ARGS__)
#define RLOG_ERRNO(...) LOG_ERRNO_IF(DEBUG_RELOCATIONS, __VA_ARGS__)
#ifndef DF_SYMBOLIC
#define DF_SYMBOLIC 2
#endif
#ifndef DF_TEXTREL
#define DF_TEXTREL 4
#endif
#ifndef DT_FLAGS
#define DT_FLAGS 30
#endif
// Processor-specific relocation types supported by the linker.
#ifdef __arm__
/* arm32 relocations */
#define R_ARM_ABS32 2
#define R_ARM_REL32 3
#define R_ARM_GLOB_DAT 21
#define R_ARM_JUMP_SLOT 22
#define R_ARM_COPY 20
#define R_ARM_RELATIVE 23
#endif // __arm__
#ifdef __aarch64__
/* arm64 relocations */
#define R_AARCH64_ABS64 257
#define R_AARCH64_COPY 1024
#define R_AARCH64_GLOB_DAT 1025
#define R_AARCH64_JUMP_SLOT 1026
#define R_AARCH64_RELATIVE 1027
#endif // __aarch64__
#ifdef __i386__
/* i386 relocations */
#define R_386_32 1
#define R_386_PC32 2
#define R_386_GLOB_DAT 6
#define R_386_JMP_SLOT 7
#define R_386_RELATIVE 8
#endif // __i386__
namespace crazy {
namespace {
// List of known relocation types the relocator knows about.
enum RelocationType {
RELOCATION_TYPE_UNKNOWN = 0,
RELOCATION_TYPE_ABSOLUTE = 1,
RELOCATION_TYPE_RELATIVE = 2,
RELOCATION_TYPE_PC_RELATIVE = 3,
RELOCATION_TYPE_COPY = 4,
};
// Convert an ELF relocation type info a RelocationType value.
RelocationType GetRelocationType(ELF::Word r_type) {
switch (r_type) {
#ifdef __arm__
case R_ARM_JUMP_SLOT:
case R_ARM_GLOB_DAT:
case R_ARM_ABS32:
return RELOCATION_TYPE_ABSOLUTE;
case R_ARM_REL32:
case R_ARM_RELATIVE:
return RELOCATION_TYPE_RELATIVE;
case R_ARM_COPY:
return RELOCATION_TYPE_COPY;
#endif
#ifdef __aarch64__
case R_AARCH64_JUMP_SLOT:
case R_AARCH64_GLOB_DAT:
case R_AARCH64_ABS64:
return RELOCATION_TYPE_ABSOLUTE;
case R_AARCH64_RELATIVE:
return RELOCATION_TYPE_RELATIVE;
case R_AARCH64_COPY:
return RELOCATION_TYPE_COPY;
#endif
#ifdef __i386__
case R_386_JMP_SLOT:
case R_386_GLOB_DAT:
case R_386_32:
return RELOCATION_TYPE_ABSOLUTE;
case R_386_RELATIVE:
return RELOCATION_TYPE_RELATIVE;
case R_386_PC32:
return RELOCATION_TYPE_PC_RELATIVE;
#endif
#ifdef __mips__
case R_MIPS_REL32:
return RELOCATION_TYPE_RELATIVE;
#endif
default:
return RELOCATION_TYPE_UNKNOWN;
}
}
} // namespace
bool ElfRelocations::Init(const ElfView* view, Error* error) {
// Save these for later.
phdr_ = view->phdr();
phdr_count_ = view->phdr_count();
load_bias_ = view->load_bias();
// We handle only Rel or Rela, but not both. If DT_RELA or DT_RELASZ
// then we require DT_PLTREL to agree.
bool has_rela_relocations = false;
bool has_rel_relocations = false;
// Parse the dynamic table.
ElfView::DynamicIterator dyn(view);
for (; dyn.HasNext(); dyn.GetNext()) {
ELF::Addr dyn_value = dyn.GetValue();
uintptr_t dyn_addr = dyn.GetAddress(view->load_bias());
const ELF::Addr tag = dyn.GetTag();
switch (tag) {
case DT_PLTREL:
RLOG(" DT_PLTREL value=%d\n", dyn_value);
if (dyn_value != DT_REL && dyn_value != DT_RELA) {
*error = "Invalid DT_PLTREL value in dynamic section";
return false;
}
relocations_type_ = dyn_value;
break;
case DT_JMPREL:
RLOG(" DT_JMPREL addr=%p\n", dyn_addr);
plt_relocations_ = dyn_addr;
break;
case DT_PLTRELSZ:
plt_relocations_size_ = dyn_value;
RLOG(" DT_PLTRELSZ size=%d\n", dyn_value);
break;
case DT_RELA:
case DT_REL:
RLOG(" %s addr=%p\n",
(tag == DT_RELA) ? "DT_RELA" : "DT_REL",
dyn_addr);
if (relocations_) {
*error = "Unsupported DT_RELA/DT_REL combination in dynamic section";
return false;
}
relocations_ = dyn_addr;
if (tag == DT_RELA)
has_rela_relocations = true;
else
has_rel_relocations = true;
break;
case DT_RELASZ:
case DT_RELSZ:
RLOG(" %s size=%d\n",
(tag == DT_RELASZ) ? "DT_RELASZ" : "DT_RELSZ",
dyn_addr);
if (relocations_size_) {
*error = "Unsupported DT_RELASZ/DT_RELSZ combination in dyn section";
return false;
}
relocations_size_ = dyn_value;
if (tag == DT_RELASZ)
has_rela_relocations = true;
else
has_rel_relocations = true;
break;
case DT_PLTGOT:
// Only used on MIPS currently. Could also be used on other platforms
// when lazy binding (i.e. RTLD_LAZY) is implemented.
RLOG(" DT_PLTGOT addr=%p\n", dyn_addr);
plt_got_ = reinterpret_cast<ELF::Addr*>(dyn_addr);
break;
case DT_TEXTREL:
RLOG(" DT_TEXTREL\n");
has_text_relocations_ = true;
break;
case DT_SYMBOLIC:
RLOG(" DT_SYMBOLIC\n");
has_symbolic_ = true;
break;
case DT_FLAGS:
if (dyn_value & DF_TEXTREL)
has_text_relocations_ = true;
if (dyn_value & DF_SYMBOLIC)
has_symbolic_ = true;
RLOG(" DT_FLAGS has_text_relocations=%s has_symbolic=%s\n",
has_text_relocations_ ? "true" : "false",
has_symbolic_ ? "true" : "false");
break;
#if defined(__mips__)
case DT_MIPS_SYMTABNO:
RLOG(" DT_MIPS_SYMTABNO value=%d\n", dyn_value);
mips_symtab_count_ = dyn_value;
break;
case DT_MIPS_LOCAL_GOTNO:
RLOG(" DT_MIPS_LOCAL_GOTNO value=%d\n", dyn_value);
mips_local_got_count_ = dyn_value;
break;
case DT_MIPS_GOTSYM:
RLOG(" DT_MIPS_GOTSYM value=%d\n", dyn_value);
mips_gotsym_ = dyn_value;
break;
#endif
default:
;
}
}
if (relocations_type_ != DT_REL && relocations_type_ != DT_RELA) {
*error = "Unsupported or missing DT_PLTREL in dynamic section";
return false;
}
if (relocations_type_ == DT_REL && has_rela_relocations) {
*error = "Found DT_RELA in dyn section, but DT_PLTREL is DT_REL";
return false;
}
if (relocations_type_ == DT_RELA && has_rel_relocations) {
*error = "Found DT_REL in dyn section, but DT_PLTREL is DT_RELA";
return false;
}
return true;
}
bool ElfRelocations::ApplyAll(const ElfSymbols* symbols,
SymbolResolver* resolver,
Error* error) {
LOG("%s: Enter\n", __FUNCTION__);
if (has_text_relocations_) {
if (phdr_table_unprotect_segments(phdr_, phdr_count_, load_bias_) < 0) {
error->Format("Can't unprotect loadable segments: %s", strerror(errno));
return false;
}
}
if (relocations_type_ == DT_REL) {
if (!ApplyRelRelocs(reinterpret_cast<ELF::Rel*>(plt_relocations_),
plt_relocations_size_ / sizeof(ELF::Rel),
symbols,
resolver,
error))
return false;
if (!ApplyRelRelocs(reinterpret_cast<ELF::Rel*>(relocations_),
relocations_size_ / sizeof(ELF::Rel),
symbols,
resolver,
error))
return false;
}
else if (relocations_type_ == DT_RELA) {
if (!ApplyRelaRelocs(reinterpret_cast<ELF::Rela*>(plt_relocations_),
plt_relocations_size_ / sizeof(ELF::Rela),
symbols,
resolver,
error))
return false;
if (!ApplyRelaRelocs(reinterpret_cast<ELF::Rela*>(relocations_),
relocations_size_ / sizeof(ELF::Rela),
symbols,
resolver,
error))
return false;
}
#ifdef __mips__
if (!RelocateMipsGot(symbols, resolver, error))
return false;
#endif
if (has_text_relocations_) {
if (phdr_table_protect_segments(phdr_, phdr_count_, load_bias_) < 0) {
error->Format("Can't reprotect loadable segments: %s", strerror(errno));
return false;
}
}
LOG("%s: Done\n", __FUNCTION__);
return true;
}
bool ElfRelocations::ApplyRelaReloc(const ELF::Rela* rela,
ELF::Addr sym_addr,
bool resolved CRAZY_UNUSED,
Error* error) {
const ELF::Word rela_type = ELF_R_TYPE(rela->r_info);
const ELF::Word CRAZY_UNUSED rela_symbol = ELF_R_SYM(rela->r_info);
const ELF::Sword CRAZY_UNUSED addend = rela->r_addend;
const ELF::Addr reloc = static_cast<ELF::Addr>(rela->r_offset + load_bias_);
RLOG(" rela reloc=%p offset=%p type=%d addend=%p\n",
reloc,
rela->r_offset,
rela_type,
addend);
// Apply the relocation.
ELF::Addr* CRAZY_UNUSED target = reinterpret_cast<ELF::Addr*>(reloc);
switch (rela_type) {
#ifdef __aarch64__
case R_AARCH64_JUMP_SLOT:
RLOG(" R_AARCH64_JUMP_SLOT target=%p addr=%p\n",
target,
sym_addr + addend);
*target = sym_addr + addend;
break;
case R_AARCH64_GLOB_DAT:
RLOG(" R_AARCH64_GLOB_DAT target=%p addr=%p\n",
target,
sym_addr + addend);
*target = sym_addr + addend;
break;
case R_AARCH64_ABS64:
RLOG(" R_AARCH64_ABS64 target=%p (%p) addr=%p\n",
target,
*target,
sym_addr + addend);
*target += sym_addr + addend;
break;
case R_AARCH64_RELATIVE:
RLOG(" R_AARCH64_RELATIVE target=%p (%p) bias=%p\n",
target,
*target,
load_bias_ + addend);
if (__builtin_expect(rela_symbol, 0)) {
*error = "Invalid relative relocation with symbol";
return false;
}
*target = load_bias_ + addend;
break;
case R_AARCH64_COPY:
// NOTE: These relocations are forbidden in shared libraries.
RLOG(" R_AARCH64_COPY\n");
*error = "Invalid R_AARCH64_COPY relocation in shared library";
return false;
#endif // __aarch64__
default:
error->Format("Invalid relocation type (%d)", rela_type);
return false;
}
return true;
}
bool ElfRelocations::ApplyRelReloc(const ELF::Rel* rel,
ELF::Addr sym_addr,
bool resolved CRAZY_UNUSED,
Error* error) {
const ELF::Word rel_type = ELF_R_TYPE(rel->r_info);
const ELF::Word CRAZY_UNUSED rel_symbol = ELF_R_SYM(rel->r_info);
const ELF::Addr reloc = static_cast<ELF::Addr>(rel->r_offset + load_bias_);
RLOG(" rel reloc=%p offset=%p type=%d\n", reloc, rel->r_offset, rel_type);
// Apply the relocation.
ELF::Addr* CRAZY_UNUSED target = reinterpret_cast<ELF::Addr*>(reloc);
switch (rel_type) {
#ifdef __arm__
case R_ARM_JUMP_SLOT:
RLOG(" R_ARM_JUMP_SLOT target=%p addr=%p\n", target, sym_addr);
*target = sym_addr;
break;
case R_ARM_GLOB_DAT:
RLOG(" R_ARM_GLOB_DAT target=%p addr=%p\n", target, sym_addr);
*target = sym_addr;
break;
case R_ARM_ABS32:
RLOG(" R_ARM_ABS32 target=%p (%p) addr=%p\n",
target,
*target,
sym_addr);
*target += sym_addr;
break;
case R_ARM_REL32:
RLOG(" R_ARM_REL32 target=%p (%p) addr=%p offset=%p\n",
target,
*target,
sym_addr,
rel->r_offset);
*target += sym_addr - rel->r_offset;
break;
case R_ARM_RELATIVE:
RLOG(" R_ARM_RELATIVE target=%p (%p) bias=%p\n",
target,
*target,
load_bias_);
if (__builtin_expect(rel_symbol, 0)) {
*error = "Invalid relative relocation with symbol";
return false;
}
*target += load_bias_;
break;
case R_ARM_COPY:
// NOTE: These relocations are forbidden in shared libraries.
// The Android linker has special code to deal with this, which
// is not needed here.
RLOG(" R_ARM_COPY\n");
*error = "Invalid R_ARM_COPY relocation in shared library";
return false;
#endif // __arm__
#ifdef __i386__
case R_386_JMP_SLOT:
*target = sym_addr;
break;
case R_386_GLOB_DAT:
*target = sym_addr;
break;
case R_386_RELATIVE:
if (rel_symbol) {
*error = "Invalid relative relocation with symbol";
return false;
}
*target += load_bias_;
break;
case R_386_32:
*target += sym_addr;
break;
case R_386_PC32:
*target += (sym_addr - reloc);
break;
#endif // __i386__
#ifdef __mips__
case R_MIPS_REL32:
if (resolved)
*target += sym_addr;
else
*target += load_bias_;
break;
#endif // __mips__
default:
error->Format("Invalid relocation type (%d)", rel_type);
return false;
}
return true;
}
bool ElfRelocations::ResolveSymbol(ELF::Word rel_type,
ELF::Word rel_symbol,
const ElfSymbols* symbols,
SymbolResolver* resolver,
ELF::Addr reloc,
ELF::Addr* sym_addr,
Error* error) {
const char* sym_name = symbols->LookupNameById(rel_symbol);
RLOG(" symbol name='%s'\n", sym_name);
void* address = resolver->Lookup(sym_name);
if (address) {
// The symbol was found, so compute its address.
RLOG("%s: symbol %s resolved to %p\n", __FUNCTION__, sym_name, address);
*sym_addr = reinterpret_cast<ELF::Addr>(address);
return true;
}
// The symbol was not found. Normally this is an error except
// if this is a weak reference.
if (!symbols->IsWeakById(rel_symbol)) {
error->Format("Could not find symbol '%s'", sym_name);
return false;
}
RLOG("%s: weak reference to unresolved symbol %s\n", __FUNCTION__, sym_name);
// IHI0044C AAELF 4.5.1.1:
// Libraries are not searched to resolve weak references.
// It is not an error for a weak reference to remain
// unsatisfied.
//
// During linking, the value of an undefined weak reference is:
// - Zero if the relocation type is absolute
// - The address of the place if the relocation is pc-relative
// - The address of nominal base address if the relocation
// type is base-relative.
RelocationType r = GetRelocationType(rel_type);
if (r == RELOCATION_TYPE_ABSOLUTE || r == RELOCATION_TYPE_RELATIVE) {
*sym_addr = 0;
return true;
}
if (r == RELOCATION_TYPE_PC_RELATIVE) {
*sym_addr = reloc;
return true;
}
error->Format(
"Invalid weak relocation type (%d) for unknown symbol '%s'",
r,
sym_name);
return false;
}
bool ElfRelocations::ApplyRelRelocs(const ELF::Rel* rel,
size_t rel_count,
const ElfSymbols* symbols,
SymbolResolver* resolver,
Error* error) {
RLOG("%s: rel=%p rel_count=%d\n", __FUNCTION__, rel, rel_count);
if (!rel)
return true;
for (size_t rel_n = 0; rel_n < rel_count; rel++, rel_n++) {
const ELF::Word rel_type = ELF_R_TYPE(rel->r_info);
const ELF::Word rel_symbol = ELF_R_SYM(rel->r_info);
ELF::Addr sym_addr = 0;
ELF::Addr reloc = static_cast<ELF::Addr>(rel->r_offset + load_bias_);
RLOG(" %d/%d reloc=%p offset=%p type=%d symbol=%d\n",
rel_n + 1,
rel_count,
reloc,
rel->r_offset,
rel_type,
rel_symbol);
if (rel_type == 0)
continue;
bool resolved = false;
// If this is a symbolic relocation, compute the symbol's address.
if (__builtin_expect(rel_symbol != 0, 0)) {
resolved = ResolveSymbol(rel_type,
rel_symbol,
symbols,
resolver,
reloc,
&sym_addr,
error);
}
if (!ApplyRelReloc(rel, sym_addr, resolved, error))
return false;
}
return true;
}
bool ElfRelocations::ApplyRelaRelocs(const ELF::Rela* rela,
size_t rela_count,
const ElfSymbols* symbols,
SymbolResolver* resolver,
Error* error) {
RLOG("%s: rela=%p rela_count=%d\n", __FUNCTION__, rela, rela_count);
if (!rela)
return true;
for (size_t rel_n = 0; rel_n < rela_count; rela++, rel_n++) {
const ELF::Word rel_type = ELF_R_TYPE(rela->r_info);
const ELF::Word rel_symbol = ELF_R_SYM(rela->r_info);
ELF::Addr sym_addr = 0;
ELF::Addr reloc = static_cast<ELF::Addr>(rela->r_offset + load_bias_);
RLOG(" %d/%d reloc=%p offset=%p type=%d symbol=%d\n",
rel_n + 1,
rela_count,
reloc,
rela->r_offset,
rel_type,
rel_symbol);
if (rel_type == 0)
continue;
bool resolved = false;
// If this is a symbolic relocation, compute the symbol's address.
if (__builtin_expect(rel_symbol != 0, 0)) {
resolved = ResolveSymbol(rel_type,
rel_symbol,
symbols,
resolver,
reloc,
&sym_addr,
error);
}
if (!ApplyRelaReloc(rela, sym_addr, resolved, error))
return false;
}
return true;
}
#ifdef __mips__
bool ElfRelocations::RelocateMipsGot(const ElfSymbols* symbols,
SymbolResolver* resolver,
Error* error) {
if (!plt_got_)
return true;
// Handle the local GOT entries.
// This mimics what the system linker does.
// Note from the system linker:
// got[0]: lazy resolver function address.
// got[1]: may be used for a GNU extension.
// Set it to a recognizable address in case someone calls it
// (should be _rtld_bind_start).
ELF::Addr* got = plt_got_;
got[0] = 0xdeadbeef;
if (got[1] & 0x80000000)
got[1] = 0xdeadbeef;
for (ELF::Addr n = 2; n < mips_local_got_count_; ++n)
got[n] += load_bias_;
// Handle the global GOT entries.
got += mips_local_got_count_;
for (size_t idx = mips_gotsym_; idx < mips_symtab_count_; idx++, got++) {
const char* sym_name = symbols->LookupNameById(idx);
void* sym_addr = resolver->Lookup(sym_name);
if (sym_addr) {
// Found symbol, update GOT entry.
*got = reinterpret_cast<ELF::Addr>(sym_addr);
continue;
}
if (symbols->IsWeakById(idx)) {
// Undefined symbols are only ok if this is a weak reference.
// Update GOT entry to 0 though.
*got = 0;
continue;
}
error->Format("Cannot locate symbol %s", sym_name);
return false;
}
return true;
}
#endif // __mips__
void ElfRelocations::AdjustRelocation(ELF::Word rel_type,
ELF::Addr src_reloc,
size_t dst_delta,
size_t map_delta) {
ELF::Addr* dst_ptr = reinterpret_cast<ELF::Addr*>(src_reloc + dst_delta);
switch (rel_type) {
#ifdef __arm__
case R_ARM_RELATIVE:
*dst_ptr += map_delta;
break;
#endif // __arm__
#ifdef __aarch64__
case R_AARCH64_RELATIVE:
*dst_ptr += map_delta;
break;
#endif // __aarch64__
#ifdef __i386__
case R_386_RELATIVE:
*dst_ptr += map_delta;
break;
#endif
#ifdef __mips__
case R_MIPS_REL32:
*dst_ptr += map_delta;
break;
#endif
default:
;
}
}
void ElfRelocations::RelocateRela(size_t src_addr,
size_t dst_addr,
size_t map_addr,
size_t size) {
// Add this value to each source address to get the corresponding
// destination address.
const size_t dst_delta = dst_addr - src_addr;
const size_t map_delta = map_addr - src_addr;
// Ignore PLT relocations, which all target symbols (ignored here).
const ELF::Rela* rel = reinterpret_cast<ELF::Rela*>(relocations_);
const size_t relocations_count = relocations_size_ / sizeof(ELF::Rela);
const ELF::Rela* rel_limit = rel + relocations_count;
for (; rel < rel_limit; ++rel) {
const ELF::Word rel_type = ELF_R_TYPE(rel->r_info);
const ELF::Word rel_symbol = ELF_R_SYM(rel->r_info);
ELF::Addr src_reloc = static_cast<ELF::Addr>(rel->r_offset + load_bias_);
if (rel_type == 0 || rel_symbol != 0) {
// Ignore empty and symbolic relocations
continue;
}
if (src_reloc < src_addr || src_reloc >= src_addr + size) {
// Ignore entries that don't relocate addresses inside the source section.
continue;
}
AdjustRelocation(rel_type, src_reloc, dst_delta, map_delta);
}
}
void ElfRelocations::RelocateRel(size_t src_addr,
size_t dst_addr,
size_t map_addr,
size_t size) {
// Add this value to each source address to get the corresponding
// destination address.
const size_t dst_delta = dst_addr - src_addr;
const size_t map_delta = map_addr - src_addr;
// Ignore PLT relocations, which all target symbols (ignored here).
const ELF::Rel* rel = reinterpret_cast<ELF::Rel*>(relocations_);
const size_t relocations_count = relocations_size_ / sizeof(ELF::Rel);
const ELF::Rel* rel_limit = rel + relocations_count;
for (; rel < rel_limit; ++rel) {
const ELF::Word rel_type = ELF_R_TYPE(rel->r_info);
const ELF::Word rel_symbol = ELF_R_SYM(rel->r_info);
ELF::Addr src_reloc = static_cast<ELF::Addr>(rel->r_offset + load_bias_);
if (rel_type == 0 || rel_symbol != 0) {
// Ignore empty and symbolic relocations
continue;
}
if (src_reloc < src_addr || src_reloc >= src_addr + size) {
// Ignore entries that don't relocate addresses inside the source section.
continue;
}
AdjustRelocation(rel_type, src_reloc, dst_delta, map_delta);
}
}
void ElfRelocations::CopyAndRelocate(size_t src_addr,
size_t dst_addr,
size_t map_addr,
size_t size) {
// First, a straight copy.
::memcpy(reinterpret_cast<void*>(dst_addr),
reinterpret_cast<void*>(src_addr),
size);
// Relocate relocations.
if (relocations_type_ == DT_REL)
RelocateRel(src_addr, dst_addr, map_addr, size);
else if (relocations_type_ == DT_RELA)
RelocateRela(src_addr, dst_addr, map_addr, size);
#ifdef __mips__
// Add this value to each source address to get the corresponding
// destination address.
const size_t dst_delta = dst_addr - src_addr;
const size_t map_delta = map_addr - src_addr;
// Only relocate local GOT entries.
ELF::Addr* got = plt_got_;
if (got) {
for (ELF::Addr n = 2; n < mips_local_got_count_; ++n) {
size_t got_addr = reinterpret_cast<size_t>(&got[n]);
if (got_addr < src_addr || got_addr >= src_addr + size)
continue;
ELF::Addr* dst_ptr = reinterpret_cast<ELF::Addr*>(got_addr + dst_delta);
*dst_ptr += map_delta;
}
}
#endif
}
} // namespace crazy