| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398 | // Copyright 2017 The Abseil Authors.//// Licensed under the Apache License, Version 2.0 (the "License");// you may not use this file except in compliance with the License.// You may obtain a copy of the License at////      http://www.apache.org/licenses/LICENSE-2.0//// Unless required by applicable law or agreed to in writing, software// distributed under the License is distributed on an "AS IS" BASIS,// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.// See the License for the specific language governing permissions and// limitations under the License.// Allow dynamic symbol lookup in an in-memory Elf image.//#include "absl/debugging/internal/elf_mem_image.h"#ifdef ABSL_HAVE_ELF_MEM_IMAGE  // defined in elf_mem_image.h#include <string.h>#include <cassert>#include <cstddef>#include "absl/base/internal/raw_logging.h"// From binutils/include/elf/common.h (this doesn't appear to be documented// anywhere else).////   /* This flag appears in a Versym structure.  It means that the symbol//      is hidden, and is only visible with an explicit version number.//      This is a GNU extension.  *///   #define VERSYM_HIDDEN           0x8000////   /* This is the mask for the rest of the Versym information.  *///   #define VERSYM_VERSION          0x7fff#define VERSYM_VERSION 0x7fffnamespace absl {namespace debugging_internal {namespace {#if __WORDSIZE == 32const int kElfClass = ELFCLASS32;int ElfBind(const ElfW(Sym) *symbol) { return ELF32_ST_BIND(symbol->st_info); }int ElfType(const ElfW(Sym) *symbol) { return ELF32_ST_TYPE(symbol->st_info); }#elif __WORDSIZE == 64const int kElfClass = ELFCLASS64;int ElfBind(const ElfW(Sym) *symbol) { return ELF64_ST_BIND(symbol->st_info); }int ElfType(const ElfW(Sym) *symbol) { return ELF64_ST_TYPE(symbol->st_info); }#elseconst int kElfClass = -1;int ElfBind(const ElfW(Sym) *) {  ABSL_RAW_LOG(FATAL, "Unexpected word size");  return 0;}int ElfType(const ElfW(Sym) *) {  ABSL_RAW_LOG(FATAL, "Unexpected word size");  return 0;}#endif// Extract an element from one of the ELF tables, cast it to desired type.// This is just a simple arithmetic and a glorified cast.// Callers are responsible for bounds checking.template <typename T>const T *GetTableElement(const ElfW(Ehdr) * ehdr, ElfW(Off) table_offset,                         ElfW(Word) element_size, size_t index) {  return reinterpret_cast<const T*>(reinterpret_cast<const char *>(ehdr)                                    + table_offset                                    + index * element_size);}}  // namespace// The value of this variable doesn't matter; it's used only for its// unique address.const int ElfMemImage::kInvalidBaseSentinel = 0;ElfMemImage::ElfMemImage(const void *base) {  ABSL_RAW_CHECK(base != kInvalidBase, "bad pointer");  Init(base);}int ElfMemImage::GetNumSymbols() const {  if (!hash_) {    return 0;  }  // See http://www.caldera.com/developers/gabi/latest/ch5.dynamic.html#hash  return hash_[1];}const ElfW(Sym) *ElfMemImage::GetDynsym(int index) const {  ABSL_RAW_CHECK(index < GetNumSymbols(), "index out of range");  return dynsym_ + index;}const ElfW(Versym) *ElfMemImage::GetVersym(int index) const {  ABSL_RAW_CHECK(index < GetNumSymbols(), "index out of range");  return versym_ + index;}const ElfW(Phdr) *ElfMemImage::GetPhdr(int index) const {  ABSL_RAW_CHECK(index < ehdr_->e_phnum, "index out of range");  return GetTableElement<ElfW(Phdr)>(ehdr_,                                     ehdr_->e_phoff,                                     ehdr_->e_phentsize,                                     index);}const char *ElfMemImage::GetDynstr(ElfW(Word) offset) const {  ABSL_RAW_CHECK(offset < strsize_, "offset out of range");  return dynstr_ + offset;}const void *ElfMemImage::GetSymAddr(const ElfW(Sym) *sym) const {  if (sym->st_shndx == SHN_UNDEF || sym->st_shndx >= SHN_LORESERVE) {    // Symbol corresponds to "special" (e.g. SHN_ABS) section.    return reinterpret_cast<const void *>(sym->st_value);  }  ABSL_RAW_CHECK(link_base_ < sym->st_value, "symbol out of range");  return GetTableElement<char>(ehdr_, 0, 1, sym->st_value) - link_base_;}const ElfW(Verdef) *ElfMemImage::GetVerdef(int index) const {  ABSL_RAW_CHECK(0 <= index && static_cast<size_t>(index) <= verdefnum_,                 "index out of range");  const ElfW(Verdef) *version_definition = verdef_;  while (version_definition->vd_ndx < index && version_definition->vd_next) {    const char *const version_definition_as_char =        reinterpret_cast<const char *>(version_definition);    version_definition =        reinterpret_cast<const ElfW(Verdef) *>(version_definition_as_char +                                               version_definition->vd_next);  }  return version_definition->vd_ndx == index ? version_definition : nullptr;}const ElfW(Verdaux) *ElfMemImage::GetVerdefAux(    const ElfW(Verdef) *verdef) const {  return reinterpret_cast<const ElfW(Verdaux) *>(verdef+1);}const char *ElfMemImage::GetVerstr(ElfW(Word) offset) const {  ABSL_RAW_CHECK(offset < strsize_, "offset out of range");  return dynstr_ + offset;}void ElfMemImage::Init(const void *base) {  ehdr_      = nullptr;  dynsym_    = nullptr;  dynstr_    = nullptr;  versym_    = nullptr;  verdef_    = nullptr;  hash_      = nullptr;  strsize_   = 0;  verdefnum_ = 0;  link_base_ = ~0L;  // Sentinel: PT_LOAD .p_vaddr can't possibly be this.  if (!base) {    return;  }  const intptr_t base_as_uintptr_t = reinterpret_cast<uintptr_t>(base);  // Fake VDSO has low bit set.  const bool fake_vdso = ((base_as_uintptr_t & 1) != 0);  base = reinterpret_cast<const void *>(base_as_uintptr_t & ~1);  const char *const base_as_char = reinterpret_cast<const char *>(base);  if (base_as_char[EI_MAG0] != ELFMAG0 || base_as_char[EI_MAG1] != ELFMAG1 ||      base_as_char[EI_MAG2] != ELFMAG2 || base_as_char[EI_MAG3] != ELFMAG3) {    assert(false);    return;  }  int elf_class = base_as_char[EI_CLASS];  if (elf_class != kElfClass) {    assert(false);    return;  }  switch (base_as_char[EI_DATA]) {    case ELFDATA2LSB: {      if (__LITTLE_ENDIAN != __BYTE_ORDER) {        assert(false);        return;      }      break;    }    case ELFDATA2MSB: {      if (__BIG_ENDIAN != __BYTE_ORDER) {        assert(false);        return;      }      break;    }    default: {      assert(false);      return;    }  }  ehdr_ = reinterpret_cast<const ElfW(Ehdr) *>(base);  const ElfW(Phdr) *dynamic_program_header = nullptr;  for (int i = 0; i < ehdr_->e_phnum; ++i) {    const ElfW(Phdr) *const program_header = GetPhdr(i);    switch (program_header->p_type) {      case PT_LOAD:        if (!~link_base_) {          link_base_ = program_header->p_vaddr;        }        break;      case PT_DYNAMIC:        dynamic_program_header = program_header;        break;    }  }  if (!~link_base_ || !dynamic_program_header) {    assert(false);    // Mark this image as not present. Can not recur infinitely.    Init(nullptr);    return;  }  ptrdiff_t relocation =      base_as_char - reinterpret_cast<const char *>(link_base_);  ElfW(Dyn) *dynamic_entry =      reinterpret_cast<ElfW(Dyn) *>(dynamic_program_header->p_vaddr +                                    relocation);  for (; dynamic_entry->d_tag != DT_NULL; ++dynamic_entry) {    ElfW(Xword) value = dynamic_entry->d_un.d_val;    if (fake_vdso) {      // A complication: in the real VDSO, dynamic entries are not relocated      // (it wasn't loaded by a dynamic loader). But when testing with a      // "fake" dlopen()ed vdso library, the loader relocates some (but      // not all!) of them before we get here.      if (dynamic_entry->d_tag == DT_VERDEF) {        // The only dynamic entry (of the ones we care about) libc-2.3.6        // loader doesn't relocate.        value += relocation;      }    } else {      // Real VDSO. Everything needs to be relocated.      value += relocation;    }    switch (dynamic_entry->d_tag) {      case DT_HASH:        hash_ = reinterpret_cast<ElfW(Word) *>(value);        break;      case DT_SYMTAB:        dynsym_ = reinterpret_cast<ElfW(Sym) *>(value);        break;      case DT_STRTAB:        dynstr_ = reinterpret_cast<const char *>(value);        break;      case DT_VERSYM:        versym_ = reinterpret_cast<ElfW(Versym) *>(value);        break;      case DT_VERDEF:        verdef_ = reinterpret_cast<ElfW(Verdef) *>(value);        break;      case DT_VERDEFNUM:        verdefnum_ = dynamic_entry->d_un.d_val;        break;      case DT_STRSZ:        strsize_ = dynamic_entry->d_un.d_val;        break;      default:        // Unrecognized entries explicitly ignored.        break;    }  }  if (!hash_ || !dynsym_ || !dynstr_ || !versym_ ||      !verdef_ || !verdefnum_ || !strsize_) {    assert(false);  // invalid VDSO    // Mark this image as not present. Can not recur infinitely.    Init(nullptr);    return;  }}bool ElfMemImage::LookupSymbol(const char *name,                               const char *version,                               int type,                               SymbolInfo *info_out) const {  for (const SymbolInfo& info : *this) {    if (strcmp(info.name, name) == 0 && strcmp(info.version, version) == 0 &&        ElfType(info.symbol) == type) {      if (info_out) {        *info_out = info;      }      return true;    }  }  return false;}bool ElfMemImage::LookupSymbolByAddress(const void *address,                                        SymbolInfo *info_out) const {  for (const SymbolInfo& info : *this) {    const char *const symbol_start =        reinterpret_cast<const char *>(info.address);    const char *const symbol_end = symbol_start + info.symbol->st_size;    if (symbol_start <= address && address < symbol_end) {      if (info_out) {        // Client wants to know details for that symbol (the usual case).        if (ElfBind(info.symbol) == STB_GLOBAL) {          // Strong symbol; just return it.          *info_out = info;          return true;        } else {          // Weak or local. Record it, but keep looking for a strong one.          *info_out = info;        }      } else {        // Client only cares if there is an overlapping symbol.        return true;      }    }  }  return false;}ElfMemImage::SymbolIterator::SymbolIterator(const void *const image, int index)    : index_(index), image_(image) {}const ElfMemImage::SymbolInfo *ElfMemImage::SymbolIterator::operator->() const {  return &info_;}const ElfMemImage::SymbolInfo& ElfMemImage::SymbolIterator::operator*() const {  return info_;}bool ElfMemImage::SymbolIterator::operator==(const SymbolIterator &rhs) const {  return this->image_ == rhs.image_ && this->index_ == rhs.index_;}bool ElfMemImage::SymbolIterator::operator!=(const SymbolIterator &rhs) const {  return !(*this == rhs);}ElfMemImage::SymbolIterator &ElfMemImage::SymbolIterator::operator++() {  this->Update(1);  return *this;}ElfMemImage::SymbolIterator ElfMemImage::begin() const {  SymbolIterator it(this, 0);  it.Update(0);  return it;}ElfMemImage::SymbolIterator ElfMemImage::end() const {  return SymbolIterator(this, GetNumSymbols());}void ElfMemImage::SymbolIterator::Update(int increment) {  const ElfMemImage *image = reinterpret_cast<const ElfMemImage *>(image_);  ABSL_RAW_CHECK(image->IsPresent() || increment == 0, "");  if (!image->IsPresent()) {    return;  }  index_ += increment;  if (index_ >= image->GetNumSymbols()) {    index_ = image->GetNumSymbols();    return;  }  const ElfW(Sym)    *symbol = image->GetDynsym(index_);  const ElfW(Versym) *version_symbol = image->GetVersym(index_);  ABSL_RAW_CHECK(symbol && version_symbol, "");  const char *const symbol_name = image->GetDynstr(symbol->st_name);  const ElfW(Versym) version_index = version_symbol[0] & VERSYM_VERSION;  const ElfW(Verdef) *version_definition = nullptr;  const char *version_name = "";  if (symbol->st_shndx == SHN_UNDEF) {    // Undefined symbols reference DT_VERNEED, not DT_VERDEF, and    // version_index could well be greater than verdefnum_, so calling    // GetVerdef(version_index) may trigger assertion.  } else {    version_definition = image->GetVerdef(version_index);  }  if (version_definition) {    // I am expecting 1 or 2 auxiliary entries: 1 for the version itself,    // optional 2nd if the version has a parent.    ABSL_RAW_CHECK(        version_definition->vd_cnt == 1 || version_definition->vd_cnt == 2,        "wrong number of entries");    const ElfW(Verdaux) *version_aux = image->GetVerdefAux(version_definition);    version_name = image->GetVerstr(version_aux->vda_name);  }  info_.name    = symbol_name;  info_.version = version_name;  info_.address = image->GetSymAddr(symbol);  info_.symbol  = symbol;}}  // namespace debugging_internal}  // namespace absl#endif  // ABSL_HAVE_ELF_MEM_IMAGE
 |