普通文本  |  325行  |  10.08 KB

// Copyright 2016, VIXL authors
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
//   * Redistributions of source code must retain the above copyright notice,
//     this list of conditions and the following disclaimer.
//   * Redistributions in binary form must reproduce the above copyright notice,
//     this list of conditions and the following disclaimer in the documentation
//     and/or other materials provided with the distribution.
//   * Neither the name of ARM Limited nor the names of its contributors may be
//     used to endorse or promote products derived from this software without
//     specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS CONTRIBUTORS "AS IS" AND
// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
// WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


// The example assumes support for ELF binaries.
#ifdef __linux__

extern "C" {
#include <elf.h>
#include <fcntl.h>
#include <stdint.h>
#include <sys/mman.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <unistd.h>
}

#include <cerrno>
#include <iostream>
#include <map>
#include <string>

#include "globals-vixl.h"
#include "aarch32/instructions-aarch32.h"
#include "aarch32/disasm-aarch32.h"

class Symbol {
  Elf32_Addr addr_;
  int32_t offset_;
  uint32_t size_;
  int section_;
  std::string name_;

 public:
  Symbol(const char* name,
         Elf32_Addr addr,
         int32_t offset,
         uint32_t size,
         int section)
      : addr_(addr),
        offset_(offset),
        size_(size),
        section_(section),
        name_(name) {}
  Symbol(const Symbol& ref)
      : addr_(ref.addr_),
        offset_(ref.offset_),
        size_(ref.size_),
        section_(ref.section_),
        name_(ref.name_) {}

  Elf32_Addr GetAddress() const { return addr_; }
  Elf32_Addr GetMemoryAddress() const { return (addr_ & ~1) + offset_; }
  uint32_t GetSize() const { return size_; }
  const std::string& GetName() const { return name_; }
  int GetSection() const { return section_; }
};


class SymbolTable : public std::map<Elf32_Addr, Symbol> {
 public:
  void insert(const Symbol& sym) {
    VIXL_ASSERT(find(sym.GetAddress()) == end());
    std::map<Elf32_Addr, Symbol>::insert(
        std::make_pair(sym.GetMemoryAddress(), sym));
  }
};


class SectionLocator {
  const Elf32_Shdr* shdr_;
  int nsections_;
  const char* shstrtab_;

 public:
  explicit SectionLocator(const Elf32_Ehdr* ehdr) {
    shdr_ = reinterpret_cast<const Elf32_Shdr*>(
        reinterpret_cast<const char*>(ehdr) + ehdr->e_shoff);
    // shstrtab holds the section names as an offset in the file.
    shstrtab_ =
        reinterpret_cast<const char*>(ehdr) + shdr_[ehdr->e_shstrndx].sh_offset;
    nsections_ = ehdr->e_shnum;
  }

  const Elf32_Shdr* Locate(Elf32_Word type,
                           const std::string& section_name) const {
    for (int shnum = 1; shnum < nsections_; shnum++) {
      if ((shdr_[shnum].sh_type == type) &&
          std::string(shstrtab_ + shdr_[shnum].sh_name) == section_name) {
        return &shdr_[shnum];
      }
    }
    return NULL;
  }
};


template <typename VISITOR>
void LocateSymbols(const Elf32_Ehdr* ehdr,
                   const Elf32_Shdr* symtab,
                   const Elf32_Shdr* strtab,
                   VISITOR* visitor) {
  if ((symtab != NULL) && (strtab != NULL)) {
    const Elf32_Shdr* shdr = reinterpret_cast<const Elf32_Shdr*>(
        reinterpret_cast<const char*>(ehdr) + ehdr->e_shoff);

    const char* symnames =
        reinterpret_cast<const char*>(ehdr) + strtab->sh_offset;
    VIXL_CHECK(symnames != NULL);

    int nsym = symtab->sh_size / symtab->sh_entsize;
    const Elf32_Sym* sym = reinterpret_cast<const Elf32_Sym*>(
        reinterpret_cast<const char*>(ehdr) + symtab->sh_offset);
    for (int snum = 0; snum < nsym; snum++) {
      if ((sym[snum].st_shndx > 0) && (sym[snum].st_shndx < ehdr->e_shnum) &&
          (sym[snum].st_value != 0) &&
          (shdr[sym[snum].st_shndx].sh_type == SHT_PROGBITS) &&
          ((ELF32_ST_BIND(sym[snum].st_info) == STB_LOCAL) ||
           (ELF32_ST_BIND(sym[snum].st_info) == STB_GLOBAL)) &&
          (ELF32_ST_TYPE(sym[snum].st_info) == STT_FUNC)) {
        visitor->visit(symnames + sym[snum].st_name, sym[snum]);
      }
    }
  }
}


class DynamicSymbolVisitor {
  SymbolTable* symbols_;

 public:
  explicit DynamicSymbolVisitor(SymbolTable* symbols) : symbols_(symbols) {}
  void visit(const char* symname, const Elf32_Sym& sym) {
    symbols_->insert(
        Symbol(symname, sym.st_value, 0, sym.st_size, sym.st_shndx));
  }
};


class StaticSymbolVisitor {
  const Elf32_Ehdr* ehdr_;
  const Elf32_Shdr* shdr_;
  SymbolTable* symbols_;

 public:
  StaticSymbolVisitor(const Elf32_Ehdr* ehdr, SymbolTable* symbols)
      : ehdr_(ehdr),
        shdr_(reinterpret_cast<const Elf32_Shdr*>(
            reinterpret_cast<const char*>(ehdr) + ehdr->e_shoff)),
        symbols_(symbols) {}
  void visit(const char* symname, const Elf32_Sym& sym) {
    if (ehdr_->e_type == ET_REL) {
      symbols_->insert(Symbol(symname,
                              sym.st_value,
                              shdr_[sym.st_shndx].sh_offset,
                              sym.st_size,
                              sym.st_shndx));
    } else {
      symbols_->insert(
          Symbol(symname,
                 sym.st_value,
                 shdr_[sym.st_shndx].sh_offset - shdr_[sym.st_shndx].sh_addr,
                 sym.st_size,
                 sym.st_shndx));
    }
  }
};


void usage() {
  std::cout << "usage: disasm-a32 <file>\n"
               "where <file> is an ELF ARM binaryfile, either an executable, "
               "a shared object, or an object file." << std::endl;
}


int main(int argc, char** argv) {
  const int kErrorNotARMELF32 = -1;
  const int kErrorArguments = -2;
  if (argc < 2) {
    usage();
    return kErrorArguments;
  }

  const char* filename = argv[1];
  struct stat sb;


  if (lstat(filename, &sb) == -1) {
    std::cerr << "Cannot stat this file" << filename << std::endl;
    return errno;
  }

  if (S_ISLNK(sb.st_mode)) {
    static char linkname[4096];
    filename = realpath(argv[1], linkname);
    if (lstat(linkname, &sb) == -1) {
      std::cerr << "Cannot stat this file: " << linkname << std::endl;
      return errno;
    }
  }

  int elf_in;
  if ((elf_in = open(filename, O_RDONLY)) < 0) {
    std::cerr << "Cannot open: " << argv[1];
    if (filename != argv[1]) std::cerr << " aka " << filename;
    std::cerr << std::endl;
    return errno;
  }

  char* base_addr;
  VIXL_CHECK((base_addr = reinterpret_cast<char*>(
                  mmap(0, sb.st_size, PROT_READ, MAP_PRIVATE, elf_in, 0))) !=
             0);

  const Elf32_Ehdr* ehdr = reinterpret_cast<const Elf32_Ehdr*>(base_addr);
  if ((ehdr->e_ident[0] != 0x7f) || (ehdr->e_ident[1] != 'E') ||
      (ehdr->e_ident[2] != 'L') || (ehdr->e_ident[3] != 'F') ||
      (ehdr->e_ehsize != sizeof(Elf32_Ehdr))) {
    std::cerr << "This file is not an 32-bit ELF file." << std::endl;
    munmap(base_addr, sb.st_size);
    return kErrorNotARMELF32;
  }

  if (ehdr->e_machine != EM_ARM) {
    std::cerr << "This file is not using the ARM isa." << std::endl;
    munmap(base_addr, sb.st_size);
    return kErrorNotARMELF32;
  }

  // shstrtab holds the section names as an offset in the file.
  const Elf32_Shdr* shdr =
      reinterpret_cast<const Elf32_Shdr*>(base_addr + ehdr->e_shoff);

  SectionLocator section_locator(ehdr);

  SymbolTable symbol_names;

  // Traverse the dynamic symbols defined in any text section
  DynamicSymbolVisitor dynamic_visitor(&symbol_names);
  LocateSymbols(ehdr,
                section_locator.Locate(SHT_DYNSYM, ".dynsym"),
                section_locator.Locate(SHT_STRTAB, ".dynstr"),
                &dynamic_visitor);

  // Traverse the static symbols defined in the any test section
  StaticSymbolVisitor static_visitor(ehdr, &symbol_names);
  LocateSymbols(ehdr,
                section_locator.Locate(SHT_SYMTAB, ".symtab"),
                section_locator.Locate(SHT_STRTAB, ".strtab"),
                &static_visitor);


  vixl::aarch32::PrintDisassembler dis(std::cout, 0);
  for (SymbolTable::iterator sres = symbol_names.begin();
       sres != symbol_names.end();
       sres++) {
    const Symbol& symbol = sres->second;
    uint32_t func_addr = symbol.GetAddress();
    uint32_t func_size = symbol.GetSize();
    if (func_size == 0) {
      SymbolTable::iterator next_func = sres;
      next_func++;
      if (next_func == symbol_names.end()) {
        const Elf32_Shdr& shndx = shdr[sres->second.GetSection()];
        func_size = (shndx.sh_offset + shndx.sh_size) - sres->first;
      } else {
        func_size = next_func->first - sres->first;
      }
    }

    std::cout << "--- " << symbol.GetName() << ":" << std::endl;
    if ((func_addr & 1) == 1) {
      func_addr &= ~1;
      dis.SetCodeAddress(func_addr);
      dis.DisassembleT32Buffer(reinterpret_cast<uint16_t*>(
                                   base_addr + symbol.GetMemoryAddress()),
                               func_size);
    } else {
      dis.SetCodeAddress(func_addr);
      dis.DisassembleA32Buffer(reinterpret_cast<uint32_t*>(
                                   base_addr + symbol.GetMemoryAddress()),
                               func_size);
    }
  }
  munmap(base_addr, sb.st_size);
  return 0;
}


#else

#include "globals-vixl.h"

// TODO: Implement this example for macOS.
int main(void) {
  VIXL_WARNING("This example has not been implemented for macOS.");
  return 0;
}

#endif  // __linux__