// Copyright (c) 2011 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef COURGETTE_DISASSEMBLER_WIN32_X86_H_ #define COURGETTE_DISASSEMBLER_WIN32_X86_H_ #include "base/basictypes.h" #include "courgette/disassembler.h" #include "courgette/memory_allocator.h" #include "courgette/types_win_pe.h" #ifdef COURGETTE_HISTOGRAM_TARGETS #include <map> #endif namespace courgette { class AssemblyProgram; class DisassemblerWin32X86 : public Disassembler { public: explicit DisassemblerWin32X86(const void* start, size_t length); virtual ExecutableType kind() { return EXE_WIN_32_X86; } // Returns 'true' if the buffer appears to point to a Windows 32 bit // executable, 'false' otherwise. If ParseHeader() succeeds, other member // functions may be called. virtual bool ParseHeader(); virtual bool Disassemble(AssemblyProgram* target); // // Exposed for test purposes // bool has_text_section() const { return has_text_section_; } uint32 size_of_code() const { return size_of_code_; } bool is_32bit() const { return !is_PE32_plus_; } // Returns 'true' if the base relocation table can be parsed. // Output is a vector of the RVAs corresponding to locations within executable // that are listed in the base relocation table. bool ParseRelocs(std::vector<RVA> *addresses); // Returns Section containing the relative virtual address, or NULL if none. const Section* RVAToSection(RVA rva) const; static const int kNoOffset = -1; // Returns kNoOffset if there is no file offset corresponding to 'rva'. int RVAToFileOffset(RVA rva) const; // Returns same as FileOffsetToPointer(RVAToFileOffset(rva)) except that NULL // is returned if there is no file offset corresponding to 'rva'. const uint8* RVAToPointer(RVA rva) const; static std::string SectionName(const Section* section); protected: CheckBool ParseFile(AssemblyProgram* target) WARN_UNUSED_RESULT; bool ParseAbs32Relocs(); void ParseRel32RelocsFromSections(); void ParseRel32RelocsFromSection(const Section* section); CheckBool ParseNonSectionFileRegion(uint32 start_file_offset, uint32 end_file_offset, AssemblyProgram* program) WARN_UNUSED_RESULT; CheckBool ParseFileRegion(const Section* section, uint32 start_file_offset, uint32 end_file_offset, AssemblyProgram* program) WARN_UNUSED_RESULT; #if COURGETTE_HISTOGRAM_TARGETS void HistogramTargets(const char* kind, const std::map<RVA, int>& map); #endif // Most addresses are represented as 32-bit RVAs. The one address we can't // do this with is the image base address. 'image_base' is valid only for // 32-bit executables. 'image_base_64' is valid for 32- and 64-bit executable. uint32 image_base() const { return static_cast<uint32>(image_base_); } const ImageDataDirectory& base_relocation_table() const { return base_relocation_table_; } bool IsValidRVA(RVA rva) const { return rva < size_of_image_; } // Returns description of the RVA, e.g. ".text+0x1243". For debugging only. std::string DescribeRVA(RVA rva) const; // Finds the first section at file_offset or above. Does not return sections // that have no raw bytes in the file. const Section* FindNextSection(uint32 file_offset) const; // There are 2 'coordinate systems' for reasoning about executables. // FileOffset - the the offset within a single .EXE or .DLL *file*. // RVA - relative virtual address (offset within *loaded image*) // FileOffsetToRVA and RVAToFileOffset convert between these representations. RVA FileOffsetToRVA(uint32 offset) const; private: bool ReadDataDirectory(int index, ImageDataDirectory* dir); bool incomplete_disassembly_; // 'true' if can leave out 'uninteresting' bits std::vector<RVA> abs32_locations_; std::vector<RVA> rel32_locations_; // // Fields that are always valid. // // // Information that is valid after successful ParseHeader. // bool is_PE32_plus_; // PE32_plus is for 64 bit executables. // Location and size of IMAGE_OPTIONAL_HEADER in the buffer. const uint8 *optional_header_; uint16 size_of_optional_header_; uint16 offset_of_data_directories_; uint16 machine_type_; uint16 number_of_sections_; const Section *sections_; bool has_text_section_; uint32 size_of_code_; uint32 size_of_initialized_data_; uint32 size_of_uninitialized_data_; RVA base_of_code_; RVA base_of_data_; uint64 image_base_; // range limited to 32 bits for 32 bit executable uint32 size_of_image_; int number_of_data_directories_; ImageDataDirectory export_table_; ImageDataDirectory import_table_; ImageDataDirectory resource_table_; ImageDataDirectory exception_table_; ImageDataDirectory base_relocation_table_; ImageDataDirectory bound_import_table_; ImageDataDirectory import_address_table_; ImageDataDirectory delay_import_descriptor_; ImageDataDirectory clr_runtime_header_; #if COURGETTE_HISTOGRAM_TARGETS std::map<RVA, int> abs32_target_rvas_; std::map<RVA, int> rel32_target_rvas_; #endif DISALLOW_COPY_AND_ASSIGN(DisassemblerWin32X86); }; } // namespace courgette #endif // COURGETTE_DISASSEMBLER_WIN32_X86_H_