/* * Copyright (c) 2010 The WebM project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include <stdio.h> #include <stdlib.h> #include "vpx_config.h" #if defined(_MSC_VER) #include <io.h> #include <share.h> #include "vpx/vpx_integer.h" #else #include <stdint.h> #include <unistd.h> #endif #include <string.h> #include <sys/types.h> #include <sys/stat.h> #include <fcntl.h> #include <stdarg.h> typedef enum { OUTPUT_FMT_PLAIN, OUTPUT_FMT_RVDS, OUTPUT_FMT_GAS, } output_fmt_t; int log_msg(const char *fmt, ...) { int res; va_list ap; va_start(ap, fmt); res = vfprintf(stderr, fmt, ap); va_end(ap); return res; } #if defined(__GNUC__) && __GNUC__ #if defined(__MACH__) #include <mach-o/loader.h> #include <mach-o/nlist.h> int parse_macho(uint8_t *base_buf, size_t sz) { int i, j; struct mach_header header; uint8_t *buf = base_buf; int base_data_section = 0; memcpy(&header, buf, sizeof(struct mach_header)); buf += sizeof(struct mach_header); if (header.magic != MH_MAGIC) { log_msg("Bad magic number for object file. 0x%x expected, 0x%x found.\n", header.magic, MH_MAGIC); goto bail; } if (header.cputype != CPU_TYPE_ARM) { log_msg("Bad cputype for object file. Currently only tested for CPU_TYPE_ARM.\n"); goto bail; } if (header.filetype != MH_OBJECT) { log_msg("Bad filetype for object file. Currently only tested for MH_OBJECT.\n"); goto bail; } for (i = 0; i < header.ncmds; i++) { struct load_command lc; struct symtab_command sc; struct segment_command seg_c; memcpy(&lc, buf, sizeof(struct load_command)); if (lc.cmd == LC_SEGMENT) { uint8_t *seg_buf = buf; struct section s; memcpy(&seg_c, buf, sizeof(struct segment_command)); seg_buf += sizeof(struct segment_command); for (j = 0; j < seg_c.nsects; j++) { memcpy(&s, seg_buf + (j * sizeof(struct section)), sizeof(struct section)); // Need to get this offset which is the start of the symbol table // before matching the strings up with symbols. base_data_section = s.offset; } } else if (lc.cmd == LC_SYMTAB) { uint8_t *sym_buf = base_buf; uint8_t *str_buf = base_buf; if (base_data_section != 0) { memcpy(&sc, buf, sizeof(struct symtab_command)); if (sc.cmdsize != sizeof(struct symtab_command)) log_msg("Can't find symbol table!\n"); sym_buf += sc.symoff; str_buf += sc.stroff; for (j = 0; j < sc.nsyms; j++) { struct nlist nl; int val; memcpy(&nl, sym_buf + (j * sizeof(struct nlist)), sizeof(struct nlist)); val = *((int *)(base_buf + base_data_section + nl.n_value)); // Location of string is cacluated each time from the // start of the string buffer. On darwin the symbols // are prefixed by "_". On other platforms it is not // so it needs to be removed. That is the reason for // the +1. printf("%-40s EQU %5d\n", str_buf + nl.n_un.n_strx + 1, val); } } } buf += lc.cmdsize; } return 0; bail: return 1; } int main(int argc, char **argv) { int fd; char *f; struct stat stat_buf; uint8_t *file_buf; int res; if (argc < 2 || argc > 3) { fprintf(stderr, "Usage: %s [output format] <obj file>\n\n", argv[0]); fprintf(stderr, " <obj file>\tMachO format object file to parse\n"); fprintf(stderr, "Output Formats:\n"); fprintf(stderr, " gas - compatible with GNU assembler\n"); fprintf(stderr, " rvds - compatible with armasm\n"); goto bail; } f = argv[2]; if (!((!strcmp(argv[1], "rvds")) || (!strcmp(argv[1], "gas")))) f = argv[1]; fd = open(f, O_RDONLY); if (fd < 0) { perror("Unable to open file"); goto bail; } if (fstat(fd, &stat_buf)) { perror("stat"); goto bail; } file_buf = malloc(stat_buf.st_size); if (!file_buf) { perror("malloc"); goto bail; } if (read(fd, file_buf, stat_buf.st_size) != stat_buf.st_size) { perror("read"); goto bail; } if (close(fd)) { perror("close"); goto bail; } res = parse_macho(file_buf, stat_buf.st_size); free(file_buf); if (!res) return EXIT_SUCCESS; bail: return EXIT_FAILURE; } #else #include "elf.h" #define COPY_STRUCT(dst, buf, ofst, sz) do {\ if(ofst + sizeof((*(dst))) > sz) goto bail;\ memcpy(dst, buf+ofst, sizeof((*(dst))));\ } while(0) #define ENDIAN_ASSIGN(val, memb) do {\ if(!elf->le_data) {log_msg("Big Endian data not supported yet!\n");goto bail;}\ (val) = (memb);\ } while(0) #define ENDIAN_ASSIGN_IN_PLACE(memb) do {\ ENDIAN_ASSIGN(memb, memb);\ } while(0) typedef struct { uint8_t *buf; /* Buffer containing ELF data */ size_t sz; /* Buffer size */ int le_data; /* Data is little-endian */ Elf32_Ehdr hdr; } elf_obj_t; int parse_elf32_header(elf_obj_t *elf) { int res; /* Verify ELF32 header */ COPY_STRUCT(&elf->hdr, elf->buf, 0, elf->sz); res = elf->hdr.e_ident[EI_MAG0] == ELFMAG0; res &= elf->hdr.e_ident[EI_MAG1] == ELFMAG1; res &= elf->hdr.e_ident[EI_MAG2] == ELFMAG2; res &= elf->hdr.e_ident[EI_MAG3] == ELFMAG3; res &= elf->hdr.e_ident[EI_CLASS] == ELFCLASS32; res &= elf->hdr.e_ident[EI_DATA] == ELFDATA2LSB || elf->hdr.e_ident[EI_DATA] == ELFDATA2MSB; if (!res) goto bail; elf->le_data = elf->hdr.e_ident[EI_DATA] == ELFDATA2LSB; ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_type); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_machine); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_version); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_entry); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_phoff); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_shoff); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_flags); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_ehsize); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_phentsize); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_phnum); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_shentsize); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_shnum); ENDIAN_ASSIGN_IN_PLACE(elf->hdr.e_shstrndx); return 0; bail: return 1; } int parse_elf32_section(elf_obj_t *elf, int idx, Elf32_Shdr *hdr) { if (idx >= elf->hdr.e_shnum) goto bail; COPY_STRUCT(hdr, elf->buf, elf->hdr.e_shoff + idx * elf->hdr.e_shentsize, elf->sz); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_name); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_type); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_flags); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_addr); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_offset); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_size); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_link); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_info); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_addralign); ENDIAN_ASSIGN_IN_PLACE(hdr->sh_entsize); return 0; bail: return 1; } char *parse_elf32_string_table(elf_obj_t *elf, int s_idx, int idx) { Elf32_Shdr shdr; if (parse_elf32_section(elf, s_idx, &shdr)) { log_msg("Failed to parse ELF string table: section %d, index %d\n", s_idx, idx); return ""; } return (char *)(elf->buf + shdr.sh_offset + idx); } int parse_elf32_symbol(elf_obj_t *elf, unsigned int ofst, Elf32_Sym *sym) { COPY_STRUCT(sym, elf->buf, ofst, elf->sz); ENDIAN_ASSIGN_IN_PLACE(sym->st_name); ENDIAN_ASSIGN_IN_PLACE(sym->st_value); ENDIAN_ASSIGN_IN_PLACE(sym->st_size); ENDIAN_ASSIGN_IN_PLACE(sym->st_info); ENDIAN_ASSIGN_IN_PLACE(sym->st_other); ENDIAN_ASSIGN_IN_PLACE(sym->st_shndx); return 0; bail: return 1; } int parse_elf32(uint8_t *buf, size_t sz, output_fmt_t mode) { elf_obj_t elf; Elf32_Shdr shdr; unsigned int ofst; int i; Elf32_Off strtab_off; /* save String Table offset for later use */ memset(&elf, 0, sizeof(elf)); elf.buf = buf; elf.sz = sz; /* Parse Header */ if (parse_elf32_header(&elf)) { log_msg("Parse error: File does not appear to be valid ELF32\n"); return 1; } for (i = 0; i < elf.hdr.e_shnum; i++) { parse_elf32_section(&elf, i, &shdr); if (shdr.sh_type == SHT_STRTAB) { char strtsb_name[128]; strcpy(strtsb_name, (char *)(elf.buf + shdr.sh_offset + shdr.sh_name)); if (!(strcmp(strtsb_name, ".shstrtab"))) { log_msg("found section: %s\n", strtsb_name); strtab_off = shdr.sh_offset; break; } } } /* Parse all Symbol Tables */ for (i = 0; i < elf.hdr.e_shnum; i++) { parse_elf32_section(&elf, i, &shdr); if (shdr.sh_type == SHT_SYMTAB) { for (ofst = shdr.sh_offset; ofst < shdr.sh_offset + shdr.sh_size; ofst += shdr.sh_entsize) { Elf32_Sym sym; parse_elf32_symbol(&elf, ofst, &sym); /* For all OBJECTS (data objects), extract the value from the * proper data segment. */ if (ELF32_ST_TYPE(sym.st_info) == STT_OBJECT && sym.st_name) log_msg("found data object %s\n", parse_elf32_string_table(&elf, shdr.sh_link, sym.st_name)); if (ELF32_ST_TYPE(sym.st_info) == STT_OBJECT && sym.st_size == 4) { Elf32_Shdr dhdr; int32_t val; char section_name[128]; parse_elf32_section(&elf, sym.st_shndx, &dhdr); /* For explanition - refer to _MSC_VER version of code */ strcpy(section_name, (char *)(elf.buf + strtab_off + dhdr.sh_name)); log_msg("Section_name: %s, Section_type: %d\n", section_name, dhdr.sh_type); if (!(strcmp(section_name, ".bss"))) { val = 0; } else { memcpy(&val, elf.buf + dhdr.sh_offset + sym.st_value, sizeof(val)); } if (!elf.le_data) { log_msg("Big Endian data not supported yet!\n"); goto bail; }\ switch (mode) { case OUTPUT_FMT_RVDS: printf("%-40s EQU %5d\n", parse_elf32_string_table(&elf, shdr.sh_link, sym.st_name), val); break; case OUTPUT_FMT_GAS: printf(".equ %-40s, %5d\n", parse_elf32_string_table(&elf, shdr.sh_link, sym.st_name), val); break; default: printf("%s = %d\n", parse_elf32_string_table(&elf, shdr.sh_link, sym.st_name), val); } } } } } if (mode == OUTPUT_FMT_RVDS) printf(" END\n"); return 0; bail: log_msg("Parse error: File does not appear to be valid ELF32\n"); return 1; } int main(int argc, char **argv) { int fd; output_fmt_t mode; char *f; struct stat stat_buf; uint8_t *file_buf; int res; if (argc < 2 || argc > 3) { fprintf(stderr, "Usage: %s [output format] <obj file>\n\n", argv[0]); fprintf(stderr, " <obj file>\tELF format object file to parse\n"); fprintf(stderr, "Output Formats:\n"); fprintf(stderr, " gas - compatible with GNU assembler\n"); fprintf(stderr, " rvds - compatible with armasm\n"); goto bail; } f = argv[2]; if (!strcmp(argv[1], "rvds")) mode = OUTPUT_FMT_RVDS; else if (!strcmp(argv[1], "gas")) mode = OUTPUT_FMT_GAS; else f = argv[1]; fd = open(f, O_RDONLY); if (fd < 0) { perror("Unable to open file"); goto bail; } if (fstat(fd, &stat_buf)) { perror("stat"); goto bail; } file_buf = malloc(stat_buf.st_size); if (!file_buf) { perror("malloc"); goto bail; } if (read(fd, file_buf, stat_buf.st_size) != stat_buf.st_size) { perror("read"); goto bail; } if (close(fd)) { perror("close"); goto bail; } res = parse_elf32(file_buf, stat_buf.st_size, mode); //res = parse_coff(file_buf, stat_buf.st_size); free(file_buf); if (!res) return EXIT_SUCCESS; bail: return EXIT_FAILURE; } #endif #endif #if defined(_MSC_VER) /* See "Microsoft Portable Executable and Common Object File Format Specification" for reference. */ #define get_le32(x) ((*(x)) | (*(x+1)) << 8 |(*(x+2)) << 16 | (*(x+3)) << 24 ) #define get_le16(x) ((*(x)) | (*(x+1)) << 8) int parse_coff(unsigned __int8 *buf, size_t sz) { unsigned int nsections, symtab_ptr, symtab_sz, strtab_ptr; unsigned int sectionrawdata_ptr; unsigned int i; unsigned __int8 *ptr; unsigned __int32 symoffset; FILE *fp; char **sectionlist; //this array holds all section names in their correct order. //it is used to check if the symbol is in .bss or .data section. nsections = get_le16(buf + 2); symtab_ptr = get_le32(buf + 8); symtab_sz = get_le32(buf + 12); strtab_ptr = symtab_ptr + symtab_sz * 18; if (nsections > 96) goto bail; sectionlist = malloc(nsections * sizeof * sectionlist); //log_msg("COFF: Found %u symbols in %u sections.\n", symtab_sz, nsections); /* The size of optional header is always zero for an obj file. So, the section header follows the file header immediately. */ ptr = buf + 20; //section header for (i = 0; i < nsections; i++) { char sectionname[9] = {0, 0, 0, 0, 0, 0, 0, 0, 0}; strncpy(sectionname, ptr, 8); //log_msg("COFF: Parsing section %s\n",sectionname); sectionlist[i] = malloc(strlen(sectionname) + 1); strcpy(sectionlist[i], sectionname); if (!strcmp(sectionname, ".data")) sectionrawdata_ptr = get_le32(ptr + 20); ptr += 40; } //log_msg("COFF: Symbol table at offset %u\n", symtab_ptr); //log_msg("COFF: raw data pointer ofset for section .data is %u\n", sectionrawdata_ptr); fp = fopen("vpx_asm_offsets.asm", "w"); if (fp == NULL) { perror("open file"); goto bail; } /* The compiler puts the data with non-zero offset in .data section, but puts the data with zero offset in .bss section. So, if the data in in .bss section, set offset=0. Note from Wiki: In an object module compiled from C, the bss section contains the local variables (but not functions) that were declared with the static keyword, except for those with non-zero initial values. (In C, static variables are initialized to zero by default.) It also contains the non-local (both extern and static) variables that are also initialized to zero (either explicitly or by default). */ //move to symbol table /* COFF symbol table: offset field 0 Name(*) 8 Value 12 SectionNumber 14 Type 16 StorageClass 17 NumberOfAuxSymbols */ ptr = buf + symtab_ptr; for (i = 0; i < symtab_sz; i++) { __int16 section = get_le16(ptr + 12); //section number if (section > 0 && ptr[16] == 2) { //if(section > 0 && ptr[16] == 3 && get_le32(ptr+8)) { if (get_le32(ptr)) { char name[9] = {0, 0, 0, 0, 0, 0, 0, 0, 0}; strncpy(name, ptr, 8); //log_msg("COFF: Parsing symbol %s\n",name); fprintf(fp, "%-40s EQU ", name); } else { //log_msg("COFF: Parsing symbol %s\n", // buf + strtab_ptr + get_le32(ptr+4)); fprintf(fp, "%-40s EQU ", buf + strtab_ptr + get_le32(ptr + 4)); } if (!(strcmp(sectionlist[section-1], ".bss"))) { symoffset = 0; } else { symoffset = get_le32(buf + sectionrawdata_ptr + get_le32(ptr + 8)); } //log_msg(" Section: %d\n",section); //log_msg(" Class: %d\n",ptr[16]); //log_msg(" Address: %u\n",get_le32(ptr+8)); //log_msg(" Offset: %u\n", symoffset); fprintf(fp, "%5d\n", symoffset); } ptr += 18; } fprintf(fp, " END\n"); fclose(fp); for (i = 0; i < nsections; i++) { free(sectionlist[i]); } free(sectionlist); return 0; bail: for (i = 0; i < nsections; i++) { free(sectionlist[i]); } free(sectionlist); return 1; } int main(int argc, char **argv) { int fd; output_fmt_t mode; const char *f; struct _stat stat_buf; unsigned __int8 *file_buf; int res; if (argc < 2 || argc > 3) { fprintf(stderr, "Usage: %s [output format] <obj file>\n\n", argv[0]); fprintf(stderr, " <obj file>\tELF format object file to parse\n"); fprintf(stderr, "Output Formats:\n"); fprintf(stderr, " gas - compatible with GNU assembler\n"); fprintf(stderr, " rvds - compatible with armasm\n"); goto bail; } f = argv[2]; if (!strcmp(argv[1], "rvds")) mode = OUTPUT_FMT_RVDS; else if (!strcmp(argv[1], "gas")) mode = OUTPUT_FMT_GAS; else f = argv[1]; if (_sopen_s(&fd, f, _O_BINARY, _SH_DENYNO, _S_IREAD | _S_IWRITE)) { perror("Unable to open file"); goto bail; } if (_fstat(fd, &stat_buf)) { perror("stat"); goto bail; } file_buf = malloc(stat_buf.st_size); if (!file_buf) { perror("malloc"); goto bail; } if (_read(fd, file_buf, stat_buf.st_size) != stat_buf.st_size) { perror("read"); goto bail; } if (_close(fd)) { perror("close"); goto bail; } res = parse_coff(file_buf, stat_buf.st_size); free(file_buf); if (!res) return EXIT_SUCCESS; bail: return EXIT_FAILURE; } #endif