#!/usr/bin/env python # Copyright (c) 2011 The Chromium Authors. All rights reserved. # Use of this source code is governed by a BSD-style license that can be # found in the LICENSE file. # Usage: strip_save_dsym <whatever-arguments-you-would-pass-to-strip> # # strip_save_dsym is a wrapper around the standard strip utility. Given an # input Mach-O file, strip_save_dsym will save a copy of the file in a "fake" # .dSYM bundle for debugging, and then call strip to strip the Mach-O file. # Note that the .dSYM file is a "fake" in that it's not a self-contained # .dSYM bundle, it just contains a copy of the original (unstripped) Mach-O # file, and therefore contains references to object files on the filesystem. # The generated .dSYM bundle is therefore unsuitable for debugging in the # absence of these .o files. # # If a .dSYM already exists and has a newer timestamp than the Mach-O file, # this utility does nothing. That allows strip_save_dsym to be run on a file # that has already been stripped without trashing the .dSYM. # # Rationale: the "right" way to generate dSYM bundles, dsymutil, is incredibly # slow. On the other hand, doing a file copy (which is really all that # dsymutil does) is comparatively fast. Since we usually just want to strip # a release-mode executable but still be able to debug it, and we don't care # so much about generating a hermetic dSYM bundle, we'll prefer the file copy. # If a real dSYM is ever needed, it's still possible to create one by running # dsymutil and pointing it at the original Mach-O file inside the "fake" # bundle, provided that the object files are available. import errno import os import re import shutil import subprocess import sys import time # Returns a list of architectures contained in a Mach-O file. The file can be # a universal (fat) file, in which case there will be one list element for # each contained architecture, or it can be a thin single-architecture Mach-O # file, in which case the list will contain a single element identifying the # architecture. On error, returns an empty list. Determines the architecture # list by calling file. def macho_archs(macho): macho_types = ["executable", "dynamically linked shared library", "bundle"] macho_types_re = "Mach-O (?:64-bit )?(?:" + "|".join(macho_types) + ")" file_cmd = subprocess.Popen(["/usr/bin/file", "-b", "--", macho], stdout=subprocess.PIPE) archs = [] type_line = file_cmd.stdout.readline() type_match = re.match("^%s (.*)$" % macho_types_re, type_line) if type_match: archs.append(type_match.group(1)) return [type_match.group(1)] else: type_match = re.match("^Mach-O universal binary with (.*) architectures$", type_line) if type_match: for i in range(0, int(type_match.group(1))): arch_line = file_cmd.stdout.readline() arch_match = re.match( "^.* \(for architecture (.*)\):\t%s .*$" % macho_types_re, arch_line) if arch_match: archs.append(arch_match.group(1)) if file_cmd.wait() != 0: archs = [] if len(archs) == 0: print >> sys.stderr, "No architectures in %s" % macho return archs # Returns a dictionary mapping architectures contained in the file as returned # by macho_archs to the LC_UUID load command for that architecture. # Architectures with no LC_UUID load command are omitted from the dictionary. # Determines the UUID value by calling otool. def macho_uuids(macho): uuids = {} archs = macho_archs(macho) if len(archs) == 0: return uuids for arch in archs: if arch == "": continue otool_cmd = subprocess.Popen(["/usr/bin/otool", "-arch", arch, "-l", "-", macho], stdout=subprocess.PIPE) # state 0 is when nothing UUID-related has been seen yet. State 1 is # entered after a load command begins, but it may not be an LC_UUID load # command. States 2, 3, and 4 are intermediate states while reading an # LC_UUID command. State 5 is the terminal state for a successful LC_UUID # read. State 6 is the error state. state = 0 uuid = "" for otool_line in otool_cmd.stdout: if state == 0: if re.match("^Load command .*$", otool_line): state = 1 elif state == 1: if re.match("^ cmd LC_UUID$", otool_line): state = 2 else: state = 0 elif state == 2: if re.match("^ cmdsize 24$", otool_line): state = 3 else: state = 6 elif state == 3: # The UUID display format changed in the version of otool shipping # with the Xcode 3.2.2 prerelease. The new format is traditional: # uuid 4D7135B2-9C56-C5F5-5F49-A994258E0955 # and with Xcode 3.2.6, then line is indented one more space: # uuid 4D7135B2-9C56-C5F5-5F49-A994258E0955 # The old format, from cctools-750 and older's otool, breaks the UUID # up into a sequence of bytes: # uuid 0x4d 0x71 0x35 0xb2 0x9c 0x56 0xc5 0xf5 # 0x5f 0x49 0xa9 0x94 0x25 0x8e 0x09 0x55 new_uuid_match = re.match("^ {3,4}uuid (.{8}-.{4}-.{4}-.{4}-.{12})$", otool_line) if new_uuid_match: uuid = new_uuid_match.group(1) # Skip state 4, there is no second line to read. state = 5 else: old_uuid_match = re.match("^ uuid 0x(..) 0x(..) 0x(..) 0x(..) " "0x(..) 0x(..) 0x(..) 0x(..)$", otool_line) if old_uuid_match: state = 4 uuid = old_uuid_match.group(1) + old_uuid_match.group(2) + \ old_uuid_match.group(3) + old_uuid_match.group(4) + "-" + \ old_uuid_match.group(5) + old_uuid_match.group(6) + "-" + \ old_uuid_match.group(7) + old_uuid_match.group(8) + "-" else: state = 6 elif state == 4: old_uuid_match = re.match("^ 0x(..) 0x(..) 0x(..) 0x(..) " "0x(..) 0x(..) 0x(..) 0x(..)$", otool_line) if old_uuid_match: state = 5 uuid += old_uuid_match.group(1) + old_uuid_match.group(2) + "-" + \ old_uuid_match.group(3) + old_uuid_match.group(4) + \ old_uuid_match.group(5) + old_uuid_match.group(6) + \ old_uuid_match.group(7) + old_uuid_match.group(8) else: state = 6 if otool_cmd.wait() != 0: state = 6 if state == 5: uuids[arch] = uuid.upper() if len(uuids) == 0: print >> sys.stderr, "No UUIDs in %s" % macho return uuids # Given a path to a Mach-O file and possible information from the environment, # determines the desired path to the .dSYM. def dsym_path(macho): # If building a bundle, the .dSYM should be placed next to the bundle. Use # WRAPPER_NAME to make this determination. If called from xcodebuild, # WRAPPER_NAME will be set to the name of the bundle. dsym = "" if "WRAPPER_NAME" in os.environ: if "BUILT_PRODUCTS_DIR" in os.environ: dsym = os.path.join(os.environ["BUILT_PRODUCTS_DIR"], os.environ["WRAPPER_NAME"]) else: dsym = os.environ["WRAPPER_NAME"] else: dsym = macho dsym += ".dSYM" return dsym # Creates a fake .dSYM bundle at dsym for macho, a Mach-O image with the # architectures and UUIDs specified by the uuids map. def make_fake_dsym(macho, dsym): uuids = macho_uuids(macho) if len(uuids) == 0: return False dwarf_dir = os.path.join(dsym, "Contents", "Resources", "DWARF") dwarf_file = os.path.join(dwarf_dir, os.path.basename(macho)) try: os.makedirs(dwarf_dir) except OSError, (err, error_string): if err != errno.EEXIST: raise shutil.copyfile(macho, dwarf_file) # info_template is the same as what dsymutil would have written, with the # addition of the fake_dsym key. info_template = \ '''<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE plist PUBLIC "-//Apple Computer//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd"> <plist version="1.0"> <dict> <key>CFBundleDevelopmentRegion</key> <string>English</string> <key>CFBundleIdentifier</key> <string>com.apple.xcode.dsym.%(root_name)s</string> <key>CFBundleInfoDictionaryVersion</key> <string>6.0</string> <key>CFBundlePackageType</key> <string>dSYM</string> <key>CFBundleSignature</key> <string>????</string> <key>CFBundleShortVersionString</key> <string>1.0</string> <key>CFBundleVersion</key> <string>1</string> <key>dSYM_UUID</key> <dict> %(uuid_dict)s </dict> <key>fake_dsym</key> <true/> </dict> </plist> ''' root_name = os.path.basename(dsym)[:-5] # whatever.dSYM without .dSYM uuid_dict = "" for arch in sorted(uuids): uuid_dict += "\t\t\t<key>" + arch + "</key>\n"\ "\t\t\t<string>" + uuids[arch] + "</string>\n" info_dict = { "root_name": root_name, "uuid_dict": uuid_dict, } info_contents = info_template % info_dict info_file = os.path.join(dsym, "Contents", "Info.plist") info_fd = open(info_file, "w") info_fd.write(info_contents) info_fd.close() return True # For a Mach-O file, determines where the .dSYM bundle should be located. If # the bundle does not exist or has a modification time older than the Mach-O # file, calls make_fake_dsym to create a fake .dSYM bundle there, then strips # the Mach-O file and sets the modification time on the .dSYM bundle and Mach-O # file to be identical. def strip_and_make_fake_dsym(macho): dsym = dsym_path(macho) macho_stat = os.stat(macho) dsym_stat = None try: dsym_stat = os.stat(dsym) except OSError, (err, error_string): if err != errno.ENOENT: raise if dsym_stat is None or dsym_stat.st_mtime < macho_stat.st_mtime: # Make a .dSYM bundle if not make_fake_dsym(macho, dsym): return False # Strip the Mach-O file remove_dsym = True try: strip_cmdline = ['xcrun', 'strip'] + sys.argv[1:] strip_cmd = subprocess.Popen(strip_cmdline) if strip_cmd.wait() == 0: remove_dsym = False finally: if remove_dsym: shutil.rmtree(dsym) # Update modification time on the Mach-O file and .dSYM bundle now = time.time() os.utime(macho, (now, now)) os.utime(dsym, (now, now)) return True def main(argv=None): if argv is None: argv = sys.argv # This only supports operating on one file at a time. Look at the arguments # to strip to figure out what the source to be stripped is. Arguments are # processed in the same way that strip does, although to reduce complexity, # this doesn't do all of the same checking as strip. For example, strip # has no -Z switch and would treat -Z on the command line as an error. For # the purposes this is needed for, that's fine. macho = None process_switches = True ignore_argument = False for arg in argv[1:]: if ignore_argument: ignore_argument = False continue if process_switches: if arg == "-": process_switches = False # strip has these switches accept an argument: if arg in ["-s", "-R", "-d", "-o", "-arch"]: ignore_argument = True if arg[0] == "-": continue if macho is None: macho = arg else: print >> sys.stderr, "Too many things to strip" return 1 if macho is None: print >> sys.stderr, "Nothing to strip" return 1 if not strip_and_make_fake_dsym(macho): return 1 return 0 if __name__ == "__main__": sys.exit(main(sys.argv))