tools/cygprofile/symbol_extractor.py - Issue 886563002: Switch from nm to objdump for the cygprofile tools.

Unified Diff: tools/cygprofile/symbol_extractor.py

Issue 886563002: Switch from nm to objdump for the cygprofile tools. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Address comments. Created 5 years, 11 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « tools/cygprofile/patch_orderfile_unittest.py ('k') | tools/cygprofile/symbol_extractor_unittest.py » ('j') | tools/cygprofile/symbol_extractor_unittest.py » ('J')
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: tools/cygprofile/symbol_extractor.py

diff --git a/tools/cygprofile/symbol_extractor.py b/tools/cygprofile/symbol_extractor.py

new file mode 100755

index 0000000000000000000000000000000000000000..8996e1df3167aa31646599f60a09a6fa50099135

--- /dev/null

+++ b/tools/cygprofile/symbol_extractor.py

@@ -0,0 +1,113 @@

+#!/usr/bin/python

+# Use of this source code is governed by a BSD-style license that can be

+# found in the LICENSE file.

+"""Utilities to get and manipulate symbols from a binary."""

+import collections

+import os

+import re

+import subprocess

+import sys

+sys.path.insert(

+ 0, os.path.join(sys.path[0], '..', '..', 'third_party', 'android_platform',

pasko 2015/01/29 12:24:42 why not sys.path.append()? let's also not make an

Benoit L 2015/01/29 13:10:30 Because python's standard library also has a modul

+ 'development', 'scripts'))

+import symbol

+# TODO(lizeb): Change symbol.ARCH to the proper value when "arm" is no longer

+# the only possible value.

+_OBJDUMP_BINARY = symbol.ToolPath('objdump')

+SymbolInfo = collections.namedtuple('SymbolInfo', ('name', 'offset', 'size',

+ 'section'))

+def _FromObjdumpLine(line):

+ """Create a SymbolInfo by parsing a properly formatted objdump output line.

+ Args:

+ line: line from objdump

+ Returns:

+ An instance of SymbolInfo if the line represents a symbol, None otherwise.

+ """

+ # All of the symbol lines we care about are in the form

+ # 0000000000 g F .text.foo 000000000 [.hidden] foo

+ # where g (global) might also be l (local) or w (weak).

+ parts = line.split()

+ if len(parts) < 6 or parts[2] != 'F':

+ return None

+ offset = int(parts[0], 16)

+ section = parts[3]

+ size = int(parts[4], 16)

+ name = parts[-1].rstrip('\n')

+ return SymbolInfo(name=name, offset=offset, section=section, size=size)

+def _SymbolInfosFromStream(objdump_lines):

+ """Parses the output of objdump, and get all the symbols from a binary.

+ Args:

+ objdump_lines: An iterable of lines

+ Returns:

+ A list of SymbolInfo.

+ """

+ symbol_infos = []

+ for line in objdump_lines:

+ symbol_info = _FromObjdumpLine(line)

+ if symbol_info is not None:

+ symbol_infos.append(symbol_info)

+ return symbol_infos

+def SymbolInfosFromBinary(binary_filename):

+ """Runs objdump to get all the symbols from a binary.

+ Args:

+ binary_filename: path to the binary.

+ Returns:

+ A list of SymbolInfo from the binary.

+ """

+ command = (_OBJDUMP_BINARY, '-t', '-w', binary_filename)

+ p = subprocess.Popen(command, shell=False, stdout=subprocess.PIPE)

+ try:

+ result = _SymbolInfosFromStream(p.stdout)

+ return result

+ finally:

+ p.wait()

+def GroupSymbolInfosByOffset(symbol_infos):

+ """Create a dict {offset: [symbol_info1, ...], ...}.

+ As several symbols can be at the same offset, this is a 1-to-many

+ relationship.

+ Args:

+ symbol_infos: iterable of SymbolInfo instances

+ Returns:

+ a dict {offset: [symbol_info1, ...], ...}

+ """

+ offset_to_symbol_infos = collections.defaultdict(list)

+ for symbol_info in symbol_infos:

+ offset_to_symbol_infos[symbol_info.offset].append(symbol_info)

+ return dict(offset_to_symbol_infos)

+def CreateNameToSymbolInfo(symbol_infos):

pasko 2015/01/29 12:24:42 this function is only used in a test, is it going

Benoit L 2015/01/29 13:10:30 Yes, it is going to be used. But I would prefer to

pasko 2015/01/29 13:25:30 since it confuses reviewers, that's usually worth

+ """Create a dict {name: symbol_info, ...}.

+ Args:

+ symbol_infos: iterable of SymbolInfo instances

+ Returns:

+ a dict {name: symbol_info, ...}

+ """

+ return {symbol_info.name: symbol_info for symbol_info in symbol_infos}