Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(64)

Unified Diff: tools/cygprofile/symbols_extractor.py

Issue 884113002: Refactor the symbol parsing, and move to NDK's nm. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: Typo. Created 5 years, 11 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
Index: tools/cygprofile/symbols_extractor.py
diff --git a/tools/cygprofile/symbols_extractor.py b/tools/cygprofile/symbols_extractor.py
new file mode 100755
index 0000000000000000000000000000000000000000..f87ce877cfeb3fc12cee3ffd9dbcacfedb20b894
--- /dev/null
+++ b/tools/cygprofile/symbols_extractor.py
@@ -0,0 +1,127 @@
+#!/usr/bin/python
+# Copyright 2015 The Chromium Authors. All rights reserved.
+# Use of this source code is governed by a BSD-style license that can be
+# found in the LICENSE file.
+
+"""Utilities to get and manipulate symbols from a binary."""
+
+import collections
+import os
+import subprocess
+import sys
+
+sys.path.append(os.path.join(sys.path[0], '..', '..', 'build', 'android'))
+from pylib import constants
+
+
+# TODO(lizeb): Fix this when the hardcoded assumptions (ARM 32bits, linux
pasko 2015/01/28 14:37:01 Can this be trivially reused via ToolPath() from t
Benoit L 2015/01/28 15:20:41 Thank you for the tip ! Done.
+# x86_64) are no longer true. Even better, encapsulate the
+# architecture-dependent bits.
+_NM_BINARY = os.path.join(constants.ANDROID_NDK_ROOT, 'toolchains',
+ 'arm-linux-androideabi-4.9', 'prebuilt',
+ 'linux-x86_64', 'bin', 'arm-linux-androideabi-nm')
+
+__SymbolInfo = collections.namedtuple(
pasko 2015/01/28 14:37:01 Two blank lines between top-level definitions: htt
Benoit L 2015/01/28 15:20:41 Done.
+ '__SymbolInfo', ('name', 'offset', 'size'))
+
+class SymbolInfo(__SymbolInfo):
pasko 2015/01/28 14:37:01 Making this a class complicates reading without cl
Benoit L 2015/01/28 15:20:41 Done.
+ """Represent the information gathered from a symbol.
+ """
+ __slots__ = ()
+
+ @classmethod
+ def fromNmLine(cls, line):
+ """Create a SymbolInfo by parsing a properly formatted nm output line.
+
+ Args:
+ line: line from nm
+
+ Returns:
+ An instance of SymbolInfo if the line represent a symbol, None otherwise.
pasko 2015/01/28 14:37:01 s/represent/represents/
Benoit L 2015/01/28 15:20:41 Done.
+ """
+ # We are interested in two types of lines:
+ # This:
+ # 00210d59 00000002 t _ZN34BrowserPluginHostMsg_Attach_ParamsD2Ev
+ # offset size <symbol_type> symbol_name
+ # And that:
+ # 0070ee8c T WebRtcSpl_ComplexBitReverse
+ # In the second case we don't have a size, so use -1 as a sentinel
+ if not any(x in line for x in (' t ', ' W ', ' T ')):
pasko 2015/01/28 14:37:02 I realize it was easy to write this line, but read
Benoit L 2015/01/28 15:20:41 Done.
+ return None
+ parts = line.split()
+ if len(parts) == 4:
+ return SymbolInfo(
+ offset=int(parts[0], 16), size=int(parts[1], 16), name=parts[3])
+ elif len(parts) == 3:
+ return SymbolInfo(
+ offset=int(parts[0], 16), size=-1, name=parts[2])
+ else:
+ return None
+
+
+def SymbolInfosFromStream(nm_lines):
+ """Parses the output of nm, and get all the symbols from a binary.
+
+ Args:
+ nm_lines: An iterable of lines
+
+ Returns:
+ The same output as GetSymbolsFromBinary.
pasko 2015/01/28 14:37:01 did you mean SymbolInfosFromBinary? Saying that it
Benoit L 2015/01/28 15:20:41 Done.
+ """
+ # TODO(lizeb): Consider switching to objdump to simplify parsing.
+ symbol_infos = []
+ for line in nm_lines:
+ if not any(x in line for x in (' t ', ' W ', ' T ')):
pasko 2015/01/28 14:37:02 why checking it again here? the checkign for None
Benoit L 2015/01/28 15:20:41 Done.
+ continue
+ symbol_info = SymbolInfo.fromNmLine(line)
+ if symbol_info:
+ symbol_infos.append(symbol_info)
+ return symbol_infos
+
+
+def SymbolInfosFromBinary(binary_filename):
+ """Runs nm to get all the symbols from a binary.
+
+ Args:
+ binary_filename: path to the binary.
+
+ Returns:
+ A list of symbols from the binary.
+ """
+ command = (_NM_BINARY, '-S', '-n', binary_filename)
+ p = subprocess.Popen(command, shell=False, stdout=subprocess.PIPE)
+ try:
+ result = SymbolInfosFromStream(p.stdout)
+ return result
+ finally:
+ p.wait()
+
+
+def OffsetToSymbolInfos(symbol_infos):
pasko 2015/01/28 14:37:02 GroupSymbolInfosByOffset? GroupSymbolsByOffset? Gr
Benoit L 2015/01/28 15:20:41 Done.
+ """Create a dict {offset: [symbol_info1, ...], ...}.
+
+ As several symbols can be at the same offset, this is a 1-to-many
+ relationship.
+
+ Args:
+ symbol_infos: iterable of SymbolInfo instances
+
+ Returns:
+ a dict {offset: [symbol_info1, ...], ...}
+ """
+ offset_to_symbol_infos = collections.defaultdict(list)
+ for symbol_info in symbol_infos:
+ offset_to_symbol_infos[symbol_info.offset].append(symbol_info)
+ return dict(offset_to_symbol_infos)
+
+
+def NameToSymbolInfo(symbol_infos):
pasko 2015/01/28 14:37:01 CreateNameToSymbolInfo?
Benoit L 2015/01/28 15:20:41 Done.
+ """Create a dict {name: symbol_info, ...}.
+
+ Args:
+ symbol_infos: iterable of SymbolInfo instances
+
+ Returns:
+ a dict {name: symbol_info, ...}
+ """
+ return {symbol_info.name: symbol_info for symbol_info in symbol_infos}

Powered by Google App Engine
This is Rietveld 408576698