tools/deep_memory_profiler/dmprof - Issue 9812010: Breakdown nonprofiled memory regions (f.k.a. 'unknown'), and add new policy files.

Unified Diff: tools/deep_memory_profiler/dmprof

Issue 9812010: Breakdown nonprofiled memory regions (f.k.a. 'unknown'), and add new policy files. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: ready for review Created 8 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/deep_memory_profiler/dmprof

diff --git a/tools/deep_memory_profiler/dmprof.py b/tools/deep_memory_profiler/dmprof

similarity index 86%

rename from tools/deep_memory_profiler/dmprof.py

rename to tools/deep_memory_profiler/dmprof

index e9c642c80d168cb82a2b455cabe0aa0efb16ccf0..1a4cd20933856d730b8a9138c95a959197b9e0ac 100755

--- a/tools/deep_memory_profiler/dmprof.py

+++ b/tools/deep_memory_profiler/dmprof

@@ -45,6 +45,11 @@ DUMP_DEEP_2 = 'DUMP_DEEP_2'

# They should be processed by POLICY_DEEP_2.

DUMP_DEEP_3 = 'DUMP_DEEP_3'

+# DUMP_DEEP_4 adds some features to DUMP_DEEP_3:

+# 1. Support comments starting with '#'

+# 2. Support additional global stats: e.g. nonprofiled-*.

+DUMP_DEEP_4 = 'DUMP_DEEP_4'

Alexander Potapenko 2012/04/12 12:51:33 I think it's time to stop adding DUMP_DEEP_X const

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 I was planning to add other versions than 'DUMP_DE

# Heap Profile Policy versions

# POLICY_DEEP_1 DOES NOT include allocation_type columns.

@@ -109,8 +114,11 @@ class Log(object):

"""A class representing one dumped log data."""

def __init__(self, log_path, buckets):

self.log_path = log_path

+ self.log_lines = []

M-A Ruel 2012/04/12 12:40:36 Here's an example how to rewrite it in a functiona

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Finally, replaced it with: self.log_lines = [l for

with open(self.log_path, mode='r') as log_f:

- self.log_lines = log_f.readlines()

+ for log_line in log_f:

+ if log_line[0] != '#':

Alexander Potapenko 2012/04/12 12:51:33 I think "not log_line.startswith('#')" is more rea

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Exactly. I used startswith as above.

+ self.log_lines.append(log_line)

self.log_version = ''

sys.stderr.write('parsing a log file:%s\n' % log_path)

self.mmap_stacktrace_lines = []

@@ -303,7 +311,7 @@ class Log(object):

lambda n: self.check_stacktrace_line(log_lines[n], buckets))

return (log_lines[stacktrace_lines_start:ln], ln)

- def parse_stacktraces(self, buckets):

+ def parse_stacktraces(self, buckets, ln):

"""Parses lines in self.log_lines as stacktrace.

Valid stacktrace lines are stored into self.mmap_stacktrace_lines and

@@ -312,36 +320,10 @@ class Log(object):

Args:

buckets: A dict mapping bucket ids and their corresponding Bucket

objects.

- Returns:

- A string representing a version of the stacktrace dump. '' for invalid

- dump.

+ ln: An integer representing the starting line number in log_lines.

Alexander Potapenko 2012/04/12 12:51:33 Please don't select short cryptic names for the fu

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Done.

"""

- version = ''

- # Skip until an identifiable line.

- headers = ('STACKTRACES:\n', 'MMAP_STACKTRACES:\n', 'heap profile: ')

- ln = self.skip_lines_while(

- 0, len(self.log_lines),

- lambda n: not self.log_lines[n].startswith(headers))

- # Identify a version.

- if self.log_lines[ln].startswith('heap profile: '):

- version = self.log_lines[ln][13:].strip()

- if version == DUMP_DEEP_2 or version == DUMP_DEEP_3:

- ln = self.skip_lines_while(

- ln, len(self.log_lines),

- lambda n: self.log_lines[n] != 'MMAP_STACKTRACES:\n')

- else:

- sys.stderr.write(' invalid heap profile dump version:%s\n' % version)

- return ''

- elif self.log_lines[ln] == 'STACKTRACES:\n':

- version = DUMP_DEEP_1

- elif self.log_lines[ln] == 'MMAP_STACKTRACES:\n':

- version = DUMP_DEEP_2

- if version == DUMP_DEEP_3:

- sys.stderr.write(' heap profile dump version: %s\n' % version)

+ if self.log_version == DUMP_DEEP_3 or self.log_version == DUMP_DEEP_4:

Alexander Potapenko 2012/04/12 12:51:33 self.log_version in [DUMP_DEEP_3, DUMP_DEEP_4]

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Done.

+ sys.stderr.write(' heap profile dump version: %s\n' % self.log_version)

Alexander Potapenko 2012/04/12 12:51:33 Please move this line to the top of the method, as

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Done.

(self.mmap_stacktrace_lines, ln) = self.parse_stacktraces_while_valid(

buckets, self.log_lines, ln)

ln = self.skip_lines_while(

@@ -349,10 +331,9 @@ class Log(object):

lambda n: self.log_lines[n] != 'MALLOC_STACKTRACES:\n')

(self.malloc_stacktrace_lines, ln) = self.parse_stacktraces_while_valid(

buckets, self.log_lines, ln)

- return version

- elif version == DUMP_DEEP_2:

- sys.stderr.write(' heap profile dump version: %s\n' % version)

+ elif self.log_version == DUMP_DEEP_2:

+ sys.stderr.write(' heap profile dump version: %s\n' % self.log_version)

(self.mmap_stacktrace_lines, ln) = self.parse_stacktraces_while_valid(

buckets, self.log_lines, ln)

ln = self.skip_lines_while(

@@ -362,17 +343,15 @@ class Log(object):

buckets, self.log_lines, ln)

self.malloc_stacktrace_lines.extend(self.mmap_stacktrace_lines)

self.mmap_stacktrace_lines = []

- return version

- elif version == DUMP_DEEP_1:

- sys.stderr.write(' heap profile dump version: %s\n' % version)

+ elif self.log_version == DUMP_DEEP_1:

+ sys.stderr.write(' heap profile dump version: %s\n' % self.log_version)

(self.malloc_stacktrace_lines, ln) = self.parse_stacktraces_while_valid(

buckets, self.log_lines, ln)

- return version

else:

- sys.stderr.write(' invalid heap profile dump version:%s\n' % version)

- return ''

+ sys.stderr.write(' invalid heap profile dump version:%s\n' % (

+ self.log_version))

def parse_global_stats(self):

"""Parses lines in self.log_lines as global stats."""

@@ -380,7 +359,18 @@ class Log(object):

0, len(self.log_lines),

lambda n: self.log_lines[n] != 'GLOBAL_STATS:\n')

- for prefix in ['total', 'file', 'anonymous', 'other', 'mmap', 'tcmalloc']:

+ if self.log_version == DUMP_DEEP_4:

+ global_stat_names = [

+ 'total', 'file-exec', 'file-nonexec', 'anonymous', 'stack', 'other',

+ 'nonprofiled-absent', 'nonprofiled-anonymous',

+ 'nonprofiled-file-exec', 'nonprofiled-file-nonexec',

+ 'nonprofiled-stack', 'nonprofiled-other',

+ 'profiled-mmap', 'profiled-malloc']

+ else:

+ global_stat_names = [

+ 'total', 'file', 'anonymous', 'other', 'mmap', 'tcmalloc']

+ for prefix in global_stat_names:

ln = self.skip_lines_while(

ln, len(self.log_lines),

lambda n: self.log_lines[n].split()[0] != prefix)

@@ -388,9 +378,44 @@ class Log(object):

self.counters[prefix + '_virtual'] = int(words[-2])

self.counters[prefix + '_committed'] = int(words[-1])

+ def parse_version(self):

+ """Parses a version string in self.log_lines.

+ Returns:

+ A string representing a version of the stacktrace dump. '' for invalid

Alexander Potapenko 2012/04/12 12:51:33 Looks like you're returning two values here.

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Modified as follows : Returns: A pair of (a strin

+ dump.

+ """

+ version = ''

+ # Skip until an identifiable line.

+ headers = ('STACKTRACES:\n', 'MMAP_STACKTRACES:\n', 'heap profile: ')

+ ln = self.skip_lines_while(

+ 0, len(self.log_lines),

+ lambda n: not self.log_lines[n].startswith(headers))

+ # Identify a version.

+ if self.log_lines[ln].startswith('heap profile: '):

Alexander Potapenko 2012/04/12 12:51:33 I guess too much machinery is involved in getting

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 The first versions didn't include version strings.

+ version = self.log_lines[ln][13:].strip()

+ if (version == DUMP_DEEP_2 or version == DUMP_DEEP_3 or

+ version == DUMP_DEEP_4):

+ ln = self.skip_lines_while(

+ ln, len(self.log_lines),

+ lambda n: self.log_lines[n] != 'MMAP_STACKTRACES:\n')

+ else:

+ sys.stderr.write(' invalid heap profile dump version:%s\n' % version)

Alexander Potapenko 2012/04/12 12:51:33 Maybe just raise an exception here? You won't need

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Sounds reasonable. Just raised an exception.

+ return ''

+ elif self.log_lines[ln] == 'STACKTRACES:\n':

+ version = DUMP_DEEP_1

+ elif self.log_lines[ln] == 'MMAP_STACKTRACES:\n':

+ version = DUMP_DEEP_2

Alexander Potapenko 2012/04/12 12:51:33 spare newline

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Hmm, this newline is helpful for readability for m

+ return (version, ln)

def parse_log(self, buckets):

+ self.log_version, ln = self.parse_version()

self.parse_global_stats()

- self.log_version = self.parse_stacktraces(buckets)

+ self.parse_stacktraces(buckets, ln)

@staticmethod

def accumulate_size_for_policy(stacktrace_lines,

@@ -434,32 +459,59 @@ class Log(object):

self.accumulate_size_for_policy(self.malloc_stacktrace_lines,

policy_list, buckets, sizes, False)

- sizes['mmap-no-log'] = self.counters['mmap_committed'] - sizes[

+ if self.log_version == DUMP_DEEP_4:

+ mmap_prefix = 'profiled-mmap'

+ malloc_prefix = 'profiled-malloc'

+ else:

+ mmap_prefix = 'mmap'

+ malloc_prefix = 'tcmalloc'

+ sizes['mmap-no-log'] = self.counters[

M-A Ruel 2012/04/12 12:40:36 I think this would be much more readable: sizes['m

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Agreed. I think it's more readable. Actaually, I

+ '%s_committed' % mmap_prefix] - sizes[

'mmap-total-log']

- sizes['mmap-total-record'] = self.counters['mmap_committed']

- sizes['mmap-total-record-vm'] = self.counters['mmap_virtual']

+ sizes['mmap-total-record'] = self.counters['%s_committed' % mmap_prefix]

+ sizes['mmap-total-record-vm'] = self.counters['%s_virtual' % mmap_prefix]

- sizes['tc-no-log'] = self.counters['tcmalloc_committed'] - sizes[

+ sizes['tc-no-log'] = self.counters[

+ '%s_committed' % malloc_prefix] - sizes[

'tc-total-log']

- sizes['tc-total-record'] = self.counters['tcmalloc_committed']

- sizes['tc-unused'] = sizes['mmap-tcmalloc'] - self.counters[

- 'tcmalloc_committed']

+ sizes['tc-total-record'] = self.counters['%s_committed' % malloc_prefix]

+ sizes['tc-unused'] = sizes[

+ 'mmap-tcmalloc'] - self.counters[

+ '%s_committed' % malloc_prefix]

sizes['tc-total'] = sizes['mmap-tcmalloc']

- for key, value in { 'total': 'total_committed',

- 'filemapped': 'file_committed',

- 'anonymous': 'anonymous_committed',

- 'other': 'other_committed',

- 'total-vm': 'total_virtual',

- 'filemapped-vm': 'file_virtual',

- 'anonymous-vm': 'anonymous_virtual',

- 'other-vm': 'other_virtual' }.items():

+ for key, value in {

Alexander Potapenko 2012/04/12 12:51:33 This can be generated automatically: map(lambda

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Just some of them doesn't have corresponding names

+ 'total': 'total_committed',

+ 'filemapped': 'file_committed',

+ 'file-exec': 'file-exec_committed',

+ 'file-nonexec': 'file-nonexec_committed',

+ 'anonymous': 'anonymous_committed',

+ 'stack': 'stack_committed',

+ 'other': 'other_committed',

+ 'nonprofiled-absent': 'nonprofiled-absent_committed',

+ 'nonprofiled-anonymous': 'nonprofiled-anonymous_committed',

+ 'nonprofiled-file-exec': 'nonprofiled-file-exec_committed',

+ 'nonprofiled-file-nonexec': 'nonprofiled-file-nonexec_committed',

+ 'nonprofiled-stack': 'nonprofiled-stack_committed',

+ 'nonprofiled-other': 'nonprofiled-other_committed',

+ 'total-vm': 'total_virtual',

+ 'filemapped-vm': 'file_virtual',

+ 'anonymous-vm': 'anonymous_virtual',

+ 'other-vm': 'other_virtual' }.items():

M-A Ruel 2012/04/12 12:40:36 Use iteritems() instead of items() Otherwise, you

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Done.

if key in sizes:

sizes[key] = self.counters[value]

- if 'unknown' in sizes:

- sizes['unknown'] = self.counters['total_committed'] - self.counters[

- 'mmap_committed']

+ if 'mustbezero' in sizes:

+ sizes['mustbezero'] = self.counters[

M-A Ruel 2012/04/12 12:40:36 Use this format instead: sizes['mustbezero'] = (

Dai Mikurube (NOT FULLTIME) 2012/04/13 05:41:10 Chose a loop. Thanks!

+ 'total_committed'] - self.counters[

+ '%s_committed' % mmap_prefix] - self.counters[

+ 'nonprofiled-absent_committed'] - self.counters[

+ 'nonprofiled-anonymous_committed'] - self.counters[

+ 'nonprofiled-file-exec_committed'] - self.counters[

+ 'nonprofiled-file-nonexec_committed'] - self.counters[

+ 'nonprofiled-stack_committed'] - self.counters[

+ 'nonprofiled-other_committed']

if 'total-exclude-profiler' in sizes:

sizes['total-exclude-profiler'] = self.counters[

'total_committed'] - sizes['mmap-profiler']

@@ -481,7 +533,7 @@ class Log(object):

component_match = get_component(policy_list, bucket, mmap)

if component_match == component_name:

stacktrace_sequence = ''

- for address in bucket.stacktrace[1 : min(len(bucket.stacktrace),

+ for address in bucket.stacktrace[0 : min(len(bucket.stacktrace),

1 + depth)]:

stacktrace_sequence += address_symbol_dict[address] + ' '

if not stacktrace_sequence in sizes:

« third_party/tcmalloc/chromium/src/deep-heap-profile.cc ('K') | « tools/deep_memory_profiler/dmpolicy ('k') | tools/deep_memory_profiler/dmprof.py » ('j') | no next file with comments »