Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(352)

Side by Side Diff: tools/binary_size/models.py

Issue 2769933002: V2 of //tools/binary_size rewrite (diffs). (Closed)
Patch Set: __add__, __sub__ Created 3 years, 9 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
(Empty)
1 # Copyright 2017 The Chromium Authors. All rights reserved.
agrieve 2017/03/24 16:43:52 Yikes, there's actually not much changed here. Sad
2 # Use of this source code is governed by a BSD-style license that can be
3 # found in the LICENSE file.
4
5 import collections
6 import copy
7 import re
8
9
10 SECTION_TO_SECTION_NAME = {
11 'b': '.bss',
12 'd': '.data',
13 'r': '.rodata',
14 't': '.text',
15 }
16
17
18 class SizeInfo(object):
19 __slots__ = (
20 'symbols',
21 'section_sizes',
22 )
23
24 """Root size information."""
25 def __init__(self, symbols, section_sizes):
26 self.symbols = symbols
27 self.section_sizes = section_sizes # E.g. {'.text': 0}
28
29
30 class BaseSymbol(object):
31 """Base class for Symbol and SymbolGroup."""
32 __slots__ = ()
33
34 @property
35 def section(self):
36 return self.section_name[1]
37
38 @property
39 def size_without_padding(self):
40 return self.size - self.padding
41
42 @property
43 def end_address(self):
44 return self.address + self.size_without_padding
45
46 @property
47 def virtual_size(self):
48 return -self.padding if self.IsBss() else self.size
49
50 def IsBss(self):
51 return self.section_name is '.bss'
52
53 def IsGroup(self):
54 return False
55
56 def IsGenerated(self):
57 # TODO(agrieve): Also match generated functions such as:
58 # startup._GLOBAL__sub_I_page_allocator.cc
59 return self.name.endswith(']') and not self.name.endswith('[]')
60
61 def _Key(self):
62 return (self.section_name, self.function_signature or self.name)
63
64
65 class Symbol(BaseSymbol):
66 """Represents a single symbol within a binary."""
67
68 __slots__ = (
69 'section_name',
70 'address',
71 'size',
72 'padding',
73 'name',
74 'function_signature',
75 'path',
76 )
77
78 def __init__(self, section_name, address, size_without_padding, name, path):
79 section_name = intern(section_name)
80 self.section_name = section_name
81 self.address = address
82 self.name = name or ''
83 self.function_signature = ''
84 self.path = path or ''
85 if self.IsBss():
86 self.size = 0
87 self.padding = -size_without_padding
88 else:
89 self.size = size_without_padding
90 self.padding = 0
91
92 def __repr__(self):
93 return '%s@%x(size=%d,padding=%d,name=%s,path=%s)' % (
94 self.section_name, self.address, self.size_without_padding,
95 self.padding, self.name, self.path)
96
97
98 class SymbolGroup(BaseSymbol):
99 """Represents a group of symbols using the same interface as Symbol."""
100
101 __slots__ = (
102 'symbols',
103 'filtered_symbols',
104 'name',
105 'section_name',
106 )
107
108 def __init__(self, symbols, filtered_symbols=None, name=None,
109 section_name=None):
110 self.symbols = symbols
111 self.filtered_symbols = filtered_symbols or []
112 self.name = name or ''
113 self.section_name = section_name or '.*'
114 assert self.section_name is intern(self.section_name)
115
116 def __repr__(self):
117 return 'Group(name=%s,count=%d,size=%d)' % (
118 self.name, len(self), self.size)
119
120 def __iter__(self):
121 return iter(self.symbols)
122
123 def __len__(self):
124 return len(self.symbols)
125
126 def __getitem__(self, index):
127 return self.symbols[index]
128
129 def __sub__(self, other):
130 other_ids = set(id(s) for s in other)
131 new_symbols = [s for s in self if id(s) not in other_ids]
132 return self._CreateTransformed(new_symbols, section_name=self.section_name)
133
134 def __add__(self, other):
135 self_ids = set(id(s) for s in self)
136 new_symbols = self.symbols + [s for s in other if id(s) not in self_ids]
137 return self._CreateTransformed(new_symbols, section_name=self.section_name)
138
139 @property
140 def address(self):
141 return 0
142
143 @property
144 def function_signature(self):
145 return None
146
147 @property
148 def path(self):
149 return None
150
151 @property
152 def size(self):
153 return sum(s.size for s in self)
154
155 @property
156 def padding(self):
157 return sum(s.padding for s in self)
158
159 def IsGroup(self):
160 return True
161
162 def _CreateTransformed(self, symbols, filtered_symbols=None, name=None,
163 section_name=None):
164 return SymbolGroup(symbols, filtered_symbols=filtered_symbols, name=name,
165 section_name=section_name)
166
167 def Sorted(self, cmp_func=None, key=None, reverse=False):
168 # Default to sorting by abs(size) then name.
169 if cmp_func is None and key is None:
170 cmp_func = lambda a, b: cmp((abs(b.size), a.name), (abs(a.size), b.name))
171
172 new_symbols = sorted(self.symbols, cmp_func, key, reverse)
173 return self._CreateTransformed(new_symbols,
174 filtered_symbols=self.filtered_symbols,
175 section_name=self.section_name)
176
177 def Filter(self, func):
178 filtered_and_kept = ([], [])
179 for symbol in self:
180 filtered_and_kept[int(bool(func(symbol)))].append(symbol)
181 return self._CreateTransformed(filtered_and_kept[1],
182 filtered_symbols=filtered_and_kept[0],
183 section_name=self.section_name)
184
185 def WhereBiggerThan(self, min_size):
186 return self.Filter(lambda s: s.size >= min_size)
187
188 def WhereInSection(self, section):
189 section_name = intern(SECTION_TO_SECTION_NAME.get(section, section))
190 assert section_name
191 ret = self.Filter(lambda s: s.section_name is section_name)
192 ret.section_name = section_name
193 return ret
194
195 def WhereIsGenerated(self):
196 return self.Filter(lambda s: s.IsGenerated())
197
198 def WhereNameMatches(self, pattern):
199 regex = re.compile(pattern)
200 return self.Filter(lambda s: regex.search(s.name))
201
202 def WherePathMatches(self, pattern):
203 regex = re.compile(pattern)
204 return self.Filter(lambda s: s.path and regex.search(s.path))
205
206 def WhereAddressInRange(self, start, end):
207 return self.Filter(lambda s: s.address >= start and s.address <= end)
208
209 def WhereHasAnyAttribution(self):
210 return self.Filter(lambda s: s.name or s.path)
211
212 def Inverted(self):
213 return self._CreateTransformed(self.filtered_symbols,
214 filtered_symbols=self.symbols)
215
216 def GroupBy(self, func):
217 new_syms = []
218 filtered_symbols = []
219 symbols_by_token = collections.defaultdict(list)
220 for symbol in self:
221 token = func(symbol)
222 if not token:
223 filtered_symbols.append(symbol)
224 continue
225 symbols_by_token[token].append(symbol)
226 for token, symbols in symbols_by_token.iteritems():
227 new_syms.append(self._CreateTransformed(symbols, name=token,
228 section_name=self.section_name))
229 return self._CreateTransformed(new_syms, filtered_symbols=filtered_symbols,
230 section_name=self.section_name)
231
232 def GroupByNamespace(self, depth=1):
233 def extract_namespace(symbol):
234 # Does not distinguish between classes and namespaces.
235 idx = -2
236 for _ in xrange(depth):
237 idx = symbol.name.find('::', idx + 2)
238 if idx != -1:
239 ret = symbol.name[:idx]
240 if '<' not in ret:
241 return ret
242 return '{global}'
243 return self.GroupBy(extract_namespace)
244
245 def GroupByPath(self, depth=1):
246 def extract_path(symbol):
247 idx = -1
248 for _ in xrange(depth):
249 idx = symbol.path.find('/', idx + 1)
250 if idx != -1:
251 return symbol.path[:idx]
252 return '{path unknown}'
253 return self.GroupBy(extract_path)
254
255
256 class SymbolDiff(SymbolGroup):
257 __slots__ = (
258 '_added_ids',
259 '_removed_ids',
260 )
261
262 def __init__(self, added, removed, similar):
263 self._added_ids = set(id(s) for s in added)
264 self._removed_ids = set(id(s) for s in removed)
265 symbols = []
266 symbols.extend(added)
267 symbols.extend(removed)
268 symbols.extend(similar)
269 super(SymbolDiff, self).__init__(symbols)
270
271 def __repr__(self):
272 return '%s(%d added, %d removed, %d changed, %d unchanged, size=%d)' % (
273 'SymbolGroup', self.added_count, self.removed_count, self.changed_count,
274 self.unchanged_count, self.size)
275
276 def _CreateTransformed(self, symbols, filtered_symbols=None, name=None,
277 section_name=None):
278 ret = SymbolDiff.__new__(SymbolDiff)
279 # Printing sorts, so fast-path the same symbols case.
280 if len(symbols) == len(self.symbols):
281 ret._added_ids = self._added_ids
282 ret._removed_ids = self._removed_ids
283 else:
284 ret._added_ids = set(id(s) for s in symbols if self.IsAdded(s))
285 ret._removed_ids = set(id(s) for s in symbols if self.IsRemoved(s))
286 super(SymbolDiff, ret).__init__(symbols, filtered_symbols=filtered_symbols,
287 name=name, section_name=section_name)
288
289 return ret
290
291 @property
292 def added_count(self):
293 return len(self._added_ids)
294
295 @property
296 def removed_count(self):
297 return len(self._removed_ids)
298
299 @property
300 def changed_count(self):
301 not_changed = self.unchanged_count + self.added_count + self.removed_count
302 return len(self) - not_changed
303
304 @property
305 def unchanged_count(self):
306 return sum(1 for s in self if self.IsSimilar(s) and s.size == 0)
307
308 def IsAdded(self, sym):
309 return id(sym) in self._added_ids
310
311 def IsSimilar(self, sym):
312 key = id(sym)
313 return key not in self._added_ids and key not in self._removed_ids
314
315 def IsRemoved(self, sym):
316 return id(sym) in self._removed_ids
317
318 def WhereNotUnchanged(self):
319 return self.Filter(lambda s: not self.IsSimilar(s) or s.size)
320
321
322 def Diff(new, old):
323 """Diffs two SizeInfo or SymbolGroup objects.
324
325 When diffing SizeInfos, ret.section_sizes are the result of |new| - |old|, and
326 ret.symbols will be a SymbolDiff.
327
328 When diffing SymbolGroups, a SymbolDiff is returned.
329
330 Returns:
331 Returns a SizeInfo when args are of type SizeInfo.
332 Returns a SymbolDiff when args are of type SymbolGroup.
333 """
334 if isinstance(new, SizeInfo):
335 assert isinstance(old, SizeInfo)
336 section_sizes = {
337 k:new.section_sizes[k] - v for k, v in old.section_sizes.iteritems()}
338 symbol_diff = Diff(new.symbols, old.symbols)
339 return SizeInfo(symbol_diff, section_sizes)
340
341 assert isinstance(new, SymbolGroup) and isinstance(old, SymbolGroup)
342 symbols_by_key = collections.defaultdict(list)
343 for s in old:
344 symbols_by_key[s._Key()].append(s)
345
346 added = []
347 removed = []
348 similar = []
349 # For similar symbols, padding is zeroed out. In order to not lose the
350 # information entirely, store it in aggregate.
351 padding_by_section_name = collections.defaultdict(int)
352 for new_sym in new:
353 matching_syms = symbols_by_key.get(new_sym._Key())
354 if matching_syms:
355 old_sym = matching_syms.pop(0)
356 # More stable/useful to compare size without padding.
357 size_diff = (new_sym.size_without_padding -
358 old_sym.size_without_padding)
359 merged_sym = Symbol(old_sym.section_name, old_sym.address,
360 size_diff, old_sym.name, old_sym.path)
361 merged_sym.function_signature = old_sym.function_signature
362 similar.append(merged_sym)
363 padding_by_section_name[new_sym.section_name] += (
364 new_sym.padding - old_sym.padding)
365 else:
366 added.append(new_sym)
367
368 for remaining_syms in symbols_by_key.itervalues():
369 for old_sym in remaining_syms:
370 duped = copy.copy(old_sym)
371 duped.size = -duped.size
372 duped.padding = -duped.padding
373 removed.append(duped)
374
375 for section_name, padding in padding_by_section_name.iteritems():
376 similar.append(Symbol(section_name, 0, padding,
377 '** aggregate padding of delta symbols', None))
378 return SymbolDiff(added, removed, similar)
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698