tools/ninja_parser.py - Issue 272113002: Revert of Enable the ninja parsing code all the time.

Side by Side Diff: tools/ninja_parser.py

Issue 272113002: Revert of Enable the ninja parsing code all the time. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Created 6 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

OLD	NEW
	(Empty)
1 #!/usr/bin/env python

2 # Copyright 2014 The Chromium Authors. All rights reserved.

3 # Use of this source code is governed by a BSD-style license that can be

4 # found in the LICENSE file.

5

6 """Primitive ninja parser.

7

8 It's primary use case is to be used by isolate_driver.py. It is a standalone

9 tool so it can be used to verify its behavior more efficiently. It's a quirky

10 tool since it is designed only to gather binary dependencies.

11

12 <directory> is assumed to be based on src/, so usually it will have the form

13 out/Release. Any target outside this directory is ignored.

14

15 This script is assumed to be run after the target was built, since it looks

16 for the +x bit on the files and only returns the ones that exist.

17 """

18

19 import logging

20 import os

21 import optparse

22 import sys

23 import time

24

25 TOOLS_DIR = os.path.dirname(os.path.abspath(__file__))

26 SRC_DIR = os.path.dirname(TOOLS_DIR)

27

28

29 ### Private stuff.

30

31

32 _HEX = frozenset('0123456789abcdef')

33

34

35 # Ignore any dependency with one of these extensions. In particular, we do not

36 # want to mark tool that would have generated these as binary dependencies,

37 # these are likely tools only used during the build process that are not

38 # necessary at runtime. The worst thing that would happen is either:

39 # - Mapping tools generating a source file but not necessary at run time.

40 # - Slower processing.

41 # On the other hand, being too aggressive will hide legitimate runtime

42 # dependencies. In particular, .a may cause an explicit dependency on a .so.

43 _IGNORED_EXTENSIONS = frozenset([

44 '.asm', '.c', '.cc', '.cpp', '.css', '.def', '.grd', '.gypcmd', '.h',

45 '.html', '.idl', '.in', '.jinja2', '.js', '.json', '.manifest', '.mm', '.o',

46 '.obj', '.pak', '.pickle', '.png', '.pdb', '.prep', '.proto', '.py', '.rc',

47 '.strings', '.svg', '.tmp', '.ttf', '.txt', '.xtb', '.wav',

48 ])

49

50

51 def _load_ninja_recursively(build_dir, ninja_path, build_steps):

52 """Crudely extracts all the subninja and build referenced in ninja_path.

53

54 In particular, it ignores rule and variable declarations. The goal is to be

55 performant (well, as much as python can be performant) which is currently in

56 the <200ms range for a complete chromium tree. As such the code is laid out

57 for performance instead of readability.

58 """

59 logging.debug('Loading %s', ninja_path)

60 try:

61 with open(os.path.join(build_dir, ninja_path), 'rb') as f:

62 line = None

63 merge_line = ''

64 subninja = []

65 for line in f:

66 line = line.rstrip()

67 if not line:

68 continue

69

70 if line[-1] == '$':

71 # The next line needs to be merged in.

72 if merge_line:

73 merge_line += ' ' + line[:-1].strip(' ')

74 else:

75 merge_line = line[:-1].strip(' ')

76 continue

77

78 if merge_line:

79 line = merge_line + ' ' + line.strip(' ')

80 merge_line = ''

81

82 statement = line[:line.find(' ')]

83 if statement == 'build':

84 # Save the dependency list as a raw string. Only the lines needed will

85 # be processed within _recurse(). This saves a good 70ms of processing

86 # time.

87 build_target, dependencies = line[6:].split(': ', 1)

88 # Interestingly, trying to be smart and only saving the build steps

89 # with the intended extensions ('', '.stamp', '.so') slows down

90 # parsing even if 90% of the build rules can be skipped.

91 # On Windows, a single step may generate two target, so split items

92 # accordingly. It has only been seen for .exe/.exe.pdb combos.

93 for i in build_target.strip().split():

94 build_steps[i] = dependencies

95 elif statement == 'subninja':

96 subninja.append(line[9:])

97 except IOError:

98 print >> sys.stderr, 'Failed to open %s' % ninja_path

99 raise

100

101 total = 1

102 for rel_path in subninja:

103 try:

104 # Load each of the files referenced.

105 # TODO(maruel): Skip the files known to not be needed. It saves an aweful

106 # lot of processing time.

107 total += _load_ninja_recursively(build_dir, rel_path, build_steps)

108 except IOError:

109 print >> sys.stderr, '... as referenced by %s' % ninja_path

110 raise

111 return total

112

113

114 def _simple_blacklist(item):

115 """Returns True if an item should be analyzed."""

116 return item not in ('', '\|', '\|\|')

117

118

119 def _using_blacklist(item):

120 """Returns True if an item should be analyzed.

121

122 Ignores many rules that are assumed to not depend on a dynamic library. If

123 the assumption doesn't hold true anymore for a file format, remove it from

124 this list. This is simply an optimization.

125 """

126 # ninja files use native path format.

127 ext = os.path.splitext(item)[1]

128 if ext in _IGNORED_EXTENSIONS:

129 return False

130 # Special case Windows, keep .dll.lib but discard .lib.

131 if item.endswith('.dll.lib'):

132 return True

133 if ext == '.lib':

134 return False

135 return _simple_blacklist(item)

136

137

138 def _should_process(build_dir, target, build_steps, rules_seen):

139 """Returns the raw dependencies if the target should be processed."""

140 if target in rules_seen:

141 # The rule was already seen. Since rules_seen is not scoped at the target

142 # visibility, it usually simply means that multiple targets depends on the

143 # same dependencies. It's fine.

144 return None

145

146 raw_dependencies = build_steps.get(target, None)

147 if raw_dependencies is None:

148 # There is not build step defined to generate 'target'.

149 parts = target.rsplit('_', 1)

150 if len(parts) == 2 and len(parts[1]) == 32 and _HEX.issuperset(parts[1]):

151 # It's because it is a phony rule.

152 return None

153

154 # Kind of a hack, assume source files are always outside build_bir.

155 if (target.startswith('..') and

156 os.path.exists(os.path.join(build_dir, target))):

157 # It's because it is a source file.

158 return None

159

160 logging.debug('Failed to find a build step to generate: %s', target)

161 return None

162 return raw_dependencies

163

164

165 def _recurse(build_dir, target, build_steps, rules_seen, blacklist):

166 raw_dependencies = _should_process(build_dir, target, build_steps, rules_seen)

167 rules_seen.add(target)

168 if raw_dependencies is None:

169 return []

170

171 out = [target]

172 # Filter out what we don't want to speed things up. This cuts off large parts

173 # of the dependency tree to analyze.

174 # The first item is the build rule, e.g. 'link', 'cxx', 'phony', 'stamp', etc.

175 dependencies = filter(blacklist, raw_dependencies.split(' ')[1:])

176 logging.debug('recurse(%s) -> %s', target, dependencies)

177 for dependency in dependencies:

178 out.extend(_recurse(

179 build_dir, dependency, build_steps, rules_seen, blacklist))

180 return out

181

182

183 def _find_link(build_dir, target, build_steps, rules_seen, search_for):

184 raw_dependencies = _should_process(build_dir, target, build_steps, rules_seen)

185 rules_seen.add(target)

186 if raw_dependencies is None:

187 return

188

189 # Filter out what we don't want to speed things up. This cuts off large parts

190 # of the dependency tree to analyze.

191 # The first item is the build rule, e.g. 'link', 'cxx', 'phony', 'stamp', etc.

192 dependencies = filter(_simple_blacklist, raw_dependencies.split(' ')[1:])

193 for dependency in dependencies:

194 if dependency == search_for:

195 yield [dependency]

196 else:

197 for out in _find_link(

198 build_dir, dependency, build_steps, rules_seen, search_for):

199 yield [dependency] + out

200

201

202 ### Public API.

203

204

205 def load_ninja(build_dir):

206 """Loads build.ninja and the tree of .ninja files in build_dir.

207

208 Returns:

209 dict of the target->build_step where build_step is an unprocessed str.

210

211 TODO(maruel): This should really just be done by ninja itself, then simply

212 process its output.

213 """

214 build_steps = {}

215 total = _load_ninja_recursively(build_dir, 'build.ninja', build_steps)

216 logging.info('Loaded %d ninja files, %d build steps', total, len(build_steps))

217 return build_steps

218

219

220 def recurse(build_dir, target, build_steps, blacklist=_using_blacklist):

221 """Recursively returns all the interesting dependencies for the target

222 specified.

223 """

224 return _recurse(build_dir, target, build_steps, set(), blacklist)

225

226

227 def find_link(build_dir, target, build_steps, search_for):

228 """Finds all the links from 'target' to 'search_for'.

229

230 Example:

231 With target='foo' and search_for='baz', if foo depends on bar which depends

232 on baz, it will yield only one list, ['foo', 'bar', 'baz']. If there were

233 multiple dependency links in the DAG, each one would be yield as a list.

234 """

235 for link in _find_link(build_dir, target, build_steps, set(), search_for):

236 yield link

237

238

239 def post_process_deps(build_dir, dependencies):

240 """Processes the dependency list with OS specific rules.

241

242 It maps the dynamic libraries import library into their actual dynamic

243 library.

244

245 Must be run after the build is completed.

246 """

247 def filter_item(i):

248 if i.endswith('.so.TOC'):

249 # Remove only the suffix .TOC, not the .so!

250 return i[:-4]

251 if i.endswith('.dylib.TOC'):

252 # Remove only the suffix .TOC, not the .dylib!

253 return i[:-4]

254 if i.endswith('.dll.lib'):

255 # Remove only the suffix .lib, not the .dll!

256 return i[:-4]

257 return i

258

259 # Check for execute access. This gets rid of all the phony rules.

260 return [

261 i for i in map(filter_item, dependencies)

262 if os.access(os.path.join(build_dir, i), os.X_OK)

263 ]

264

265

266 def main():

267 parser = optparse.OptionParser(

268 usage='%prog [options] <directory> <target> <search_for>',

269 description=sys.modules[__name__].__doc__)

270 parser.add_option(

271 '-v', '--verbose', action='count', default=0,

272 help='Use twice for more info')

273 options, args = parser.parse_args()

274

275 levels = (logging.ERROR, logging.INFO, logging.DEBUG)

276 logging.basicConfig(

277 level=levels[min(len(levels)-1, options.verbose)],

278 format='%(levelname)7s %(message)s')

279 if len(args) == 2:

280 build_dir, target = args

281 search_for = None

282 elif len(args) == 3:

283 build_dir, target, search_for = args

284 else:

285 parser.error('Please provide a directory, a target, optionally a link')

286

287 start = time.time()

288 build_dir = os.path.abspath(build_dir)

289 if not os.path.isdir(build_dir):

290 parser.error('build dir must exist')

291 build_steps = load_ninja(build_dir)

292

293 if search_for:

294 found_one = False

295 # Find how to get to link from target.

296 for rules in find_link(build_dir, target, build_steps, search_for):

297 found_one = True

298 print('%s -> %s' % (target, ' -> '.join(rules)))

299 if not found_one:

300 print('Find to find a link between %s and %s' % (target, search_for))

301 end = time.time()

302 logging.info('Processing took %.3fs', end-start)

303 else:

304 binary_deps = post_process_deps(

305 build_dir, recurse(build_dir, target, build_steps))

306 end = time.time()

307 logging.info('Processing took %.3fs', end-start)

308 print('Binary dependencies:%s' % ''.join('\n ' + i for i in binary_deps))

309 return 0

310

311

312 if __name__ == '__main__':

313 sys.exit(main())

OLD	NEW

« no previous file with comments | « tools/isolate_driver.py ('k') | no next file » | no next file with comments »