OLD | NEW |
1 #!/usr/bin/python | 1 #!/usr/bin/python |
2 # Copyright (c) 2012 The Native Client Authors. All rights reserved. | 2 # Copyright (c) 2012 The Native Client Authors. All rights reserved. |
3 # Use of this source code is governed by a BSD-style license that can be | 3 # Use of this source code is governed by a BSD-style license that can be |
4 # found in the LICENSE file. | 4 # found in the LICENSE file. |
5 # | 5 # |
6 # IMPORTANT NOTE: If you make local mods to this file, you must run: | 6 # IMPORTANT NOTE: If you make local mods to this file, you must run: |
7 # % pnacl/build.sh driver | 7 # % pnacl/build.sh driver |
8 # in order for them to take effect in the scons build. This command | 8 # in order for them to take effect in the scons build. This command |
9 # updates the copy in the toolchain/ tree. | 9 # updates the copy in the toolchain/ tree. |
10 # | 10 # |
(...skipping 106 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
117 ('-arm-reserve-r9 -sfi-disable-cp ' + | 117 ('-arm-reserve-r9 -sfi-disable-cp ' + |
118 '-sfi-load -sfi-store -sfi-stack -sfi-branch -sfi-data ' + | 118 '-sfi-load -sfi-store -sfi-stack -sfi-branch -sfi-data ' + |
119 '-no-inline-jumptables -float-abi=hard'), | 119 '-no-inline-jumptables -float-abi=hard'), |
120 | 120 |
121 'LLC_FLAGS_X8632' : '', | 121 'LLC_FLAGS_X8632' : '', |
122 'LLC_FLAGS_X8664' : '', | 122 'LLC_FLAGS_X8664' : '', |
123 | 123 |
124 'LLC_FLAGS_MIPS32': '-sfi-load -sfi-store -sfi-stack -sfi-branch -sfi-data', | 124 'LLC_FLAGS_MIPS32': '-sfi-load -sfi-store -sfi-stack -sfi-branch -sfi-data', |
125 | 125 |
126 # LLC flags which set the target and output type. | 126 # LLC flags which set the target and output type. |
127 # These are handled separately by libLTO. | 127 'LLC_FLAGS_TARGET' : '-mtriple=${TRIPLE} -filetype=${filetype}', |
128 'LLC_FLAGS_TARGET' : '-mcpu=${LLC_MCPU} ' + | 128 |
129 '-mtriple=${TRIPLE} ' + | |
130 '-filetype=${filetype}', | |
131 # Append additional non-default flags here. | 129 # Append additional non-default flags here. |
132 'LLC_FLAGS_EXTRA' : '${#OPT_LEVEL ? -O${OPT_LEVEL}} ' + | 130 'LLC_FLAGS_EXTRA' : '${FAST_TRANSLATION ? ${LLC_FLAGS_FAST}} ' + |
| 131 '${#OPT_LEVEL ? -O${OPT_LEVEL}} ' + |
133 '${OPT_LEVEL == 0 ? -disable-fp-elim}', | 132 '${OPT_LEVEL == 0 ? -disable-fp-elim}', |
134 | 133 |
135 # Opt level from command line (if any) | 134 # Opt level from command line (if any) |
136 'OPT_LEVEL' : '', | 135 'OPT_LEVEL' : '', |
137 | 136 |
138 # slower translation == faster code | |
139 'LLC_FLAGS_SLOW': | |
140 # Due to a quadratic algorithm used for tail merging | |
141 # capping it at 50 helps speed up translation | |
142 '-tail-merge-threshold=50', | |
143 | |
144 # faster translation == slower code | 137 # faster translation == slower code |
145 'LLC_FLAGS_FAST' : '${LLC_FLAGS_FAST_%ARCH%}', | 138 'LLC_FLAGS_FAST' : '${LLC_FLAGS_FAST_%ARCH%}', |
146 | 139 |
147 'LLC_FLAGS_FAST_X8632': | 140 'LLC_FLAGS_FAST_X8632': '-O0 ' + |
148 '-O0 ' + | 141 # This, surprisingly, makes a measurable difference |
149 # This, surprisingly, makes a measurable difference | |
150 '-tail-merge-threshold=20', | 142 '-tail-merge-threshold=20', |
151 'LLC_FLAGS_FAST_X8664': | 143 'LLC_FLAGS_FAST_X8664': '-O0 ' + |
152 '-O0 ' + | |
153 '-tail-merge-threshold=20', | 144 '-tail-merge-threshold=20', |
154 'LLC_FLAGS_FAST_ARM': | 145 'LLC_FLAGS_FAST_ARM': '-O0 ' + |
155 # due to slow turn around times ARM settings have not been explored in depth | |
156 '-O0 ' + | |
157 '-tail-merge-threshold=20', | 146 '-tail-merge-threshold=20', |
158 'LLC_FLAGS_FAST_MIPS32': '-fast-isel -tail-merge-threshold=20', | 147 'LLC_FLAGS_FAST_MIPS32': '-fast-isel -tail-merge-threshold=20', |
159 | 148 |
160 'LLC_FLAGS': '${LLC_FLAGS_TARGET} ' + | 149 'LLC_FLAGS': '${LLC_FLAGS_TARGET} ${LLC_FLAGS_COMMON} ${LLC_FLAGS_%ARCH%} ' + |
161 '${LLC_FLAGS_COMMON} ' + | |
162 '${LLC_FLAGS_%ARCH%} ' + | |
163 '${FAST_TRANSLATION ? ${LLC_FLAGS_FAST} : ${LLC_FLAGS_SLOW}} ' + | |
164 '${LLC_FLAGS_EXTRA}', | 150 '${LLC_FLAGS_EXTRA}', |
165 | 151 |
166 # CPU that is representative of baseline feature requirements for NaCl | 152 # CPU that is representative of baseline feature requirements for NaCl |
167 # and/or chrome. We may want to make this more like "-mtune" | 153 # and/or chrome. We may want to make this more like "-mtune" |
168 # by specifying both "-mcpu=X" and "-mattr=+feat1,-feat2,...". | 154 # by specifying both "-mcpu=X" and "-mattr=+feat1,-feat2,...". |
169 # Note: this may be different from the in-browser translator, which may | 155 # Note: this may be different from the in-browser translator, which may |
170 # do auto feature detection based on CPUID, but constrained by what is | 156 # do auto feature detection based on CPUID, but constrained by what is |
171 # accepted by NaCl validators. | 157 # accepted by NaCl validators. |
172 'LLC_MCPU' : '${LLC_MCPU_%ARCH%}', | 158 'LLC_MCPU' : '-mcpu=${LLC_MCPU_%ARCH%}', |
173 'LLC_MCPU_ARM' : 'cortex-a8', | 159 'LLC_MCPU_ARM' : 'cortex-a8', |
174 'LLC_MCPU_X8632' : 'pentium4', | 160 'LLC_MCPU_X8632' : 'pentium4', |
175 'LLC_MCPU_X8664' : 'core2', | 161 'LLC_MCPU_X8664' : 'core2', |
176 'LLC_MCPU_MIPS32' : 'mips32r2', | 162 'LLC_MCPU_MIPS32' : 'mips32r2', |
177 | 163 |
178 # Note: this is only used in the unsandboxed case | 164 # Note: this is only used in the unsandboxed case |
179 'RUN_LLC' : '${LLVM_LLC} ${LLC_FLAGS} ${input} -o ${output} ' + | 165 'RUN_LLC' : '${LLVM_LLC} ${LLC_FLAGS} ${LLC_MCPU} ' |
| 166 '${input} -o ${output} ' + |
180 '-metadata-text ${output}.meta', | 167 '-metadata-text ${output}.meta', |
181 # Rate in bits/sec to stream the bitcode from sel_universal over SRPC | 168 # Rate in bits/sec to stream the bitcode from sel_universal over SRPC |
182 # for testing. Defaults to 1Gbps (effectively unlimited). | 169 # for testing. Defaults to 1Gbps (effectively unlimited). |
183 'BITCODE_STREAM_RATE' : '1000000000', | 170 'BITCODE_STREAM_RATE' : '1000000000', |
184 } | 171 } |
185 | 172 |
186 TranslatorPatterns = [ | 173 TranslatorPatterns = [ |
187 ( '-o(.+)', "env.set('OUTPUT', pathtools.normalize($0))"), | 174 ( '-o(.+)', "env.set('OUTPUT', pathtools.normalize($0))"), |
188 ( ('-o', '(.+)'), "env.set('OUTPUT', pathtools.normalize($0))"), | 175 ( ('-o', '(.+)'), "env.set('OUTPUT', pathtools.normalize($0))"), |
189 | 176 |
190 ( '-S', "env.set('OUTPUT_TYPE', 's')"), # Stop at .s | 177 ( '-S', "env.set('OUTPUT_TYPE', 's')"), # Stop at .s |
191 ( '-c', "env.set('OUTPUT_TYPE', 'o')"), # Stop at .o | 178 ( '-c', "env.set('OUTPUT_TYPE', 'o')"), # Stop at .o |
192 | 179 |
193 # Expose a very limited set of llc flags. | 180 # Expose a very limited set of llc flags. |
194 ( '(-sfi-.+)', "env.append('LLC_FLAGS_EXTRA', $0)"), | 181 ( '(-sfi-.+)', "env.append('LLC_FLAGS_EXTRA', $0)"), |
195 ( '(-mtls-use-call)', "env.append('LLC_FLAGS_EXTRA', $0)"), | 182 ( '(-mtls-use-call)', "env.append('LLC_FLAGS_EXTRA', $0)"), |
196 # These flags are usually used for linktime dead code/data | 183 # These flags are usually used for linktime dead code/data |
197 # removal but also help with reloc overflows on ARM | 184 # removal but also help with reloc overflows on ARM |
198 ( '(-fdata-sections)', "env.append('LLC_FLAGS_EXTRA', $0)"), | 185 ( '(-fdata-sections)', "env.append('LLC_FLAGS_EXTRA', $0)"), |
199 ( '(-ffunction-sections)', "env.append('LLC_FLAGS_EXTRA', $0)"), | 186 ( '(-ffunction-sections)', "env.append('LLC_FLAGS_EXTRA', $0)"), |
200 ( '(--gc-sections)', "env.append('LD_FLAGS', $0)"), | 187 ( '(--gc-sections)', "env.append('LD_FLAGS', $0)"), |
201 ( '(-mattr=.*)', "env.append('LLC_FLAGS_EXTRA', $0)"), | 188 ( '(-mattr=.*)', "env.append('LLC_FLAGS_EXTRA', $0)"), |
202 ( '-mcpu=(.*)', "env.set('LLC_MCPU', $0)"), | 189 ( '(-mcpu=.*)', "env.set('LLC_MCPU', '')\n" |
| 190 "env.append('LLC_FLAGS_EXTRA', $0)"), |
203 # Allow overriding the -O level. | 191 # Allow overriding the -O level. |
204 ( '-O([0-3])', "env.set('OPT_LEVEL', $0)"), | 192 ( '-O([0-3])', "env.set('OPT_LEVEL', $0)"), |
205 | 193 |
206 # This adds arch specific flags to the llc invocation aimed at | 194 # This adds arch specific flags to the llc invocation aimed at |
207 # improving translation speed at the expense of code quality. | 195 # improving translation speed at the expense of code quality. |
208 ( '-translate-fast', "env.set('FAST_TRANSLATION', '1')"), | 196 ( '-translate-fast', "env.set('FAST_TRANSLATION', '1')"), |
209 | 197 |
210 # If translating a .pexe which was linked statically against | 198 # If translating a .pexe which was linked statically against |
211 # glibc, then you must do pnacl-translate -static. This will | 199 # glibc, then you must do pnacl-translate -static. This will |
212 # be removed once GLibC is actually statically linked. | 200 # be removed once GLibC is actually statically linked. |
(...skipping 245 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
458 | 446 |
459 def ToggleDefaultCommandlineLD(inputs, infile): | 447 def ToggleDefaultCommandlineLD(inputs, infile): |
460 if env.getbool('USE_DEFAULT_CMD_LINE'): | 448 if env.getbool('USE_DEFAULT_CMD_LINE'): |
461 reason, non_standard = RequiresNonStandardLDCommandline(inputs, infile) | 449 reason, non_standard = RequiresNonStandardLDCommandline(inputs, infile) |
462 if non_standard: | 450 if non_standard: |
463 Log.Info(reason + ' -- not using default SRPC commandline for LD!') | 451 Log.Info(reason + ' -- not using default SRPC commandline for LD!') |
464 inputs.append('--pnacl-driver-set-USE_DEFAULT_CMD_LINE=0') | 452 inputs.append('--pnacl-driver-set-USE_DEFAULT_CMD_LINE=0') |
465 | 453 |
466 | 454 |
467 def RequiresNonStandardLLCCommandline(): | 455 def RequiresNonStandardLLCCommandline(): |
468 if env.getbool('FAST_TRANSLATION'): | |
469 return ('FAST_TRANSLATION', True) | |
470 | |
471 extra_flags = env.get('LLC_FLAGS_EXTRA') | 456 extra_flags = env.get('LLC_FLAGS_EXTRA') |
472 if extra_flags != []: | 457 if extra_flags != []: |
473 reason = 'Has additional llc flags: %s' % extra_flags | 458 reason = 'Has additional llc flags: %s' % extra_flags |
474 return (reason, True) | 459 return (reason, True) |
475 | 460 |
476 return (None, False) | 461 return (None, False) |
477 | 462 |
478 | 463 |
479 def UseDefaultCommandlineLLC(): | 464 def UseDefaultCommandlineLLC(): |
480 if not env.getbool('USE_DEFAULT_CMD_LINE'): | 465 if not env.getbool('USE_DEFAULT_CMD_LINE'): |
(...skipping 35 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
516 # As a side effect, this creates a temporary file | 501 # As a side effect, this creates a temporary file |
517 if not env.getbool('SAVE_TEMPS'): | 502 if not env.getbool('SAVE_TEMPS'): |
518 TempFiles.add(outfile + '.meta') | 503 TempFiles.add(outfile + '.meta') |
519 env.pop() | 504 env.pop() |
520 return 0 | 505 return 0 |
521 | 506 |
522 def RunLLCSandboxed(): | 507 def RunLLCSandboxed(): |
523 driver_tools.CheckTranslatorPrerequisites() | 508 driver_tools.CheckTranslatorPrerequisites() |
524 infile = env.getone('input') | 509 infile = env.getone('input') |
525 outfile = env.getone('output') | 510 outfile = env.getone('output') |
526 flags = env.get('LLC_FLAGS') | |
527 if not driver_tools.IsBitcode(infile): | 511 if not driver_tools.IsBitcode(infile): |
528 Log.Fatal('Input to sandboxed translator must be bitcode') | 512 Log.Fatal('Input to sandboxed translator must be bitcode') |
529 script = MakeSelUniversalScriptForLLC(infile, outfile, flags) | 513 script = MakeSelUniversalScriptForLLC(infile, outfile) |
530 command = ('${SEL_UNIVERSAL_PREFIX} ${SEL_UNIVERSAL} ${SEL_UNIVERSAL_FLAGS} ' | 514 command = ('${SEL_UNIVERSAL_PREFIX} ${SEL_UNIVERSAL} ${SEL_UNIVERSAL_FLAGS} ' |
531 '-- ${LLC_SB}') | 515 '-- ${LLC_SB}') |
532 _, stdout, _ = driver_tools.Run(command, | 516 _, stdout, _ = driver_tools.Run(command, |
533 stdin_contents=script, | 517 stdin_contents=script, |
534 # stdout/stderr will be automatically dumped | 518 # stdout/stderr will be automatically dumped |
535 # upon failure | 519 # upon failure |
536 redirect_stderr=subprocess.PIPE, | 520 redirect_stderr=subprocess.PIPE, |
537 redirect_stdout=subprocess.PIPE) | 521 redirect_stdout=subprocess.PIPE) |
538 # Get the values returned from the llc RPC to use in input to ld | 522 # Get the values returned from the llc RPC to use in input to ld |
539 is_shared = re.search(r'output\s+0:\s+i\(([0|1])\)', stdout).group(1) | 523 is_shared = re.search(r'output\s+0:\s+i\(([0|1])\)', stdout).group(1) |
540 is_shared = (is_shared == '1') | 524 is_shared = (is_shared == '1') |
541 soname = re.search(r'output\s+1:\s+s\("(.*)"\)', stdout).group(1) | 525 soname = re.search(r'output\s+1:\s+s\("(.*)"\)', stdout).group(1) |
542 needed_str = re.search(r'output\s+2:\s+s\("(.*)"\)', stdout).group(1) | 526 needed_str = re.search(r'output\s+2:\s+s\("(.*)"\)', stdout).group(1) |
543 # If the delimiter changes, this line needs to change | 527 # If the delimiter changes, this line needs to change |
544 needed_libs = [ lib for lib in needed_str.split(r'\n') if lib] | 528 needed_libs = [ lib for lib in needed_str.split(r'\n') if lib] |
545 return is_shared, soname, needed_libs | 529 return is_shared, soname, needed_libs |
546 | 530 |
547 def BuildLLCCommandLine(flags): | 531 def BuildOverrideLLCCommandLine(): |
| 532 extra_flags = env.get('LLC_FLAGS_EXTRA') |
| 533 # The mcpu is not part of the default flags, so append that too. |
| 534 mcpu = env.getone('LLC_MCPU') |
| 535 if mcpu: |
| 536 extra_flags.append(mcpu) |
548 # command_line is a NUL (\x00) terminated sequence. | 537 # command_line is a NUL (\x00) terminated sequence. |
549 kTerminator = '\0' | 538 kTerminator = '\0' |
550 command_line = kTerminator.join(['llc'] + flags) + kTerminator | 539 command_line = kTerminator.join(extra_flags) + kTerminator |
551 command_line_escaped = command_line.replace(kTerminator, '\\x00') | 540 command_line_escaped = command_line.replace(kTerminator, '\\x00') |
552 return len(command_line), command_line_escaped | 541 return len(command_line), command_line_escaped |
553 | 542 |
554 def MakeSelUniversalScriptForLLC(infile, outfile, flags): | 543 def MakeSelUniversalScriptForLLC(infile, outfile): |
555 script = [] | 544 script = [] |
556 script.append('readwrite_file objfile %s' % outfile) | 545 script.append('readwrite_file objfile %s' % outfile) |
557 stream_rate = int(env.getraw('BITCODE_STREAM_RATE')) | 546 stream_rate = int(env.getraw('BITCODE_STREAM_RATE')) |
558 assert stream_rate != 0 | 547 assert stream_rate != 0 |
559 if UseDefaultCommandlineLLC(): | 548 if UseDefaultCommandlineLLC(): |
560 script.append('rpc StreamInit h(objfile) * s()') | 549 script.append('rpc StreamInit h(objfile) * s()') |
561 else: | 550 else: |
562 cmdline_len, cmdline_escaped = BuildLLCCommandLine(flags) | 551 cmdline_len, cmdline_escaped = BuildOverrideLLCCommandLine() |
563 script.append('rpc StreamInitWithCommandLine h(objfile) C(%d,%s) * s()' % | 552 script.append('rpc StreamInitWithOverrides h(objfile) C(%d,%s) * s()' % |
564 (cmdline_len, cmdline_escaped)) | 553 (cmdline_len, cmdline_escaped)) |
565 # specify filename, chunk size and rate in bits/s | 554 # specify filename, chunk size and rate in bits/s |
566 script.append('stream_file %s %s %s' % (infile, 64 * 1024, stream_rate)) | 555 script.append('stream_file %s %s %s' % (infile, 64 * 1024, stream_rate)) |
567 script.append('rpc StreamEnd * i() s() s() s()') | 556 script.append('rpc StreamEnd * i() s() s() s()') |
568 script.append('echo "llc complete"') | 557 script.append('echo "llc complete"') |
569 script.append('') | 558 script.append('') |
570 return '\n'.join(script) | 559 return '\n'.join(script) |
571 | 560 |
572 def get_help(argv): | 561 def get_help(argv): |
573 return """ | 562 return """ |
(...skipping 16 matching lines...) Expand all Loading... |
590 | 579 |
591 ADVANCED OPTIONS: | 580 ADVANCED OPTIONS: |
592 -mattr=<+feat1,-feat2> Toggle specific cpu features on and off. | 581 -mattr=<+feat1,-feat2> Toggle specific cpu features on and off. |
593 -mcpu=<cpu-name> Target a specific cpu type. Tunes code as well as | 582 -mcpu=<cpu-name> Target a specific cpu type. Tunes code as well as |
594 turns cpu features on and off. | 583 turns cpu features on and off. |
595 -S Generate native assembly only. | 584 -S Generate native assembly only. |
596 -c Generate native object file only. | 585 -c Generate native object file only. |
597 --pnacl-sb Use the translator which runs inside the NaCl sandbox. | 586 --pnacl-sb Use the translator which runs inside the NaCl sandbox. |
598 -O[0-3] Change translation-time optimization level. | 587 -O[0-3] Change translation-time optimization level. |
599 """ | 588 """ |
OLD | NEW |