OLD | NEW |
(Empty) | |
| 1 #!/usr/bin/python |
| 2 # Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 3 # Use of this source code is governed by a BSD-style license that can be |
| 4 # found in the LICENSE file. |
| 5 |
| 6 """Checks third-party licenses for the purposes of the Android WebView build. |
| 7 |
| 8 The Android tree includes a snapshot of Chromium in order to power the system |
| 9 WebView. This tool checks that all code uses open-source licenses compatible |
| 10 with Android, and that we meet the requirements of those licenses. It can also |
| 11 be used to generate an Android NOTICE file for the third-party code. |
| 12 |
| 13 It makes use of src/tools/licenses.py and the README.chromium files on which |
| 14 it depends. It also makes use of a data file, third_party_files_whitelist.txt, |
| 15 which whitelists indicidual files which contain third-party code but which |
| 16 aren't in a third-party directory with a README.chromium file. |
| 17 """ |
| 18 |
| 19 import optparse |
| 20 import os |
| 21 import re |
| 22 import subprocess |
| 23 import sys |
| 24 import textwrap |
| 25 |
| 26 |
| 27 REPOSITORY_ROOT = os.path.abspath(os.path.join( |
| 28 os.path.dirname(__file__), '..', '..')) |
| 29 |
| 30 sys.path.append(os.path.join(REPOSITORY_ROOT, 'tools')) |
| 31 import licenses |
| 32 |
| 33 |
| 34 def _CheckLicenseHeaders(directory_list, whitelisted_files): |
| 35 """Checks that all files which are not in a listed third-party directory, |
| 36 and which do not use the standard Chromium license, are listed. |
| 37 Args: |
| 38 directory_list: The list of directories. |
| 39 whitelisted_files: The list of files. |
| 40 Returns: |
| 41 True if all files with non-standard license headers are listed and the |
| 42 file list contains no stale entries, otherwise false. |
| 43 """ |
| 44 |
| 45 # Matches one of ... |
| 46 # - '[Cc]opyright', but not when followed by |
| 47 # ' (c) 20[0-9][0-9] The Chromium Authors.', with optional date range |
| 48 # - '([Cc]) (19|20)[0-9][0-9]', but not when preceeded by the word copyright, |
| 49 # as this is handled above |
| 50 regex = '[Cc]opyright(?! \(c\) 20[0-9][0-9](-20[0-9][0-9])? ' \ |
| 51 'The Chromium Authors\. All rights reserved\.)' \ |
| 52 '|' \ |
| 53 '(?<!(pyright |opyright))\([Cc]\) (19|20)[0-9][0-9]' |
| 54 |
| 55 args = ['grep', |
| 56 '-rPlI', |
| 57 '--exclude-dir', 'third_party', |
| 58 '--exclude-dir', 'out', |
| 59 '--exclude-dir', '.git', |
| 60 regex, |
| 61 '.'] |
| 62 p = subprocess.Popen(args=args, cwd=REPOSITORY_ROOT, stdout=subprocess.PIPE) |
| 63 files = p.communicate()[0].splitlines() |
| 64 |
| 65 # Exclude files under listed directories and some known offendors. |
| 66 offending_files = [] |
| 67 for x in files: |
| 68 x = os.path.normpath(x) |
| 69 is_in_listed_directory = False |
| 70 for y in directory_list: |
| 71 if x.startswith(y): |
| 72 is_in_listed_directory = True |
| 73 break |
| 74 if (not is_in_listed_directory |
| 75 # The tests use a number of licenses, including (L)GPL v3. |
| 76 and not x.startswith('chrome/test/data/') |
| 77 # Ignore these tools. |
| 78 and not x.startswith('android_webview/tools/') |
| 79 # This is a build intermediate directory. |
| 80 and not x.startswith('chrome/app/theme/google_chrome/') |
| 81 # This is a test output directory. |
| 82 and not x.startswith('data/page_cycler/') |
| 83 # 'Copyright' appears in strings. |
| 84 and not x.startswith('chrome/app/resources/')): |
| 85 offending_files += [x] |
| 86 |
| 87 result = True |
| 88 unknown = set(offending_files) - set(whitelisted_files) |
| 89 if unknown: |
| 90 print 'The following files contain a third-party license but are not in ' \ |
| 91 'a listed third-party directory and are not whitelisted. You must ' \ |
| 92 'add the following files to the whitelist.\n%s' % \ |
| 93 '\n'.join(sorted(unknown)) |
| 94 result = False |
| 95 |
| 96 stale = set(whitelisted_files) - set(offending_files) |
| 97 if stale: |
| 98 print 'The following files are whitelisted unnecessarily. You must ' \ |
| 99 ' remove the following files from the whitelist list.\n%s' % \ |
| 100 '\n'.join(sorted(stale)) |
| 101 result = False |
| 102 |
| 103 return result |
| 104 |
| 105 |
| 106 def _ReadFile(path): |
| 107 """Reads a file from disk. |
| 108 Args: |
| 109 path: The path of the file to read, relative to the root of the repository. |
| 110 Returns: |
| 111 The contents of the file as a string. |
| 112 """ |
| 113 |
| 114 with file(os.path.join(REPOSITORY_ROOT, path), 'r') as f: |
| 115 lines = f.read() |
| 116 return lines |
| 117 |
| 118 |
| 119 def _Scan(): |
| 120 """Checks that license meta-data is present for all third-party code. |
| 121 Returns: |
| 122 Whether the check succeeded. |
| 123 """ |
| 124 |
| 125 third_party_dirs = _FindThirdPartyDirs() |
| 126 |
| 127 # First, check designated third-party directories using src/tools/licenses.py. |
| 128 result = True |
| 129 for path in sorted(third_party_dirs): |
| 130 try: |
| 131 licenses.ParseDir(path) |
| 132 except licenses.LicenseError, e: |
| 133 print 'Got LicenseError "%s" while scanning %s' % (e, path) |
| 134 result = False |
| 135 |
| 136 # Second, check for non-standard license text. |
| 137 files_data = _ReadFile(os.path.join('android_webview', 'tools', |
| 138 'third_party_files_whitelist.txt')) |
| 139 whitelisted_files = [] |
| 140 for line in files_data.splitlines(): |
| 141 match = re.match(r'([^#\s]*)', line) |
| 142 if match and not len(match.group(1)) == 0: |
| 143 whitelisted_files += [match.group(1)] |
| 144 return _CheckLicenseHeaders(third_party_dirs, whitelisted_files) and result |
| 145 |
| 146 |
| 147 def _FindThirdPartyDirs(): |
| 148 """Gets the list of third-party directories. |
| 149 Returns: |
| 150 The list of third-party directories. |
| 151 """ |
| 152 |
| 153 prune_paths = [ |
| 154 # Placeholder directory, no third-party code. |
| 155 os.path.join('third_party', 'adobe'), |
| 156 # Apache 2.0 license. See |
| 157 # https://code.google.com/p/chromium/issues/detail?id=140478. |
| 158 os.path.join('third_party', 'bidichecker'), |
| 159 ] |
| 160 return licenses.FindThirdPartyDirs(prune_paths) |
| 161 |
| 162 |
| 163 def _GenerateNoticeFile(print_warnings): |
| 164 """Generates the contents of an Android NOTICE file for the third-party code. |
| 165 Args: |
| 166 print_warnings: Whether to print warnings. |
| 167 Returns: |
| 168 The contents of the NOTICE file. |
| 169 """ |
| 170 |
| 171 third_party_dirs = _FindThirdPartyDirs() |
| 172 |
| 173 # Don't forget Chromium's LICENSE file |
| 174 content = [_ReadFile('LICENSE')] |
| 175 |
| 176 # We provide attribution for all third-party directories. |
| 177 # TODO(steveblock): Limit this to only code used by the WebView binary. |
| 178 for directory in third_party_dirs: |
| 179 content += [_ReadFile(licenses.ParseDir(directory)['License File'])] |
| 180 |
| 181 return '\n'.join(content) |
| 182 |
| 183 |
| 184 def main(): |
| 185 class IndentedHelpFormatterWithNL(optparse.IndentedHelpFormatter): |
| 186 def format_description(self, description): |
| 187 if not description: return "" |
| 188 desc_width = self.width - self.current_indent |
| 189 indent = " "*self.current_indent |
| 190 bits = description.split('\n') |
| 191 formatted_bits = [ |
| 192 textwrap.fill(bit, |
| 193 desc_width, |
| 194 initial_indent=indent, |
| 195 subsequent_indent=indent) |
| 196 for bit in bits] |
| 197 result = '\n'.join(formatted_bits) + '\n' |
| 198 return result |
| 199 |
| 200 parser = optparse.OptionParser(formatter=IndentedHelpFormatterWithNL(), |
| 201 usage='%prog [options]') |
| 202 parser.description = (__doc__ + |
| 203 '\nCommands:\n' \ |
| 204 ' scan Check licenses.\n' \ |
| 205 ' notice Generate Android NOTICE file on stdout') |
| 206 (options, args) = parser.parse_args() |
| 207 if len(args) != 1: |
| 208 parser.print_help() |
| 209 return 1 |
| 210 |
| 211 if args[0] == 'scan': |
| 212 if _Scan(): |
| 213 print 'OK!' |
| 214 return 0 |
| 215 else: |
| 216 return 1 |
| 217 elif args[0] == 'notice': |
| 218 print _GenerateNoticeFile(print_warnings=False) |
| 219 return 0 |
| 220 |
| 221 parser.print_help() |
| 222 return 1 |
| 223 |
| 224 if __name__ == '__main__': |
| 225 sys.exit(main()) |
OLD | NEW |