Upstream version 9.38.198.0
[platform/framework/web/crosswalk.git] / src / tools / licenses.py
1 #!/usr/bin/env python
2 # Copyright (c) 2012 The Chromium Authors. All rights reserved.
3 # Use of this source code is governed by a BSD-style license that can be
4 # found in the LICENSE file.
5
6 """Utility for checking and processing licensing information in third_party
7 directories.
8
9 Usage: licenses.py <command>
10
11 Commands:
12   scan     scan third_party directories, verifying that we have licensing info
13   credits  generate about:credits on stdout
14
15 (You can also import this as a module.)
16 """
17
18 import cgi
19 import os
20 import sys
21
22 # Paths from the root of the tree to directories to skip.
23 PRUNE_PATHS = set([
24     # Same module occurs in crypto/third_party/nss and net/third_party/nss, so
25     # skip this one.
26     os.path.join('third_party','nss'),
27
28     # Placeholder directory only, not third-party code.
29     os.path.join('third_party','adobe'),
30
31     # Build files only, not third-party code.
32     os.path.join('third_party','widevine'),
33
34     # Only binaries, used during development.
35     os.path.join('third_party','valgrind'),
36
37     # Used for development and test, not in the shipping product.
38     os.path.join('build','secondary'),
39     os.path.join('third_party','bison'),
40     os.path.join('third_party','blanketjs'),
41     os.path.join('third_party','cygwin'),
42     os.path.join('third_party','gnu_binutils'),
43     os.path.join('third_party','gold'),
44     os.path.join('third_party','gperf'),
45     os.path.join('third_party','lighttpd'),
46     os.path.join('third_party','llvm'),
47     os.path.join('third_party','llvm-build'),
48     os.path.join('third_party','mingw-w64'),
49     os.path.join('third_party','nacl_sdk_binaries'),
50     os.path.join('third_party','pefile'),
51     os.path.join('third_party','perl'),
52     os.path.join('third_party','psyco_win32'),
53     os.path.join('third_party','pylib'),
54     os.path.join('third_party','pywebsocket'),
55     os.path.join('third_party','qunit'),
56     os.path.join('third_party','sinonjs'),
57     os.path.join('third_party','syzygy'),
58     os.path.join('tools', 'profile_chrome', 'third_party'),
59
60     # Chromium code in third_party.
61     os.path.join('third_party','fuzzymatch'),
62     os.path.join('tools', 'swarming_client'),
63
64     # Stuff pulled in from chrome-internal for official builds/tools.
65     os.path.join('third_party', 'clear_cache'),
66     os.path.join('third_party', 'gnu'),
67     os.path.join('third_party', 'googlemac'),
68     os.path.join('third_party', 'pcre'),
69     os.path.join('third_party', 'psutils'),
70     os.path.join('third_party', 'sawbuck'),
71
72     # Redistribution does not require attribution in documentation.
73     os.path.join('third_party','directxsdk'),
74     os.path.join('third_party','platformsdk_win2008_6_1'),
75     os.path.join('third_party','platformsdk_win7'),
76 ])
77
78 # Directories we don't scan through.
79 VCS_METADATA_DIRS = ('.svn', '.git')
80 PRUNE_DIRS = (VCS_METADATA_DIRS +
81               ('out', 'Debug', 'Release',  # build files
82                'layout_tests'))            # lots of subdirs
83
84 ADDITIONAL_PATHS = (
85     os.path.join('breakpad'),
86     os.path.join('chrome', 'common', 'extensions', 'docs', 'examples'),
87     os.path.join('chrome', 'test', 'chromeos', 'autotest'),
88     os.path.join('chrome', 'test', 'data'),
89     os.path.join('native_client'),
90     os.path.join('net', 'tools', 'spdyshark'),
91     os.path.join('sdch', 'open-vcdiff'),
92     os.path.join('testing', 'gmock'),
93     os.path.join('testing', 'gtest'),
94     os.path.join('tools', 'grit'),
95     os.path.join('tools', 'gyp'),
96     os.path.join('tools', 'page_cycler', 'acid3'),
97     os.path.join('url', 'third_party', 'mozilla'),
98     os.path.join('v8'),
99     # Fake directory so we can include the strongtalk license.
100     os.path.join('v8', 'strongtalk'),
101     os.path.join('v8', 'third_party', 'fdlibm'),
102 )
103
104
105 # Directories where we check out directly from upstream, and therefore
106 # can't provide a README.chromium.  Please prefer a README.chromium
107 # wherever possible.
108 SPECIAL_CASES = {
109     os.path.join('native_client'): {
110         "Name": "native client",
111         "URL": "http://code.google.com/p/nativeclient",
112         "License": "BSD",
113     },
114     os.path.join('sdch', 'open-vcdiff'): {
115         "Name": "open-vcdiff",
116         "URL": "http://code.google.com/p/open-vcdiff",
117         "License": "Apache 2.0, MIT, GPL v2 and custom licenses",
118         "License Android Compatible": "yes",
119     },
120     os.path.join('testing', 'gmock'): {
121         "Name": "gmock",
122         "URL": "http://code.google.com/p/googlemock",
123         "License": "BSD",
124         "License File": "NOT_SHIPPED",
125     },
126     os.path.join('testing', 'gtest'): {
127         "Name": "gtest",
128         "URL": "http://code.google.com/p/googletest",
129         "License": "BSD",
130         "License File": "NOT_SHIPPED",
131     },
132     os.path.join('third_party', 'angle'): {
133         "Name": "Almost Native Graphics Layer Engine",
134         "URL": "http://code.google.com/p/angleproject/",
135         "License": "BSD",
136     },
137     os.path.join('third_party', 'cros_system_api'): {
138         "Name": "Chromium OS system API",
139         "URL": "http://www.chromium.org/chromium-os",
140         "License": "BSD",
141         # Absolute path here is resolved as relative to the source root.
142         "License File": "/LICENSE.chromium_os",
143     },
144     os.path.join('third_party', 'lss'): {
145         "Name": "linux-syscall-support",
146         "URL": "http://code.google.com/p/linux-syscall-support/",
147         "License": "BSD",
148         "License File": "/LICENSE",
149     },
150     os.path.join('third_party', 'ots'): {
151         "Name": "OTS (OpenType Sanitizer)",
152         "URL": "http://code.google.com/p/ots/",
153         "License": "BSD",
154     },
155     os.path.join('third_party', 'pdfium'): {
156         "Name": "PDFium",
157         "URL": "http://code.google.com/p/pdfium/",
158         "License": "BSD",
159     },
160     os.path.join('third_party', 'pdfsqueeze'): {
161         "Name": "pdfsqueeze",
162         "URL": "http://code.google.com/p/pdfsqueeze/",
163         "License": "Apache 2.0",
164         "License File": "COPYING",
165     },
166     os.path.join('third_party', 'ppapi'): {
167         "Name": "ppapi",
168         "URL": "http://code.google.com/p/ppapi/",
169     },
170     os.path.join('third_party', 'scons-2.0.1'): {
171         "Name": "scons-2.0.1",
172         "URL": "http://www.scons.org",
173         "License": "MIT",
174         "License File": "NOT_SHIPPED",
175     },
176     os.path.join('third_party', 'trace-viewer'): {
177         "Name": "trace-viewer",
178         "URL": "http://code.google.com/p/trace-viewer",
179         "License": "BSD",
180         "License File": "NOT_SHIPPED",
181     },
182     os.path.join('third_party', 'v8-i18n'): {
183         "Name": "Internationalization Library for v8",
184         "URL": "http://code.google.com/p/v8-i18n/",
185         "License": "Apache 2.0",
186     },
187     os.path.join('third_party', 'WebKit'): {
188         "Name": "WebKit",
189         "URL": "http://webkit.org/",
190         "License": "BSD and GPL v2",
191         # Absolute path here is resolved as relative to the source root.
192         "License File": "/webkit/LICENSE",
193     },
194     os.path.join('third_party', 'webpagereplay'): {
195         "Name": "webpagereplay",
196         "URL": "http://code.google.com/p/web-page-replay",
197         "License": "Apache 2.0",
198         "License File": "NOT_SHIPPED",
199     },
200     os.path.join('tools', 'grit'): {
201         "Name": "grit",
202         "URL": "http://code.google.com/p/grit-i18n",
203         "License": "BSD",
204         "License File": "NOT_SHIPPED",
205     },
206     os.path.join('tools', 'gyp'): {
207         "Name": "gyp",
208         "URL": "http://code.google.com/p/gyp",
209         "License": "BSD",
210         "License File": "NOT_SHIPPED",
211     },
212     os.path.join('v8'): {
213         "Name": "V8 JavaScript Engine",
214         "URL": "http://code.google.com/p/v8",
215         "License": "BSD",
216     },
217     os.path.join('v8', 'strongtalk'): {
218         "Name": "Strongtalk",
219         "URL": "http://www.strongtalk.org/",
220         "License": "BSD",
221         # Absolute path here is resolved as relative to the source root.
222         "License File": "/v8/LICENSE.strongtalk",
223     },
224     os.path.join('v8', 'third_party', 'fdlibm'): {
225         "Name": "fdlibm",
226         "URL": "http://www.netlib.org/fdlibm/",
227         "License": "Freely Distributable",
228         # Absolute path here is resolved as relative to the source root.
229         "License File" : "/v8/third_party/fdlibm/LICENSE",
230         "License Android Compatible" : "yes",
231     },
232 }
233
234 # Special value for 'License File' field used to indicate that the license file
235 # should not be used in about:credits.
236 NOT_SHIPPED = "NOT_SHIPPED"
237
238
239 class LicenseError(Exception):
240     """We raise this exception when a directory's licensing info isn't
241     fully filled out."""
242     pass
243
244 def AbsolutePath(path, filename, root):
245     """Convert a path in README.chromium to be absolute based on the source
246     root."""
247     if filename.startswith('/'):
248         # Absolute-looking paths are relative to the source root
249         # (which is the directory we're run from).
250         absolute_path = os.path.join(root, filename[1:])
251     else:
252         absolute_path = os.path.join(root, path, filename)
253     if os.path.exists(absolute_path):
254         return absolute_path
255     return None
256
257 def ParseDir(path, root, require_license_file=True):
258     """Examine a third_party/foo component and extract its metadata."""
259
260     # Parse metadata fields out of README.chromium.
261     # We examine "LICENSE" for the license file by default.
262     metadata = {
263         "License File": "LICENSE",  # Relative path to license text.
264         "Name": None,               # Short name (for header on about:credits).
265         "URL": None,                # Project home page.
266         "License": None,            # Software license.
267         }
268
269     # Relative path to a file containing some html we're required to place in
270     # about:credits.
271     optional_keys = ["Required Text", "License Android Compatible"]
272
273     if path in SPECIAL_CASES:
274         metadata.update(SPECIAL_CASES[path])
275     else:
276         # Try to find README.chromium.
277         readme_path = os.path.join(root, path, 'README.chromium')
278         if not os.path.exists(readme_path):
279             raise LicenseError("missing README.chromium or licenses.py "
280                                "SPECIAL_CASES entry")
281
282         for line in open(readme_path):
283             line = line.strip()
284             if not line:
285                 break
286             for key in metadata.keys() + optional_keys:
287                 field = key + ": "
288                 if line.startswith(field):
289                     metadata[key] = line[len(field):]
290
291     # Check that all expected metadata is present.
292     for key, value in metadata.iteritems():
293         if not value:
294             raise LicenseError("couldn't find '" + key + "' line "
295                                "in README.chromium or licences.py "
296                                "SPECIAL_CASES")
297
298     # Special-case modules that aren't in the shipping product, so don't need
299     # their license in about:credits.
300     if metadata["License File"] != NOT_SHIPPED:
301         # Check that the license file exists.
302         for filename in (metadata["License File"], "COPYING"):
303             license_path = AbsolutePath(path, filename, root)
304             if license_path is not None:
305                 break
306
307         if require_license_file and not license_path:
308             raise LicenseError("License file not found. "
309                                "Either add a file named LICENSE, "
310                                "import upstream's COPYING if available, "
311                                "or add a 'License File:' line to "
312                                "README.chromium with the appropriate path.")
313         metadata["License File"] = license_path
314
315     if "Required Text" in metadata:
316         required_path = AbsolutePath(path, metadata["Required Text"], root)
317         if required_path is not None:
318             metadata["Required Text"] = required_path
319         else:
320             raise LicenseError("Required text file listed but not found.")
321
322     return metadata
323
324
325 def ContainsFiles(path, root):
326     """Determines whether any files exist in a directory or in any of its
327     subdirectories."""
328     for _, dirs, files in os.walk(os.path.join(root, path)):
329         if files:
330             return True
331         for vcs_metadata in VCS_METADATA_DIRS:
332             if vcs_metadata in dirs:
333                 dirs.remove(vcs_metadata)
334     return False
335
336
337 def FilterDirsWithFiles(dirs_list, root):
338     # If a directory contains no files, assume it's a DEPS directory for a
339     # project not used by our current configuration and skip it.
340     return [x for x in dirs_list if ContainsFiles(x, root)]
341
342
343 def FindThirdPartyDirs(prune_paths, root):
344     """Find all third_party directories underneath the source root."""
345     third_party_dirs = set()
346     for path, dirs, files in os.walk(root):
347         path = path[len(root)+1:]  # Pretty up the path.
348
349         if path in prune_paths:
350             dirs[:] = []
351             continue
352
353         # Prune out directories we want to skip.
354         # (Note that we loop over PRUNE_DIRS so we're not iterating over a
355         # list that we're simultaneously mutating.)
356         for skip in PRUNE_DIRS:
357             if skip in dirs:
358                 dirs.remove(skip)
359
360         if os.path.basename(path) == 'third_party':
361             # Add all subdirectories that are not marked for skipping.
362             for dir in dirs:
363                 dirpath = os.path.join(path, dir)
364                 if dirpath not in prune_paths:
365                     third_party_dirs.add(dirpath)
366
367             # Don't recurse into any subdirs from here.
368             dirs[:] = []
369             continue
370
371         # Don't recurse into paths in ADDITIONAL_PATHS, like we do with regular
372         # third_party/foo paths.
373         if path in ADDITIONAL_PATHS:
374             dirs[:] = []
375
376     for dir in ADDITIONAL_PATHS:
377         if dir not in prune_paths:
378             third_party_dirs.add(dir)
379
380     return third_party_dirs
381
382
383 def ScanThirdPartyDirs(root=None):
384     """Scan a list of directories and report on any problems we find."""
385     if root is None:
386       root = os.getcwd()
387     third_party_dirs = FindThirdPartyDirs(PRUNE_PATHS, root)
388     third_party_dirs = FilterDirsWithFiles(third_party_dirs, root)
389
390     errors = []
391     for path in sorted(third_party_dirs):
392         try:
393             metadata = ParseDir(path, root)
394         except LicenseError, e:
395             errors.append((path, e.args[0]))
396             continue
397
398     for path, error in sorted(errors):
399         print path + ": " + error
400
401     return len(errors) == 0
402
403
404 def GenerateCredits():
405     """Generate about:credits."""
406
407     if len(sys.argv) not in (2, 3):
408       print 'usage: licenses.py credits [output_file]'
409       return False
410
411     def EvaluateTemplate(template, env, escape=True):
412         """Expand a template with variables like {{foo}} using a
413         dictionary of expansions."""
414         for key, val in env.items():
415             if escape and not key.endswith("_unescaped"):
416                 val = cgi.escape(val)
417             template = template.replace('{{%s}}' % key, val)
418         return template
419
420     root = os.path.join(os.path.dirname(__file__), '..')
421     third_party_dirs = FindThirdPartyDirs(PRUNE_PATHS, root)
422
423     entry_template = open(os.path.join(root, 'chrome', 'browser', 'resources',
424                                        'about_credits_entry.tmpl'), 'rb').read()
425     entries = []
426     for path in sorted(third_party_dirs):
427         try:
428             metadata = ParseDir(path, root)
429         except LicenseError:
430             # TODO(phajdan.jr): Convert to fatal error (http://crbug.com/39240).
431             continue
432         if metadata['License File'] == NOT_SHIPPED:
433             continue
434         env = {
435             'name': metadata['Name'],
436             'url': metadata['URL'],
437             'license': open(metadata['License File'], 'rb').read(),
438             'license_unescaped': '',
439         }
440         if 'Required Text' in metadata:
441             required_text = open(metadata['Required Text'], 'rb').read()
442             env["license_unescaped"] = required_text
443         entries.append(EvaluateTemplate(entry_template, env))
444
445     file_template = open(os.path.join(root, 'chrome', 'browser', 'resources',
446                                       'about_credits.tmpl'), 'rb').read()
447     template_contents = "<!-- Generated by licenses.py; do not edit. -->"
448     template_contents += EvaluateTemplate(file_template,
449                                           {'entries': '\n'.join(entries)},
450                                           escape=False)
451
452     if len(sys.argv) == 3:
453       with open(sys.argv[2], 'w') as output_file:
454         output_file.write(template_contents)
455     elif len(sys.argv) == 2:
456       print template_contents
457
458     return True
459
460
461 def main():
462     command = 'help'
463     if len(sys.argv) > 1:
464         command = sys.argv[1]
465
466     if command == 'scan':
467         if not ScanThirdPartyDirs():
468             return 1
469     elif command == 'credits':
470         if not GenerateCredits():
471             return 1
472     else:
473         print __doc__
474         return 1
475
476
477 if __name__ == '__main__':
478   sys.exit(main())