# Copyright 2013 The Chromium Authors. All rights reserved. # Use of this source code is governed by a BSD-style license that can be # found in the LICENSE file. """Contains common helpers for GN action()s.""" import collections import contextlib import filecmp import fnmatch import json import os import pipes import re import shutil import stat import subprocess import sys import tempfile import zipfile # Any new non-system import must be added to: # //build/config/android/internal_rules.gni # Some clients do not add //build/android/gyp to PYTHONPATH. import build.android.gyp.util.md5_check as md5_check # pylint: disable=relative-import import build.gn_helpers as gn_helpers # Definition copied from pylib/constants/__init__.py to avoid adding # a dependency on pylib. DIR_SOURCE_ROOT = os.environ.get('CHECKOUT_SOURCE_ROOT', os.path.abspath(os.path.join(os.path.dirname(__file__), os.pardir, os.pardir, os.pardir, os.pardir))) HERMETIC_TIMESTAMP = (2001, 1, 1, 0, 0, 0) _HERMETIC_FILE_ATTR = (0o644 << 16) @contextlib.contextmanager def TempDir(): dirname = tempfile.mkdtemp() try: yield dirname finally: shutil.rmtree(dirname) def MakeDirectory(dir_path): try: os.makedirs(dir_path) except OSError: pass def DeleteDirectory(dir_path): if os.path.exists(dir_path): shutil.rmtree(dir_path) def Touch(path, fail_if_missing=False): if fail_if_missing and not os.path.exists(path): raise Exception(path + ' doesn\'t exist.') MakeDirectory(os.path.dirname(path)) with open(path, 'a'): os.utime(path, None) def FindInDirectory(directory, filename_filter): files = [] for root, _dirnames, filenames in os.walk(directory): matched_files = fnmatch.filter(filenames, filename_filter) files.extend((os.path.join(root, f) for f in matched_files)) return files def ReadBuildVars(path): """Parses a build_vars.txt into a dict.""" with open(path) as f: return dict(l.rstrip().split('=', 1) for l in f) def ParseGnList(gn_string): """Converts a command-line parameter into a list. If the input starts with a '[' it is assumed to be a GN-formatted list and it will be parsed accordingly. When empty an empty list will be returned. Otherwise, the parameter will be treated as a single raw string (not GN-formatted in that it's not assumed to have literal quotes that must be removed) and a list will be returned containing that string. The common use for this behavior is in the Android build where things can take lists of @FileArg references that are expanded via ExpandFileArgs. """ if gn_string.startswith('['): parser = gn_helpers.GNValueParser(gn_string) return parser.ParseList() if len(gn_string): return [ gn_string ] return [] def CheckOptions(options, parser, required=None): if not required: return for option_name in required: if getattr(options, option_name) is None: parser.error('--%s is required' % option_name.replace('_', '-')) def WriteJson(obj, path, only_if_changed=False): old_dump = None if os.path.exists(path): with open(path, 'r') as oldfile: old_dump = oldfile.read() new_dump = json.dumps(obj, sort_keys=True, indent=2, separators=(',', ': ')) if not only_if_changed or old_dump != new_dump: with open(path, 'w') as outfile: outfile.write(new_dump) @contextlib.contextmanager def AtomicOutput(path, only_if_changed=True): """Helper to prevent half-written outputs. Args: path: Path to the final output file, which will be written atomically. only_if_changed: If True (the default), do not touch the filesystem if the content has not changed. Returns: A python context manager that yelds a NamedTemporaryFile instance that must be used by clients to write the data to. On exit, the manager will try to replace the final output file with the temporary one if necessary. The temporary file is always destroyed on exit. Example: with build_utils.AtomicOutput(output_path) as tmp_file: subprocess.check_call(['prog', '--output', tmp_file.name]) """ # Create in same directory to ensure same filesystem when moving. with tempfile.NamedTemporaryFile(suffix=os.path.basename(path), dir=os.path.dirname(path), delete=False) as f: try: yield f # file should be closed before comparison/move. f.close() if not (only_if_changed and os.path.exists(path) and filecmp.cmp(f.name, path)): shutil.move(f.name, path) finally: if os.path.exists(f.name): os.unlink(f.name) class CalledProcessError(Exception): """This exception is raised when the process run by CheckOutput exits with a non-zero exit code.""" def __init__(self, cwd, args, output): super(CalledProcessError, self).__init__() self.cwd = cwd self.args = args self.output = output def __str__(self): # A user should be able to simply copy and paste the command that failed # into their shell. copyable_command = '( cd {}; {} )'.format(os.path.abspath(self.cwd), ' '.join(map(pipes.quote, self.args))) return 'Command failed: {}\n{}'.format(copyable_command, self.output) # This can be used in most cases like subprocess.check_output(). The output, # particularly when the command fails, better highlights the command's failure. # If the command fails, raises a build_utils.CalledProcessError. def CheckOutput(args, cwd=None, env=None, print_stdout=False, print_stderr=True, stdout_filter=None, stderr_filter=None, fail_func=lambda returncode, stderr: returncode != 0): if not cwd: cwd = os.getcwd() child = subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE, cwd=cwd, env=env) stdout, stderr = child.communicate() if stdout_filter is not None: stdout = stdout_filter(stdout) if stderr_filter is not None: stderr = stderr_filter(stderr) if fail_func(child.returncode, stderr): raise CalledProcessError(cwd, args, stdout + stderr) if print_stdout: sys.stdout.write(stdout) if print_stderr: sys.stderr.write(stderr) return stdout def GetModifiedTime(path): # For a symlink, the modified time should be the greater of the link's # modified time and the modified time of the target. return max(os.lstat(path).st_mtime, os.stat(path).st_mtime) def IsTimeStale(output, inputs): if not os.path.exists(output): return True output_time = GetModifiedTime(output) for i in inputs: if GetModifiedTime(i) > output_time: return True return False def _CheckZipPath(name): if os.path.normpath(name) != name: raise Exception('Non-canonical zip path: %s' % name) if os.path.isabs(name): raise Exception('Absolute zip path: %s' % name) def _IsSymlink(zip_file, name): zi = zip_file.getinfo(name) # The two high-order bytes of ZipInfo.external_attr represent # UNIX permissions and file type bits. return stat.S_ISLNK(zi.external_attr >> 16) def ExtractAll(zip_path, path=None, no_clobber=True, pattern=None, predicate=None): if path is None: path = os.getcwd() elif not os.path.exists(path): MakeDirectory(path) if not zipfile.is_zipfile(zip_path): raise Exception('Invalid zip file: %s' % zip_path) extracted = [] with zipfile.ZipFile(zip_path) as z: for name in z.namelist(): if name.endswith('/'): MakeDirectory(os.path.join(path, name)) continue if pattern is not None: if not fnmatch.fnmatch(name, pattern): continue if predicate and not predicate(name): continue _CheckZipPath(name) if no_clobber: output_path = os.path.join(path, name) if os.path.exists(output_path): raise Exception( 'Path already exists from zip: %s %s %s' % (zip_path, name, output_path)) if _IsSymlink(z, name): dest = os.path.join(path, name) MakeDirectory(os.path.dirname(dest)) os.symlink(z.read(name), dest) extracted.append(dest) else: z.extract(name, path) extracted.append(os.path.join(path, name)) return extracted def AddToZipHermetic(zip_file, zip_path, src_path=None, data=None, compress=None): """Adds a file to the given ZipFile with a hard-coded modified time. Args: zip_file: ZipFile instance to add the file to. zip_path: Destination path within the zip file. src_path: Path of the source file. Mutually exclusive with |data|. data: File data as a string. compress: Whether to enable compression. Default is taken from ZipFile constructor. """ assert (src_path is None) != (data is None), ( '|src_path| and |data| are mutually exclusive.') _CheckZipPath(zip_path) zipinfo = zipfile.ZipInfo(filename=zip_path, date_time=HERMETIC_TIMESTAMP) zipinfo.external_attr = _HERMETIC_FILE_ATTR if src_path and os.path.islink(src_path): zipinfo.filename = zip_path zipinfo.external_attr |= stat.S_IFLNK << 16 # mark as a symlink zip_file.writestr(zipinfo, os.readlink(src_path)) return if src_path: with open(src_path) as f: data = f.read() # zipfile will deflate even when it makes the file bigger. To avoid # growing files, disable compression at an arbitrary cut off point. if len(data) < 16: compress = False # None converts to ZIP_STORED, when passed explicitly rather than the # default passed to the ZipFile constructor. compress_type = zip_file.compression if compress is not None: compress_type = zipfile.ZIP_DEFLATED if compress else zipfile.ZIP_STORED zip_file.writestr(zipinfo, data, compress_type) def DoZip(inputs, output, base_dir=None, compress_fn=None): """Creates a zip file from a list of files. Args: inputs: A list of paths to zip, or a list of (zip_path, fs_path) tuples. output: Destination .zip file. base_dir: Prefix to strip from inputs. compress_fn: Applied to each input to determine whether or not to compress. By default, items will be |zipfile.ZIP_STORED|. """ input_tuples = [] for tup in inputs: if isinstance(tup, str): tup = (os.path.relpath(tup, base_dir), tup) input_tuples.append(tup) # Sort by zip path to ensure stable zip ordering. input_tuples.sort(key=lambda tup: tup[0]) with zipfile.ZipFile(output, 'w') as outfile: for zip_path, fs_path in input_tuples: compress = compress_fn(zip_path) if compress_fn else None AddToZipHermetic(outfile, zip_path, src_path=fs_path, compress=compress) def ZipDir(output, base_dir, compress_fn=None): """Creates a zip file from a directory.""" inputs = [] for root, _, files in os.walk(base_dir): for f in files: inputs.append(os.path.join(root, f)) with AtomicOutput(output) as f: DoZip(inputs, f, base_dir, compress_fn=compress_fn) def MatchesGlob(path, filters): """Returns whether the given path matches any of the given glob patterns.""" return filters and any(fnmatch.fnmatch(path, f) for f in filters) def MergeZips(output, input_zips, path_transform=None): """Combines all files from |input_zips| into |output|. Args: output: Path or ZipFile instance to add files to. input_zips: Iterable of paths to zip files to merge. path_transform: Called for each entry path. Returns a new path, or None to skip the file. """ path_transform = path_transform or (lambda p: p) added_names = set() output_is_already_open = not isinstance(output, str) if output_is_already_open: assert isinstance(output, zipfile.ZipFile) out_zip = output else: out_zip = zipfile.ZipFile(output, 'w') try: for in_file in input_zips: with zipfile.ZipFile(in_file, 'r') as in_zip: # ijar creates zips with null CRCs. in_zip._expected_crc = None for info in in_zip.infolist(): # Ignore directories. if info.filename[-1] == '/': continue dst_name = path_transform(info.filename) if not dst_name: continue already_added = dst_name in added_names if not already_added: AddToZipHermetic(out_zip, dst_name, data=in_zip.read(info), compress=info.compress_type != zipfile.ZIP_STORED) added_names.add(dst_name) finally: if not output_is_already_open: out_zip.close() def GetSortedTransitiveDependencies(top, deps_func): """Gets the list of all transitive dependencies in sorted order. There should be no cycles in the dependency graph (crashes if cycles exist). Args: top: A list of the top level nodes deps_func: A function that takes a node and returns a list of its direct dependencies. Returns: A list of all transitive dependencies of nodes in top, in order (a node will appear in the list at a higher index than all of its dependencies). """ # Find all deps depth-first, maintaining original order in the case of ties. deps_map = collections.OrderedDict() def discover(nodes): for node in nodes: if node in deps_map: continue deps = deps_func(node) discover(deps) deps_map[node] = deps discover(top) return deps_map.keys() def _ComputePythonDependencies(): """Gets the paths of imported non-system python modules. A path is assumed to be a "system" import if it is outside of chromium's src/. The paths will be relative to the current directory. """ _ForceLazyModulesToLoad() module_paths = (m.__file__ for m in sys.modules.values() if m is not None and hasattr(m, '__file__')) abs_module_paths = map(os.path.abspath, module_paths) assert os.path.isabs(DIR_SOURCE_ROOT) non_system_module_paths = [ p for p in abs_module_paths if p.startswith(DIR_SOURCE_ROOT)] def ConvertPycToPy(s): if s.endswith('.pyc'): return s[:-1] return s non_system_module_paths = map(ConvertPycToPy, non_system_module_paths) non_system_module_paths = map(os.path.relpath, non_system_module_paths) return sorted(set(non_system_module_paths)) def _ForceLazyModulesToLoad(): """Forces any lazily imported modules to fully load themselves. Inspecting the modules' __file__ attribute causes lazily imported modules (e.g. from email) to get fully imported and update sys.modules. Iterate over the values until sys.modules stabilizes so that no modules are missed. """ while True: num_modules_before = len(sys.modules.keys()) for m in sys.modules.values(): if m is not None and hasattr(m, '__file__'): _ = m.__file__ num_modules_after = len(sys.modules.keys()) if num_modules_before == num_modules_after: break def AddDepfileOption(parser): # TODO(agrieve): Get rid of this once we've moved to argparse. if hasattr(parser, 'add_option'): func = parser.add_option else: func = parser.add_argument func('--depfile', help='Path to depfile (refer to `gn help depfile`)') def WriteDepfile(depfile_path, first_gn_output, inputs=None, add_pydeps=True): assert depfile_path != first_gn_output # http://crbug.com/646165 inputs = inputs or [] if add_pydeps: inputs = _ComputePythonDependencies() + inputs MakeDirectory(os.path.dirname(depfile_path)) # Ninja does not support multiple outputs in depfiles. with open(depfile_path, 'w') as depfile: depfile.write(first_gn_output.replace(' ', '\\ ')) depfile.write(': ') depfile.write(' '.join(i.replace(' ', '\\ ') for i in inputs)) depfile.write('\n') def ExpandFileArgs(args): """Replaces file-arg placeholders in args. These placeholders have the form: @FileArg(filename:key1:key2:...:keyn) The value of such a placeholder is calculated by reading 'filename' as json. And then extracting the value at [key1][key2]...[keyn]. Note: This intentionally does not return the list of files that appear in such placeholders. An action that uses file-args *must* know the paths of those files prior to the parsing of the arguments (typically by explicitly listing them in the action's inputs in build files). """ new_args = list(args) file_jsons = dict() r = re.compile('@FileArg\((.*?)\)') for i, arg in enumerate(args): match = r.search(arg) if not match: continue if match.end() != len(arg): raise Exception('Unexpected characters after FileArg: ' + arg) lookup_path = match.group(1).split(':') file_path = lookup_path[0] if not file_path in file_jsons: with open(file_path) as f: file_jsons[file_path] = json.load(f) expansion = file_jsons[file_path] for k in lookup_path[1:]: expansion = expansion[k] # This should match ParseGNList. The output is either a GN-formatted list # or a literal (with no quotes). if isinstance(expansion, list): new_args[i] = arg[:match.start()] + gn_helpers.ToGNString(expansion) else: new_args[i] = arg[:match.start()] + str(expansion) return new_args def ReadSourcesList(sources_list_file_name): """Reads a GN-written file containing list of file names and returns a list. Note that this function should not be used to parse response files. """ with open(sources_list_file_name) as f: return [file_name.strip() for file_name in f] def CallAndWriteDepfileIfStale(function, options, record_path=None, input_paths=None, input_strings=None, output_paths=None, force=False, pass_changes=False, depfile_deps=None, add_pydeps=True): """Wraps md5_check.CallAndRecordIfStale() and writes a depfile if applicable. Depfiles are automatically added to output_paths when present in the |options| argument. They are then created after |function| is called. By default, only python dependencies are added to the depfile. If there are other input paths that are not captured by GN deps, then they should be listed in depfile_deps. It's important to write paths to the depfile that are already captured by GN deps since GN args can cause GN deps to change, and such changes are not immediately reflected in depfiles (http://crbug.com/589311). """ if not output_paths: raise Exception('At least one output_path must be specified.') input_paths = list(input_paths or []) input_strings = list(input_strings or []) output_paths = list(output_paths or []) python_deps = None if hasattr(options, 'depfile') and options.depfile: python_deps = _ComputePythonDependencies() input_paths += python_deps output_paths += [options.depfile] def on_stale_md5(changes): args = (changes,) if pass_changes else () function(*args) if python_deps is not None: all_depfile_deps = list(python_deps) if add_pydeps else [] if depfile_deps: all_depfile_deps.extend(depfile_deps) WriteDepfile(options.depfile, output_paths[0], all_depfile_deps, add_pydeps=False) md5_check.CallAndRecordIfStale( on_stale_md5, record_path=record_path, input_paths=input_paths, input_strings=input_strings, output_paths=output_paths, force=force, pass_changes=True)