blob: d1d3a726731d82ba1251f1310d2e65ce80be7d2c [file] [log] [blame]
# Copyright 2013 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
"""Contains common helpers for GN action()s."""
import atexit
import collections
import contextlib
import filecmp
import fnmatch
import json
import logging
import os
import pipes
import re
import shutil
import stat
import subprocess
import sys
import tempfile
import time
import zipfile
sys.path.append(os.path.join(os.path.dirname(__file__),
os.pardir, os.pardir, os.pardir))
import gn_helpers
# Use relative paths to improved hermetic property of build scripts.
DIR_SOURCE_ROOT = os.path.relpath(
os.environ.get(
'CHECKOUT_SOURCE_ROOT',
os.path.join(
os.path.dirname(__file__), os.pardir, os.pardir, os.pardir,
os.pardir)))
JAVA_HOME = os.path.join(DIR_SOURCE_ROOT, 'third_party', 'jdk', 'current')
JAVAC_PATH = os.path.join(JAVA_HOME, 'bin', 'javac')
JAVAP_PATH = os.path.join(JAVA_HOME, 'bin', 'javap')
RT_JAR_PATH = os.path.join(DIR_SOURCE_ROOT, 'third_party', 'jdk', 'extras',
'java_8', 'jre', 'lib', 'rt.jar')
try:
string_types = basestring
except NameError:
string_types = (str, bytes)
def JavaCmd(verify=True, xmx='1G'):
ret = [os.path.join(JAVA_HOME, 'bin', 'java')]
# Limit heap to avoid Java not GC'ing when it should, and causing
# bots to OOM when many java commands are runnig at the same time
# https://crbug.com/1098333
ret += ['-Xmx' + xmx]
# Disable bytecode verification for local builds gives a ~2% speed-up.
if not verify:
ret += ['-noverify']
return ret
@contextlib.contextmanager
def TempDir(**kwargs):
dirname = tempfile.mkdtemp(**kwargs)
try:
yield dirname
finally:
shutil.rmtree(dirname)
def MakeDirectory(dir_path):
try:
os.makedirs(dir_path)
except OSError:
pass
def DeleteDirectory(dir_path):
if os.path.exists(dir_path):
shutil.rmtree(dir_path)
def Touch(path, fail_if_missing=False):
if fail_if_missing and not os.path.exists(path):
raise Exception(path + ' doesn\'t exist.')
MakeDirectory(os.path.dirname(path))
with open(path, 'a'):
os.utime(path, None)
def FindInDirectory(directory, filename_filter='*'):
files = []
for root, _dirnames, filenames in os.walk(directory):
matched_files = fnmatch.filter(filenames, filename_filter)
files.extend((os.path.join(root, f) for f in matched_files))
return files
def ParseGnList(value):
"""Converts a "GN-list" command-line parameter into a list.
Conversions handled:
* None -> []
* '' -> []
* 'asdf' -> ['asdf']
* '["a", "b"]' -> ['a', 'b']
* ['["a", "b"]', 'c'] -> ['a', 'b', 'c'] (flattened list)
The common use for this behavior is in the Android build where things can
take lists of @FileArg references that are expanded via ExpandFileArgs.
"""
# Convert None to [].
if not value:
return []
# Convert a list of GN lists to a flattened list.
if isinstance(value, list):
ret = []
for arg in value:
ret.extend(ParseGnList(arg))
return ret
# Convert normal GN list.
if value.startswith('['):
return gn_helpers.GNValueParser(value).ParseList()
# Convert a single string value to a list.
return [value]
def CheckOptions(options, parser, required=None):
if not required:
return
for option_name in required:
if getattr(options, option_name) is None:
parser.error('--%s is required' % option_name.replace('_', '-'))
def WriteJson(obj, path, only_if_changed=False):
old_dump = None
if os.path.exists(path):
with open(path, 'r') as oldfile:
old_dump = oldfile.read()
new_dump = json.dumps(obj, sort_keys=True, indent=2, separators=(',', ': '))
if not only_if_changed or old_dump != new_dump:
with open(path, 'w') as outfile:
outfile.write(new_dump)
@contextlib.contextmanager
def AtomicOutput(path, only_if_changed=True, mode='w+b'):
"""Helper to prevent half-written outputs.
Args:
path: Path to the final output file, which will be written atomically.
only_if_changed: If True (the default), do not touch the filesystem
if the content has not changed.
mode: The mode to open the file in (str).
Returns:
A python context manager that yelds a NamedTemporaryFile instance
that must be used by clients to write the data to. On exit, the
manager will try to replace the final output file with the
temporary one if necessary. The temporary file is always destroyed
on exit.
Example:
with build_utils.AtomicOutput(output_path) as tmp_file:
subprocess.check_call(['prog', '--output', tmp_file.name])
"""
# Create in same directory to ensure same filesystem when moving.
dirname = os.path.dirname(path)
if not os.path.exists(dirname):
MakeDirectory(dirname)
with tempfile.NamedTemporaryFile(
mode, suffix=os.path.basename(path), dir=dirname, delete=False) as f:
try:
yield f
# file should be closed before comparison/move.
f.close()
if not (only_if_changed and os.path.exists(path) and
filecmp.cmp(f.name, path)):
shutil.move(f.name, path)
finally:
if os.path.exists(f.name):
os.unlink(f.name)
class CalledProcessError(Exception):
"""This exception is raised when the process run by CheckOutput
exits with a non-zero exit code."""
def __init__(self, cwd, args, output):
super(CalledProcessError, self).__init__()
self.cwd = cwd
self.args = args
self.output = output
def __str__(self):
# A user should be able to simply copy and paste the command that failed
# into their shell.
copyable_command = '( cd {}; {} )'.format(os.path.abspath(self.cwd),
' '.join(map(pipes.quote, self.args)))
return 'Command failed: {}\n{}'.format(copyable_command, self.output)
def FilterLines(output, filter_string):
"""Output filter from build_utils.CheckOutput.
Args:
output: Executable output as from build_utils.CheckOutput.
filter_string: An RE string that will filter (remove) matching
lines from |output|.
Returns:
The filtered output, as a single string.
"""
re_filter = re.compile(filter_string)
return '\n'.join(
line for line in output.split('\n') if not re_filter.search(line))
def FilterReflectiveAccessJavaWarnings(output):
"""Filters out warnings about illegal reflective access operation.
These warnings were introduced in Java 9, and generally mean that dependencies
need to be updated.
"""
# WARNING: An illegal reflective access operation has occurred
# WARNING: Illegal reflective access by ...
# WARNING: Please consider reporting this to the maintainers of ...
# WARNING: Use --illegal-access=warn to enable warnings of further ...
# WARNING: All illegal access operations will be denied in a future release
return FilterLines(
output, r'WARNING: ('
'An illegal reflective|'
'Illegal reflective access|'
'Please consider reporting this to|'
'Use --illegal-access=warn|'
'All illegal access operations)')
# This can be used in most cases like subprocess.check_output(). The output,
# particularly when the command fails, better highlights the command's failure.
# If the command fails, raises a build_utils.CalledProcessError.
def CheckOutput(args,
cwd=None,
env=None,
print_stdout=False,
print_stderr=True,
stdout_filter=None,
stderr_filter=None,
fail_on_output=True,
fail_func=lambda returncode, stderr: returncode != 0):
if not cwd:
cwd = os.getcwd()
child = subprocess.Popen(args,
stdout=subprocess.PIPE, stderr=subprocess.PIPE, cwd=cwd, env=env)
stdout, stderr = child.communicate()
# For Python3 only:
if isinstance(stdout, bytes) and sys.version_info >= (3, ):
stdout = stdout.decode('utf-8')
stderr = stderr.decode('utf-8')
if stdout_filter is not None:
stdout = stdout_filter(stdout)
if stderr_filter is not None:
stderr = stderr_filter(stderr)
if fail_func and fail_func(child.returncode, stderr):
raise CalledProcessError(cwd, args, stdout + stderr)
if print_stdout:
sys.stdout.write(stdout)
if print_stderr:
sys.stderr.write(stderr)
has_stdout = print_stdout and stdout
has_stderr = print_stderr and stderr
if fail_on_output and (has_stdout or has_stderr):
MSG = """\
Command failed because it wrote to {}.
You can often set treat_warnings_as_errors=false to not treat output as \
failure (useful when developing locally)."""
if has_stdout and has_stderr:
stream_string = 'stdout and stderr'
elif has_stdout:
stream_string = 'stdout'
else:
stream_string = 'stderr'
raise CalledProcessError(cwd, args, MSG.format(stream_string))
return stdout
def GetModifiedTime(path):
# For a symlink, the modified time should be the greater of the link's
# modified time and the modified time of the target.
return max(os.lstat(path).st_mtime, os.stat(path).st_mtime)
def IsTimeStale(output, inputs):
if not os.path.exists(output):
return True
output_time = GetModifiedTime(output)
for i in inputs:
if GetModifiedTime(i) > output_time:
return True
return False
def _CheckZipPath(name):
if os.path.normpath(name) != name:
raise Exception('Non-canonical zip path: %s' % name)
if os.path.isabs(name):
raise Exception('Absolute zip path: %s' % name)
def _IsSymlink(zip_file, name):
zi = zip_file.getinfo(name)
# The two high-order bytes of ZipInfo.external_attr represent
# UNIX permissions and file type bits.
return stat.S_ISLNK(zi.external_attr >> 16)
def ExtractAll(zip_path, path=None, no_clobber=True, pattern=None,
predicate=None):
if path is None:
path = os.getcwd()
elif not os.path.exists(path):
MakeDirectory(path)
if not zipfile.is_zipfile(zip_path):
raise Exception('Invalid zip file: %s' % zip_path)
extracted = []
with zipfile.ZipFile(zip_path) as z:
for name in z.namelist():
if name.endswith('/'):
MakeDirectory(os.path.join(path, name))
continue
if pattern is not None:
if not fnmatch.fnmatch(name, pattern):
continue
if predicate and not predicate(name):
continue
_CheckZipPath(name)
if no_clobber:
output_path = os.path.join(path, name)
if os.path.exists(output_path):
raise Exception(
'Path already exists from zip: %s %s %s'
% (zip_path, name, output_path))
if _IsSymlink(z, name):
dest = os.path.join(path, name)
MakeDirectory(os.path.dirname(dest))
os.symlink(z.read(name), dest)
extracted.append(dest)
else:
z.extract(name, path)
extracted.append(os.path.join(path, name))
return extracted
def HermeticDateTime(timestamp=None):
"""Returns a constant ZipInfo.date_time tuple.
Args:
timestamp: Unix timestamp to use for files in the archive.
Returns:
A ZipInfo.date_time tuple for Jan 1, 2001, or the given timestamp.
"""
if not timestamp:
return (2001, 1, 1, 0, 0, 0)
utc_time = time.gmtime(timestamp)
return (utc_time.tm_year, utc_time.tm_mon, utc_time.tm_mday, utc_time.tm_hour,
utc_time.tm_min, utc_time.tm_sec)
def HermeticZipInfo(*args, **kwargs):
"""Creates a zipfile.ZipInfo with a constant timestamp and external_attr.
If a date_time value is not provided in the positional or keyword arguments,
the default value from HermeticDateTime is used.
Args:
See zipfile.ZipInfo.
Returns:
A zipfile.ZipInfo.
"""
# The caller may have provided a date_time either as a positional parameter
# (args[1]) or as a keyword parameter. Use the default hermetic date_time if
# none was provided.
date_time = None
if len(args) >= 2:
date_time = args[1]
elif 'date_time' in kwargs:
date_time = kwargs['date_time']
if not date_time:
kwargs['date_time'] = HermeticDateTime()
ret = zipfile.ZipInfo(*args, **kwargs)
ret.external_attr = (0o644 << 16)
return ret
def AddToZipHermetic(zip_file,
zip_path,
src_path=None,
data=None,
compress=None,
date_time=None):
"""Adds a file to the given ZipFile with a hard-coded modified time.
Args:
zip_file: ZipFile instance to add the file to.
zip_path: Destination path within the zip file (or ZipInfo instance).
src_path: Path of the source file. Mutually exclusive with |data|.
data: File data as a string.
compress: Whether to enable compression. Default is taken from ZipFile
constructor.
date_time: The last modification date and time for the archive member.
"""
assert (src_path is None) != (data is None), (
'|src_path| and |data| are mutually exclusive.')
if isinstance(zip_path, zipfile.ZipInfo):
zipinfo = zip_path
zip_path = zipinfo.filename
else:
zipinfo = HermeticZipInfo(filename=zip_path, date_time=date_time)
_CheckZipPath(zip_path)
if src_path and os.path.islink(src_path):
zipinfo.filename = zip_path
zipinfo.external_attr |= stat.S_IFLNK << 16 # mark as a symlink
zip_file.writestr(zipinfo, os.readlink(src_path))
return
# zipfile.write() does
# external_attr = (os.stat(src_path)[0] & 0xFFFF) << 16
# but we want to use _HERMETIC_FILE_ATTR, so manually set
# the few attr bits we care about.
if src_path:
st = os.stat(src_path)
for mode in (stat.S_IXUSR, stat.S_IXGRP, stat.S_IXOTH):
if st.st_mode & mode:
zipinfo.external_attr |= mode << 16
if src_path:
with open(src_path, 'rb') as f:
data = f.read()
# zipfile will deflate even when it makes the file bigger. To avoid
# growing files, disable compression at an arbitrary cut off point.
if len(data) < 16:
compress = False
# None converts to ZIP_STORED, when passed explicitly rather than the
# default passed to the ZipFile constructor.
compress_type = zip_file.compression
if compress is not None:
compress_type = zipfile.ZIP_DEFLATED if compress else zipfile.ZIP_STORED
zip_file.writestr(zipinfo, data, compress_type)
def DoZip(inputs,
output,
base_dir=None,
compress_fn=None,
zip_prefix_path=None,
timestamp=None):
"""Creates a zip file from a list of files.
Args:
inputs: A list of paths to zip, or a list of (zip_path, fs_path) tuples.
output: Path, fileobj, or ZipFile instance to add files to.
base_dir: Prefix to strip from inputs.
compress_fn: Applied to each input to determine whether or not to compress.
By default, items will be |zipfile.ZIP_STORED|.
zip_prefix_path: Path prepended to file path in zip file.
timestamp: Unix timestamp to use for files in the archive.
"""
if base_dir is None:
base_dir = '.'
input_tuples = []
for tup in inputs:
if isinstance(tup, string_types):
tup = (os.path.relpath(tup, base_dir), tup)
if tup[0].startswith('..'):
raise Exception('Invalid zip_path: ' + tup[0])
input_tuples.append(tup)
# Sort by zip path to ensure stable zip ordering.
input_tuples.sort(key=lambda tup: tup[0])
out_zip = output
if not isinstance(output, zipfile.ZipFile):
out_zip = zipfile.ZipFile(output, 'w')
date_time = HermeticDateTime(timestamp)
try:
for zip_path, fs_path in input_tuples:
if zip_prefix_path:
zip_path = os.path.join(zip_prefix_path, zip_path)
compress = compress_fn(zip_path) if compress_fn else None
AddToZipHermetic(out_zip,
zip_path,
src_path=fs_path,
compress=compress,
date_time=date_time)
finally:
if output is not out_zip:
out_zip.close()
def ZipDir(output, base_dir, compress_fn=None, zip_prefix_path=None):
"""Creates a zip file from a directory."""
inputs = []
for root, _, files in os.walk(base_dir):
for f in files:
inputs.append(os.path.join(root, f))
if isinstance(output, zipfile.ZipFile):
DoZip(
inputs,
output,
base_dir,
compress_fn=compress_fn,
zip_prefix_path=zip_prefix_path)
else:
with AtomicOutput(output) as f:
DoZip(
inputs,
f,
base_dir,
compress_fn=compress_fn,
zip_prefix_path=zip_prefix_path)
def MatchesGlob(path, filters):
"""Returns whether the given path matches any of the given glob patterns."""
return filters and any(fnmatch.fnmatch(path, f) for f in filters)
def MergeZips(output, input_zips, path_transform=None, compress=None):
"""Combines all files from |input_zips| into |output|.
Args:
output: Path, fileobj, or ZipFile instance to add files to.
input_zips: Iterable of paths to zip files to merge.
path_transform: Called for each entry path. Returns a new path, or None to
skip the file.
compress: Overrides compression setting from origin zip entries.
"""
path_transform = path_transform or (lambda p: p)
added_names = set()
out_zip = output
if not isinstance(output, zipfile.ZipFile):
out_zip = zipfile.ZipFile(output, 'w')
try:
for in_file in input_zips:
with zipfile.ZipFile(in_file, 'r') as in_zip:
for info in in_zip.infolist():
# Ignore directories.
if info.filename[-1] == '/':
continue
dst_name = path_transform(info.filename)
if not dst_name:
continue
already_added = dst_name in added_names
if not already_added:
if compress is not None:
compress_entry = compress
else:
compress_entry = info.compress_type != zipfile.ZIP_STORED
AddToZipHermetic(
out_zip,
dst_name,
data=in_zip.read(info),
compress=compress_entry)
added_names.add(dst_name)
finally:
if output is not out_zip:
out_zip.close()
def GetSortedTransitiveDependencies(top, deps_func):
"""Gets the list of all transitive dependencies in sorted order.
There should be no cycles in the dependency graph (crashes if cycles exist).
Args:
top: A list of the top level nodes
deps_func: A function that takes a node and returns a list of its direct
dependencies.
Returns:
A list of all transitive dependencies of nodes in top, in order (a node will
appear in the list at a higher index than all of its dependencies).
"""
# Find all deps depth-first, maintaining original order in the case of ties.
deps_map = collections.OrderedDict()
def discover(nodes):
for node in nodes:
if node in deps_map:
continue
deps = deps_func(node)
discover(deps)
deps_map[node] = deps
discover(top)
return list(deps_map)
def InitLogging(enabling_env):
logging.basicConfig(
level=logging.DEBUG if os.environ.get(enabling_env) else logging.WARNING,
format='%(levelname).1s %(process)d %(relativeCreated)6d %(message)s')
script_name = os.path.basename(sys.argv[0])
logging.info('Started (%s)', script_name)
my_pid = os.getpid()
def log_exit():
# Do not log for fork'ed processes.
if os.getpid() == my_pid:
logging.info("Job's done (%s)", script_name)
atexit.register(log_exit)
def AddDepfileOption(parser):
# TODO(agrieve): Get rid of this once we've moved to argparse.
if hasattr(parser, 'add_option'):
func = parser.add_option
else:
func = parser.add_argument
func('--depfile',
help='Path to depfile (refer to `gn help depfile`)')
def WriteDepfile(depfile_path, first_gn_output, inputs=None):
assert depfile_path != first_gn_output # http://crbug.com/646165
assert not isinstance(inputs, string_types) # Easy mistake to make
inputs = inputs or []
MakeDirectory(os.path.dirname(depfile_path))
# Ninja does not support multiple outputs in depfiles.
with open(depfile_path, 'w') as depfile:
depfile.write(first_gn_output.replace(' ', '\\ '))
depfile.write(': ')
depfile.write(' '.join(i.replace(' ', '\\ ') for i in inputs))
depfile.write('\n')
def ExpandFileArgs(args):
"""Replaces file-arg placeholders in args.
These placeholders have the form:
@FileArg(filename:key1:key2:...:keyn)
The value of such a placeholder is calculated by reading 'filename' as json.
And then extracting the value at [key1][key2]...[keyn]. If a key has a '[]'
suffix the (intermediate) value will be interpreted as a single item list and
the single item will be returned or used for further traversal.
Note: This intentionally does not return the list of files that appear in such
placeholders. An action that uses file-args *must* know the paths of those
files prior to the parsing of the arguments (typically by explicitly listing
them in the action's inputs in build files).
"""
new_args = list(args)
file_jsons = dict()
r = re.compile('@FileArg\((.*?)\)')
for i, arg in enumerate(args):
match = r.search(arg)
if not match:
continue
def get_key(key):
if key.endswith('[]'):
return key[:-2], True
return key, False
lookup_path = match.group(1).split(':')
file_path, _ = get_key(lookup_path[0])
if not file_path in file_jsons:
with open(file_path) as f:
file_jsons[file_path] = json.load(f)
expansion = file_jsons
for k in lookup_path:
k, flatten = get_key(k)
expansion = expansion[k]
if flatten:
if not isinstance(expansion, list) or not len(expansion) == 1:
raise Exception('Expected single item list but got %s' % expansion)
expansion = expansion[0]
# This should match ParseGnList. The output is either a GN-formatted list
# or a literal (with no quotes).
if isinstance(expansion, list):
new_args[i] = (arg[:match.start()] + gn_helpers.ToGNString(expansion) +
arg[match.end():])
else:
new_args[i] = arg[:match.start()] + str(expansion) + arg[match.end():]
return new_args
def ReadSourcesList(sources_list_file_name):
"""Reads a GN-written file containing list of file names and returns a list.
Note that this function should not be used to parse response files.
"""
with open(sources_list_file_name) as f:
return [file_name.strip() for file_name in f]