blob: 8e341cb2ce8414f5f64e5db146ab32ec0e461fbe [file] [log] [blame]
The LLVM Compiler Infrastructure
This file is distributed under the University of Illinois Open Source
License. See LICENSE.TXT for details.
Provides classes used by the test results reporting infrastructure
within the LLDB test suite.
from __future__ import print_function
from __future__ import absolute_import
# System modules
import argparse
import os
import re
import sys
import threading
# Third-party modules
# LLDB modules
from lldbsuite.test import configuration
from ..event_builder import EventBuilder
import lldbsuite
FILE_LEVEL_KEY_RE = re.compile(r"^(.+\.py)[^.:]*$")
class ResultsFormatter(object):
"""Provides interface to formatting test results out to a file-like object.
This class allows the LLDB test framework's raw test-related
events to be processed and formatted in any manner desired.
Test events are represented by python dictionaries, formatted
as in the EventBuilder class above.
ResultFormatter instances are given a file-like object in which
to write their results.
ResultFormatter lifetime looks like the following:
# The result formatter is created.
# The argparse options dictionary is generated from calling
# the SomeResultFormatter.arg_parser() with the options data
# passed to via the "--results-formatter-options"
# argument. See the help on that for syntactic requirements
# on getting that parsed correctly.
formatter = SomeResultFormatter(file_like_object, argparse_options_dict)
# Single call to session start, before parsing any events.
# Zero or more calls specified for events recorded during the test session.
# The parallel test runner manages getting results from all the inferior
# dotest processes, so from a new format perspective, don't worry about
# that. The formatter will be presented with a single stream of events
# sandwiched between a single begin_session()/end_session() pair in the
# parallel test runner process/thread.
for event in zero_or_more_test_events():
# Single call to terminate/wrap-up. For formatters that need all the
# data before they can print a correct result (e.g. xUnit/JUnit),
# this is where the final report can be generated.
It is not the formatter's responsibility to close the file_like_object.
(i.e. do not close it).
The lldb test framework passes these test events in real time, so they
arrive as they come in.
In the case of the parallel test runner, the dotest inferiors
add a 'pid' field to the dictionary that indicates which inferior
pid generated the event.
Note more events may be added in the future to support richer test
reporting functionality. One example: creating a true flaky test
result category so that unexpected successes really mean the test
is marked incorrectly (either should be marked flaky, or is indeed
passing consistently now and should have the xfail marker
removed). In this case, a flaky_success and flaky_fail event
likely will be added to capture these and support reporting things
like percentages of flaky test passing so we can see if we're
making some things worse/better with regards to failure rates.
Another example: announcing all the test methods that are planned
to be run, so we can better support redo operations of various kinds
(redo all non-run tests, redo non-run tests except the one that
was running [perhaps crashed], etc.)
Implementers are expected to override all the public methods
provided in this class. See each method's docstring to see
expectations about when the call should be chained.
def arg_parser(cls):
"""@return arg parser used to parse formatter-specific options."""
parser = argparse.ArgumentParser(
description='{} options'.format(cls.__name__),
usage=(' --results-formatter-options='
'"--option1 value1 [--option2 value2 [...]]"'))
help=('dump the raw results data after printing '
'the summary output.'))
return parser
def __init__(self, out_file, options, file_is_stream):
super(ResultsFormatter, self).__init__()
self.out_file = out_file
self.options = options
self.using_terminal = False
if not self.out_file:
raise Exception("ResultsFormatter created with no file object")
self.start_time_by_test = {}
self.terminate_called = False
self.file_is_stream = file_is_stream
# Track the most recent test start event by worker index.
# We'll use this to assign TIMEOUT and exceptional
# exits to the most recent test started on a given
# worker index.
self.started_tests_by_worker = {}
# Store the most recent test_method/job status.
self.result_events = {}
# Track the number of test method reruns.
self.test_method_rerun_count = 0
# Lock that we use while mutating inner state, like the
# total test count and the elements. We minimize how
# long we hold the lock just to keep inner state safe, not
# entirely consistent from the outside.
self.lock = threading.RLock()
# Keeps track of the test base filenames for tests that
# are expected to timeout. If a timeout occurs in any test
# basename that matches this list, that result should be
# converted into a non-issue. We'll create an expected
# timeout test status for this.
self.expected_timeouts_by_basename = set()
# Tests which have reported that they are expecting to fail. These will
# be marked as expected failures even if they return a failing status,
# probably because they crashed or deadlocked.
self.expected_failures = set()
# Keep track of rerun-eligible tests.
# This is a set that contains tests saved as:
# {test_filename}:{test_class}:{test_name}
self.rerun_eligible_tests = set()
# A dictionary of test files that had a failing
# test, in the format of:
# key = test path, value = array of test methods that need rerun
self.tests_for_rerun = {}
def _make_key(cls, result_event):
"""Creates a key from a test or job result event.
This key attempts to be as unique as possible. For
test result events, it will be unique per test method.
For job events (ones not promoted to a test result event),
it will be unique per test case file.
@return a string-based key of the form
if result_event is None:
return None
component_count = 0
if "test_filename" in result_event:
key = result_event["test_filename"]
component_count += 1
key = "<no_filename>"
if "test_class" in result_event:
if component_count > 0:
key += ":"
key += result_event["test_class"]
component_count += 1
if "test_name" in result_event:
if component_count > 0:
key += "."
key += result_event["test_name"]
component_count += 1
return key
def _is_file_level_issue(cls, key, event):
"""Returns whether a given key represents a file-level event.
@param cls this class. Unused, but following PEP8 for
preferring @classmethod over @staticmethod.
@param key the key for the issue being tested.
@param event the event for the issue being tested.
@return True when the given key (as made by _make_key())
represents an event that is at the test file level (i.e.
it isn't scoped to a test class or method).
if key is None:
return False
return FILE_LEVEL_KEY_RE.match(key) is not None
def _mark_test_as_expected_failure(self, test_result_event):
key = self._make_key(test_result_event)
if key is not None:
"\nerror: test marked as expected failure but "
"failed to create key.\n")
def _mark_test_for_rerun_eligibility(self, test_result_event):
key = self._make_key(test_result_event)
if key is not None:
"\nerror: test marked for re-run eligibility but "
"failed to create key.\n")
def _maybe_add_test_to_rerun_list(self, result_event):
key = self._make_key(result_event)
if key is not None:
if (key in self.rerun_eligible_tests or
test_filename = result_event.get("test_filename", None)
if test_filename is not None:
test_name = result_event.get("test_name", None)
if test_filename not in self.tests_for_rerun:
self.tests_for_rerun[test_filename] = []
if test_name is not None:
"\nerror: couldn't add testrun-failing test to rerun "
"list because no eligibility key could be created.\n")
def _maybe_remap_job_result_event(self, test_event):
"""Remaps timeout/exceptional exit job results to last test method running.
@param test_event the job_result test event. This is an in/out
parameter. It will be modified if it can be mapped to a test_result
of the same status, using details from the last-running test method
known to be most recently started on the same worker index.
test_start = None
job_status = test_event["status"]
if job_status in [
worker_index = test_event.get("worker_index", None)
if worker_index is not None:
test_start = self.started_tests_by_worker.get(
worker_index, None)
# If we have a test start to remap, do it here.
if test_start is not None:
test_event["event"] = EventBuilder.TYPE_TEST_RESULT
# Fill in all fields from test start not present in
# job status message.
for (start_key, start_value) in test_start.items():
if start_key not in test_event:
test_event[start_key] = start_value
def _maybe_remap_expected_timeout(self, event):
if event is None:
status = event.get("status", None)
if status is None or status != EventBuilder.STATUS_TIMEOUT:
# Check if the timeout test's basename is in the expected timeout
# list. If so, convert to an expected timeout.
basename = os.path.basename(event.get("test_filename", ""))
if basename in self.expected_timeouts_by_basename:
# Convert to an expected timeout.
event["status"] = EventBuilder.STATUS_EXPECTED_TIMEOUT
def _maybe_remap_expected_failure(self, event):
if event is None:
key = self._make_key(event)
if key not in self.expected_failures:
status = event.get("status", None)
if status in EventBuilder.TESTRUN_ERROR_STATUS_VALUES:
event["status"] = EventBuilder.STATUS_EXPECTED_FAILURE
elif status == EventBuilder.STATUS_SUCCESS:
event["status"] = EventBuilder.STATUS_UNEXPECTED_SUCCESS
def handle_event(self, test_event):
"""Handles the test event for collection into the formatter output.
Derived classes may override this but should call down to this
implementation first.
@param test_event the test event as formatted by one of the
event_for_* calls.
with self.lock:
# Keep track of whether terminate was received. We do this so
# that a process can call the 'terminate' event on its own, to
# close down a formatter at the appropriate time. Then the
# atexit() cleanup can call the "terminate if it hasn't been
# called yet".
if test_event is not None:
event_type = test_event.get("event", "")
# We intentionally allow event_type to be checked anew
# after this check below since this check may rewrite
# the event type
if event_type == EventBuilder.TYPE_JOB_RESULT:
# Possibly convert the job status (timeout,
# exceptional exit) # to an appropriate test_result event.
event_type = test_event.get("event", "")
# Remap timeouts to expected timeouts.
if event_type in EventBuilder.RESULT_TYPES:
event_type = test_event.get("event", "")
if event_type == "terminate":
self.terminate_called = True
elif event_type in EventBuilder.RESULT_TYPES:
# Clear the most recently started test for the related
# worker.
worker_index = test_event.get("worker_index", None)
if worker_index is not None:
self.started_tests_by_worker.pop(worker_index, None)
status = test_event["status"]
if status in EventBuilder.TESTRUN_ERROR_STATUS_VALUES:
# A test/job status value in any of those status values
# causes a testrun failure. If such a test fails, check
# whether it can be rerun. If it can be rerun, add it
# to the rerun job.
# Build the test key.
test_key = self._make_key(test_event)
if test_key is None:
raise Exception(
"failed to find test filename for "
"test event {}".format(test_event))
# Save the most recent test event for the test key. This
# allows a second test phase to overwrite the most recent
# result for the test key (unique per method). We do final
# reporting at the end, so we'll report based on final
# results. We do this so that a re-run caused by, perhaps,
# the need to run a low-load, single-worker test run can
# have the final run's results to always be used.
if test_key in self.result_events:
self.test_method_rerun_count += 1
self.result_events[test_key] = test_event
elif event_type == EventBuilder.TYPE_TEST_START:
# Track the start time for the test method.
# Track of the most recent test method start event
# for the related worker. This allows us to figure
# out whether a process timeout or exceptional exit
# can be charged (i.e. assigned) to a test method.
worker_index = test_event.get("worker_index", None)
if worker_index is not None:
self.started_tests_by_worker[worker_index] = test_event
elif event_type == EventBuilder.TYPE_MARK_TEST_RERUN_ELIGIBLE:
elif (event_type ==
def set_expected_timeouts_by_basename(self, basenames):
"""Specifies a list of test file basenames that are allowed to timeout
without being called out as a timeout issue.
These fall into a new status category called STATUS_EXPECTED_TIMEOUT.
if basenames is not None:
for basename in basenames:
def track_start_time(self, test_class, test_name, start_time):
"""tracks the start time of a test so elapsed time can be computed.
this alleviates the need for test results to be processed serially
by test. it will save the start time for the test so that
elapsed_time_for_test() can compute the elapsed time properly.
if test_class is None or test_name is None:
test_key = "{}.{}".format(test_class, test_name)
self.start_time_by_test[test_key] = start_time
def elapsed_time_for_test(self, test_class, test_name, end_time):
"""returns the elapsed time for a test.
this function can only be called once per test and requires that
the track_start_time() method be called sometime prior to calling
this method.
if test_class is None or test_name is None:
return -2.0
test_key = "{}.{}".format(test_class, test_name)
if test_key not in self.start_time_by_test:
return -1.0
start_time = self.start_time_by_test[test_key]
del self.start_time_by_test[test_key]
return end_time - start_time
def is_using_terminal(self):
"""returns true if this results formatter is using the terminal and
output should be avoided."""
return self.using_terminal
def send_terminate_as_needed(self):
"""sends the terminate event if it hasn't been received yet."""
if not self.terminate_called:
terminate_event = EventBuilder.bare_event("terminate")
# Derived classes may require self access
# pylint: disable=no-self-use
# noinspection PyMethodMayBeStatic,PyMethodMayBeStatic
def replaces_summary(self):
"""Returns whether the results formatter includes a summary
suitable to replace the old lldb test run results.
@return True if the lldb test runner can skip its summary
generation when using this results formatter; False otherwise.
return False
def counts_by_test_result_status(self, status):
"""Returns number of test method results for the given status.
@status_result a test result status (e.g. success, fail, skip)
as defined by the EventBuilder.STATUS_* class members.
@return an integer returning the number of test methods matching
the given test result status.
return len([
[key, event] for (key, event) in self.result_events.items()
if event.get("status", "") == status])
def _event_sort_key(cls, event):
"""Returns the sort key to be used for a test event.
This method papers over the differences in a test method result vs. a
job (i.e. inferior process) result.
@param event a test result or job result event.
@return a key useful for sorting events by name (test name preferably,
then by test filename).
if "test_name" in event:
return event["test_name"]
return event.get("test_filename", None)
def _partition_results_by_status(self, categories):
"""Partitions the captured test results by event status.
This permits processing test results by the category ids.
@param categories the list of categories on which to partition.
Follows the format described in _report_category_details().
@return a dictionary where each key is the test result status,
and each entry is a list containing all the test result events
that matched that test result status. Result status IDs with
no matching entries will have a zero-length list.
partitioned_events = {}
for category in categories:
result_status_id = category[0]
matching_events = [
[key, event] for (key, event) in self.result_events.items()
if event.get("status", "") == result_status_id]
partitioned_events[result_status_id] = sorted(
key=lambda x: self._event_sort_key(x[1]))
return partitioned_events
def _print_banner(out_file, banner_text):
"""Prints an ASCII banner around given text.
Output goes to the out file for the results formatter.
@param out_file a file-like object where output will be written.
@param banner_text the text to display, with a banner
of '=' around the line above and line below.
banner_separator = "".ljust(len(banner_text), "=")
def _print_summary_counts(
self, out_file, categories, result_events_by_status, extra_rows):
"""Prints summary counts for all categories.
@param out_file a file-like object used to print output.
@param categories the list of categories on which to partition.
Follows the format described in _report_category_details().
@param result_events_by_status the partitioned list of test
result events in a dictionary, with the key set to the test
result status id and the value set to the list of test method
results that match the status id.
# Get max length for category printed name
category_with_max_printed_name = max(
categories, key=lambda x: len(x[1]))
max_category_name_length = len(category_with_max_printed_name[1])
# If we are provided with extra rows, consider these row name lengths.
if extra_rows is not None:
for row in extra_rows:
name_length = len(row[0])
if name_length > max_category_name_length:
max_category_name_length = name_length
self._print_banner(out_file, "Test Result Summary")
# Prepend extra rows
if extra_rows is not None:
for row in extra_rows:
extra_label = "{}:".format(row[0]).ljust(
max_category_name_length + 1)
out_file.write("{} {:4}\n".format(extra_label, row[1]))
for category in categories:
result_status_id = category[0]
result_label = "{}:".format(category[1]).ljust(
max_category_name_length + 1)
count = len(result_events_by_status[result_status_id])
out_file.write("{} {:4}\n".format(
def _has_printable_details(cls, categories, result_events_by_status):
"""Returns whether there are any test result details that need to be printed.
This will spin through the results and see if any result in a category
that is printable has any results to print.
@param categories the list of categories on which to partition.
Follows the format described in _report_category_details().
@param result_events_by_status the partitioned list of test
result events in a dictionary, with the key set to the test
result status id and the value set to the list of test method
results that match the status id.
@return True if there are any details (i.e. test results
for failures, errors, unexpected successes); False otherwise.
for category in categories:
result_status_id = category[0]
print_matching_tests = category[2]
if print_matching_tests:
if len(result_events_by_status[result_status_id]) > 0:
# We found a printable details test result status
# that has details to print.
return True
# We didn't find any test result category with printable
# details.
return False
def _report_category_details(out_file, category, result_events_by_status):
"""Reports all test results matching the given category spec.
@param out_file a file-like object used to print output.
@param category a category spec of the format [test_event_name,
printed_category_name, print_matching_entries?]
@param result_events_by_status the partitioned list of test
result events in a dictionary, with the key set to the test
result status id and the value set to the list of test method
results that match the status id.
result_status_id = category[0]
print_matching_tests = category[2]
detail_label = category[3]
if print_matching_tests:
# Sort by test name
for (_, event) in result_events_by_status[result_status_id]:
# Convert full test path into test-root-relative.
test_relative_path = os.path.relpath(
# Create extra info component (used for exceptional exit info)
if result_status_id == EventBuilder.STATUS_EXCEPTIONAL_EXIT:
extra_info = "[EXCEPTIONAL EXIT {} ({})] ".format(
extra_info = ""
# Figure out the identity we will use for this test.
if configuration.verbose and ("test_class" in event):
test_id = "{}.{}".format(
event["test_class"], event["test_name"])
elif "test_name" in event:
test_id = event["test_name"]
test_id = "<no_running_test_method>"
# Display the info.
out_file.write("{}: {}{} ({})\n".format(
def print_results(self, out_file):
"""Writes the test result report to the output file.
@param out_file a file-like object used for printing summary
results. This is different than self.out_file, which might
be something else for non-summary data.
extra_results = [
# Total test methods processed, excluding reruns.
["Test Methods", len(self.result_events)],
["Reruns", self.test_method_rerun_count]]
# Output each of the test result entries.
categories = [
# result id, printed name, print matching tests?, detail label
"Success", False, None],
"Expected Failure", False, None],
"Failure", True, "FAIL"],
"Error", True, "ERROR"],
"Exceptional Exit", True, "ERROR"],
"Unexpected Success", True, "UNEXPECTED SUCCESS"],
[EventBuilder.STATUS_SKIP, "Skip", False, None],
"Timeout", True, "TIMEOUT"],
# Intentionally using the unusual hyphenation in TIME-OUT to
# prevent buildbots from thinking it is an issue when scanning
# for TIMEOUT.
"Expected Timeout", True, "EXPECTED TIME-OUT"]
# Partition all the events by test result status
result_events_by_status = self._partition_results_by_status(
# Print the details
have_details = self._has_printable_details(
categories, result_events_by_status)
if have_details:
self._print_banner(out_file, "Issue Details")
for category in categories:
out_file, category, result_events_by_status)
# Print the summary
out_file, categories, result_events_by_status, extra_results)
if self.options.dump_results:
# Debug dump of the key/result info for all categories.
self._print_banner(out_file, "Results Dump")
for status, events_by_key in result_events_by_status.items():
out_file.write("\nSTATUS: {}\n".format(status))
for key, event in events_by_key:
out_file.write("key: {}\n".format(key))
out_file.write("event: {}\n".format(event))
def clear_file_level_issues(self, tests_for_rerun, out_file):
"""Clear file-charged issues in any of the test rerun files.
@param tests_for_rerun the list of test-dir-relative paths that have
functions that require rerunning. This is the test list
returned by the results_formatter at the end of the previous run.
@return the number of file-level issues that were cleared.
if tests_for_rerun is None:
return 0
cleared_file_level_issues = 0
# Find the unique set of files that are covered by the given tests
# that are to be rerun. We derive the files that are eligible for
# having their markers cleared, because we support running in a mode
# where only flaky tests are eligible for rerun. If the file-level
# issue occurred in a file that was not marked as flaky, then we
# shouldn't be clearing the event here.
basename_set = set()
for test_file_relpath in tests_for_rerun:
# Find all the keys for file-level events that are considered
# test issues.
file_level_issues = [(key, event)
for key, event in self.result_events.items()
if ResultsFormatter._is_file_level_issue(
key, event)
and event.get("status", "") in
# Now remove any file-level error for the given test base name.
for key, event in file_level_issues:
# If the given file base name is in the rerun set, then we
# clear that entry from the result set.
if os.path.basename(key) in basename_set:
self.result_events.pop(key, None)
cleared_file_level_issues += 1
if out_file is not None:
"clearing file-level issue for file {} "
"(issue type: {})"
.format(key, event.get("status", "<unset-status>")))
return cleared_file_level_issues