third_party/blink/tools/blinkpy/web_tests/controllers/web_test_runner.py - chromium/src - Git at Google

 # Copyright (C) 2011 Google Inc. All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.
 #     * Neither the name of Google Inc. nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 import collections
 import itertools
 import logging
 import math
 import time

 from blinkpy.common import message_pool
 from blinkpy.tool import grammar
 from blinkpy.web_tests.controllers import single_test_runner
 from blinkpy.web_tests.models.test_run_results import TestRunResults
 from blinkpy.web_tests.models import test_expectations
 from blinkpy.web_tests.models import test_failures
 from blinkpy.web_tests.models import test_results

 _log = logging.getLogger(__name__)


 class TestRunInterruptedException(Exception):
     """Raised when a test run should be stopped immediately."""

     def __init__(self, reason):
         Exception.__init__(self)
         self.reason = reason
         self.msg = reason

     def __reduce__(self):
         return self.__class__, (self.reason,)


 class WebTestRunner(object):

     def __init__(self, options, port, printer, results_directory, test_is_slow_fn):
         self._options = options
         self._port = port
         self._printer = printer
         self._results_directory = results_directory
         self._test_is_slow = test_is_slow_fn
         self._sharder = Sharder(self._port.split_test, self._options.max_locked_shards)
         self._filesystem = self._port.host.filesystem

         self._expectations = None
         self._test_inputs = []
         self._retry_attempt = 0
         self._shards_to_redo = []

         self._current_run_results = None

     def run_tests(self, expectations, test_inputs, tests_to_skip, num_workers, retry_attempt):
         batch_size = self._options.derived_batch_size

         # If we're retrying a test, then it's because we think it might be flaky
         # and rerunning it might provide a different result. We must restart
         # content shell to get a valid result, as otherwise state can leak
         # from previous tests. To do so, we set a batch size of 1, as that
         # prevents content shell reuse.
         if not self._options.must_use_derived_batch_size and retry_attempt >= 1:
             batch_size = 1

         self._expectations = expectations
         self._test_inputs = test_inputs
         self._retry_attempt = retry_attempt

         test_run_results = TestRunResults(self._expectations, len(test_inputs) + len(tests_to_skip))
         self._current_run_results = test_run_results
         self._printer.num_tests = len(test_inputs)
         self._printer.num_completed = 0

         if retry_attempt < 1:
             self._printer.print_expected(test_run_results, self._expectations.get_tests_with_result_type)

         for test_name in set(tests_to_skip):
             result = test_results.TestResult(test_name)
             result.type = test_expectations.SKIP
             test_run_results.add(result, expected=True, test_is_slow=self._test_is_slow(test_name))

         self._printer.write_update('Sharding tests ...')
         locked_shards, unlocked_shards = self._sharder.shard_tests(
             test_inputs,
             int(self._options.child_processes),
             self._options.fully_parallel,
             batch_size == 1)

         self._reorder_tests_by_args(locked_shards)
         self._reorder_tests_by_args(unlocked_shards)

         # We don't have a good way to coordinate the workers so that they don't
         # try to run the shards that need a lock. The easiest solution is to
         # run all of the locked shards first.
         all_shards = locked_shards + unlocked_shards
         num_workers = min(num_workers, len(all_shards))

         if retry_attempt < 1:
             self._printer.print_workers_and_shards(self._port, num_workers, len(all_shards), len(locked_shards))

         if self._options.dry_run:
             return test_run_results

         self._printer.write_update('Starting %s ...' % grammar.pluralize('worker', num_workers))

         start_time = time.time()
         try:
             with message_pool.get(self, self._worker_factory, num_workers, self._port.host) as pool:
                 pool.run(('test_list', shard.name, shard.test_inputs, batch_size) for shard in all_shards)

             if self._shards_to_redo:
                 num_workers -= len(self._shards_to_redo)
                 if num_workers > 0:
                     with message_pool.get(self, self._worker_factory, num_workers, self._port.host) as pool:
                         pool.run(('test_list', shard.name, shard.test_inputs, batch_size) for shard in self._shards_to_redo)
         except TestRunInterruptedException as error:
             _log.warning(error.reason)
             test_run_results.interrupted = True
         except KeyboardInterrupt:
             self._printer.flush()
             self._printer.writeln('Interrupted, exiting ...')
             test_run_results.keyboard_interrupted = True
         except Exception as error:
             _log.debug('%s("%s") raised, exiting', error.__class__.__name__, error)
             raise
         finally:
             test_run_results.run_time = time.time() - start_time

         return test_run_results

     def _reorder_tests_by_args(self, shards):
         reordered_shards = []
         for shard in shards:
             tests_by_args = collections.OrderedDict()
             for test_input in shard.test_inputs:
                 args = tuple(self._port.args_for_test(test_input.test_name))
                 if args not in tests_by_args:
                     tests_by_args[args] = []
                 tests_by_args[args].append(test_input)
             shard.test_inputs = list(itertools.chain(*tests_by_args.values()))

     def _worker_factory(self, worker_connection):
         results_directory = self._results_directory
         if self._retry_attempt > 0:
             results_directory = self._filesystem.join(self._results_directory,
                                                       'retry_%d' % self._retry_attempt)
             self._filesystem.maybe_make_directory(results_directory)
         return Worker(worker_connection, results_directory, self._options)

     def _mark_interrupted_tests_as_skipped(self, test_run_results):
         for test_input in self._test_inputs:
             if test_input.test_name not in test_run_results.results_by_name:
                 result = test_results.TestResult(test_input.test_name, [test_failures.FailureEarlyExit()])
                 # FIXME: We probably need to loop here if there are multiple iterations.
                 # FIXME: Also, these results are really neither expected nor unexpected. We probably
                 # need a third type of result.
                 test_run_results.add(result, expected=False, test_is_slow=self._test_is_slow(test_input.test_name))

     def _interrupt_if_at_failure_limits(self, test_run_results):

         def interrupt_if_at_failure_limit(limit, failure_count, test_run_results, message):
             if limit and failure_count >= limit:
                 message += ' %d tests run.' % (test_run_results.expected + test_run_results.unexpected)
                 self._mark_interrupted_tests_as_skipped(test_run_results)
                 raise TestRunInterruptedException(message)

         interrupt_if_at_failure_limit(
             self._options.exit_after_n_failures,
             test_run_results.unexpected_failures,
             test_run_results,
             'Exiting early after %d failures.' % test_run_results.unexpected_failures)
         interrupt_if_at_failure_limit(
             self._options.exit_after_n_crashes_or_timeouts,
             test_run_results.unexpected_crashes + test_run_results.unexpected_timeouts,
             test_run_results,
             'Exiting early after %d crashes and %d timeouts.' % (
                 test_run_results.unexpected_crashes, test_run_results.unexpected_timeouts))

     def _update_summary_with_result(self, test_run_results, result):
         expected = self._expectations.matches_an_expected_result(
             result.test_name, result.type, self._options.enable_sanitizer)
         expectation_string = self._expectations.get_expectations_string(result.test_name)
         actual_string = self._expectations.expectation_to_string(result.type)

         if result.device_failed:
             self._printer.print_finished_test(self._port, result, False, expectation_string, 'Aborted')
             return

         test_run_results.add(result, expected, self._test_is_slow(result.test_name))
         self._printer.print_finished_test(self._port, result, expected, expectation_string, actual_string)
         self._interrupt_if_at_failure_limits(test_run_results)

     def handle(self, name, source, *args):
         method = getattr(self, '_handle_' + name)
         if method:
             return method(source, *args)
         raise AssertionError('unknown message %s received from %s, args=%s' % (name, source, repr(args)))

     # The _handle_* methods below are called indirectly by handle(),
     # and may not use all of their arguments - pylint: disable=unused-argument
     def _handle_started_test(self, worker_name, test_input):
         self._printer.print_started_test(test_input.test_name)

     def _handle_finished_test_list(self, worker_name, list_name):
         pass

     def _handle_finished_test(self, worker_name, result, log_messages=None):
         self._update_summary_with_result(self._current_run_results, result)

     def _handle_device_failed(self, worker_name, list_name, remaining_tests):
         _log.warning('%s has failed', worker_name)
         if remaining_tests:
             self._shards_to_redo.append(TestShard(list_name, remaining_tests))


 class Worker(object):

     def __init__(self, caller, results_directory, options):
         self._caller = caller
         self._worker_number = caller.worker_number
         self._name = caller.name
         self._results_directory = results_directory
         self._options = options

         # The remaining fields are initialized in start()
         self._host = None
         self._port = None
         self._batch_count = None
         self._filesystem = None
         self._primary_driver = None
         self._secondary_driver = None
         self._num_tests = 0

     def __del__(self):
         self.stop()

     def start(self):
         """This method is called when the object is starting to be used and it is safe
         for the object to create state that does not need to be pickled (usually this means
         it is called in a child process).
         """
         self._host = self._caller.host
         self._filesystem = self._host.filesystem
         self._port = self._host.port_factory.get(self._options.platform, self._options)
         self._primary_driver = self._port.create_driver(self._worker_number)

         if self._port.max_drivers_per_process() > 1:
             self._secondary_driver = self._port.create_driver(self._worker_number)

         self._batch_count = 0

     def handle(self, name, source, test_list_name, test_inputs, batch_size):
         assert name == 'test_list'
         for i, test_input in enumerate(test_inputs):
             device_failed = self._run_test(test_input, test_list_name, batch_size)
             if device_failed:
                 self._caller.post('device_failed', test_list_name, test_inputs[i:])
                 self._caller.stop_running()
                 return

         # Kill the secondary driver at the end of each test shard.
         self._kill_driver(self._secondary_driver, 'secondary')

         self._caller.post('finished_test_list', test_list_name)

     def _update_test_input(self, test_input):
         if test_input.reference_files is None:
             # Lazy initialization.
             test_input.reference_files = self._port.reference_files(test_input.test_name)

     def _run_test(self, test_input, shard_name, batch_size):
         # If the batch size has been exceeded, kill the drivers.
         if batch_size > 0 and self._batch_count >= batch_size:
             self._kill_driver(self._primary_driver, 'primary')
             self._kill_driver(self._secondary_driver, 'secondary')
             self._batch_count = 0

         self._batch_count += 1

         self._update_test_input(test_input)
         start = time.time()

         # TODO(crbug.com/673207): Re-add logging if it doesn't make the logs too large.
         self._caller.post('started_test', test_input)
         result = single_test_runner.run_single_test(
             self._port, self._options, self._results_directory, self._name,
             self._primary_driver, self._secondary_driver, test_input)

         result.shard_name = shard_name
         result.worker_name = self._name
         result.total_run_time = time.time() - start
         result.test_number = self._num_tests
         self._num_tests += 1
         self._caller.post('finished_test', result)
         self._clean_up_after_test(test_input, result)
         return result.device_failed

     def stop(self):
         _log.debug('%s cleaning up', self._name)
         self._kill_driver(self._primary_driver, 'primary')
         self._kill_driver(self._secondary_driver, 'secondary')

     def _kill_driver(self, driver, label):
         # Be careful about how and when we kill the driver; if driver.stop()
         # raises an exception, this routine may get re-entered via __del__.
         if driver:
             # When tracing we need to go through the standard shutdown path to
             # ensure that the trace is recorded properly.
             if any(i in ['--trace-startup', '--trace-shutdown']
                    for i in self._options.additional_driver_flag):
                 _log.debug('%s waiting %d seconds for %s driver to shutdown',
                            self._name, self._port.driver_stop_timeout(), label)
                 driver.stop(timeout_secs=self._port.driver_stop_timeout())
                 return

             # Otherwise, kill the driver immediately to speed up shutdown.
             _log.debug('%s killing %s driver', self._name, label)
             driver.stop()

     def _clean_up_after_test(self, test_input, result):
         test_name = test_input.test_name

         if result.failures:
             # Check and kill the driver if we need to.
             if any([f.driver_needs_restart() for f in result.failures]):
                 # FIXME: Need more information in failure reporting so
                 # we know which driver needs to be restarted. For now
                 # we kill both drivers.
                 self._kill_driver(self._primary_driver, 'primary')
                 self._kill_driver(self._secondary_driver, 'secondary')

                 # Reset the batch count since the shell just bounced.
                 self._batch_count = 0

             # Print the error message(s).
             _log.debug('%s %s failed:', self._name, test_name)
             for f in result.failures:
                 _log.debug('%s  %s', self._name, f.message())
         elif result.type == test_expectations.SKIP:
             _log.debug('%s %s skipped', self._name, test_name)
         else:
             _log.debug('%s %s passed', self._name, test_name)


 class TestShard(object):
     """A test shard is a named list of TestInputs."""

     def __init__(self, name, test_inputs):
         self.name = name
         self.test_inputs = test_inputs
         self.requires_lock = test_inputs[0].requires_lock

     def __repr__(self):
         return 'TestShard(name=%r, test_inputs=%r, requires_lock=%r)' % (
             self.name, self.test_inputs, self.requires_lock)

     def __eq__(self, other):
         return self.name == other.name and self.test_inputs == other.test_inputs


 class Sharder(object):

     def __init__(self, test_split_fn, max_locked_shards):
         self._split = test_split_fn
         self._max_locked_shards = max_locked_shards

     def shard_tests(self, test_inputs, num_workers, fully_parallel, run_singly):
         """Groups tests into batches.
         This helps ensure that tests that depend on each other (aka bad tests!)
         continue to run together as most cross-tests dependencies tend to
         occur within the same directory.
         Return:
             Two list of TestShards. The first contains tests that must only be
             run under the server lock, the second can be run whenever.
         """

         # FIXME: Move all of the sharding logic out of manager into its
         # own class or module. Consider grouping it with the chunking logic
         # in prepare_lists as well.
         if num_workers == 1:
             return self._shard_in_two(test_inputs)
         elif fully_parallel:
             return self._shard_every_file(test_inputs, run_singly)
         return self._shard_by_directory(test_inputs)

     def _shard_in_two(self, test_inputs):
         """Returns two lists of shards: tests requiring a lock and all others.

         This is used when there's only one worker, to minimize the per-shard overhead.
         """
         locked_inputs = []
         unlocked_inputs = []
         for test_input in test_inputs:
             if test_input.requires_lock:
                 locked_inputs.append(test_input)
             else:
                 unlocked_inputs.append(test_input)

         locked_shards = []
         unlocked_shards = []
         if locked_inputs:
             locked_shards = [TestShard('locked_tests', locked_inputs)]
         if unlocked_inputs:
             unlocked_shards = [TestShard('unlocked_tests', unlocked_inputs)]

         return locked_shards, unlocked_shards

     def _shard_every_file(self, test_inputs, run_singly):
         """Returns two lists of shards, each shard containing a single test file.

         This mode gets maximal parallelism at the cost of much higher flakiness.
         """
         locked_shards = []
         unlocked_shards = []
         virtual_inputs = []

         for test_input in test_inputs:
             # Note that we use a '.' for the shard name; the name doesn't really
             # matter, and the only other meaningful value would be the filename,
             # which would be really redundant.
             if test_input.requires_lock:
                 locked_shards.append(TestShard('.', [test_input]))
             elif test_input.test_name.startswith('virtual') and not run_singly:
                 # This violates the spirit of sharding every file, but in practice, since the
                 # virtual test suites require a different commandline flag and thus a restart
                 # of content_shell, it's too slow to shard them fully.
                 virtual_inputs.append(test_input)
             else:
                 unlocked_shards.append(TestShard('.', [test_input]))

         locked_virtual_shards, unlocked_virtual_shards = self._shard_by_directory(virtual_inputs)

         # The locked shards still need to be limited to self._max_locked_shards in order to not
         # overload the http server for the http tests.
         return (self._resize_shards(locked_virtual_shards + locked_shards, self._max_locked_shards, 'locked_shard'),
                 unlocked_virtual_shards + unlocked_shards)

     def _shard_by_directory(self, test_inputs):
         """Returns two lists of shards, each shard containing all the files in a directory.

         This is the default mode, and gets as much parallelism as we can while
         minimizing flakiness caused by inter-test dependencies.
         """
         locked_shards = []
         unlocked_shards = []
         unlocked_slow_shards = []
         tests_by_dir = {}
         # FIXME: Given that the tests are already sorted by directory,
         # we can probably rewrite this to be clearer and faster.
         for test_input in test_inputs:
             directory = self._split(test_input.test_name)[0]
             tests_by_dir.setdefault(directory, [])
             tests_by_dir[directory].append(test_input)

         for directory, test_inputs in tests_by_dir.iteritems():
             shard = TestShard(directory, test_inputs)
             if test_inputs[0].requires_lock:
                 locked_shards.append(shard)
             # In practice, virtual test suites are slow to run. It's a bit hacky, but
             # put them first since they're the long-tail of test runtime.
             elif directory.startswith('virtual'):
                 unlocked_slow_shards.append(shard)
             else:
                 unlocked_shards.append(shard)

         # Sort the shards by directory name.
         locked_shards.sort(key=lambda shard: shard.name)
         unlocked_slow_shards.sort(key=lambda shard: shard.name)
         unlocked_shards.sort(key=lambda shard: shard.name)

         # Put a ceiling on the number of locked shards, so that we
         # don't hammer the servers too badly.

         # FIXME: For now, limit to one shard or set it
         # with the --max-locked-shards. After testing to make sure we
         # can handle multiple shards, we should probably do something like
         # limit this to no more than a quarter of all workers, e.g.:
         # return max(math.ceil(num_workers / 4.0), 1)
         return (self._resize_shards(locked_shards, self._max_locked_shards, 'locked_shard'),
                 unlocked_slow_shards + unlocked_shards)

     def _resize_shards(self, old_shards, max_new_shards, shard_name_prefix):
         """Takes a list of shards and redistributes the tests into no more
         than |max_new_shards| new shards.
         """

         # This implementation assumes that each input shard only contains tests from a
         # single directory, and that tests in each shard must remain together; as a
         # result, a given input shard is never split between output shards.
         #
         # Each output shard contains the tests from one or more input shards and
         # hence may contain tests from multiple directories.

         def divide_and_round_up(numerator, divisor):
             return int(math.ceil(float(numerator) / divisor))

         def extract_and_flatten(shards):
             test_inputs = []
             for shard in shards:
                 test_inputs.extend(shard.test_inputs)
             return test_inputs

         def split_at(seq, index):
             return (seq[:index], seq[index:])

         num_old_per_new = divide_and_round_up(len(old_shards), max_new_shards)
         new_shards = []
         remaining_shards = old_shards
         while remaining_shards:
             some_shards, remaining_shards = split_at(remaining_shards, num_old_per_new)
             new_shards.append(
                 TestShard('%s_%d' % (shard_name_prefix, len(new_shards) + 1),
                           extract_and_flatten(some_shards)))
         return new_shards
	# Copyright (C) 2011 Google Inc. All rights reserved.
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.
	# * Neither the name of Google Inc. nor the names of its
	# contributors may be used to endorse or promote products derived from
	# this software without specific prior written permission.
	#
	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	import collections
	import itertools
	import logging
	import math
	import time

	from blinkpy.common import message_pool
	from blinkpy.tool import grammar
	from blinkpy.web_tests.controllers import single_test_runner
	from blinkpy.web_tests.models.test_run_results import TestRunResults
	from blinkpy.web_tests.models import test_expectations
	from blinkpy.web_tests.models import test_failures
	from blinkpy.web_tests.models import test_results

	_log = logging.getLogger(__name__)


	class TestRunInterruptedException(Exception):
	"""Raised when a test run should be stopped immediately."""

	def __init__(self, reason):
	Exception.__init__(self)
	self.reason = reason
	self.msg = reason

	def __reduce__(self):
	return self.__class__, (self.reason,)


	class WebTestRunner(object):

	def __init__(self, options, port, printer, results_directory, test_is_slow_fn):
	self._options = options
	self._port = port
	self._printer = printer
	self._results_directory = results_directory
	self._test_is_slow = test_is_slow_fn
	self._sharder = Sharder(self._port.split_test, self._options.max_locked_shards)
	self._filesystem = self._port.host.filesystem

	self._expectations = None
	self._test_inputs = []
	self._retry_attempt = 0
	self._shards_to_redo = []

	self._current_run_results = None

	def run_tests(self, expectations, test_inputs, tests_to_skip, num_workers, retry_attempt):
	batch_size = self._options.derived_batch_size

	# If we're retrying a test, then it's because we think it might be flaky
	# and rerunning it might provide a different result. We must restart
	# content shell to get a valid result, as otherwise state can leak
	# from previous tests. To do so, we set a batch size of 1, as that
	# prevents content shell reuse.
	if not self._options.must_use_derived_batch_size and retry_attempt >= 1:
	batch_size = 1

	self._expectations = expectations
	self._test_inputs = test_inputs
	self._retry_attempt = retry_attempt

	test_run_results = TestRunResults(self._expectations, len(test_inputs) + len(tests_to_skip))
	self._current_run_results = test_run_results
	self._printer.num_tests = len(test_inputs)
	self._printer.num_completed = 0

	if retry_attempt < 1:
	self._printer.print_expected(test_run_results, self._expectations.get_tests_with_result_type)

	for test_name in set(tests_to_skip):
	result = test_results.TestResult(test_name)
	result.type = test_expectations.SKIP
	test_run_results.add(result, expected=True, test_is_slow=self._test_is_slow(test_name))

	self._printer.write_update('Sharding tests ...')
	locked_shards, unlocked_shards = self._sharder.shard_tests(
	test_inputs,
	int(self._options.child_processes),
	self._options.fully_parallel,
	batch_size == 1)

	self._reorder_tests_by_args(locked_shards)
	self._reorder_tests_by_args(unlocked_shards)

	# We don't have a good way to coordinate the workers so that they don't
	# try to run the shards that need a lock. The easiest solution is to
	# run all of the locked shards first.
	all_shards = locked_shards + unlocked_shards
	num_workers = min(num_workers, len(all_shards))

	if retry_attempt < 1:
	self._printer.print_workers_and_shards(self._port, num_workers, len(all_shards), len(locked_shards))

	if self._options.dry_run:
	return test_run_results

	self._printer.write_update('Starting %s ...' % grammar.pluralize('worker', num_workers))

	start_time = time.time()
	try:
	with message_pool.get(self, self._worker_factory, num_workers, self._port.host) as pool:
	pool.run(('test_list', shard.name, shard.test_inputs, batch_size) for shard in all_shards)

	if self._shards_to_redo:
	num_workers -= len(self._shards_to_redo)
	if num_workers > 0:
	with message_pool.get(self, self._worker_factory, num_workers, self._port.host) as pool:
	pool.run(('test_list', shard.name, shard.test_inputs, batch_size) for shard in self._shards_to_redo)
	except TestRunInterruptedException as error:
	_log.warning(error.reason)
	test_run_results.interrupted = True
	except KeyboardInterrupt:
	self._printer.flush()
	self._printer.writeln('Interrupted, exiting ...')
	test_run_results.keyboard_interrupted = True
	except Exception as error:
	_log.debug('%s("%s") raised, exiting', error.__class__.__name__, error)
	raise
	finally:
	test_run_results.run_time = time.time() - start_time

	return test_run_results

	def _reorder_tests_by_args(self, shards):
	reordered_shards = []
	for shard in shards:
	tests_by_args = collections.OrderedDict()
	for test_input in shard.test_inputs:
	args = tuple(self._port.args_for_test(test_input.test_name))
	if args not in tests_by_args:
	tests_by_args[args] = []
	tests_by_args[args].append(test_input)
	shard.test_inputs = list(itertools.chain(*tests_by_args.values()))

	def _worker_factory(self, worker_connection):
	results_directory = self._results_directory
	if self._retry_attempt > 0:
	results_directory = self._filesystem.join(self._results_directory,
	'retry_%d' % self._retry_attempt)
	self._filesystem.maybe_make_directory(results_directory)
	return Worker(worker_connection, results_directory, self._options)

	def _mark_interrupted_tests_as_skipped(self, test_run_results):
	for test_input in self._test_inputs:
	if test_input.test_name not in test_run_results.results_by_name:
	result = test_results.TestResult(test_input.test_name, [test_failures.FailureEarlyExit()])
	# FIXME: We probably need to loop here if there are multiple iterations.
	# FIXME: Also, these results are really neither expected nor unexpected. We probably
	# need a third type of result.
	test_run_results.add(result, expected=False, test_is_slow=self._test_is_slow(test_input.test_name))

	def _interrupt_if_at_failure_limits(self, test_run_results):

	def interrupt_if_at_failure_limit(limit, failure_count, test_run_results, message):
	if limit and failure_count >= limit:
	message += ' %d tests run.' % (test_run_results.expected + test_run_results.unexpected)
	self._mark_interrupted_tests_as_skipped(test_run_results)
	raise TestRunInterruptedException(message)

	interrupt_if_at_failure_limit(
	self._options.exit_after_n_failures,
	test_run_results.unexpected_failures,
	test_run_results,
	'Exiting early after %d failures.' % test_run_results.unexpected_failures)
	interrupt_if_at_failure_limit(
	self._options.exit_after_n_crashes_or_timeouts,
	test_run_results.unexpected_crashes + test_run_results.unexpected_timeouts,
	test_run_results,
	'Exiting early after %d crashes and %d timeouts.' % (
	test_run_results.unexpected_crashes, test_run_results.unexpected_timeouts))

	def _update_summary_with_result(self, test_run_results, result):
	expected = self._expectations.matches_an_expected_result(
	result.test_name, result.type, self._options.enable_sanitizer)
	expectation_string = self._expectations.get_expectations_string(result.test_name)
	actual_string = self._expectations.expectation_to_string(result.type)

	if result.device_failed:
	self._printer.print_finished_test(self._port, result, False, expectation_string, 'Aborted')
	return

	test_run_results.add(result, expected, self._test_is_slow(result.test_name))
	self._printer.print_finished_test(self._port, result, expected, expectation_string, actual_string)
	self._interrupt_if_at_failure_limits(test_run_results)

	def handle(self, name, source, *args):
	method = getattr(self, '_handle_' + name)
	if method:
	return method(source, *args)
	raise AssertionError('unknown message %s received from %s, args=%s' % (name, source, repr(args)))

	# The _handle_* methods below are called indirectly by handle(),
	# and may not use all of their arguments - pylint: disable=unused-argument
	def _handle_started_test(self, worker_name, test_input):
	self._printer.print_started_test(test_input.test_name)

	def _handle_finished_test_list(self, worker_name, list_name):
	pass

	def _handle_finished_test(self, worker_name, result, log_messages=None):
	self._update_summary_with_result(self._current_run_results, result)

	def _handle_device_failed(self, worker_name, list_name, remaining_tests):
	_log.warning('%s has failed', worker_name)
	if remaining_tests:
	self._shards_to_redo.append(TestShard(list_name, remaining_tests))


	class Worker(object):

	def __init__(self, caller, results_directory, options):
	self._caller = caller
	self._worker_number = caller.worker_number
	self._name = caller.name
	self._results_directory = results_directory
	self._options = options

	# The remaining fields are initialized in start()
	self._host = None
	self._port = None
	self._batch_count = None
	self._filesystem = None
	self._primary_driver = None
	self._secondary_driver = None
	self._num_tests = 0

	def __del__(self):
	self.stop()

	def start(self):
	"""This method is called when the object is starting to be used and it is safe
	for the object to create state that does not need to be pickled (usually this means
	it is called in a child process).
	"""
	self._host = self._caller.host
	self._filesystem = self._host.filesystem
	self._port = self._host.port_factory.get(self._options.platform, self._options)
	self._primary_driver = self._port.create_driver(self._worker_number)

	if self._port.max_drivers_per_process() > 1:
	self._secondary_driver = self._port.create_driver(self._worker_number)

	self._batch_count = 0

	def handle(self, name, source, test_list_name, test_inputs, batch_size):
	assert name == 'test_list'
	for i, test_input in enumerate(test_inputs):
	device_failed = self._run_test(test_input, test_list_name, batch_size)
	if device_failed:
	self._caller.post('device_failed', test_list_name, test_inputs[i:])
	self._caller.stop_running()
	return

	# Kill the secondary driver at the end of each test shard.
	self._kill_driver(self._secondary_driver, 'secondary')

	self._caller.post('finished_test_list', test_list_name)

	def _update_test_input(self, test_input):
	if test_input.reference_files is None:
	# Lazy initialization.
	test_input.reference_files = self._port.reference_files(test_input.test_name)

	def _run_test(self, test_input, shard_name, batch_size):
	# If the batch size has been exceeded, kill the drivers.
	if batch_size > 0 and self._batch_count >= batch_size:
	self._kill_driver(self._primary_driver, 'primary')
	self._kill_driver(self._secondary_driver, 'secondary')
	self._batch_count = 0

	self._batch_count += 1

	self._update_test_input(test_input)
	start = time.time()

	# TODO(crbug.com/673207): Re-add logging if it doesn't make the logs too large.
	self._caller.post('started_test', test_input)
	result = single_test_runner.run_single_test(
	self._port, self._options, self._results_directory, self._name,
	self._primary_driver, self._secondary_driver, test_input)

	result.shard_name = shard_name
	result.worker_name = self._name
	result.total_run_time = time.time() - start
	result.test_number = self._num_tests
	self._num_tests += 1
	self._caller.post('finished_test', result)
	self._clean_up_after_test(test_input, result)
	return result.device_failed

	def stop(self):
	_log.debug('%s cleaning up', self._name)
	self._kill_driver(self._primary_driver, 'primary')
	self._kill_driver(self._secondary_driver, 'secondary')

	def _kill_driver(self, driver, label):
	# Be careful about how and when we kill the driver; if driver.stop()
	# raises an exception, this routine may get re-entered via __del__.
	if driver:
	# When tracing we need to go through the standard shutdown path to
	# ensure that the trace is recorded properly.
	if any(i in ['--trace-startup', '--trace-shutdown']
	for i in self._options.additional_driver_flag):
	_log.debug('%s waiting %d seconds for %s driver to shutdown',
	self._name, self._port.driver_stop_timeout(), label)
	driver.stop(timeout_secs=self._port.driver_stop_timeout())
	return

	# Otherwise, kill the driver immediately to speed up shutdown.
	_log.debug('%s killing %s driver', self._name, label)
	driver.stop()

	def _clean_up_after_test(self, test_input, result):
	test_name = test_input.test_name

	if result.failures:
	# Check and kill the driver if we need to.
	if any([f.driver_needs_restart() for f in result.failures]):
	# FIXME: Need more information in failure reporting so
	# we know which driver needs to be restarted. For now
	# we kill both drivers.
	self._kill_driver(self._primary_driver, 'primary')
	self._kill_driver(self._secondary_driver, 'secondary')

	# Reset the batch count since the shell just bounced.
	self._batch_count = 0

	# Print the error message(s).
	_log.debug('%s %s failed:', self._name, test_name)
	for f in result.failures:
	_log.debug('%s %s', self._name, f.message())
	elif result.type == test_expectations.SKIP:
	_log.debug('%s %s skipped', self._name, test_name)
	else:
	_log.debug('%s %s passed', self._name, test_name)


	class TestShard(object):
	"""A test shard is a named list of TestInputs."""

	def __init__(self, name, test_inputs):
	self.name = name
	self.test_inputs = test_inputs
	self.requires_lock = test_inputs[0].requires_lock

	def __repr__(self):
	return 'TestShard(name=%r, test_inputs=%r, requires_lock=%r)' % (
	self.name, self.test_inputs, self.requires_lock)

	def __eq__(self, other):
	return self.name == other.name and self.test_inputs == other.test_inputs


	class Sharder(object):

	def __init__(self, test_split_fn, max_locked_shards):
	self._split = test_split_fn
	self._max_locked_shards = max_locked_shards

	def shard_tests(self, test_inputs, num_workers, fully_parallel, run_singly):
	"""Groups tests into batches.
	This helps ensure that tests that depend on each other (aka bad tests!)
	continue to run together as most cross-tests dependencies tend to
	occur within the same directory.
	Return:
	Two list of TestShards. The first contains tests that must only be
	run under the server lock, the second can be run whenever.
	"""

	# FIXME: Move all of the sharding logic out of manager into its
	# own class or module. Consider grouping it with the chunking logic
	# in prepare_lists as well.
	if num_workers == 1:
	return self._shard_in_two(test_inputs)
	elif fully_parallel:
	return self._shard_every_file(test_inputs, run_singly)
	return self._shard_by_directory(test_inputs)

	def _shard_in_two(self, test_inputs):
	"""Returns two lists of shards: tests requiring a lock and all others.

	This is used when there's only one worker, to minimize the per-shard overhead.
	"""
	locked_inputs = []
	unlocked_inputs = []
	for test_input in test_inputs:
	if test_input.requires_lock:
	locked_inputs.append(test_input)
	else:
	unlocked_inputs.append(test_input)

	locked_shards = []
	unlocked_shards = []
	if locked_inputs:
	locked_shards = [TestShard('locked_tests', locked_inputs)]
	if unlocked_inputs:
	unlocked_shards = [TestShard('unlocked_tests', unlocked_inputs)]

	return locked_shards, unlocked_shards

	def _shard_every_file(self, test_inputs, run_singly):
	"""Returns two lists of shards, each shard containing a single test file.

	This mode gets maximal parallelism at the cost of much higher flakiness.
	"""
	locked_shards = []
	unlocked_shards = []
	virtual_inputs = []

	for test_input in test_inputs:
	# Note that we use a '.' for the shard name; the name doesn't really
	# matter, and the only other meaningful value would be the filename,
	# which would be really redundant.
	if test_input.requires_lock:
	locked_shards.append(TestShard('.', [test_input]))
	elif test_input.test_name.startswith('virtual') and not run_singly:
	# This violates the spirit of sharding every file, but in practice, since the
	# virtual test suites require a different commandline flag and thus a restart
	# of content_shell, it's too slow to shard them fully.
	virtual_inputs.append(test_input)
	else:
	unlocked_shards.append(TestShard('.', [test_input]))

	locked_virtual_shards, unlocked_virtual_shards = self._shard_by_directory(virtual_inputs)

	# The locked shards still need to be limited to self._max_locked_shards in order to not
	# overload the http server for the http tests.
	return (self._resize_shards(locked_virtual_shards + locked_shards, self._max_locked_shards, 'locked_shard'),
	unlocked_virtual_shards + unlocked_shards)

	def _shard_by_directory(self, test_inputs):
	"""Returns two lists of shards, each shard containing all the files in a directory.

	This is the default mode, and gets as much parallelism as we can while
	minimizing flakiness caused by inter-test dependencies.
	"""
	locked_shards = []
	unlocked_shards = []
	unlocked_slow_shards = []
	tests_by_dir = {}
	# FIXME: Given that the tests are already sorted by directory,
	# we can probably rewrite this to be clearer and faster.
	for test_input in test_inputs:
	directory = self._split(test_input.test_name)[0]
	tests_by_dir.setdefault(directory, [])
	tests_by_dir[directory].append(test_input)

	for directory, test_inputs in tests_by_dir.iteritems():
	shard = TestShard(directory, test_inputs)
	if test_inputs[0].requires_lock:
	locked_shards.append(shard)
	# In practice, virtual test suites are slow to run. It's a bit hacky, but
	# put them first since they're the long-tail of test runtime.
	elif directory.startswith('virtual'):
	unlocked_slow_shards.append(shard)
	else:
	unlocked_shards.append(shard)

	# Sort the shards by directory name.
	locked_shards.sort(key=lambda shard: shard.name)
	unlocked_slow_shards.sort(key=lambda shard: shard.name)
	unlocked_shards.sort(key=lambda shard: shard.name)

	# Put a ceiling on the number of locked shards, so that we
	# don't hammer the servers too badly.

	# FIXME: For now, limit to one shard or set it
	# with the --max-locked-shards. After testing to make sure we
	# can handle multiple shards, we should probably do something like
	# limit this to no more than a quarter of all workers, e.g.:
	# return max(math.ceil(num_workers / 4.0), 1)
	return (self._resize_shards(locked_shards, self._max_locked_shards, 'locked_shard'),
	unlocked_slow_shards + unlocked_shards)

	def _resize_shards(self, old_shards, max_new_shards, shard_name_prefix):
	"""Takes a list of shards and redistributes the tests into no more
	than \|max_new_shards\| new shards.
	"""

	# This implementation assumes that each input shard only contains tests from a
	# single directory, and that tests in each shard must remain together; as a
	# result, a given input shard is never split between output shards.
	#
	# Each output shard contains the tests from one or more input shards and
	# hence may contain tests from multiple directories.

	def divide_and_round_up(numerator, divisor):
	return int(math.ceil(float(numerator) / divisor))

	def extract_and_flatten(shards):
	test_inputs = []
	for shard in shards:
	test_inputs.extend(shard.test_inputs)
	return test_inputs

	def split_at(seq, index):
	return (seq[:index], seq[index:])

	num_old_per_new = divide_and_round_up(len(old_shards), max_new_shards)
	new_shards = []
	remaining_shards = old_shards
	while remaining_shards:
	some_shards, remaining_shards = split_at(remaining_shards, num_old_per_new)
	new_shards.append(
	TestShard('%s_%d' % (shard_name_prefix, len(new_shards) + 1),
	extract_and_flatten(some_shards)))
	return new_shards