server/site_tests/telemetry_AFDOGenerate/telemetry_AFDOGenerate.py - mirrors/cros/chromiumos/third_party/autotest - Git at Google

 # Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
 # Use of this source code is governed by a BSD-style license that can be
 # found in the LICENSE file.

 """
 Test to generate the AFDO profile for a set of ChromeOS benchmarks.

 This will run a pre-determined set of benchmarks on the DUT under
 the monitoring of the linux "perf" tool. The resulting perf.data
 file will then be copied to Google Storage (GS) where it can be
 used by the AFDO optimized build.

 Given that the telemetry benchmarks are quite unstable on ChromeOS at
 this point, this test also supports a mode where the benchmarks are
 executed outside of the telemetry framework. It is not the same as
 executing the benchmarks under telemetry because there is no telemetry
 measurement taken but, for the purposes of profiling Chrome, it should
 be pretty close.

 Example invocation:
 /usr/bin/test_that --debug --board=lumpy <DUT IP>
   --args="ignore_failures=True local=True gs_test_location=True"
   telemetry_AFDOGenerate
 """

 import bz2
 import logging
 import os
 import time

 from autotest_lib.client.common_lib import error
 from autotest_lib.server import autotest
 from autotest_lib.server import profilers
 from autotest_lib.server import test
 from autotest_lib.server import utils
 from autotest_lib.server.cros import telemetry_runner

 # List of benchmarks to run to capture profile information. This is
 # based on the "superhero" and "perf_v2" list and other telemetry
 # benchmarks. Goal is to have a short list that is as representative
 # as possible and takes a short time to execute. At this point the
 # list of benchmarks is in flux.
 TELEMETRY_AFDO_BENCHMARKS = (
     ('page_cycler_v2.typical_25', ('--pageset-repeat=1',)),
     ('page_cycler_v2.intl_ja_zh', ('--pageset-repeat=1',)),
     # Temporarily disable these two benchmarks to finish in 60 minutes.
     # ('page_cycler_v2.intl_ar_fa_he', ('--pageset-repeat=1',)),
     # ('page_cycler_v2.intl_es_fr_pt-BR', ('--pageset-repeat=1',)),
     # ('page_cycler_v2.intl_ko_th_vi', ('--pageset-repeat=1',)),
     # ('page_cycler_v2.intl_hi_ru', ('--pageset-repeat=1',)),
     ('octane',),
     ('kraken',),
     ('speedometer',),
     ('dromaeo.domcoreattr',),
     ('dromaeo.domcoremodify',),
     )

 # Temporarily disable this benchmark because it is failing a
 # lot. Filed chromium:590127
 # ('smoothness.tough_webgl_cases',)

 # Some benchmarks removed from the profile set:
 # 'page_cycler.morejs' -> uninteresting, seems to fail frequently,
 # 'page_cycler.moz' -> seems very old.
 # 'media.tough_video_cases' -> removed this because it does not bring
 #                              any benefit and takes more than 12 mins

 # List of boards where this test can be run.  Currently, it needs a
 # machines with at least 4GB of memory or 2GB of /tmp.
 # This must be consistent with chromite.
 GCC_BOARDS = ['lumpy']

 # Should be disjoint with GCC_BOARDS
 LLVM_BOARDS = ['chell', 'samus']

 class telemetry_AFDOGenerate(test.test):
     """
     Run one or more telemetry benchmarks under the "perf" monitoring
     tool, generate a "perf.data" file and upload to GS for comsumption
     by the AFDO optimized build.
     """
     version = 1


     def run_once(self, host, args):
         """Run a set of telemetry benchmarks.

         @param host: Host machine where test is run
         @param args: A dictionary of the arguments that were passed
                 to this test.
         @returns None.
         """
         self._host = host
         host_board = host.get_board().split(':')[1]

         if not (host_board in LLVM_BOARDS or host_board in GCC_BOARDS):
             raise error.TestFail(
                     'This test cannot be run on board %s' % host_board)

         self._parse_args(args)

         if self._minimal_telemetry:
             self._run_tests_minimal_telemetry()
         else:
             self._telemetry_runner = telemetry_runner.TelemetryRunner(
                     self._host, self._local, telemetry_on_dut=False)

             for benchmark_info in TELEMETRY_AFDO_BENCHMARKS:
                 benchmark = benchmark_info[0]
                 args = () if len(benchmark_info) == 1 else benchmark_info[1]
                 try:
                     self._run_test_with_retry(benchmark, *args)
                 except error.TestBaseException:
                     if not self._ignore_failures:
                         raise
                     else:
                         logging.info('Ignoring failure from benchmark %s.',
                                      benchmark)


     def after_run_once(self):
         """After the profile information has been collected, compress it
         and upload it to GS
         """
         PERF_FILE = 'perf.data'
         COMP_PERF_FILE = 'chromeos-chrome-%s-%s.perf.data'
         perf_data = os.path.join(self.profdir, PERF_FILE)
         comp_data = os.path.join(self.profdir, COMP_PERF_FILE % (
                 self._arch, self._version))
         compressed = self._compress_file(perf_data, comp_data)
         self._gs_upload(compressed, os.path.basename(compressed))

         # Also create copy of this file using "LATEST" as version so
         # it can be found in case the builder is looking for a version
         # number that does not match. It is ok to use a slighly old
         # version of the this file for the optimized build
         latest_data =  COMP_PERF_FILE % (self._arch, 'LATEST')
         latest_compressed = self._get_compressed_name(latest_data)
         self._gs_upload(compressed, latest_compressed)


     def _parse_args(self, args):
         """Parses input arguments to this autotest.

         @param args: Options->values dictionary.
         @raises error.TestFail if a bad option is passed.
         """

         # Set default values for the options.
         # Architecture for which we are collecting afdo data.
         self._arch = 'amd64'
         # Use an alternate GS location where everyone can write.
         # Set default depending on whether this is executing in
         # the lab environment or not
         self._gs_test_location = not utils.host_is_in_lab_zone(
                 self._host.hostname)
         # Ignore individual test failures.
         self._ignore_failures = False
         # Use local copy of telemetry instead of using the dev server copy.
         self._local = False
         # Chrome version to which the AFDO data corresponds.
         self._version, _ = self._host.get_chrome_version()
         # Try to use the minimal support from Telemetry. The Telemetry
         # benchmarks in ChromeOS are too flaky at this point. So, initially,
         # this will be set to True by default.
         self._minimal_telemetry = False

         for option_name, value in args.iteritems():
             if option_name == 'arch':
                 self._arch = value
             elif option_name == 'gs_test_location':
                 self._gs_test_location = (value == 'True')
             elif option_name == 'ignore_failures':
                 self._ignore_failures = (value == 'True')
             elif option_name == 'local':
                 self._local = (value == 'True')
             elif option_name == 'minimal_telemetry':
                 self._minimal_telemetry = (value == 'True')
             elif option_name == 'version':
                 self._version = value
             else:
                 raise error.TestFail('Unknown option passed: %s' % option_name)


     def _run_test(self, benchmark, *args):
         """Run the benchmark using Telemetry.

         @param benchmark: Name of the benchmark to run.
         @param args: Additional arguments to pass to the telemetry execution
                      script.
         @raises Raises error.TestFail if execution of test failed.
                 Also re-raise any exceptions thrown by run_telemetry benchmark.
         """
         try:
             logging.info('Starting run for Telemetry benchmark %s', benchmark)
             start_time = time.time()
             result = self._telemetry_runner.run_telemetry_benchmark(
                     benchmark, None, *args)
             end_time = time.time()
             logging.info('Completed Telemetry benchmark %s in %f seconds',
                          benchmark, end_time - start_time)
         except error.TestBaseException as e:
             end_time = time.time()
             logging.info('Got exception from Telemetry benchmark %s '
                          'after %f seconds. Exception: %s',
                          benchmark, end_time - start_time, str(e))
             raise

         # We dont generate any keyvals for this run. This is not
         # an official run of the benchmark. We are just running it to get
         # a profile from it.

         if result.status is telemetry_runner.SUCCESS_STATUS:
             logging.info('Benchmark %s succeeded', benchmark)
         else:
             raise error.TestFail('An error occurred while executing'
                                  ' benchmark: %s' % benchmark)


     def _run_test_with_retry(self, benchmark, *args):
         """Run the benchmark using Telemetry. Retry in case of failure.

         @param benchmark: Name of the benchmark to run.
         @param args: Additional arguments to pass to the telemetry execution
                      script.
         @raises Re-raise any exceptions thrown by _run_test.
         """

         tried = False
         while True:
             try:
                 self._run_test(benchmark, *args)
                 logging.info('Benchmark %s succeeded on %s try',
                              benchmark,
                              'first' if not tried else 'second')
                 break
             except error.TestBaseException:
                 if not tried:
                    tried = True
                    logging.info('Benchmark %s failed. Retrying ...',
                                 benchmark)
                 else:
                     logging.info('Benchmark %s failed twice. Not retrying',
                                   benchmark)
                     raise


     def _run_tests_minimal_telemetry(self):
         """Run the benchmarks using the minimal support from Telemetry.

         The benchmarks are run using a client side autotest test. This test
         will control Chrome directly using the chrome.Chrome support and it
         will ask Chrome to display the benchmark pages directly instead of
         using the "page sets" and "measurements" support from Telemetry.
         In this way we avoid using Telemetry benchmark support which is not
         stable on ChromeOS yet.
         """
         AFDO_GENERATE_CLIENT_TEST = 'telemetry_AFDOGenerateClient'

         # We dont want to "inherit" the profiler settings for this test
         # to the client test. Doing so will end up in two instances of
         # the profiler (perf) being executed at the same time.
         # Filed a feature request about this. See crbug/342958.

         # Save the current settings for profilers.
         saved_profilers = self.job.profilers
         saved_default_profile_only = self.job.default_profile_only

         # Reset the state of the profilers.
         self.job.default_profile_only = False
         self.job.profilers = profilers.profilers(self.job)

         # Execute the client side test.
         client_at = autotest.Autotest(self._host)
         client_at.run_test(AFDO_GENERATE_CLIENT_TEST, args='')

         # Restore the settings for the profilers.
         self.job.default_profile_only = saved_default_profile_only
         self.job.profiler = saved_profilers


     @staticmethod
     def _get_compressed_name(name):
         """Given a file name, return bz2 compressed name.
         @param name: Name of uncompressed file.
         @returns name of compressed file.
         """
         return name + '.bz2'

     @staticmethod
     def _compress_file(unc_file, com_file):
         """Compresses specified file with bz2.

         @param unc_file: name of file to compress.
         @param com_file: prefix name of compressed file.
         @raises error.TestFail if compression failed
         @returns Name of compressed file.
         """
         dest = ''
         with open(unc_file, 'r') as inp:
             dest = telemetry_AFDOGenerate._get_compressed_name(com_file)
             with bz2.BZ2File(dest, 'w') as out:
                 for data in inp:
                     out.write(data)
         if not dest or not os.path.isfile(dest):
             raise error.TestFail('Could not compress %s' % unc_file)
         return dest


     def _gs_upload(self, local_file, remote_basename):
         """Uploads file to google storage specific location.

         @param local_file: name of file to upload.
         @param remote_basename: basename of remote file.
         @raises error.TestFail if upload failed.
         @returns nothing.
         """
         GS_GCC_DEST = 'gs://chromeos-prebuilt/afdo-job/canonicals/%s'
         GS_LLVM_DEST = 'gs://chromeos-prebuilt/afdo-job/llvm/%s'
         GS_TEST_DEST = 'gs://chromeos-throw-away-bucket/afdo-job/canonicals/%s'
         GS_ACL = 'project-private'

         board = self._host.get_board().split(':')[1]

         if self._gs_test_location:
             gs_dest = GS_TEST_DEST
         elif board in GCC_BOARDS:
             gs_dest = GS_GCC_DEST
         elif board in LLVM_BOARDS:
             gs_dest = GS_LLVM_DEST
         else:
             raise error.TestFail(
                     'This test cannot be run on board %s' % board)

         remote_file = gs_dest % remote_basename

         logging.info('About to upload to GS: %s', remote_file)
         if not utils.gs_upload(local_file,
                                remote_file,
                                GS_ACL, result_dir=self.resultsdir):
             logging.info('Failed upload to GS: %s', remote_file)
             raise error.TestFail('Unable to gs upload %s to %s' %
                                  (local_file, remote_file))

         logging.info('Successfull upload to GS: %s', remote_file)
	# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
	# Use of this source code is governed by a BSD-style license that can be
	# found in the LICENSE file.

	"""
	Test to generate the AFDO profile for a set of ChromeOS benchmarks.

	This will run a pre-determined set of benchmarks on the DUT under
	the monitoring of the linux "perf" tool. The resulting perf.data
	file will then be copied to Google Storage (GS) where it can be
	used by the AFDO optimized build.

	Given that the telemetry benchmarks are quite unstable on ChromeOS at
	this point, this test also supports a mode where the benchmarks are
	executed outside of the telemetry framework. It is not the same as
	executing the benchmarks under telemetry because there is no telemetry
	measurement taken but, for the purposes of profiling Chrome, it should
	be pretty close.

	Example invocation:
	/usr/bin/test_that --debug --board=lumpy <DUT IP>
	--args="ignore_failures=True local=True gs_test_location=True"
	telemetry_AFDOGenerate
	"""

	import bz2
	import logging
	import os
	import time

	from autotest_lib.client.common_lib import error
	from autotest_lib.server import autotest
	from autotest_lib.server import profilers
	from autotest_lib.server import test
	from autotest_lib.server import utils
	from autotest_lib.server.cros import telemetry_runner

	# List of benchmarks to run to capture profile information. This is
	# based on the "superhero" and "perf_v2" list and other telemetry
	# benchmarks. Goal is to have a short list that is as representative
	# as possible and takes a short time to execute. At this point the
	# list of benchmarks is in flux.
	TELEMETRY_AFDO_BENCHMARKS = (
	('page_cycler_v2.typical_25', ('--pageset-repeat=1',)),
	('page_cycler_v2.intl_ja_zh', ('--pageset-repeat=1',)),
	# Temporarily disable these two benchmarks to finish in 60 minutes.
	# ('page_cycler_v2.intl_ar_fa_he', ('--pageset-repeat=1',)),
	# ('page_cycler_v2.intl_es_fr_pt-BR', ('--pageset-repeat=1',)),
	# ('page_cycler_v2.intl_ko_th_vi', ('--pageset-repeat=1',)),
	# ('page_cycler_v2.intl_hi_ru', ('--pageset-repeat=1',)),
	('octane',),
	('kraken',),
	('speedometer',),
	('dromaeo.domcoreattr',),
	('dromaeo.domcoremodify',),
	)

	# Temporarily disable this benchmark because it is failing a
	# lot. Filed chromium:590127
	# ('smoothness.tough_webgl_cases',)

	# Some benchmarks removed from the profile set:
	# 'page_cycler.morejs' -> uninteresting, seems to fail frequently,
	# 'page_cycler.moz' -> seems very old.
	# 'media.tough_video_cases' -> removed this because it does not bring
	# any benefit and takes more than 12 mins

	# List of boards where this test can be run. Currently, it needs a
	# machines with at least 4GB of memory or 2GB of /tmp.
	# This must be consistent with chromite.
	GCC_BOARDS = ['lumpy']

	# Should be disjoint with GCC_BOARDS
	LLVM_BOARDS = ['chell', 'samus']

	class telemetry_AFDOGenerate(test.test):
	"""
	Run one or more telemetry benchmarks under the "perf" monitoring
	tool, generate a "perf.data" file and upload to GS for comsumption
	by the AFDO optimized build.
	"""
	version = 1


	def run_once(self, host, args):
	"""Run a set of telemetry benchmarks.

	@param host: Host machine where test is run
	@param args: A dictionary of the arguments that were passed
	to this test.
	@returns None.
	"""
	self._host = host
	host_board = host.get_board().split(':')[1]

	if not (host_board in LLVM_BOARDS or host_board in GCC_BOARDS):
	raise error.TestFail(
	'This test cannot be run on board %s' % host_board)

	self._parse_args(args)

	if self._minimal_telemetry:
	self._run_tests_minimal_telemetry()
	else:
	self._telemetry_runner = telemetry_runner.TelemetryRunner(
	self._host, self._local, telemetry_on_dut=False)

	for benchmark_info in TELEMETRY_AFDO_BENCHMARKS:
	benchmark = benchmark_info[0]
	args = () if len(benchmark_info) == 1 else benchmark_info[1]
	try:
	self._run_test_with_retry(benchmark, *args)
	except error.TestBaseException:
	if not self._ignore_failures:
	raise
	else:
	logging.info('Ignoring failure from benchmark %s.',
	benchmark)


	def after_run_once(self):
	"""After the profile information has been collected, compress it
	and upload it to GS
	"""
	PERF_FILE = 'perf.data'
	COMP_PERF_FILE = 'chromeos-chrome-%s-%s.perf.data'
	perf_data = os.path.join(self.profdir, PERF_FILE)
	comp_data = os.path.join(self.profdir, COMP_PERF_FILE % (
	self._arch, self._version))
	compressed = self._compress_file(perf_data, comp_data)
	self._gs_upload(compressed, os.path.basename(compressed))

	# Also create copy of this file using "LATEST" as version so
	# it can be found in case the builder is looking for a version
	# number that does not match. It is ok to use a slighly old
	# version of the this file for the optimized build
	latest_data = COMP_PERF_FILE % (self._arch, 'LATEST')
	latest_compressed = self._get_compressed_name(latest_data)
	self._gs_upload(compressed, latest_compressed)


	def _parse_args(self, args):
	"""Parses input arguments to this autotest.

	@param args: Options->values dictionary.
	@raises error.TestFail if a bad option is passed.
	"""

	# Set default values for the options.
	# Architecture for which we are collecting afdo data.
	self._arch = 'amd64'
	# Use an alternate GS location where everyone can write.
	# Set default depending on whether this is executing in
	# the lab environment or not
	self._gs_test_location = not utils.host_is_in_lab_zone(
	self._host.hostname)
	# Ignore individual test failures.
	self._ignore_failures = False
	# Use local copy of telemetry instead of using the dev server copy.
	self._local = False
	# Chrome version to which the AFDO data corresponds.
	self._version, _ = self._host.get_chrome_version()
	# Try to use the minimal support from Telemetry. The Telemetry
	# benchmarks in ChromeOS are too flaky at this point. So, initially,
	# this will be set to True by default.
	self._minimal_telemetry = False

	for option_name, value in args.iteritems():
	if option_name == 'arch':
	self._arch = value
	elif option_name == 'gs_test_location':
	self._gs_test_location = (value == 'True')
	elif option_name == 'ignore_failures':
	self._ignore_failures = (value == 'True')
	elif option_name == 'local':
	self._local = (value == 'True')
	elif option_name == 'minimal_telemetry':
	self._minimal_telemetry = (value == 'True')
	elif option_name == 'version':
	self._version = value
	else:
	raise error.TestFail('Unknown option passed: %s' % option_name)


	def _run_test(self, benchmark, *args):
	"""Run the benchmark using Telemetry.

	@param benchmark: Name of the benchmark to run.
	@param args: Additional arguments to pass to the telemetry execution
	script.
	@raises Raises error.TestFail if execution of test failed.
	Also re-raise any exceptions thrown by run_telemetry benchmark.
	"""
	try:
	logging.info('Starting run for Telemetry benchmark %s', benchmark)
	start_time = time.time()
	result = self._telemetry_runner.run_telemetry_benchmark(
	benchmark, None, *args)
	end_time = time.time()
	logging.info('Completed Telemetry benchmark %s in %f seconds',
	benchmark, end_time - start_time)
	except error.TestBaseException as e:
	end_time = time.time()
	logging.info('Got exception from Telemetry benchmark %s '
	'after %f seconds. Exception: %s',
	benchmark, end_time - start_time, str(e))
	raise

	# We dont generate any keyvals for this run. This is not
	# an official run of the benchmark. We are just running it to get
	# a profile from it.

	if result.status is telemetry_runner.SUCCESS_STATUS:
	logging.info('Benchmark %s succeeded', benchmark)
	else:
	raise error.TestFail('An error occurred while executing'
	' benchmark: %s' % benchmark)


	def _run_test_with_retry(self, benchmark, *args):
	"""Run the benchmark using Telemetry. Retry in case of failure.

	@param benchmark: Name of the benchmark to run.
	@param args: Additional arguments to pass to the telemetry execution
	script.
	@raises Re-raise any exceptions thrown by _run_test.
	"""

	tried = False
	while True:
	try:
	self._run_test(benchmark, *args)
	logging.info('Benchmark %s succeeded on %s try',
	benchmark,
	'first' if not tried else 'second')
	break
	except error.TestBaseException:
	if not tried:
	tried = True
	logging.info('Benchmark %s failed. Retrying ...',
	benchmark)
	else:
	logging.info('Benchmark %s failed twice. Not retrying',
	benchmark)
	raise


	def _run_tests_minimal_telemetry(self):
	"""Run the benchmarks using the minimal support from Telemetry.

	The benchmarks are run using a client side autotest test. This test
	will control Chrome directly using the chrome.Chrome support and it
	will ask Chrome to display the benchmark pages directly instead of
	using the "page sets" and "measurements" support from Telemetry.
	In this way we avoid using Telemetry benchmark support which is not
	stable on ChromeOS yet.
	"""
	AFDO_GENERATE_CLIENT_TEST = 'telemetry_AFDOGenerateClient'

	# We dont want to "inherit" the profiler settings for this test
	# to the client test. Doing so will end up in two instances of
	# the profiler (perf) being executed at the same time.
	# Filed a feature request about this. See crbug/342958.

	# Save the current settings for profilers.
	saved_profilers = self.job.profilers
	saved_default_profile_only = self.job.default_profile_only

	# Reset the state of the profilers.
	self.job.default_profile_only = False
	self.job.profilers = profilers.profilers(self.job)

	# Execute the client side test.
	client_at = autotest.Autotest(self._host)
	client_at.run_test(AFDO_GENERATE_CLIENT_TEST, args='')

	# Restore the settings for the profilers.
	self.job.default_profile_only = saved_default_profile_only
	self.job.profiler = saved_profilers


	@staticmethod
	def _get_compressed_name(name):
	"""Given a file name, return bz2 compressed name.
	@param name: Name of uncompressed file.
	@returns name of compressed file.
	"""
	return name + '.bz2'

	@staticmethod
	def _compress_file(unc_file, com_file):
	"""Compresses specified file with bz2.

	@param unc_file: name of file to compress.
	@param com_file: prefix name of compressed file.
	@raises error.TestFail if compression failed
	@returns Name of compressed file.
	"""
	dest = ''
	with open(unc_file, 'r') as inp:
	dest = telemetry_AFDOGenerate._get_compressed_name(com_file)
	with bz2.BZ2File(dest, 'w') as out:
	for data in inp:
	out.write(data)
	if not dest or not os.path.isfile(dest):
	raise error.TestFail('Could not compress %s' % unc_file)
	return dest


	def _gs_upload(self, local_file, remote_basename):
	"""Uploads file to google storage specific location.

	@param local_file: name of file to upload.
	@param remote_basename: basename of remote file.
	@raises error.TestFail if upload failed.
	@returns nothing.
	"""
	GS_GCC_DEST = 'gs://chromeos-prebuilt/afdo-job/canonicals/%s'
	GS_LLVM_DEST = 'gs://chromeos-prebuilt/afdo-job/llvm/%s'
	GS_TEST_DEST = 'gs://chromeos-throw-away-bucket/afdo-job/canonicals/%s'
	GS_ACL = 'project-private'

	board = self._host.get_board().split(':')[1]

	if self._gs_test_location:
	gs_dest = GS_TEST_DEST
	elif board in GCC_BOARDS:
	gs_dest = GS_GCC_DEST
	elif board in LLVM_BOARDS:
	gs_dest = GS_LLVM_DEST
	else:
	raise error.TestFail(
	'This test cannot be run on board %s' % board)

	remote_file = gs_dest % remote_basename

	logging.info('About to upload to GS: %s', remote_file)
	if not utils.gs_upload(local_file,
	remote_file,
	GS_ACL, result_dir=self.resultsdir):
	logging.info('Failed upload to GS: %s', remote_file)
	raise error.TestFail('Unable to gs upload %s to %s' %
	(local_file, remote_file))

	logging.info('Successfull upload to GS: %s', remote_file)