bootperf-bin/resultset.py - mirrors/cros/chromiumos/platform/crosutils - Git at Google

 # Copyright (c) 2010 The Chromium OS Authors. All rights reserved.
 # Use of this source code is governed by a BSD-style license that can be
 # found in the LICENSE file.

 """Classes and functions for managing platform_BootPerf results.

 Results from the platform_BootPerf test in the ChromiumOS autotest
 package are stored in as performance 'keyvals', that is, a mapping
 of names to numeric values.  For each iteration of the test, one
 set of keyvals is recorded.

 This module currently tracks two kinds of keyval results, the boot
 time results, and the disk read results.  These results are stored
 with keyval names such as 'seconds_kernel_to_login' and
 'rdbytes_kernel_to_login'.  Additionally, some older versions of the
 test produced keyval names such as 'sectors_read_kernel_to_login'.
 These keyvals record an accumulated total measured from a fixed
 time in the past (kernel startup), e.g. 'seconds_kernel_to_login'
 records the total seconds from kernel startup to login screen
 ready.

 The boot time keyval names all start with the prefix
 'seconds_kernel_to_', and record time in seconds since kernel
 startup.

 The disk read keyval names all start with the prefix
 'rdbytes_kernel_to_', and record bytes read from the boot device
 since kernel startup.  The obsolete disk keyvals start with the
 prefix 'sectors_read_kernel_to_' and record the same statistic
 measured in 512-byte sectors.

 Boot time and disk kevyal values have a consistent ordering
 across iterations.  For instance, if in one iteration the value of
 'seconds_kernel_to_login' is greater than the value of
 'seconds_kernel_to_x_started', then it will be greater in *all*
 iterations.  This property is a consequence of the underlying
 measurement procedure; it is not enforced by this module.

 """

 import math


 def _ListStats(list_):
   # Utility function - calculate the average and (sample) standard
   # deviation of a list of numbers.  Result is float, even if the
   # input list is full of int's
   sum_ = 0.0
   sumsq = 0.0
   for v in list_:
     sum_ += v
     sumsq += v * v
   n = len(list_)
   avg = sum_ / n
   var = (sumsq - sum_ * avg) / (n - 1)
   if var < 0.0:
     var = 0.0
   dev = math.sqrt(var)
   return (avg, dev)


 def _DoCheck(dict_):
   # Utility function - check the that all keyvals occur the same
   # number of times.  On success, return the number of occurrences;
   # on failure return None
   check = map(len, dict_.values())
   if not check:
     return None
   for i in range(1, len(check)):
     if check[i] != check[i-1]:
       return None
   return check[0]


 def _KeyDelta(dict_, key0, key1):
   # Utility function - return a list of the vector difference between
   # two keyvals.
   return map(lambda a, b: b - a, dict_[key0], dict_[key1])


 class TestResultSet(object):
   """A set of boot time and disk usage result statistics.

   Objects of this class consist of two sets of result statistics:
   the boot time statistics and the disk statistics.

   Class TestResultsSet does not interpret or store keyval mappings
   directly; iteration results are processed by attached _KeySet
   objects, one for boot time (`_timekeys`), one for disk read
   (`_diskkeys`).  These attached _KeySet objects can be obtained
   with appropriate methods; various methods on these objects will
   calculate statistics on the results, and provide the raw data.

   """

   def __init__(self, name):
     self.name = name
     self._timekeys = _TimeKeySet()
     self._diskkeys = _DiskKeySet()
     self._olddiskkeys = _OldDiskKeySet()

   def AddIterationResults(self, runkeys):
     """Add keyval results from a single iteration.

     A TestResultSet is constructed by repeatedly calling
     AddRunResults(), iteration by iteration.  Iteration results are
     passed in as a dictionary mapping keyval attributes to values.
     When all iteration results have been added, FinalizeResults()
     makes the results available for analysis.

     """

     self._timekeys.AddRunResults(runkeys)
     self._diskkeys.AddRunResults(runkeys)
     self._olddiskkeys.AddRunResults(runkeys)

   def FinalizeResults(self):
     """Make results available for analysis.

     A TestResultSet is constructed by repeatedly feeding it results,
     iteration by iteration.  Iteration results are passed in as a
     dictionary mapping keyval attributes to values.  When all iteration
     results have been added, FinalizeResults() makes the results
     available for analysis.

     """

     self._timekeys.FinalizeResults()
     if not self._diskkeys.FinalizeResults():
       self._olddiskkeys.FinalizeResults()
       self._diskkeys = self._olddiskkeys
     self._olddiskkeys = None

   def TimeKeySet(self):
     """Return the boot time statistics result set."""
     return self._timekeys

   def DiskKeySet(self):
     """Return the disk read statistics result set."""
     return self._diskkeys


 class _KeySet(object):
   """Container for a set of related statistics.

   _KeySet is an abstract superclass for containing collections of
   either boot time or disk read statistics.  Statistics are stored
   as a dictionary (`_keyvals`) mapping keyval names to lists of
   values.

   The mapped keyval names are shortened by stripping the prefix
   that identifies the type of prefix (keyvals that don't start with
   the proper prefix are ignored).  So, for example, with boot time
   keyvals, 'seconds_kernel_to_login' becomes 'login' (and
   'rdbytes_kernel_to_login' is ignored).

   A list of all valid keyval names is stored in the `markers`
   instance variable.  The list is sorted by the natural ordering of
   the underlying values (see the module comments for more details).

   The list of values associated with a given keyval name are indexed
   in the order in which they were added.  So, all values for a given
   iteration are stored at the same index.

   """

   def __init__(self):
     self._keyvals = {}

   def AddRunResults(self, runkeys):
     """Add results for one iteration."""

     for key, value in runkeys.iteritems():
       if not key.startswith(self.PREFIX):
         continue
       shortkey = key[len(self.PREFIX):]
       keylist = self._keyvals.setdefault(shortkey, [])
       keylist.append(self._ConvertVal(value))

   def FinalizeResults(self):
     """Finalize this object's results.

     This method makes available the `markers` and `num_iterations`
     instance variables.  It also ensures that every keyval occurred
     in every iteration by requiring that all keyvals have the same
     number of data points.

     """

     count = _DoCheck(self._keyvals)
     if count is None:
       self.num_iterations = 0
       self.markers = []
       return False
     self.num_iterations = count
     keylist = map(lambda k: (self._keyvals[k][0], k),
                   self._keyvals.keys())
     keylist.sort(key=lambda tp: tp[0])
     self.markers = map(lambda tp: tp[1], keylist)
     return True

   def RawData(self, key):
     """Return the list of values for the given marker key."""
     return self._keyvals[key]

   def DeltaData(self, key0, key1):
     """Return vector difference of the values of the given keys."""
     return _KeyDelta(self._keyvals, key0, key1)

   def Statistics(self, key):
     """Return the average and standard deviation of the key's values."""
     return _ListStats(self._keyvals[key])

   def DeltaStatistics(self, key0, key1):
     """Return the average and standard deviation of the differences
     between two keys.

     """

     return _ListStats(self.DeltaData(key0, key1))


 class _TimeKeySet(_KeySet):
   """Concrete subclass of _KeySet for boot time statistics."""

   # TIME_KEY_PREFIX = 'seconds_kernel_to_'
   PREFIX = 'seconds_kernel_to_'

   # Time-based keyvals are reported in seconds and get converted to
   # milliseconds
   TIME_SCALE = 1000

   def _ConvertVal(self, value):
     # We use a "round to nearest int" formula here to make sure we
     # don't lose anything in the conversion from decimal.
     return int(self.TIME_SCALE * float(value) + 0.5)

   def PrintableStatistic(self, value):
     v = int(value + 0.5)
     return ("%d" % v, v)


 class _DiskKeySet(_KeySet):
   """Concrete subclass of _KeySet for disk read statistics."""

   PREFIX = 'rdbytes_kernel_to_'

   # Disk read keyvals are reported in bytes and get converted to
   # MBytes (1 MByte = 1 million bytes, not 2**20)
   DISK_SCALE = 1.0e-6

   def _ConvertVal(self, value):
     return self.DISK_SCALE * float(value)

   def PrintableStatistic(self, value):
     v = round(value, 1)
     return ("%.1fM" % v, v)


 class _OldDiskKeySet(_DiskKeySet):
   """Concrete subclass of _KeySet for the old-style disk read statistics."""

   # Older versions of platform_BootPerf reported total sectors read
   # using names of the form sectors_read_kernel_to_* (instead of the
   # more recent rdbytes_kernel_to_*), but some of those names
   # exceeded the 30-character limit in the MySQL database schema.
   PREFIX = 'sectors_read_kernel_to_'

   # Old sytle disk read keyvals are reported in 512-byte sectors and
   # get converted to MBytes (1 MByte = 1 million bytes, not 2**20)
   SECTOR_SCALE = 512 * _DiskKeySet.DISK_SCALE

   def _ConvertVal(self, value):
     return self.SECTOR_SCALE * float(value)
	# Copyright (c) 2010 The Chromium OS Authors. All rights reserved.
	# Use of this source code is governed by a BSD-style license that can be
	# found in the LICENSE file.

	"""Classes and functions for managing platform_BootPerf results.

	Results from the platform_BootPerf test in the ChromiumOS autotest
	package are stored in as performance 'keyvals', that is, a mapping
	of names to numeric values. For each iteration of the test, one
	set of keyvals is recorded.

	This module currently tracks two kinds of keyval results, the boot
	time results, and the disk read results. These results are stored
	with keyval names such as 'seconds_kernel_to_login' and
	'rdbytes_kernel_to_login'. Additionally, some older versions of the
	test produced keyval names such as 'sectors_read_kernel_to_login'.
	These keyvals record an accumulated total measured from a fixed
	time in the past (kernel startup), e.g. 'seconds_kernel_to_login'
	records the total seconds from kernel startup to login screen
	ready.

	The boot time keyval names all start with the prefix
	'seconds_kernel_to_', and record time in seconds since kernel
	startup.

	The disk read keyval names all start with the prefix
	'rdbytes_kernel_to_', and record bytes read from the boot device
	since kernel startup. The obsolete disk keyvals start with the
	prefix 'sectors_read_kernel_to_' and record the same statistic
	measured in 512-byte sectors.

	Boot time and disk kevyal values have a consistent ordering
	across iterations. For instance, if in one iteration the value of
	'seconds_kernel_to_login' is greater than the value of
	'seconds_kernel_to_x_started', then it will be greater in all
	iterations. This property is a consequence of the underlying
	measurement procedure; it is not enforced by this module.

	"""

	import math


	def _ListStats(list_):
	# Utility function - calculate the average and (sample) standard
	# deviation of a list of numbers. Result is float, even if the
	# input list is full of int's
	sum_ = 0.0
	sumsq = 0.0
	for v in list_:
	sum_ += v
	sumsq += v * v
	n = len(list_)
	avg = sum_ / n
	var = (sumsq - sum_ * avg) / (n - 1)
	if var < 0.0:
	var = 0.0
	dev = math.sqrt(var)
	return (avg, dev)


	def _DoCheck(dict_):
	# Utility function - check the that all keyvals occur the same
	# number of times. On success, return the number of occurrences;
	# on failure return None
	check = map(len, dict_.values())
	if not check:
	return None
	for i in range(1, len(check)):
	if check[i] != check[i-1]:
	return None
	return check[0]


	def _KeyDelta(dict_, key0, key1):
	# Utility function - return a list of the vector difference between
	# two keyvals.
	return map(lambda a, b: b - a, dict_[key0], dict_[key1])


	class TestResultSet(object):
	"""A set of boot time and disk usage result statistics.

	Objects of this class consist of two sets of result statistics:
	the boot time statistics and the disk statistics.

	Class TestResultsSet does not interpret or store keyval mappings
	directly; iteration results are processed by attached _KeySet
	objects, one for boot time (`_timekeys`), one for disk read
	(`_diskkeys`). These attached _KeySet objects can be obtained
	with appropriate methods; various methods on these objects will
	calculate statistics on the results, and provide the raw data.

	"""

	def __init__(self, name):
	self.name = name
	self._timekeys = _TimeKeySet()
	self._diskkeys = _DiskKeySet()
	self._olddiskkeys = _OldDiskKeySet()

	def AddIterationResults(self, runkeys):
	"""Add keyval results from a single iteration.

	A TestResultSet is constructed by repeatedly calling
	AddRunResults(), iteration by iteration. Iteration results are
	passed in as a dictionary mapping keyval attributes to values.
	When all iteration results have been added, FinalizeResults()
	makes the results available for analysis.

	"""

	self._timekeys.AddRunResults(runkeys)
	self._diskkeys.AddRunResults(runkeys)
	self._olddiskkeys.AddRunResults(runkeys)

	def FinalizeResults(self):
	"""Make results available for analysis.

	A TestResultSet is constructed by repeatedly feeding it results,
	iteration by iteration. Iteration results are passed in as a
	dictionary mapping keyval attributes to values. When all iteration
	results have been added, FinalizeResults() makes the results
	available for analysis.

	"""

	self._timekeys.FinalizeResults()
	if not self._diskkeys.FinalizeResults():
	self._olddiskkeys.FinalizeResults()
	self._diskkeys = self._olddiskkeys
	self._olddiskkeys = None

	def TimeKeySet(self):
	"""Return the boot time statistics result set."""
	return self._timekeys

	def DiskKeySet(self):
	"""Return the disk read statistics result set."""
	return self._diskkeys


	class _KeySet(object):
	"""Container for a set of related statistics.

	_KeySet is an abstract superclass for containing collections of
	either boot time or disk read statistics. Statistics are stored
	as a dictionary (`_keyvals`) mapping keyval names to lists of
	values.

	The mapped keyval names are shortened by stripping the prefix
	that identifies the type of prefix (keyvals that don't start with
	the proper prefix are ignored). So, for example, with boot time
	keyvals, 'seconds_kernel_to_login' becomes 'login' (and
	'rdbytes_kernel_to_login' is ignored).

	A list of all valid keyval names is stored in the `markers`
	instance variable. The list is sorted by the natural ordering of
	the underlying values (see the module comments for more details).

	The list of values associated with a given keyval name are indexed
	in the order in which they were added. So, all values for a given
	iteration are stored at the same index.

	"""

	def __init__(self):
	self._keyvals = {}

	def AddRunResults(self, runkeys):
	"""Add results for one iteration."""

	for key, value in runkeys.iteritems():
	if not key.startswith(self.PREFIX):
	continue
	shortkey = key[len(self.PREFIX):]
	keylist = self._keyvals.setdefault(shortkey, [])
	keylist.append(self._ConvertVal(value))

	def FinalizeResults(self):
	"""Finalize this object's results.

	This method makes available the `markers` and `num_iterations`
	instance variables. It also ensures that every keyval occurred
	in every iteration by requiring that all keyvals have the same
	number of data points.

	"""

	count = _DoCheck(self._keyvals)
	if count is None:
	self.num_iterations = 0
	self.markers = []
	return False
	self.num_iterations = count
	keylist = map(lambda k: (self._keyvals[k][0], k),
	self._keyvals.keys())
	keylist.sort(key=lambda tp: tp[0])
	self.markers = map(lambda tp: tp[1], keylist)
	return True

	def RawData(self, key):
	"""Return the list of values for the given marker key."""
	return self._keyvals[key]

	def DeltaData(self, key0, key1):
	"""Return vector difference of the values of the given keys."""
	return _KeyDelta(self._keyvals, key0, key1)

	def Statistics(self, key):
	"""Return the average and standard deviation of the key's values."""
	return _ListStats(self._keyvals[key])

	def DeltaStatistics(self, key0, key1):
	"""Return the average and standard deviation of the differences
	between two keys.

	"""

	return _ListStats(self.DeltaData(key0, key1))


	class _TimeKeySet(_KeySet):
	"""Concrete subclass of _KeySet for boot time statistics."""

	# TIME_KEY_PREFIX = 'seconds_kernel_to_'
	PREFIX = 'seconds_kernel_to_'

	# Time-based keyvals are reported in seconds and get converted to
	# milliseconds
	TIME_SCALE = 1000

	def _ConvertVal(self, value):
	# We use a "round to nearest int" formula here to make sure we
	# don't lose anything in the conversion from decimal.
	return int(self.TIME_SCALE * float(value) + 0.5)

	def PrintableStatistic(self, value):
	v = int(value + 0.5)
	return ("%d" % v, v)


	class _DiskKeySet(_KeySet):
	"""Concrete subclass of _KeySet for disk read statistics."""

	PREFIX = 'rdbytes_kernel_to_'

	# Disk read keyvals are reported in bytes and get converted to
	# MBytes (1 MByte = 1 million bytes, not 2**20)
	DISK_SCALE = 1.0e-6

	def _ConvertVal(self, value):
	return self.DISK_SCALE * float(value)

	def PrintableStatistic(self, value):
	v = round(value, 1)
	return ("%.1fM" % v, v)


	class _OldDiskKeySet(_DiskKeySet):
	"""Concrete subclass of _KeySet for the old-style disk read statistics."""

	# Older versions of platform_BootPerf reported total sectors read
	# using names of the form sectors_read_kernel_to_* (instead of the
	# more recent rdbytes_kernel_to_*), but some of those names
	# exceeded the 30-character limit in the MySQL database schema.
	PREFIX = 'sectors_read_kernel_to_'

	# Old sytle disk read keyvals are reported in 512-byte sectors and
	# get converted to MBytes (1 MByte = 1 million bytes, not 2**20)
	SECTOR_SCALE = 512 * _DiskKeySet.DISK_SCALE

	def _ConvertVal(self, value):
	return self.SECTOR_SCALE * float(value)