catapult/dashboard/dashboard/find_change_points_test.py - platform/external/chromium-trace - Git at Google

 # Copyright 2015 The Chromium Authors. All rights reserved.
 # Use of this source code is governed by a BSD-style license that can be
 # found in the LICENSE file.

 import unittest

 from dashboard import find_change_points
 from dashboard import math_utils


 class FindChangePointsTest(unittest.TestCase):

   def testFindChangePoints(self):
     # Simple test that the output is as expected for a clear change.
     # Tests for specific aspects of the algorithm are below.
     data = [1, 1, 2, 1, 1, 8, 8, 8, 9, 8, 9]
     series = list(enumerate(data))
     expected = [
         find_change_points.ChangePoint(
             x_value=5,
             median_before=1,
             median_after=8,
             window_start=1,
             window_end=10,
             size_before=4,
             size_after=6,
             relative_change=7,
             std_dev_before=0.4330127018922193,
             t_statistic=-24.452628375754593,
             degrees_of_freedom=6.9938793160801023,
             p_value=0.001)
     ]
     actual = find_change_points.FindChangePoints(
         series,
         max_window_size=10,
         multiple_of_std_dev=3,
         min_relative_change=0.5,
         min_absolute_change=1,
         min_steppiness=0.4,
         min_segment_size=3)
     self.assertEqual(expected, actual)

   def testFindChangePoints_EmptySeries(self):
     # For an empty series, there are certainly no change points.
     self.assertEqual([], find_change_points.FindChangePoints([]))

   def testFindSplit(self):
     # Find split returns the first index of the segment after the split.
     self.assertEqual(3, find_change_points._FindSplit([3, 2, 3, 5, 6, 5]))

     # If there are several splits that are equally interesting, or no
     # interesting splits, then the first one is returned.
     self.assertEqual(2, find_change_points._FindSplit([2, 2, 4, 4, 6, 6]))
     self.assertEqual(1, find_change_points._FindSplit([4, 4, 4, 4, 4, 4]))

   def _PassesThresholds(
       self, data, index, multiple_of_std_dev=0, min_relative_change=0,
       min_absolute_change=0, min_segment_size=0, min_steppiness=0):
     """Tests whether a split passes the thresholds with the given parameters."""
     # All of the threshold parameters are set to zero by default here, so that
     # we can test just one threshold at a time.
     return find_change_points._PassesThresholds(
         data, index,
         min_segment_size=min_segment_size,
         min_absolute_change=min_absolute_change,
         min_relative_change=min_relative_change,
         min_steppiness=min_steppiness,
         multiple_of_std_dev=multiple_of_std_dev)

   def testIsAnomalous_FiltersOnSegmentSize(self):
     sample = [1, 1, 5, 5, 5, 9, 9]
     self.assertFalse(self._PassesThresholds(sample, 2, min_segment_size=3))
     self.assertFalse(self._PassesThresholds(sample, 5, min_segment_size=3))
     self.assertTrue(self._PassesThresholds(sample, 2, min_segment_size=2))
     self.assertTrue(self._PassesThresholds(sample, 5, min_segment_size=2))

   def testIsAnomalous_FiltersOnAbsoluteChange(self):
     sample = [2, 2, 2, 4, 4, 4, 4, 8, 8, 8]
     self.assertTrue(self._PassesThresholds(sample, 7))
     self.assertTrue(self._PassesThresholds(sample, 7, min_absolute_change=4))
     self.assertFalse(self._PassesThresholds(sample, 3, min_absolute_change=4))

   def testIsAnomalous_FiltersOnRelativeChange(self):
     sample = [2, 2, 2, 6, 6, 6, 6, 10, 10, 10]
     self.assertTrue(self._PassesThresholds(sample, 3))
     self.assertTrue(self._PassesThresholds(sample, 3, min_relative_change=1))
     self.assertFalse(self._PassesThresholds(sample, 7, min_relative_change=1))

   def testIsAnomalous_FiltersOnMultipleOfStdDev(self):
     # In the first sample, the standard deviation on either side of index 5
     # is between 2 and 4. In the second sample, the standard deviation within
     # each of the two segments is 0.
     noisy = [2, 8, 5, 1, 7, 13, 19, 10, 15, 17]
     steady = [5, 5, 5, 5, 5, 15, 15, 15, 15, 15]
     self.assertTrue(self._PassesThresholds(steady, 5, multiple_of_std_dev=1))
     self.assertTrue(self._PassesThresholds(steady, 5, multiple_of_std_dev=8))
     self.assertTrue(self._PassesThresholds(noisy, 5, multiple_of_std_dev=1))
     self.assertFalse(self._PassesThresholds(noisy, 5, multiple_of_std_dev=8))

   def testIsAnomalous_MultipleOfStdDevFilter_LowOnOneSide(self):
     # The standard deviation to use is the lower of the standard deviations
     # of the two sides, so if either side doesn't have a high standard
     # deviation then an alert can be fired.
     left = [3, 2, 3, 4, 3, 5, 30, 1, 50, 10]
     right = [5, 30, 1, 50, 10, 3, 2, 3, 4, 3]
     # Note that stddev([3, 2, 3, 4, 3]) is less than 1, and the difference
     # between the medians of the two sides is 7.
     self.assertTrue(self._PassesThresholds(left, 5, multiple_of_std_dev=7))
     self.assertTrue(self._PassesThresholds(right, 5, multiple_of_std_dev=7))

   def testZeroMedian_ReturnsValuesWithMedianEqualToZero(self):
     # The _ZeroMedian function adjusts values so that the median is zero.
     self.assertEqual([0, 0, 1], find_change_points._ZeroMedian([1, 1, 2]))
     self.assertEqual([-0.5, 0.5], find_change_points._ZeroMedian([45, 46]))

   def testZeroMedian_ResultProperties(self):
     nums = [3.4, 8, 100.2, 78, 3, -4, 12, 3.14, 1024]
     zeroed_nums = find_change_points._ZeroMedian(nums)
     # The output of _ZeroMedian has the same standard deviation as the input.
     self.assertEqual(
         math_utils.StandardDeviation(nums),
         math_utils.StandardDeviation(zeroed_nums))
     # Also, the median of the output is always zero.
     self.assertEqual(0, math_utils.Median(zeroed_nums))

   def _AssertFindsChangePoints(
       self, y_values, expected_indexes, max_window_size=50, min_segment_size=6,
       min_absolute_change=0, min_relative_change=0.01, min_steppiness=0.4,
       multiple_of_std_dev=2.5):
     """Asserts that change points are found at particular indexes."""
     series = list(enumerate(y_values))
     results = find_change_points.FindChangePoints(
         series,
         max_window_size=max_window_size,
         min_segment_size=min_segment_size,
         min_absolute_change=min_absolute_change,
         min_relative_change=min_relative_change,
         min_steppiness=min_steppiness,
         multiple_of_std_dev=multiple_of_std_dev)
     actual_indexes = [a.x_value for a in results]
     self.assertEqual(expected_indexes, actual_indexes)

   def testFindChangePoints_ShortSequences(self):
     self._AssertFindsChangePoints(
         [1, 1, 1, 5, 5, 5, 5, 9, 9, 9], [3],
         max_window_size=10, min_segment_size=3)
     self._AssertFindsChangePoints(
         [1, 1, 5, 5, 5, 5, 9, 9, 9, 9], [6],
         max_window_size=10, min_segment_size=3)
     self._AssertFindsChangePoints(
         [1, 1, 1, 1, 5, 5, 5, 5, 9, 9, 9], [8],
         max_window_size=11, min_segment_size=3)
     self._AssertFindsChangePoints(
         [1, 1, 1, 5, 5, 5, 5, 9, 9, 9, 9], [3],
         max_window_size=11, min_segment_size=3)
     self._AssertFindsChangePoints(
         [1, 1, 5, 5, 5, 5, 9, 9, 9, 9, 9], [6],
         max_window_size=11, min_segment_size=3)

   def testChangePoint_CanBeMadeAndConvertedToDict(self):
     series = list(enumerate([4, 4, 4, 8, 8, 8, 8]))
     change_point = find_change_points.MakeChangePoint(series, 3)
     self.assertEqual(
         find_change_points.ChangePoint(
             x_value=3, median_before=4.0, median_after=8.0, size_before=3,
             size_after=4, window_start=0, window_end=6, relative_change=1.0,
             std_dev_before=0.0, t_statistic=float('inf'),
             degrees_of_freedom=1.0, p_value=0.001),
         change_point)
     self.assertEqual(
         {
             'x_value': 3,
             'median_before': 4.0,
             'median_after': 8.0,
             'size_before': 3,
             'size_after': 4,
             'window_start': 0,
             'window_end': 6,
             'relative_change': 1.0,
             'std_dev_before': 0.0,
             't_statistic': float('inf'),
             'degrees_of_freedom': 1.0,
             'p_value': 0.001,
         },
         change_point.AsDict())


 if __name__ == '__main__':
   unittest.main()
	# Copyright 2015 The Chromium Authors. All rights reserved.
	# Use of this source code is governed by a BSD-style license that can be
	# found in the LICENSE file.

	import unittest

	from dashboard import find_change_points
	from dashboard import math_utils


	class FindChangePointsTest(unittest.TestCase):

	def testFindChangePoints(self):
	# Simple test that the output is as expected for a clear change.
	# Tests for specific aspects of the algorithm are below.
	data = [1, 1, 2, 1, 1, 8, 8, 8, 9, 8, 9]
	series = list(enumerate(data))
	expected = [
	find_change_points.ChangePoint(
	x_value=5,
	median_before=1,
	median_after=8,
	window_start=1,
	window_end=10,
	size_before=4,
	size_after=6,
	relative_change=7,
	std_dev_before=0.4330127018922193,
	t_statistic=-24.452628375754593,
	degrees_of_freedom=6.9938793160801023,
	p_value=0.001)
	]
	actual = find_change_points.FindChangePoints(
	series,
	max_window_size=10,
	multiple_of_std_dev=3,
	min_relative_change=0.5,
	min_absolute_change=1,
	min_steppiness=0.4,
	min_segment_size=3)
	self.assertEqual(expected, actual)

	def testFindChangePoints_EmptySeries(self):
	# For an empty series, there are certainly no change points.
	self.assertEqual([], find_change_points.FindChangePoints([]))

	def testFindSplit(self):
	# Find split returns the first index of the segment after the split.
	self.assertEqual(3, find_change_points._FindSplit([3, 2, 3, 5, 6, 5]))

	# If there are several splits that are equally interesting, or no
	# interesting splits, then the first one is returned.
	self.assertEqual(2, find_change_points._FindSplit([2, 2, 4, 4, 6, 6]))
	self.assertEqual(1, find_change_points._FindSplit([4, 4, 4, 4, 4, 4]))

	def _PassesThresholds(
	self, data, index, multiple_of_std_dev=0, min_relative_change=0,
	min_absolute_change=0, min_segment_size=0, min_steppiness=0):
	"""Tests whether a split passes the thresholds with the given parameters."""
	# All of the threshold parameters are set to zero by default here, so that
	# we can test just one threshold at a time.
	return find_change_points._PassesThresholds(
	data, index,
	min_segment_size=min_segment_size,
	min_absolute_change=min_absolute_change,
	min_relative_change=min_relative_change,
	min_steppiness=min_steppiness,
	multiple_of_std_dev=multiple_of_std_dev)

	def testIsAnomalous_FiltersOnSegmentSize(self):
	sample = [1, 1, 5, 5, 5, 9, 9]
	self.assertFalse(self._PassesThresholds(sample, 2, min_segment_size=3))
	self.assertFalse(self._PassesThresholds(sample, 5, min_segment_size=3))
	self.assertTrue(self._PassesThresholds(sample, 2, min_segment_size=2))
	self.assertTrue(self._PassesThresholds(sample, 5, min_segment_size=2))

	def testIsAnomalous_FiltersOnAbsoluteChange(self):
	sample = [2, 2, 2, 4, 4, 4, 4, 8, 8, 8]
	self.assertTrue(self._PassesThresholds(sample, 7))
	self.assertTrue(self._PassesThresholds(sample, 7, min_absolute_change=4))
	self.assertFalse(self._PassesThresholds(sample, 3, min_absolute_change=4))

	def testIsAnomalous_FiltersOnRelativeChange(self):
	sample = [2, 2, 2, 6, 6, 6, 6, 10, 10, 10]
	self.assertTrue(self._PassesThresholds(sample, 3))
	self.assertTrue(self._PassesThresholds(sample, 3, min_relative_change=1))
	self.assertFalse(self._PassesThresholds(sample, 7, min_relative_change=1))

	def testIsAnomalous_FiltersOnMultipleOfStdDev(self):
	# In the first sample, the standard deviation on either side of index 5
	# is between 2 and 4. In the second sample, the standard deviation within
	# each of the two segments is 0.
	noisy = [2, 8, 5, 1, 7, 13, 19, 10, 15, 17]
	steady = [5, 5, 5, 5, 5, 15, 15, 15, 15, 15]
	self.assertTrue(self._PassesThresholds(steady, 5, multiple_of_std_dev=1))
	self.assertTrue(self._PassesThresholds(steady, 5, multiple_of_std_dev=8))
	self.assertTrue(self._PassesThresholds(noisy, 5, multiple_of_std_dev=1))
	self.assertFalse(self._PassesThresholds(noisy, 5, multiple_of_std_dev=8))

	def testIsAnomalous_MultipleOfStdDevFilter_LowOnOneSide(self):
	# The standard deviation to use is the lower of the standard deviations
	# of the two sides, so if either side doesn't have a high standard
	# deviation then an alert can be fired.
	left = [3, 2, 3, 4, 3, 5, 30, 1, 50, 10]
	right = [5, 30, 1, 50, 10, 3, 2, 3, 4, 3]
	# Note that stddev([3, 2, 3, 4, 3]) is less than 1, and the difference
	# between the medians of the two sides is 7.
	self.assertTrue(self._PassesThresholds(left, 5, multiple_of_std_dev=7))
	self.assertTrue(self._PassesThresholds(right, 5, multiple_of_std_dev=7))

	def testZeroMedian_ReturnsValuesWithMedianEqualToZero(self):
	# The _ZeroMedian function adjusts values so that the median is zero.
	self.assertEqual([0, 0, 1], find_change_points._ZeroMedian([1, 1, 2]))
	self.assertEqual([-0.5, 0.5], find_change_points._ZeroMedian([45, 46]))

	def testZeroMedian_ResultProperties(self):
	nums = [3.4, 8, 100.2, 78, 3, -4, 12, 3.14, 1024]
	zeroed_nums = find_change_points._ZeroMedian(nums)
	# The output of _ZeroMedian has the same standard deviation as the input.
	self.assertEqual(
	math_utils.StandardDeviation(nums),
	math_utils.StandardDeviation(zeroed_nums))
	# Also, the median of the output is always zero.
	self.assertEqual(0, math_utils.Median(zeroed_nums))

	def _AssertFindsChangePoints(
	self, y_values, expected_indexes, max_window_size=50, min_segment_size=6,
	min_absolute_change=0, min_relative_change=0.01, min_steppiness=0.4,
	multiple_of_std_dev=2.5):
	"""Asserts that change points are found at particular indexes."""
	series = list(enumerate(y_values))
	results = find_change_points.FindChangePoints(
	series,
	max_window_size=max_window_size,
	min_segment_size=min_segment_size,
	min_absolute_change=min_absolute_change,
	min_relative_change=min_relative_change,
	min_steppiness=min_steppiness,
	multiple_of_std_dev=multiple_of_std_dev)
	actual_indexes = [a.x_value for a in results]
	self.assertEqual(expected_indexes, actual_indexes)

	def testFindChangePoints_ShortSequences(self):
	self._AssertFindsChangePoints(
	[1, 1, 1, 5, 5, 5, 5, 9, 9, 9], [3],
	max_window_size=10, min_segment_size=3)
	self._AssertFindsChangePoints(
	[1, 1, 5, 5, 5, 5, 9, 9, 9, 9], [6],
	max_window_size=10, min_segment_size=3)
	self._AssertFindsChangePoints(
	[1, 1, 1, 1, 5, 5, 5, 5, 9, 9, 9], [8],
	max_window_size=11, min_segment_size=3)
	self._AssertFindsChangePoints(
	[1, 1, 1, 5, 5, 5, 5, 9, 9, 9, 9], [3],
	max_window_size=11, min_segment_size=3)
	self._AssertFindsChangePoints(
	[1, 1, 5, 5, 5, 5, 9, 9, 9, 9, 9], [6],
	max_window_size=11, min_segment_size=3)

	def testChangePoint_CanBeMadeAndConvertedToDict(self):
	series = list(enumerate([4, 4, 4, 8, 8, 8, 8]))
	change_point = find_change_points.MakeChangePoint(series, 3)
	self.assertEqual(
	find_change_points.ChangePoint(
	x_value=3, median_before=4.0, median_after=8.0, size_before=3,
	size_after=4, window_start=0, window_end=6, relative_change=1.0,
	std_dev_before=0.0, t_statistic=float('inf'),
	degrees_of_freedom=1.0, p_value=0.001),
	change_point)
	self.assertEqual(
	{
	'x_value': 3,
	'median_before': 4.0,
	'median_after': 8.0,
	'size_before': 3,
	'size_after': 4,
	'window_start': 0,
	'window_end': 6,
	'relative_change': 1.0,
	'std_dev_before': 0.0,
	't_statistic': float('inf'),
	'degrees_of_freedom': 1.0,
	'p_value': 0.001,
	},
	change_point.AsDict())


	if __name__ == '__main__':
	unittest.main()