Files
mongo/buildscripts/tests/test_update_test_lifecycle.py
2019-04-08 14:08:49 -04:00

1122 lines
44 KiB
Python

"""
Tests for buildscripts/update_test_lifecycle.py.
"""
import collections
import copy
import datetime
import unittest
from buildscripts import update_test_lifecycle as utl
from buildscripts.ciconfig import tags as ci_tags
# pylint: disable=invalid-name,missing-docstring,protected-access,too-many-lines
class TestTestCombination(unittest.TestCase):
def test_equal(self):
args = ["test1", "task1", "variant1", "distro1"]
while args:
t1 = utl.TestCombination(*args)
t2 = utl.TestCombination(*args)
self.assertTrue(t1 == t2)
self.assertTrue(t2 == t1)
args.pop()
def test_properties(self):
t = utl.TestCombination("test1", "task1", "variant1", "distro1")
self.assertEqual("test1", t.test)
self.assertEqual("task1", t.task)
self.assertEqual("variant1", t.variant)
self.assertEqual("distro1", t.distro)
def test_equal_group_by(self):
args = ["test1", "task1", "variant1", "distro1"]
# yapf: disable
group_by = [
utl.TestCombination.GROUP_BY_TEST,
utl.TestCombination.GROUP_BY_TASK,
utl.TestCombination.GROUP_BY_VARIANT,
utl.TestCombination.GROUP_BY_DISTRO
]
# yapf: enable
while args:
t1 = utl.TestCombination(*args)
t2 = utl.TestCombination(*args)
self.assertTrue(t1 == t2)
self.assertTrue(t2 == t1)
self.assertEqual(group_by.pop(), t1.group_by)
args.pop()
def test_tag(self):
args = ["test1", "task1", "variant1", "distro1"]
tags = [
"unreliable",
"unreliable|task1",
"unreliable|task1|variant1",
"unreliable|task1|variant1|distro1",
]
while args:
t = utl.TestCombination(*args)
self.assertEqual(tags.pop(), t.tag)
args.pop()
def test_from_tag(self):
test = "testA"
combination = utl.TestCombination.from_tag(test, "unreliable")
self.assertEqual(combination, utl.TestCombination(test, None, None, None))
combination = utl.TestCombination.from_tag(test, "unreliable|taskA")
self.assertEqual(combination, utl.TestCombination(test, "taskA", None, None))
combination = utl.TestCombination.from_tag(test, "unreliable|taskA|variantA")
self.assertEqual(combination, utl.TestCombination(test, "taskA", "variantA", None))
combination = utl.TestCombination.from_tag(test, "unreliable|taskA|variantA|distroA")
self.assertEqual(combination, utl.TestCombination(test, "taskA", "variantA", "distroA"))
class TestTestHistory(unittest.TestCase):
def test_get_rates_by_distro(self):
th = utl.TestHistory("test1.js")
th.add_reliable_period_stats([
{
"test_file": "test1.js", "task_name": "task1", "variant": "v", "distro": "d1",
"num_pass": 1, "num_fail": 0
},
{
"test_file": "test1.js", "task_name": "task1", "variant": "v", "distro": "d1",
"num_pass": 0, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task1", "variant": "v", "distro": "d2",
"num_pass": 0, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task2", "variant": "v", "distro": "d2",
"num_pass": 1, "num_fail": 0
},
])
expected = [
(utl.TestCombination("test1.js", "task1", "v", "d1"), 0.5, 2),
(utl.TestCombination("test1.js", "task1", "v", "d2"), 1.0, 1),
(utl.TestCombination("test1.js", "task2", "v", "d2"), 0.0, 1),
]
rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_DISTRO)
self.assertListEqual(expected, rates)
def test_get_rates_by_variant(self):
th = utl.TestHistory("test1.js")
th.add_reliable_period_stats([
{
"test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d1",
"num_pass": 1, "num_fail": 0
},
{
"test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d2",
"num_pass": 0, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task1", "variant": "v2", "distro": "d2",
"num_pass": 0, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d2",
"num_pass": 1, "num_fail": 0
},
])
expected = [
(utl.TestCombination("test1.js", "task1", "v1", None), 0.5, 2),
(utl.TestCombination("test1.js", "task1", "v2", None), 1.0, 1),
(utl.TestCombination("test1.js", "task2", "v2", None), 0.0, 1),
]
rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_VARIANT)
self.assertListEqual(expected, rates)
def test_get_rates_by_task(self):
th = utl.TestHistory("test1.js")
th.add_reliable_period_stats([
{
"test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d1",
"num_pass": 1, "num_fail": 0
},
{
"test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d2",
"num_pass": 0, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d3",
"num_pass": 2, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d4",
"num_pass": 1, "num_fail": 0
},
])
expected = [
(utl.TestCombination("test1.js", "task1", None, None), 0.5, 2),
(utl.TestCombination("test1.js", "task2", None, None), 0.25, 4),
]
rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_TASK)
self.assertListEqual(expected, rates)
def test_get_rates_by_test(self):
th = utl.TestHistory("test1.js")
th.add_reliable_period_stats([
{
"test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d1",
"num_pass": 1, "num_fail": 0
},
{
"test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d2",
"num_pass": 0, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d3",
"num_pass": 2, "num_fail": 1
},
{
"test_file": "test1.js", "task_name": "task3", "variant": "v2", "distro": "d4",
"num_pass": 1, "num_fail": 0
},
])
expected = [
(utl.TestCombination("test1.js", None, None, None), float(1) / 3, 6),
]
rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_TEST)
self.assertListEqual(expected, rates)
class TestValidateConfig(unittest.TestCase):
"""
Tests for the validate_config() function.
"""
# yapf: disable
CONFIG = utl.Config(
test_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
task_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
variant_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
distro_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
reliable_min_runs=2,
reliable_time_period=datetime.timedelta(days=1),
unreliable_min_runs=2,
unreliable_time_period=datetime.timedelta(days=1))
# yapf: enable
def test_acceptable_test_fail_rate(self):
"""
Tests the validation of the 'test_fail_rates.acceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=2))
utl.validate_config(config)
def test_unacceptable_test_fail_rate(self):
"""
Tests the validation of the 'test_fail_rates.unacceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=2))
utl.validate_config(config)
def test_test_fail_rates(self):
"""
Tests the validation of the 'test_fail_rates' attribute.
"""
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9,
unacceptable=0.1))
utl.validate_config(config)
def test_acceptable_task_fail_rate(self):
"""
Tests the validation of the 'test_fail_rates.acceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=2))
utl.validate_config(config)
def test_unacceptable_task_fail_rate(self):
"""
Tests the validation of the 'task_fail_rates.unacceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=2))
utl.validate_config(config)
def test_task_fail_rates(self):
"""
Tests the validation of the 'task_fail_rates' attribute.
"""
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9,
unacceptable=0.1))
utl.validate_config(config)
def test_acceptable_variant_fail_rate(self):
"""
Tests the validation of the 'variant_fail_rates.acceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(
acceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=2))
utl.validate_config(config)
def test_unacceptable_variant_fail_rate(self):
"""
Tests the validation of the 'variant_fail_rates.unacceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(
unacceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=2))
utl.validate_config(config)
def test_variant_fail_rates(self):
"""
Tests the validation of the 'variant_fail_rates' attribute.
"""
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(
acceptable=0.9, unacceptable=0.1))
utl.validate_config(config)
def test_acceptable_distro_fail_rate(self):
"""
Tests the validation of the 'distro_fail_rates.acceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=2))
utl.validate_config(config)
def test_unacceptable_distro_fail_rate(self):
"""
Tests the validation of the 'distro_fail_rates.unacceptable' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(
unacceptable="not a number"))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=2))
utl.validate_config(config)
def test_distro_fail_rates(self):
"""
Tests the validation of the 'distro_fail_rates' attribute.
"""
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(
acceptable=0.9, unacceptable=0.1))
utl.validate_config(config)
def test_reliable_min_runs(self):
"""
Tests the validation of the 'reliable_min_runs' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(reliable_min_runs="not a number")
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(reliable_min_runs=-1)
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(reliable_min_runs=0)
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(reliable_min_runs=1.5)
utl.validate_config(config)
def test_reliable_time_period(self):
"""
Tests the validation of the 'reliable_time_period' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(reliable_time_period="not a datetime.timedelta")
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(reliable_time_period=datetime.timedelta(days=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(reliable_time_period=datetime.timedelta(days=0))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(reliable_time_period=datetime.timedelta(days=1, hours=1))
utl.validate_config(config)
def test_unreliable_min_runs(self):
"""
Tests the validation of the 'unreliable_min_runs' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(unreliable_min_runs="not a number")
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(unreliable_min_runs=-1)
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(unreliable_min_runs=0)
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(unreliable_min_runs=1.5)
utl.validate_config(config)
def test_unreliable_time_period(self):
"""
Tests the validation of the 'unreliable_time_period' attribute.
"""
with self.assertRaises(TypeError):
config = self.CONFIG._replace(unreliable_time_period="not a datetime.timedelta")
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(unreliable_time_period=datetime.timedelta(days=-1))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(unreliable_time_period=datetime.timedelta(days=0))
utl.validate_config(config)
with self.assertRaises(ValueError):
config = self.CONFIG._replace(
unreliable_time_period=datetime.timedelta(days=1, hours=1))
utl.validate_config(config)
class TestUpdateTags(unittest.TestCase): # pylint: disable=too-many-public-methods
"""
Tests for the update_tags() function.
"""
# yapf: disable
CONFIG = utl.Config(
test_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
task_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
variant_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
distro_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
reliable_min_runs=2,
reliable_time_period=datetime.timedelta(days=1),
unreliable_min_runs=2,
unreliable_time_period=datetime.timedelta(days=1))
# yapf: enable
STATS = {
"test": "jstests/core/all.js", "task": "jsCore_WT", "variant": "linux-64",
"distro": "rhel62", "num_pass": 0, "num_fail": 0
}
@staticmethod
def _stats( # pylint: disable=too-many-arguments
test="jstests/core/all.js", task="jsCore_WT", variant="linux-64", distro="rhel62",
num_pass=0, num_fail=0):
return {
"test_file": test,
"task_name": task,
"variant": variant,
"distro": distro,
"num_pass": num_pass,
"num_fail": num_fail,
}
def assert_has_only_js_tests(self, lifecycle):
"""
Raises an AssertionError exception if 'lifecycle' is not of the following form:
selector:
js_test:
...
"""
self.assertIn("selector", lifecycle.raw)
self.assertEqual(1, len(lifecycle.raw), msg=str(lifecycle.raw))
self.assertIn("js_test", lifecycle.raw["selector"])
self.assertEqual(1, len(lifecycle.raw["selector"]), msg=str(lifecycle.raw))
return lifecycle.raw["selector"]["js_test"]
def transition_from_reliable_to_unreliable(self, config, expected_tags):
"""
Tests that update_tags() tags a formerly reliable combination as being unreliable.
"""
initial_tags = collections.OrderedDict()
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(collections.OrderedDict(), self.assert_has_only_js_tests(lifecycle))
test_history = utl.TestHistory("jstests/core/all.js")
stats = [
self._stats(num_pass=0, num_fail=1),
self._stats(num_pass=0, num_fail=1, task="jsCore"),
self._stats(num_pass=0, num_fail=1, variant="linux-64-debug"),
self._stats(num_pass=1, num_fail=0),
self._stats(num_pass=0, num_fail=1, distro="rhel55"),
]
test_history.add_reliable_period_stats(stats)
test_history.add_unreliable_period_stats(stats)
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
updated_tags = self.assert_has_only_js_tests(lifecycle)
self.assertEqual(updated_tags, expected_tags)
def test_transition_test_from_reliable_to_unreliable(self):
"""
Tests that update_tags() tags a formerly reliable (test,) combination as being unreliable.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1))
self.transition_from_reliable_to_unreliable(
config, collections.OrderedDict([
("jstests/core/all.js", ["unreliable"]),
]))
def test_transition_task_from_reliable_to_unreliable(self):
"""
Tests that update_tags() tags a formerly reliable (test, task) combination as being
unreliable.
"""
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1))
self.transition_from_reliable_to_unreliable(
config, collections.OrderedDict([
("jstests/core/all.js", ["unreliable|jsCore_WT"]),
]))
def test_transition_variant_from_reliable_to_unreliable(self):
"""
Tests that update_tags() tags a formerly reliable (test, task, variant) combination as being
unreliable.
"""
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1))
self.transition_from_reliable_to_unreliable(
config,
collections.OrderedDict([
("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64"]),
]))
def test_transition_distro_from_reliable_to_unreliable(self):
"""
Tests that update_tags() tags a formerly reliable (test, task, variant, distro) combination
as being unreliable.
"""
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1))
self.transition_from_reliable_to_unreliable(
config,
collections.OrderedDict([
("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64|rhel62"]),
]))
def test_transition_from_reliable_to_unreliable(self):
"""
Tests that update_tags() tags multiple formerly reliable combination as being unreliable.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1))
self.transition_from_reliable_to_unreliable(
config,
collections.OrderedDict([
("jstests/core/all.js", [
"unreliable",
"unreliable|jsCore_WT",
"unreliable|jsCore_WT|linux-64",
"unreliable|jsCore_WT|linux-64|rhel62",
]),
]))
def transition_from_unreliable_to_reliable(self, config, initial_tags):
"""
Tests that update_tags() untags a formerly unreliable combination after it has become
reliable again.
"""
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))
test_history = utl.TestHistory("jstests/core/all.js")
stats = [
self._stats(num_pass=1, num_fail=0),
self._stats(num_pass=1, num_fail=0, task="jsCore"),
self._stats(num_pass=1, num_fail=0, variant="linux-64-debug"),
self._stats(num_pass=0, num_fail=1),
self._stats(num_pass=1, num_fail=0, distro="rhel55"),
]
test_history.add_reliable_period_stats(stats)
test_history.add_unreliable_period_stats(stats)
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
updated_tags = self.assert_has_only_js_tests(lifecycle)
self.assertEqual(updated_tags, collections.OrderedDict())
def test_non_running_in_reliable_period_is_reliable(self):
"""
Tests that tests that have a failure rate above the unacceptable rate during the unreliable
period but haven't run during the reliable period are marked as reliable.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1),
unreliable_time_period=datetime.timedelta(days=2))
initial_tags = collections.OrderedDict([
("jstests/core/all.js", [
"unreliable",
"unreliable|jsCore_WT",
"unreliable|jsCore_WT|linux-64",
"unreliable|jsCore_WT|linux-64|rhel62",
]),
])
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))
test_history = utl.TestHistory("jstests/core/all.js")
# The test did not run on the reliable period on linux-64.
reliable_period_stats = [
self._stats(num_pass=3, num_fail=0, variant="linux-alt", distro="debian7"),
]
unreliable_period_stats = [
# Failing.
self._stats(num_pass=0, num_fail=2),
self._stats(num_pass=3, num_fail=0, variant="linux-alt", distro="debian7"),
]
test_history.add_reliable_period_stats(reliable_period_stats)
test_history.add_unreliable_period_stats(unreliable_period_stats)
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
updated_tags = self.assert_has_only_js_tests(lifecycle)
# The tags for variant and distro have been removed.
self.assertEqual(
updated_tags,
collections.OrderedDict([("jstests/core/all.js", ["unreliable",
"unreliable|jsCore_WT"])]))
def test_non_running_at_all_is_reliable(self):
"""
Tests that tests that are tagged as unreliable but no longer running (either during the
reliable or the unreliable period) have their tags removed.
"""
config = self.CONFIG
test_history = utl.TestHistory("jstests/core/all.js")
test_history2 = utl.TestHistory("jstests/core/all2.js")
initial_tags = collections.OrderedDict([
("jstests/core/all2.js", [
"unreliable",
"unreliable|jsCore_WT",
"unreliable|jsCore_WT|linux-64",
"unreliable|jsCore_WT|linux-64|rhel62",
]),
])
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))
# all2.js did not run at all
test_history.add_reliable_period_stats([self._stats()])
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
utl.update_tags(summary_lifecycle, config, test_history2)
updated_tags = self.assert_has_only_js_tests(lifecycle)
# The tags for variant and distro have been removed.
self.assertEqual(updated_tags, collections.OrderedDict([]))
def test_transition_test_from_unreliable_to_reliable(self):
"""
Tests that update_tags() untags a formerly unreliable (test,) combination after it has
become reliable again.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9))
self.transition_from_unreliable_to_reliable(
config, collections.OrderedDict([
("jstests/core/all.js", ["unreliable"]),
]))
def test_transition_task_from_unreliable_to_reliable(self):
"""
Tests that update_tags() untags a formerly unreliable (test, task) combination after it has
become reliable again.
"""
config = self.CONFIG._replace(
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9))
self.transition_from_unreliable_to_reliable(
config, collections.OrderedDict([
("jstests/core/all.js", ["unreliable|jsCore_WT"]),
]))
def test_transition_variant_from_unreliable_to_reliable(self):
"""
Tests that update_tags() untags a formerly unreliable (test, task, variant) combination
after it has become reliable again.
"""
config = self.CONFIG._replace(
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9))
self.transition_from_unreliable_to_reliable(
config,
collections.OrderedDict([
("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64"]),
]))
def test_transition_distro_from_unreliable_to_reliable(self):
"""
Tests that update_tags() untags a formerly unreliable (test, task, variant, distro)
combination after it has become reliable again.
"""
config = self.CONFIG._replace(
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9))
self.transition_from_unreliable_to_reliable(
config,
collections.OrderedDict([
("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64|rhel62"]),
]))
def test_transition_from_unreliable_to_reliable(self):
"""
Tests that update_tags() untags multiple formerly unreliable combination after it has become
reliable again.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9),
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9))
self.transition_from_unreliable_to_reliable(
config,
collections.OrderedDict([
("jstests/core/all.js", [
"unreliable",
"unreliable|jsCore_WT",
"unreliable|jsCore_WT|linux-64",
"unreliable|jsCore_WT|linux-64|rhel62",
]),
]))
def test_remain_reliable(self):
"""
Tests that update_tags() preserves the absence of tags for reliable combinations.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9),
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9))
initial_tags = collections.OrderedDict()
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))
test_history = utl.TestHistory("jstests/core/all.js")
stats = [
self._stats(num_pass=1, num_fail=0),
self._stats(num_pass=1, num_fail=0, task="jsCore"),
self._stats(num_pass=1, num_fail=0, variant="linux-64-debug"),
self._stats(num_pass=0, num_fail=1),
self._stats(num_pass=1, num_fail=0, distro="rhel55"),
]
test_history.add_reliable_period_stats(stats)
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
updated_tags = self.assert_has_only_js_tests(lifecycle)
self.assertEqual(updated_tags, initial_tags)
def test_remain_unreliable(self):
"""
Tests that update_tags() preserves the tags for unreliable combinations.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1))
initial_tags = collections.OrderedDict([
("jstests/core/all.js", [
"unreliable",
"unreliable|jsCore_WT",
"unreliable|jsCore_WT|linux-64",
"unreliable|jsCore_WT|linux-64|rhel62",
]),
])
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))
test_history = utl.TestHistory("jstests/core/all.js")
stats = [
self._stats(num_pass=0, num_fail=1),
self._stats(num_pass=0, num_fail=1, task="jsCore"),
self._stats(num_pass=0, num_fail=1, variant="linux-64-debug"),
self._stats(num_pass=1, num_fail=0),
self._stats(num_pass=0, num_fail=1, distro="rhel55"),
]
test_history.add_reliable_period_stats(stats)
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
updated_tags = self.assert_has_only_js_tests(lifecycle)
self.assertEqual(updated_tags, initial_tags)
def test_obeys_reliable_min_runs(self):
"""
Tests that update_tags() considers a test reliable if it has fewer than 'reliable_min_runs'.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9),
task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9),
reliable_min_runs=100)
self.transition_from_unreliable_to_reliable(
config,
collections.OrderedDict([
("jstests/core/all.js", [
"unreliable",
"unreliable|jsCore_WT",
"unreliable|jsCore_WT|linux-64",
"unreliable|jsCore_WT|linux-64|rhel62",
]),
]))
def test_obeys_unreliable_min_runs(self):
"""
Tests that update_tags() only considers a test unreliable if it has more than
'unreliable_min_runs'.
"""
config = self.CONFIG._replace(
test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1),
unreliable_min_runs=100)
initial_tags = collections.OrderedDict()
lifecycle = ci_tags.TagsConfig.from_dict(
dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))
test_history = utl.TestHistory("jstests/core/all.js")
stats = [
self._stats(num_pass=0, num_fail=1),
self._stats(num_pass=0, num_fail=1, task="jsCore"),
self._stats(num_pass=0, num_fail=1, variant="linux-64-debug"),
self._stats(num_pass=1, num_fail=0),
self._stats(num_pass=0, num_fail=1, distro="rhel55"),
]
test_history.add_reliable_period_stats(stats)
test_history.add_unreliable_period_stats(stats)
utl.validate_config(config)
utl.update_tags(summary_lifecycle, config, test_history)
updated_tags = self.assert_has_only_js_tests(lifecycle)
self.assertEqual(updated_tags, initial_tags)
class TestCleanUpTags(unittest.TestCase):
@classmethod
def setUpClass(cls):
cls.evg = MockEvergreenConfig(
["task1", "task2", "task3"], {
"variant1": {"tasks": ["task1", "task2"], "distros": ["distro1"]},
"variant2": {"tasks": ["task3"], "distros": ["distro2"]}
})
def test_is_unreliable_tag_relevant(self):
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable"))
def test_is_unknown_task_relevant(self):
self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task_unknown"))
def test_is_known_task_relevant(self):
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task1"))
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task2"))
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task3"))
def test_is_unknown_variant_relevant(self):
self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant3"))
def test_is_unknown_task_variant_relevant(self):
self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant1"))
self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant2"))
def test_is_known_task_variant_relevant(self):
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant1"))
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task2|variant1"))
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant2"))
def test_is_unknown_task_variant_distro_relevant(self):
self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant1|distro2"))
self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant2|distro1"))
def test_is_known_task_variant_distro_relevant(self):
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant1|distro1"))
self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant2|distro2"))
class MockEvergreenConfig(object):
def __init__(self, tasks, variants):
self.task_names = tasks
self.variants = {}
for name, fields in list(variants.items()):
self.variants[name] = MockVariant(fields["tasks"], fields["distros"])
def get_variant(self, variant_name):
return self.variants.get(variant_name)
class MockVariant(object):
def __init__(self, task_names, distros):
self.task_names = task_names
self.distro_names = distros
class TestJiraIssueCreator(unittest.TestCase):
def test_description(self):
data = {
"js_test": {
"testfile1": {"tag1": 0.1, "tag2": 0.2}, "testfile2": {"tag1": 0.1, "tag3": 0.3}
}
}
desc = utl.JiraIssueCreator._make_updated_tags_description(data)
expected = ("- *js_test*\n"
"-- {{testfile1}}\n"
"--- {{tag1}} (0.10)\n"
"--- {{tag2}} (0.20)\n"
"-- {{testfile2}}\n"
"--- {{tag1}} (0.10)\n"
"--- {{tag3}} (0.30)")
self.assertEqual(expected, desc)
def test_description_empty(self):
data = {}
desc = utl.JiraIssueCreator._make_updated_tags_description(data)
expected = "_None_"
self.assertEqual(expected, desc)
def test_clean_up_description(self):
data = {"js_test": {"testfile1": ["tag1", "tag2"], "testfile2": []}}
desc = utl.JiraIssueCreator._make_tags_cleaned_up_description(data)
expected = ("- *js_test*\n"
"-- {{testfile1}}\n"
"--- {{tag1}}\n"
"--- {{tag2}}\n"
"-- {{testfile2}}\n"
"--- ALL (test file removed or renamed as part of an earlier commit)")
self.assertEqual(expected, desc)
def test_clean_up_description_empty(self):
data = {}
desc = utl.JiraIssueCreator._make_tags_cleaned_up_description(data)
expected = "_None_"
self.assertEqual(expected, desc)
def test_truncate_description(self):
desc = "a" * (utl.JiraIssueCreator._MAX_DESCRIPTION_SIZE - 1)
self.assertTrue(desc == utl.JiraIssueCreator._truncate_description(desc))
desc += "a"
self.assertTrue(desc == utl.JiraIssueCreator._truncate_description(desc))
desc += "a"
self.assertTrue(
len(utl.JiraIssueCreator._truncate_description(desc)) <= utl.JiraIssueCreator.
_MAX_DESCRIPTION_SIZE)
class TestTagsConfigWithChangelog(unittest.TestCase):
def setUp(self):
lifecycle = ci_tags.TagsConfig({"selector": {}})
self.summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
def test_add_tag(self):
self.summary_lifecycle.add_tag("js_test", "testfile1", "tag1", 0.1)
self.assertEqual({"js_test": {"testfile1": {"tag1": 0.1}}}, self.summary_lifecycle.added)
def test_remove_tag(self):
self.summary_lifecycle.lifecycle.add_tag("js_test", "testfile1", "tag1")
self.summary_lifecycle.remove_tag("js_test", "testfile1", "tag1", 0.1)
self.assertEqual({"js_test": {"testfile1": {"tag1": 0.1}}}, self.summary_lifecycle.removed)
def test_add_remove_tag(self):
self.summary_lifecycle.add_tag("js_test", "testfile1", "tag1", 0.1)
self.summary_lifecycle.remove_tag("js_test", "testfile1", "tag1", 0.4)
self.assertEqual({}, self.summary_lifecycle.added)
self.assertEqual({}, self.summary_lifecycle.removed)
def test_remove_add_tag(self):
self.summary_lifecycle.lifecycle.add_tag("js_test", "testfile1", "tag1")
self.summary_lifecycle.remove_tag("js_test", "testfile1", "tag1", 0.1)
self.summary_lifecycle.add_tag("js_test", "testfile1", "tag1", 0.1)
self.assertEqual({}, self.summary_lifecycle.added)
self.assertEqual({}, self.summary_lifecycle.removed)