mongo/buildscripts/tests/test_update_test_lifecycle.py

"""
Tests for buildscripts/update_test_lifecycle.py.
"""

import collections
import copy
import datetime
import unittest

from buildscripts import update_test_lifecycle as utl
from buildscripts.ciconfig import tags as ci_tags

# pylint: disable=invalid-name,missing-docstring,protected-access,too-many-lines


class TestTestCombination(unittest.TestCase):
    def test_equal(self):
        args = ["test1", "task1", "variant1", "distro1"]
        while args:
            t1 = utl.TestCombination(*args)
            t2 = utl.TestCombination(*args)
            self.assertTrue(t1 == t2)
            self.assertTrue(t2 == t1)
            args.pop()

    def test_properties(self):
        t = utl.TestCombination("test1", "task1", "variant1", "distro1")
        self.assertEqual("test1", t.test)
        self.assertEqual("task1", t.task)
        self.assertEqual("variant1", t.variant)
        self.assertEqual("distro1", t.distro)

    def test_equal_group_by(self):
        args = ["test1", "task1", "variant1", "distro1"]
        # yapf: disable
        group_by = [
            utl.TestCombination.GROUP_BY_TEST,
            utl.TestCombination.GROUP_BY_TASK,
            utl.TestCombination.GROUP_BY_VARIANT,
            utl.TestCombination.GROUP_BY_DISTRO
        ]
        # yapf: enable
        while args:
            t1 = utl.TestCombination(*args)
            t2 = utl.TestCombination(*args)
            self.assertTrue(t1 == t2)
            self.assertTrue(t2 == t1)
            self.assertEqual(group_by.pop(), t1.group_by)
            args.pop()

    def test_tag(self):
        args = ["test1", "task1", "variant1", "distro1"]
        tags = [
            "unreliable",
            "unreliable|task1",
            "unreliable|task1|variant1",
            "unreliable|task1|variant1|distro1",
        ]
        while args:
            t = utl.TestCombination(*args)
            self.assertEqual(tags.pop(), t.tag)
            args.pop()

    def test_from_tag(self):
        test = "testA"

        combination = utl.TestCombination.from_tag(test, "unreliable")
        self.assertEqual(combination, utl.TestCombination(test, None, None, None))

        combination = utl.TestCombination.from_tag(test, "unreliable|taskA")
        self.assertEqual(combination, utl.TestCombination(test, "taskA", None, None))

        combination = utl.TestCombination.from_tag(test, "unreliable|taskA|variantA")
        self.assertEqual(combination, utl.TestCombination(test, "taskA", "variantA", None))

        combination = utl.TestCombination.from_tag(test, "unreliable|taskA|variantA|distroA")
        self.assertEqual(combination, utl.TestCombination(test, "taskA", "variantA", "distroA"))


class TestTestHistory(unittest.TestCase):
    def test_get_rates_by_distro(self):
        th = utl.TestHistory("test1.js")
        th.add_reliable_period_stats([
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v", "distro": "d1",
                "num_pass": 1, "num_fail": 0
            },
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v", "distro": "d1",
                "num_pass": 0, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v", "distro": "d2",
                "num_pass": 0, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task2", "variant": "v", "distro": "d2",
                "num_pass": 1, "num_fail": 0
            },
        ])
        expected = [
            (utl.TestCombination("test1.js", "task1", "v", "d1"), 0.5, 2),
            (utl.TestCombination("test1.js", "task1", "v", "d2"), 1.0, 1),
            (utl.TestCombination("test1.js", "task2", "v", "d2"), 0.0, 1),
        ]

        rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_DISTRO)

        self.assertListEqual(expected, rates)

    def test_get_rates_by_variant(self):
        th = utl.TestHistory("test1.js")
        th.add_reliable_period_stats([
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d1",
                "num_pass": 1, "num_fail": 0
            },
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d2",
                "num_pass": 0, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v2", "distro": "d2",
                "num_pass": 0, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d2",
                "num_pass": 1, "num_fail": 0
            },
        ])
        expected = [
            (utl.TestCombination("test1.js", "task1", "v1", None), 0.5, 2),
            (utl.TestCombination("test1.js", "task1", "v2", None), 1.0, 1),
            (utl.TestCombination("test1.js", "task2", "v2", None), 0.0, 1),
        ]

        rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_VARIANT)

        self.assertListEqual(expected, rates)

    def test_get_rates_by_task(self):
        th = utl.TestHistory("test1.js")
        th.add_reliable_period_stats([
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d1",
                "num_pass": 1, "num_fail": 0
            },
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d2",
                "num_pass": 0, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d3",
                "num_pass": 2, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d4",
                "num_pass": 1, "num_fail": 0
            },
        ])
        expected = [
            (utl.TestCombination("test1.js", "task1", None, None), 0.5, 2),
            (utl.TestCombination("test1.js", "task2", None, None), 0.25, 4),
        ]

        rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_TASK)

        self.assertListEqual(expected, rates)

    def test_get_rates_by_test(self):
        th = utl.TestHistory("test1.js")
        th.add_reliable_period_stats([
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d1",
                "num_pass": 1, "num_fail": 0
            },
            {
                "test_file": "test1.js", "task_name": "task1", "variant": "v1", "distro": "d2",
                "num_pass": 0, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task2", "variant": "v2", "distro": "d3",
                "num_pass": 2, "num_fail": 1
            },
            {
                "test_file": "test1.js", "task_name": "task3", "variant": "v2", "distro": "d4",
                "num_pass": 1, "num_fail": 0
            },
        ])
        expected = [
            (utl.TestCombination("test1.js", None, None, None), float(1) / 3, 6),
        ]

        rates = th.get_reliable_period_rates(group_by=utl.TestCombination.GROUP_BY_TEST)

        self.assertListEqual(expected, rates)


class TestValidateConfig(unittest.TestCase):
    """
    Tests for the validate_config() function.
    """

    # yapf: disable
    CONFIG = utl.Config(
        test_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        task_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        variant_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        distro_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        reliable_min_runs=2,
        reliable_time_period=datetime.timedelta(days=1),
        unreliable_min_runs=2,
        unreliable_time_period=datetime.timedelta(days=1))
    # yapf: enable

    def test_acceptable_test_fail_rate(self):
        """
        Tests the validation of the 'test_fail_rates.acceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=2))
            utl.validate_config(config)

    def test_unacceptable_test_fail_rate(self):
        """
        Tests the validation of the 'test_fail_rates.unacceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=2))
            utl.validate_config(config)

    def test_test_fail_rates(self):
        """
        Tests the validation of the 'test_fail_rates' attribute.
        """

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9,
                                                                     unacceptable=0.1))
            utl.validate_config(config)

    def test_acceptable_task_fail_rate(self):
        """
        Tests the validation of the 'test_fail_rates.acceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=2))
            utl.validate_config(config)

    def test_unacceptable_task_fail_rate(self):
        """
        Tests the validation of the 'task_fail_rates.unacceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=2))
            utl.validate_config(config)

    def test_task_fail_rates(self):
        """
        Tests the validation of the 'task_fail_rates' attribute.
        """

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9,
                                                                     unacceptable=0.1))
            utl.validate_config(config)

    def test_acceptable_variant_fail_rate(self):
        """
        Tests the validation of the 'variant_fail_rates.acceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(
                    acceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=2))
            utl.validate_config(config)

    def test_unacceptable_variant_fail_rate(self):
        """
        Tests the validation of the 'variant_fail_rates.unacceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(
                    unacceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=2))
            utl.validate_config(config)

    def test_variant_fail_rates(self):
        """
        Tests the validation of the 'variant_fail_rates' attribute.
        """

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                variant_fail_rates=self.CONFIG.variant_fail_rates._replace(
                    acceptable=0.9, unacceptable=0.1))
            utl.validate_config(config)

    def test_acceptable_distro_fail_rate(self):
        """
        Tests the validation of the 'distro_fail_rates.acceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=2))
            utl.validate_config(config)

    def test_unacceptable_distro_fail_rate(self):
        """
        Tests the validation of the 'distro_fail_rates.unacceptable' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(
                    unacceptable="not a number"))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=2))
            utl.validate_config(config)

    def test_distro_fail_rates(self):
        """
        Tests the validation of the 'distro_fail_rates' attribute.
        """

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                distro_fail_rates=self.CONFIG.distro_fail_rates._replace(
                    acceptable=0.9, unacceptable=0.1))
            utl.validate_config(config)

    def test_reliable_min_runs(self):
        """
        Tests the validation of the 'reliable_min_runs' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(reliable_min_runs="not a number")
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(reliable_min_runs=-1)
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(reliable_min_runs=0)
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(reliable_min_runs=1.5)
            utl.validate_config(config)

    def test_reliable_time_period(self):
        """
        Tests the validation of the 'reliable_time_period' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(reliable_time_period="not a datetime.timedelta")
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(reliable_time_period=datetime.timedelta(days=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(reliable_time_period=datetime.timedelta(days=0))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(reliable_time_period=datetime.timedelta(days=1, hours=1))
            utl.validate_config(config)

    def test_unreliable_min_runs(self):
        """
        Tests the validation of the 'unreliable_min_runs' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(unreliable_min_runs="not a number")
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(unreliable_min_runs=-1)
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(unreliable_min_runs=0)
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(unreliable_min_runs=1.5)
            utl.validate_config(config)

    def test_unreliable_time_period(self):
        """
        Tests the validation of the 'unreliable_time_period' attribute.
        """

        with self.assertRaises(TypeError):
            config = self.CONFIG._replace(unreliable_time_period="not a datetime.timedelta")
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(unreliable_time_period=datetime.timedelta(days=-1))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(unreliable_time_period=datetime.timedelta(days=0))
            utl.validate_config(config)

        with self.assertRaises(ValueError):
            config = self.CONFIG._replace(
                unreliable_time_period=datetime.timedelta(days=1, hours=1))
            utl.validate_config(config)


class TestUpdateTags(unittest.TestCase):  # pylint: disable=too-many-public-methods
    """
    Tests for the update_tags() function.
    """
    # yapf: disable
    CONFIG = utl.Config(
        test_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        task_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        variant_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        distro_fail_rates=utl.Rates(acceptable=0, unacceptable=1),
        reliable_min_runs=2,
        reliable_time_period=datetime.timedelta(days=1),
        unreliable_min_runs=2,
        unreliable_time_period=datetime.timedelta(days=1))
    # yapf: enable

    STATS = {
        "test": "jstests/core/all.js", "task": "jsCore_WT", "variant": "linux-64",
        "distro": "rhel62", "num_pass": 0, "num_fail": 0
    }

    @staticmethod
    def _stats(  # pylint: disable=too-many-arguments
            test="jstests/core/all.js", task="jsCore_WT", variant="linux-64", distro="rhel62",
            num_pass=0, num_fail=0):
        return {
            "test_file": test,
            "task_name": task,
            "variant": variant,
            "distro": distro,
            "num_pass": num_pass,
            "num_fail": num_fail,
        }

    def assert_has_only_js_tests(self, lifecycle):
        """
        Raises an AssertionError exception if 'lifecycle' is not of the following form:

            selector:
              js_test:
                ...
        """

        self.assertIn("selector", lifecycle.raw)
        self.assertEqual(1, len(lifecycle.raw), msg=str(lifecycle.raw))
        self.assertIn("js_test", lifecycle.raw["selector"])
        self.assertEqual(1, len(lifecycle.raw["selector"]), msg=str(lifecycle.raw))

        return lifecycle.raw["selector"]["js_test"]

    def transition_from_reliable_to_unreliable(self, config, expected_tags):
        """
        Tests that update_tags() tags a formerly reliable combination as being unreliable.
        """

        initial_tags = collections.OrderedDict()
        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(collections.OrderedDict(), self.assert_has_only_js_tests(lifecycle))

        test_history = utl.TestHistory("jstests/core/all.js")
        stats = [
            self._stats(num_pass=0, num_fail=1),
            self._stats(num_pass=0, num_fail=1, task="jsCore"),
            self._stats(num_pass=0, num_fail=1, variant="linux-64-debug"),
            self._stats(num_pass=1, num_fail=0),
            self._stats(num_pass=0, num_fail=1, distro="rhel55"),
        ]
        test_history.add_reliable_period_stats(stats)
        test_history.add_unreliable_period_stats(stats)

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        self.assertEqual(updated_tags, expected_tags)

    def test_transition_test_from_reliable_to_unreliable(self):
        """
        Tests that update_tags() tags a formerly reliable (test,) combination as being unreliable.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1))

        self.transition_from_reliable_to_unreliable(
            config, collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable"]),
            ]))

    def test_transition_task_from_reliable_to_unreliable(self):
        """
        Tests that update_tags() tags a formerly reliable (test, task) combination as being
        unreliable.
        """

        config = self.CONFIG._replace(
            task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1))

        self.transition_from_reliable_to_unreliable(
            config, collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable|jsCore_WT"]),
            ]))

    def test_transition_variant_from_reliable_to_unreliable(self):
        """
        Tests that update_tags() tags a formerly reliable (test, task, variant) combination as being
        unreliable.
        """

        config = self.CONFIG._replace(
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1))

        self.transition_from_reliable_to_unreliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64"]),
            ]))

    def test_transition_distro_from_reliable_to_unreliable(self):
        """
        Tests that update_tags() tags a formerly reliable (test, task, variant, distro) combination
        as being unreliable.
        """

        config = self.CONFIG._replace(
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1))

        self.transition_from_reliable_to_unreliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64|rhel62"]),
            ]))

    def test_transition_from_reliable_to_unreliable(self):
        """
        Tests that update_tags() tags multiple formerly reliable combination as being unreliable.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1))

        self.transition_from_reliable_to_unreliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", [
                    "unreliable",
                    "unreliable|jsCore_WT",
                    "unreliable|jsCore_WT|linux-64",
                    "unreliable|jsCore_WT|linux-64|rhel62",
                ]),
            ]))

    def transition_from_unreliable_to_reliable(self, config, initial_tags):
        """
        Tests that update_tags() untags a formerly unreliable combination after it has become
        reliable again.
        """

        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))

        test_history = utl.TestHistory("jstests/core/all.js")
        stats = [
            self._stats(num_pass=1, num_fail=0),
            self._stats(num_pass=1, num_fail=0, task="jsCore"),
            self._stats(num_pass=1, num_fail=0, variant="linux-64-debug"),
            self._stats(num_pass=0, num_fail=1),
            self._stats(num_pass=1, num_fail=0, distro="rhel55"),
        ]
        test_history.add_reliable_period_stats(stats)
        test_history.add_unreliable_period_stats(stats)

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        self.assertEqual(updated_tags, collections.OrderedDict())

    def test_non_running_in_reliable_period_is_reliable(self):
        """
        Tests that tests that have a failure rate above the unacceptable rate during the unreliable
        period but haven't run during the reliable period are marked as reliable.
        """
        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1),
            unreliable_time_period=datetime.timedelta(days=2))

        initial_tags = collections.OrderedDict([
            ("jstests/core/all.js", [
                "unreliable",
                "unreliable|jsCore_WT",
                "unreliable|jsCore_WT|linux-64",
                "unreliable|jsCore_WT|linux-64|rhel62",
            ]),
        ])

        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))

        test_history = utl.TestHistory("jstests/core/all.js")
        # The test did not run on the reliable period on linux-64.
        reliable_period_stats = [
            self._stats(num_pass=3, num_fail=0, variant="linux-alt", distro="debian7"),
        ]
        unreliable_period_stats = [
            # Failing.
            self._stats(num_pass=0, num_fail=2),
            self._stats(num_pass=3, num_fail=0, variant="linux-alt", distro="debian7"),
        ]
        test_history.add_reliable_period_stats(reliable_period_stats)
        test_history.add_unreliable_period_stats(unreliable_period_stats)

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        # The tags for variant and distro have been removed.
        self.assertEqual(
            updated_tags,
            collections.OrderedDict([("jstests/core/all.js", ["unreliable",
                                                              "unreliable|jsCore_WT"])]))

    def test_non_running_at_all_is_reliable(self):
        """
        Tests that tests that are tagged as unreliable but no longer running (either during the
        reliable or the unreliable period) have their tags removed.
        """
        config = self.CONFIG

        test_history = utl.TestHistory("jstests/core/all.js")
        test_history2 = utl.TestHistory("jstests/core/all2.js")
        initial_tags = collections.OrderedDict([
            ("jstests/core/all2.js", [
                "unreliable",
                "unreliable|jsCore_WT",
                "unreliable|jsCore_WT|linux-64",
                "unreliable|jsCore_WT|linux-64|rhel62",
            ]),
        ])

        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))

        # all2.js did not run at all
        test_history.add_reliable_period_stats([self._stats()])

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        utl.update_tags(summary_lifecycle, config, test_history2)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        # The tags for variant and distro have been removed.
        self.assertEqual(updated_tags, collections.OrderedDict([]))

    def test_transition_test_from_unreliable_to_reliable(self):
        """
        Tests that update_tags() untags a formerly unreliable (test,) combination after it has
        become reliable again.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9))

        self.transition_from_unreliable_to_reliable(
            config, collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable"]),
            ]))

    def test_transition_task_from_unreliable_to_reliable(self):
        """
        Tests that update_tags() untags a formerly unreliable (test, task) combination after it has
        become reliable again.
        """

        config = self.CONFIG._replace(
            task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9))

        self.transition_from_unreliable_to_reliable(
            config, collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable|jsCore_WT"]),
            ]))

    def test_transition_variant_from_unreliable_to_reliable(self):
        """
        Tests that update_tags() untags a formerly unreliable (test, task, variant) combination
        after it has become reliable again.
        """

        config = self.CONFIG._replace(
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9))

        self.transition_from_unreliable_to_reliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64"]),
            ]))

    def test_transition_distro_from_unreliable_to_reliable(self):
        """
        Tests that update_tags() untags a formerly unreliable (test, task, variant, distro)
        combination after it has become reliable again.
        """

        config = self.CONFIG._replace(
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9))

        self.transition_from_unreliable_to_reliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", ["unreliable|jsCore_WT|linux-64|rhel62"]),
            ]))

    def test_transition_from_unreliable_to_reliable(self):
        """
        Tests that update_tags() untags multiple formerly unreliable combination after it has become
        reliable again.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9))

        self.transition_from_unreliable_to_reliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", [
                    "unreliable",
                    "unreliable|jsCore_WT",
                    "unreliable|jsCore_WT|linux-64",
                    "unreliable|jsCore_WT|linux-64|rhel62",
                ]),
            ]))

    def test_remain_reliable(self):
        """
        Tests that update_tags() preserves the absence of tags for reliable combinations.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9))

        initial_tags = collections.OrderedDict()
        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))

        test_history = utl.TestHistory("jstests/core/all.js")
        stats = [
            self._stats(num_pass=1, num_fail=0),
            self._stats(num_pass=1, num_fail=0, task="jsCore"),
            self._stats(num_pass=1, num_fail=0, variant="linux-64-debug"),
            self._stats(num_pass=0, num_fail=1),
            self._stats(num_pass=1, num_fail=0, distro="rhel55"),
        ]
        test_history.add_reliable_period_stats(stats)

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        self.assertEqual(updated_tags, initial_tags)

    def test_remain_unreliable(self):
        """
        Tests that update_tags() preserves the tags for unreliable combinations.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1))

        initial_tags = collections.OrderedDict([
            ("jstests/core/all.js", [
                "unreliable",
                "unreliable|jsCore_WT",
                "unreliable|jsCore_WT|linux-64",
                "unreliable|jsCore_WT|linux-64|rhel62",
            ]),
        ])

        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))

        test_history = utl.TestHistory("jstests/core/all.js")
        stats = [
            self._stats(num_pass=0, num_fail=1),
            self._stats(num_pass=0, num_fail=1, task="jsCore"),
            self._stats(num_pass=0, num_fail=1, variant="linux-64-debug"),
            self._stats(num_pass=1, num_fail=0),
            self._stats(num_pass=0, num_fail=1, distro="rhel55"),
        ]
        test_history.add_reliable_period_stats(stats)

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        self.assertEqual(updated_tags, initial_tags)

    def test_obeys_reliable_min_runs(self):
        """
        Tests that update_tags() considers a test reliable if it has fewer than 'reliable_min_runs'.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(acceptable=0.9),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(acceptable=0.9),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(acceptable=0.9),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(acceptable=0.9),
            reliable_min_runs=100)

        self.transition_from_unreliable_to_reliable(
            config,
            collections.OrderedDict([
                ("jstests/core/all.js", [
                    "unreliable",
                    "unreliable|jsCore_WT",
                    "unreliable|jsCore_WT|linux-64",
                    "unreliable|jsCore_WT|linux-64|rhel62",
                ]),
            ]))

    def test_obeys_unreliable_min_runs(self):
        """
        Tests that update_tags() only considers a test unreliable if it has more than
        'unreliable_min_runs'.
        """

        config = self.CONFIG._replace(
            test_fail_rates=self.CONFIG.test_fail_rates._replace(unacceptable=0.1),
            task_fail_rates=self.CONFIG.task_fail_rates._replace(unacceptable=0.1),
            variant_fail_rates=self.CONFIG.variant_fail_rates._replace(unacceptable=0.1),
            distro_fail_rates=self.CONFIG.distro_fail_rates._replace(unacceptable=0.1),
            unreliable_min_runs=100)

        initial_tags = collections.OrderedDict()
        lifecycle = ci_tags.TagsConfig.from_dict(
            dict(selector=dict(js_test=copy.deepcopy(initial_tags))))
        summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)
        self.assertEqual(initial_tags, self.assert_has_only_js_tests(lifecycle))

        test_history = utl.TestHistory("jstests/core/all.js")
        stats = [
            self._stats(num_pass=0, num_fail=1),
            self._stats(num_pass=0, num_fail=1, task="jsCore"),
            self._stats(num_pass=0, num_fail=1, variant="linux-64-debug"),
            self._stats(num_pass=1, num_fail=0),
            self._stats(num_pass=0, num_fail=1, distro="rhel55"),
        ]
        test_history.add_reliable_period_stats(stats)
        test_history.add_unreliable_period_stats(stats)

        utl.validate_config(config)
        utl.update_tags(summary_lifecycle, config, test_history)
        updated_tags = self.assert_has_only_js_tests(lifecycle)
        self.assertEqual(updated_tags, initial_tags)


class TestCleanUpTags(unittest.TestCase):
    @classmethod
    def setUpClass(cls):
        cls.evg = MockEvergreenConfig(
            ["task1", "task2", "task3"], {
                "variant1": {"tasks": ["task1", "task2"], "distros": ["distro1"]},
                "variant2": {"tasks": ["task3"], "distros": ["distro2"]}
            })

    def test_is_unreliable_tag_relevant(self):
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable"))

    def test_is_unknown_task_relevant(self):
        self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task_unknown"))

    def test_is_known_task_relevant(self):
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task1"))
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task2"))
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task3"))

    def test_is_unknown_variant_relevant(self):
        self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant3"))

    def test_is_unknown_task_variant_relevant(self):
        self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant1"))
        self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant2"))

    def test_is_known_task_variant_relevant(self):
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant1"))
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task2|variant1"))
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant2"))

    def test_is_unknown_task_variant_distro_relevant(self):
        self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant1|distro2"))
        self.assertFalse(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant2|distro1"))

    def test_is_known_task_variant_distro_relevant(self):
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task1|variant1|distro1"))
        self.assertTrue(utl._is_tag_still_relevant(self.evg, "unreliable|task3|variant2|distro2"))


class MockEvergreenConfig(object):
    def __init__(self, tasks, variants):
        self.task_names = tasks
        self.variants = {}
        for name, fields in list(variants.items()):
            self.variants[name] = MockVariant(fields["tasks"], fields["distros"])

    def get_variant(self, variant_name):
        return self.variants.get(variant_name)


class MockVariant(object):
    def __init__(self, task_names, distros):
        self.task_names = task_names
        self.distro_names = distros


class TestJiraIssueCreator(unittest.TestCase):
    def test_description(self):
        data = {
            "js_test": {
                "testfile1": {"tag1": 0.1, "tag2": 0.2}, "testfile2": {"tag1": 0.1, "tag3": 0.3}
            }
        }
        desc = utl.JiraIssueCreator._make_updated_tags_description(data)
        expected = ("- *js_test*\n"
                    "-- {{testfile1}}\n"
                    "--- {{tag1}} (0.10)\n"
                    "--- {{tag2}} (0.20)\n"
                    "-- {{testfile2}}\n"
                    "--- {{tag1}} (0.10)\n"
                    "--- {{tag3}} (0.30)")
        self.assertEqual(expected, desc)

    def test_description_empty(self):
        data = {}
        desc = utl.JiraIssueCreator._make_updated_tags_description(data)
        expected = "_None_"
        self.assertEqual(expected, desc)

    def test_clean_up_description(self):
        data = {"js_test": {"testfile1": ["tag1", "tag2"], "testfile2": []}}
        desc = utl.JiraIssueCreator._make_tags_cleaned_up_description(data)
        expected = ("- *js_test*\n"
                    "-- {{testfile1}}\n"
                    "--- {{tag1}}\n"
                    "--- {{tag2}}\n"
                    "-- {{testfile2}}\n"
                    "--- ALL (test file removed or renamed as part of an earlier commit)")
        self.assertEqual(expected, desc)

    def test_clean_up_description_empty(self):
        data = {}
        desc = utl.JiraIssueCreator._make_tags_cleaned_up_description(data)
        expected = "_None_"
        self.assertEqual(expected, desc)

    def test_truncate_description(self):
        desc = "a" * (utl.JiraIssueCreator._MAX_DESCRIPTION_SIZE - 1)
        self.assertTrue(desc == utl.JiraIssueCreator._truncate_description(desc))

        desc += "a"
        self.assertTrue(desc == utl.JiraIssueCreator._truncate_description(desc))

        desc += "a"
        self.assertTrue(
            len(utl.JiraIssueCreator._truncate_description(desc)) <= utl.JiraIssueCreator.
            _MAX_DESCRIPTION_SIZE)


class TestTagsConfigWithChangelog(unittest.TestCase):
    def setUp(self):
        lifecycle = ci_tags.TagsConfig({"selector": {}})
        self.summary_lifecycle = utl.TagsConfigWithChangelog(lifecycle)

    def test_add_tag(self):
        self.summary_lifecycle.add_tag("js_test", "testfile1", "tag1", 0.1)
        self.assertEqual({"js_test": {"testfile1": {"tag1": 0.1}}}, self.summary_lifecycle.added)

    def test_remove_tag(self):
        self.summary_lifecycle.lifecycle.add_tag("js_test", "testfile1", "tag1")
        self.summary_lifecycle.remove_tag("js_test", "testfile1", "tag1", 0.1)
        self.assertEqual({"js_test": {"testfile1": {"tag1": 0.1}}}, self.summary_lifecycle.removed)

    def test_add_remove_tag(self):
        self.summary_lifecycle.add_tag("js_test", "testfile1", "tag1", 0.1)
        self.summary_lifecycle.remove_tag("js_test", "testfile1", "tag1", 0.4)
        self.assertEqual({}, self.summary_lifecycle.added)
        self.assertEqual({}, self.summary_lifecycle.removed)

    def test_remove_add_tag(self):
        self.summary_lifecycle.lifecycle.add_tag("js_test", "testfile1", "tag1")
        self.summary_lifecycle.remove_tag("js_test", "testfile1", "tag1", 0.1)
        self.summary_lifecycle.add_tag("js_test", "testfile1", "tag1", 0.1)
        self.assertEqual({}, self.summary_lifecycle.added)
        self.assertEqual({}, self.summary_lifecycle.removed)