bugbug/scripts/test_scheduling_history_ret...

# -*- coding: utf-8 -*-

import argparse
import json
import os
import subprocess
import tarfile
from datetime import datetime
from logging import INFO, basicConfig, getLogger

import dateutil.parser
import requests
from dateutil.relativedelta import relativedelta
from tqdm import tqdm

from bugbug import db, repository, test_scheduling
from bugbug.utils import ExpQueue, download_check_etag, zstd_compress

basicConfig(level=INFO)
logger = getLogger(__name__)

JOBS_TO_CONSIDER = ("test-", "build-")


URL = "https://index.taskcluster.net/v1/task/project.relman.bugbug.data_test_scheduling_history.latest/artifacts/public/adr_cache.tar.xz"

TRAINING_MONTHS = 6


class Retriever(object):
    def retrieve_test_scheduling_history(self):
        os.makedirs("data", exist_ok=True)

        # Download previous cache.
        cache_path = os.path.abspath("data/adr_cache")
        if not os.path.exists(cache_path):
            try:
                download_check_etag(URL, "adr_cache.tar.xz")
                with tarfile.open("adr_cache.tar.xz", "r:xz") as tar:
                    tar.extractall()
                assert os.path.exists("data/adr_cache"), "Decompressed adr cache exists"
            except requests.exceptions.HTTPError:
                logger.info("The adr cache is not available yet")

        # Setup adr cache configuration.
        os.makedirs(os.path.expanduser("~/.config/adr"), exist_ok=True)
        with open(os.path.expanduser("~/.config/adr/config.toml"), "w") as f:
            f.write(
                f"""[adr.cache.stores]
file = {{ driver = "file", path = "{cache_path}" }}
"""
            )

        # Get the commits DB.
        if db.is_old_version(repository.COMMITS_DB) or not db.exists(
            repository.COMMITS_DB
        ):
            db.download(repository.COMMITS_DB, force=True)

        # We'll use the past TRAINING_MONTHS months only for training the model,
        # but we use 3 months more than that to calculate the failure statistics.
        subprocess.run(
            [
                "run-adr",
                "ahal/ci-recipes",
                "recipe",
                "-o",
                os.path.abspath("push_data.json"),
                "-f",
                "json",
                "push_data",
                "--",
                "--from",
                f"today-{TRAINING_MONTHS + 3}month",
                "--to",
                "today-2day",
                "--branch",
                "autoland",
            ],
            check=True,
            stdout=subprocess.DEVNULL,  # Redirect to /dev/null, as the logs are too big otherwise.
        )

        HISTORY_DATE_START = datetime.now() - relativedelta(months=TRAINING_MONTHS)

        with open("push_data.json", "r") as f:
            data = json.load(f)

        push_data = {}
        for row in data[1:]:
            # Revision -> (all tasks, possible regressions, likely regressions)
            push_data[row[0]] = (row[1], row[2], row[3])

        HISTORICAL_TIMESPAN = 56

        past_failures = {}

        def get_and_update_past_failures(type_, task, items, push_num, is_regression):
            if type_ not in past_failures:
                past_failures[type_] = {}

            if task not in past_failures[type_]:
                past_failures[type_][task] = {}

            values_total = []
            values_prev_7 = []
            values_prev_14 = []
            values_prev_28 = []
            values_prev_56 = []

            for item in items:
                if item not in past_failures[type_][task]:
                    past_failures[type_][task][item] = ExpQueue(
                        push_num, HISTORICAL_TIMESPAN + 1, 0
                    )

                value = past_failures[type_][task][item][push_num]

                values_total.append(value)
                values_prev_7.append(
                    value - past_failures[type_][task][item][push_num - 7]
                )
                values_prev_14.append(
                    value - past_failures[type_][task][item][push_num - 14]
                )
                values_prev_28.append(
                    value - past_failures[type_][task][item][push_num - 28]
                )
                values_prev_56.append(
                    value - past_failures[type_][task][item][push_num - 56]
                )

                if is_regression:
                    past_failures[type_][task][item][push_num] = value + 1

            return (
                sum(values_total),
                sum(values_prev_7),
                sum(values_prev_14),
                sum(values_prev_28),
                sum(values_prev_56),
            )

        def generate_data():
            commits_with_data = set()
            saved_nodes = set()

            push_num = 0
            for commit_data in tqdm(repository.get_commits()):
                node = commit_data["node"]

                if node not in push_data:
                    continue

                commits_with_data.add(node)

                commit_push_data = push_data[node]

                for task in commit_push_data[0]:
                    if not any(task.startswith(j) for j in JOBS_TO_CONSIDER):
                        continue

                    is_regression = (
                        task in commit_push_data[1] or task in commit_push_data[2]
                    )

                    total_failures, past_7_pushes_failures, past_14_pushes_failures, past_28_pushes_failures, past_56_pushes_failures = get_and_update_past_failures(
                        "all", task, ["all"], push_num, is_regression
                    )

                    total_types_failures, past_7_pushes_types_failures, past_14_pushes_types_failures, past_28_pushes_types_failures, past_56_pushes_types_failures = get_and_update_past_failures(
                        "type", task, commit_data["types"], push_num, is_regression
                    )

                    total_files_failures, past_7_pushes_files_failures, past_14_pushes_files_failures, past_28_pushes_files_failures, past_56_pushes_files_failures = get_and_update_past_failures(
                        "file", task, commit_data["files"], push_num, is_regression
                    )

                    total_directories_failures, past_7_pushes_directories_failures, past_14_pushes_directories_failures, past_28_pushes_directories_failures, past_56_pushes_directories_failures = get_and_update_past_failures(
                        "directory",
                        task,
                        commit_data["directories"],
                        push_num,
                        is_regression,
                    )

                    total_components_failures, past_7_pushes_components_failures, past_14_pushes_components_failures, past_28_pushes_components_failures, past_56_pushes_components_failures = get_and_update_past_failures(
                        "component",
                        task,
                        commit_data["components"],
                        push_num,
                        is_regression,
                    )

                    pushdate = dateutil.parser.parse(commit_data["pushdate"])
                    if pushdate > HISTORY_DATE_START:
                        saved_nodes.add(node)

                        yield {
                            "rev": node,
                            "name": task,
                            "failures": total_failures,
                            "failures_past_7_pushes": past_7_pushes_failures,
                            "failures_past_14_pushes": past_14_pushes_failures,
                            "failures_past_28_pushes": past_28_pushes_failures,
                            "failures_past_56_pushes": past_56_pushes_failures,
                            "failures_in_types": total_types_failures,
                            "failures_past_7_pushes_in_types": past_7_pushes_types_failures,
                            "failures_past_14_pushes_in_types": past_14_pushes_types_failures,
                            "failures_past_28_pushes_in_types": past_28_pushes_types_failures,
                            "failures_past_56_pushes_in_types": past_56_pushes_types_failures,
                            "failures_in_files": total_files_failures,
                            "failures_past_7_pushes_in_files": past_7_pushes_files_failures,
                            "failures_past_14_pushes_in_files": past_14_pushes_files_failures,
                            "failures_past_28_pushes_in_files": past_28_pushes_files_failures,
                            "failures_past_56_pushes_in_files": past_56_pushes_files_failures,
                            "failures_in_directories": total_directories_failures,
                            "failures_past_7_pushes_in_directories": past_7_pushes_directories_failures,
                            "failures_past_14_pushes_in_directories": past_14_pushes_directories_failures,
                            "failures_past_28_pushes_in_directories": past_28_pushes_directories_failures,
                            "failures_past_56_pushes_in_directories": past_56_pushes_directories_failures,
                            "failures_in_components": total_components_failures,
                            "failures_past_7_pushes_in_components": past_7_pushes_components_failures,
                            "failures_past_14_pushes_in_components": past_14_pushes_components_failures,
                            "failures_past_28_pushes_in_components": past_28_pushes_components_failures,
                            "failures_past_56_pushes_in_components": past_56_pushes_components_failures,
                            "is_possible_regression": task in commit_push_data[1],
                            "is_likely_regression": task in commit_push_data[2],
                        }

                push_num += 1

            logger.info(f"push data nodes: {len(push_data)}")

            logger.info(f"commits linked to push data: {len(commits_with_data)}")

            logger.info(f"saved push data nodes: {len(saved_nodes)}")

        db.write(test_scheduling.TEST_SCHEDULING_DB, generate_data())

        zstd_compress(test_scheduling.TEST_SCHEDULING_DB)

        with tarfile.open("data/adr_cache.tar.xz", "w:xz") as tar:
            tar.add("data/adr_cache")


def main():
    description = "Retrieve and extract the test scheduling history from ActiveData"
    parser = argparse.ArgumentParser(description=description)

    # Parse args to show the help if `--help` is passed
    parser.parse_args()

    retriever = Retriever()
    retriever.retrieve_test_scheduling_history()


if __name__ == "__main__":
    main()
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`# -- coding: utf-8 --`

			`import argparse`
Keep using standard json library in the test scheduling history retrieval task The orjson library doesn't support stream reading from a file, so here the standard json library is preferable. 2019-10-18 03:23:53 +03:00			`import json`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`import os`
			`import subprocess`
			`import tarfile`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`from datetime import datetime`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`from logging import INFO, basicConfig, getLogger`

Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`import dateutil.parser`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`import requests`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`from dateutil.relativedelta import relativedelta`
Show progress while generating test scheduling history data 2019-09-19 02:32:01 +03:00			`from tqdm import tqdm`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00
Move TEST_SCHEDULING_DB definition in a module 2019-09-19 12:21:21 +03:00			`from bugbug import db, repository, test_scheduling`
Move exp_queue from repository.py to utils.py (#974) Fixes #971 2019-09-25 16:52:37 +03:00			`from bugbug.utils import ExpQueue, download_check_etag, zstd_compress`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00
			`basicConfig(level=INFO)`
			`logger = getLogger(__name__)`

Only consider build-* and test-* tasks 2019-09-24 23:42:44 +03:00			`JOBS_TO_CONSIDER = ("test-", "build-")`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00
Move TEST_SCHEDULING_DB definition in a module 2019-09-19 12:21:21 +03:00
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`URL = "https://index.taskcluster.net/v1/task/project.relman.bugbug.data_test_scheduling_history.latest/artifacts/public/adr_cache.tar.xz"`

Retrieve past 6 months test scheduling history instead of just 3 2019-09-24 23:32:16 +03:00			`TRAINING_MONTHS = 6`

Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00
			`class Retriever(object):`
			`def retrieve_test_scheduling_history(self):`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`os.makedirs("data", exist_ok=True)`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00
			`# Download previous cache.`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`cache_path = os.path.abspath("data/adr_cache")`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`if not os.path.exists(cache_path):`
			`try:`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`download_check_etag(URL, "adr_cache.tar.xz")`
			`with tarfile.open("adr_cache.tar.xz", "r:xz") as tar:`
			`tar.extractall()`
			`assert os.path.exists("data/adr_cache"), "Decompressed adr cache exists"`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`except requests.exceptions.HTTPError:`
			`logger.info("The adr cache is not available yet")`

			`# Setup adr cache configuration.`
Create adr configuration directory before writing the configuration file 2019-09-12 13:35:04 +03:00			`os.makedirs(os.path.expanduser("~/.config/adr"), exist_ok=True)`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`with open(os.path.expanduser("~/.config/adr/config.toml"), "w") as f:`
			`f.write(`
			`f"""[adr.cache.stores]`
			`file = {{ driver = "file", path = "{cache_path}" }}`
Don't write useless whitespaces in adr configuration 2019-10-09 17:01:02 +03:00			`"""`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`)`

Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`# Get the commits DB.`
			`if db.is_old_version(repository.COMMITS_DB) or not db.exists(`
			`repository.COMMITS_DB`
			`):`
			`db.download(repository.COMMITS_DB, force=True)`

Retrieve past 6 months test scheduling history instead of just 3 2019-09-24 23:32:16 +03:00			`# We'll use the past TRAINING_MONTHS months only for training the model,`
			`# but we use 3 months more than that to calculate the failure statistics.`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`subprocess.run(`
			`[`
			`"run-adr",`
			`"ahal/ci-recipes",`
			`"recipe",`
			`"-o",`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`os.path.abspath("push_data.json"),`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`"-f",`
			`"json",`
			`"push_data",`
			`"--",`
			`"--from",`
Retrieve past 6 months test scheduling history instead of just 3 2019-09-24 23:32:16 +03:00			`f"today-{TRAINING_MONTHS + 3}month",`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`"--to",`
			`"today-2day",`
			`"--branch",`
			`"autoland",`
			`],`
			`check=True,`
Redirect adr stdout to /dev/null to reduce the size of the logs 2019-09-13 11:09:33 +03:00			`stdout=subprocess.DEVNULL, # Redirect to /dev/null, as the logs are too big otherwise.`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00			`)`

Retrieve past 6 months test scheduling history instead of just 3 2019-09-24 23:32:16 +03:00			`HISTORY_DATE_START = datetime.now() - relativedelta(months=TRAINING_MONTHS)`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00
			`with open("push_data.json", "r") as f:`
Keep using standard json library in the test scheduling history retrieval task The orjson library doesn't support stream reading from a file, so here the standard json library is preferable. 2019-10-18 03:23:53 +03:00			`data = json.load(f)`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00
			`push_data = {}`
			`for row in data[1:]:`
			`# Revision -> (all tasks, possible regressions, likely regressions)`
			`push_data[row[0]] = (row[1], row[2], row[3])`

			`HISTORICAL_TIMESPAN = 56`

			`past_failures = {}`

Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00			`def get_and_update_past_failures(type_, task, items, push_num, is_regression):`
			`if type_ not in past_failures:`
			`past_failures[type_] = {}`

			`if task not in past_failures[type_]:`
			`past_failures[type_][task] = {}`

			`values_total = []`
			`values_prev_7 = []`
			`values_prev_14 = []`
			`values_prev_28 = []`
			`values_prev_56 = []`

			`for item in items:`
			`if item not in past_failures[type_][task]:`
			`past_failures[type_][task][item] = ExpQueue(`
			`push_num, HISTORICAL_TIMESPAN + 1, 0`
			`)`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00
Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00			`value = past_failures[type_][task][item][push_num]`

			`values_total.append(value)`
			`values_prev_7.append(`
			`value - past_failures[type_][task][item][push_num - 7]`
			`)`
			`values_prev_14.append(`
			`value - past_failures[type_][task][item][push_num - 14]`
			`)`
			`values_prev_28.append(`
			`value - past_failures[type_][task][item][push_num - 28]`
			`)`
			`values_prev_56.append(`
			`value - past_failures[type_][task][item][push_num - 56]`
			`)`

			`if is_regression:`
			`past_failures[type_][task][item][push_num] = value + 1`

			`return (`
			`sum(values_total),`
			`sum(values_prev_7),`
			`sum(values_prev_14),`
			`sum(values_prev_28),`
			`sum(values_prev_56),`
			`)`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00
			`def generate_data():`
			`commits_with_data = set()`
			`saved_nodes = set()`

			`push_num = 0`
Show progress while generating test scheduling history data 2019-09-19 02:32:01 +03:00			`for commit_data in tqdm(repository.get_commits()):`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`node = commit_data["node"]`

			`if node not in push_data:`
			`continue`

			`commits_with_data.add(node)`

			`commit_push_data = push_data[node]`

			`for task in commit_push_data[0]:`
Only consider build-* and test-* tasks 2019-09-24 23:42:44 +03:00			`if not any(task.startswith(j) for j in JOBS_TO_CONSIDER):`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`continue`

Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00			`is_regression = (`
			`task in commit_push_data[1] or task in commit_push_data[2]`
			`)`

			`total_failures, past_7_pushes_failures, past_14_pushes_failures, past_28_pushes_failures, past_56_pushes_failures = get_and_update_past_failures(`
			`"all", task, ["all"], push_num, is_regression`
			`)`

			`total_types_failures, past_7_pushes_types_failures, past_14_pushes_types_failures, past_28_pushes_types_failures, past_56_pushes_types_failures = get_and_update_past_failures(`
			`"type", task, commit_data["types"], push_num, is_regression`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`)`
Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00
			`total_files_failures, past_7_pushes_files_failures, past_14_pushes_files_failures, past_28_pushes_files_failures, past_56_pushes_files_failures = get_and_update_past_failures(`
			`"file", task, commit_data["files"], push_num, is_regression`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`)`
Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00
			`total_directories_failures, past_7_pushes_directories_failures, past_14_pushes_directories_failures, past_28_pushes_directories_failures, past_56_pushes_directories_failures = get_and_update_past_failures(`
			`"directory",`
			`task,`
			`commit_data["directories"],`
			`push_num,`
			`is_regression,`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`)`
Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00
			`total_components_failures, past_7_pushes_components_failures, past_14_pushes_components_failures, past_28_pushes_components_failures, past_56_pushes_components_failures = get_and_update_past_failures(`
			`"component",`
			`task,`
			`commit_data["components"],`
			`push_num,`
			`is_regression,`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`)`

			`pushdate = dateutil.parser.parse(commit_data["pushdate"])`
			`if pushdate > HISTORY_DATE_START:`
			`saved_nodes.add(node)`

			`yield {`
			`"rev": node,`
			`"name": task,`
			`"failures": total_failures,`
			`"failures_past_7_pushes": past_7_pushes_failures,`
			`"failures_past_14_pushes": past_14_pushes_failures,`
			`"failures_past_28_pushes": past_28_pushes_failures,`
			`"failures_past_56_pushes": past_56_pushes_failures,`
Get past task failures with specific files, directories, components, file types 2019-10-09 17:02:58 +03:00			`"failures_in_types": total_types_failures,`
			`"failures_past_7_pushes_in_types": past_7_pushes_types_failures,`
			`"failures_past_14_pushes_in_types": past_14_pushes_types_failures,`
			`"failures_past_28_pushes_in_types": past_28_pushes_types_failures,`
			`"failures_past_56_pushes_in_types": past_56_pushes_types_failures,`
			`"failures_in_files": total_files_failures,`
			`"failures_past_7_pushes_in_files": past_7_pushes_files_failures,`
			`"failures_past_14_pushes_in_files": past_14_pushes_files_failures,`
			`"failures_past_28_pushes_in_files": past_28_pushes_files_failures,`
			`"failures_past_56_pushes_in_files": past_56_pushes_files_failures,`
			`"failures_in_directories": total_directories_failures,`
			`"failures_past_7_pushes_in_directories": past_7_pushes_directories_failures,`
			`"failures_past_14_pushes_in_directories": past_14_pushes_directories_failures,`
			`"failures_past_28_pushes_in_directories": past_28_pushes_directories_failures,`
			`"failures_past_56_pushes_in_directories": past_56_pushes_directories_failures,`
			`"failures_in_components": total_components_failures,`
			`"failures_past_7_pushes_in_components": past_7_pushes_components_failures,`
			`"failures_past_14_pushes_in_components": past_14_pushes_components_failures,`
			`"failures_past_28_pushes_in_components": past_28_pushes_components_failures,`
			`"failures_past_56_pushes_in_components": past_56_pushes_components_failures,`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`"is_possible_regression": task in commit_push_data[1],`
			`"is_likely_regression": task in commit_push_data[2],`
			`}`

			`push_num += 1`

			`logger.info(f"push data nodes: {len(push_data)}")`

			`logger.info(f"commits linked to push data: {len(commits_with_data)}")`

			`logger.info(f"saved push data nodes: {len(saved_nodes)}")`

Move TEST_SCHEDULING_DB definition in a module 2019-09-19 12:21:21 +03:00			`db.write(test_scheduling.TEST_SCHEDULING_DB, generate_data())`
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00
Move TEST_SCHEDULING_DB definition in a module 2019-09-19 12:21:21 +03:00			`zstd_compress(test_scheduling.TEST_SCHEDULING_DB)`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00
Generate a DB of past test runs, with their failure history Also move the artifacts to be in relative directories rather than absolute 2019-09-18 14:10:22 +03:00			`with tarfile.open("data/adr_cache.tar.xz", "w:xz") as tar:`
			`tar.add("data/adr_cache")`
Add a task to retrieve test scheduling history 2019-09-11 21:17:02 +03:00

			`def main():`
			`description = "Retrieve and extract the test scheduling history from ActiveData"`
			`parser = argparse.ArgumentParser(description=description)`

			# Parse args to show the help if `--help` is passed
			`parser.parse_args()`

			`retriever = Retriever()`
			`retriever.retrieve_test_scheduling_history()`


			`if __name__ == "__main__":`
			`main()`