Refactor run_test.py (#6816)

Over the last few months run_test.py got more and more complex. This refactors the code in `run_test.py` to be better understandable. Mostly this splits up separate pieces of logic into separate functions.
2023-04-05 11:11:30 +02:00 · 2023-04-05 11:11:30 +02:00 · e5e5eb35c7
parent d4f9de7875
commit e5e5eb35c7
3 changed files with 277 additions and 247 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@ -35,3 +35,6 @@ norecursedirs = [
    'data',
    '__pycache__',
 ]
 # Don't find files with test at the end such as run_test.py
 python_files = ['test_*.py']
--- a/src/test/regress/citus_tests/common.py
+++ b/src/test/regress/citus_tests/common.py
@ -2,6 +2,7 @@ import asyncio
 import atexit
 import concurrent.futures
 import os
 import pathlib
 import platform
 import random
 import re
@ -43,6 +44,8 @@ BSD = MACOS or FREEBSD or OPENBSD
 TIMEOUT_DEFAULT = timedelta(seconds=int(os.getenv("PG_TEST_TIMEOUT_DEFAULT", "10")))
 FORCE_PORTS = os.getenv("PG_FORCE_PORTS", "NO").lower() not in ("no", "0", "n", "")
 REGRESS_DIR = pathlib.Path(os.path.realpath(__file__)).parent.parent
 def initialize_temp_dir(temp_dir):
    if os.path.exists(temp_dir):
--- a/src/test/regress/citus_tests/run_test.py
+++ b/src/test/regress/citus_tests/run_test.py
@ -9,68 +9,30 @@ import re
 import shutil
 import sys
 from collections import OrderedDict
 from contextlib import contextmanager
 from typing import Optional
 import common
 from common import REGRESS_DIR, capture, run
 from config import ARBITRARY_SCHEDULE_NAMES, MASTER_VERSION, CitusDefaultClusterConfig
-# Returns true if given test_schedule_line is of the form:
+def main():
-#   "test: upgrade_ ... _after .."
+    args = parse_arguments()
-def schedule_line_is_upgrade_after(test_schedule_line: str) -> bool:
+
-    return (
+    test_name = get_test_name(args)
-        test_schedule_line.startswith("test: upgrade_")
+
-        and "_after" in test_schedule_line
+    # All python tests start with test_ and all other tests don't. This is by
-    )
+    # convention.
    if test_name.startswith("test_"):
        run_python_test(test_name, args)
        # above function never returns
    else:
        run_regress_test(test_name, args)
-def run_python_test(test_file_name, repeat):
+def parse_arguments():
    """Runs the test using pytest
    This function never returns as it usese os.execlp to replace the current
    process with a new pytest process.
    """
    test_path = regress_dir / "citus_tests" / "test" / f"{test_file_name}.py"
    if not test_path.exists():
        raise Exception("Test could not be found in any schedule")
    os.execlp(
        "pytest",
        "pytest",
        "--numprocesses",
        "auto",
        "--count",
        str(repeat),
        str(test_path),
    )
 def run_schedule_with_python(schedule):
    bindir = common.capture("pg_config --bindir").rstrip()
    pgxs_path = pathlib.Path(common.capture("pg_config --pgxs").rstrip())
    os.chdir(regress_dir)
    os.environ["PATH"] = str(regress_dir / "bin") + os.pathsep + os.environ["PATH"]
    os.environ["PG_REGRESS_DIFF_OPTS"] = "-dU10 -w"
    os.environ["CITUS_OLD_VERSION"] = f"v{MASTER_VERSION}.0"
    args = {
        "--pgxsdir": str(pgxs_path.parent.parent.parent),
        "--bindir": bindir,
    }
    config = CitusDefaultClusterConfig(args)
    common.initialize_temp_dir(config.temp_dir)
    common.initialize_citus_cluster(
        config.bindir, config.datadir, config.settings, config
    )
    common.run_pg_regress(
        config.bindir, config.pg_srcdir, config.coordinator_port(), schedule
    )
 if __name__ == "__main__":
    args = argparse.ArgumentParser()
    args.add_argument(
        "test_name", help="Test name (must be included in a schedule.)", nargs="?"
@ -106,208 +68,125 @@ if __name__ == "__main__":
        action="store_true",
    )
-    args = vars(args.parse_args())
+    return vars(args.parse_args())
    regress_dir = pathlib.Path(
        os.path.dirname(os.path.dirname(os.path.realpath(__file__)))
    )
    test_file_path = args["path"]
    test_file_name = args["test_name"]
    use_base_schedule = args["use_base_schedule"]
    use_whole_schedule_line = args["use_whole_schedule_line"]
-    class TestDeps:
+class TestDeps:
-        schedule: Optional[str]
+    schedule: Optional[str]
-        direct_extra_tests: list[str]
+    direct_extra_tests: list[str]
-        def __init__(self, schedule, extra_tests=None, repeatable=True, worker_count=2):
+    def __init__(self, schedule, extra_tests=None, repeatable=True, worker_count=2):
-            self.schedule = schedule
+        self.schedule = schedule
-            self.direct_extra_tests = extra_tests or []
+        self.direct_extra_tests = extra_tests or []
-            self.repeatable = repeatable
+        self.repeatable = repeatable
-            self.worker_count = worker_count
+        self.worker_count = worker_count
-        def extra_tests(self):
+    def extra_tests(self):
-            all_deps = OrderedDict()
+        all_deps = OrderedDict()
-            for direct_dep in self.direct_extra_tests:
+        for direct_dep in self.direct_extra_tests:
-                if direct_dep in deps:
+            if direct_dep in DEPS:
-                    for indirect_dep in deps[direct_dep].extra_tests():
+                for indirect_dep in DEPS[direct_dep].extra_tests():
-                        all_deps[indirect_dep] = True
+                    all_deps[indirect_dep] = True
-                all_deps[direct_dep] = True
+            all_deps[direct_dep] = True
-            return list(all_deps.keys())
+        return list(all_deps.keys())
    deps = {
        "multi_cluster_management": TestDeps(
            None, ["multi_test_helpers_superuser"], repeatable=False
        ),
        "create_role_propagation": TestDeps(None, ["multi_cluster_management"]),
        "single_node_enterprise": TestDeps(None),
        "single_node": TestDeps(None),
        "single_node_truncate": TestDeps(None),
        "multi_extension": TestDeps(None, repeatable=False),
        "multi_test_helpers": TestDeps(None),
        "multi_insert_select": TestDeps("base_schedule"),
        "multi_mx_create_table": TestDeps(
            None,
            [
                "multi_test_helpers_superuser",
                "multi_mx_node_metadata",
                "multi_cluster_management",
                "multi_mx_function_table_reference",
            ],
        ),
        "background_rebalance_parallel": TestDeps(
            None,
            [
                "multi_test_helpers",
                "multi_cluster_management",
            ],
            worker_count=6,
        ),
        "multi_mx_modifying_xacts": TestDeps(None, ["multi_mx_create_table"]),
        "multi_mx_router_planner": TestDeps(None, ["multi_mx_create_table"]),
        "multi_mx_copy_data": TestDeps(None, ["multi_mx_create_table"]),
        "multi_mx_schema_support": TestDeps(None, ["multi_mx_copy_data"]),
        "multi_simple_queries": TestDeps("base_schedule"),
    }
-    if not (test_file_name or test_file_path):
+DEPS = {
-        print("FATAL: No test given.")
+    "multi_cluster_management": TestDeps(
-        sys.exit(2)
+        None, ["multi_test_helpers_superuser"], repeatable=False
    ),
    "create_role_propagation": TestDeps(None, ["multi_cluster_management"]),
    "single_node_enterprise": TestDeps(None),
    "single_node": TestDeps(None),
    "single_node_truncate": TestDeps(None),
    "multi_extension": TestDeps(None, repeatable=False),
    "multi_test_helpers": TestDeps(None),
    "multi_insert_select": TestDeps("base_schedule"),
    "multi_mx_create_table": TestDeps(
        None,
        [
            "multi_test_helpers_superuser",
            "multi_mx_node_metadata",
            "multi_cluster_management",
            "multi_mx_function_table_reference",
        ],
    ),
    "background_rebalance_parallel": TestDeps(
        None,
        [
            "multi_test_helpers",
            "multi_cluster_management",
        ],
        worker_count=6,
    ),
    "multi_mx_modifying_xacts": TestDeps(None, ["multi_mx_create_table"]),
    "multi_mx_router_planner": TestDeps(None, ["multi_mx_create_table"]),
    "multi_mx_copy_data": TestDeps(None, ["multi_mx_create_table"]),
    "multi_mx_schema_support": TestDeps(None, ["multi_mx_copy_data"]),
    "multi_simple_queries": TestDeps("base_schedule"),
 }
    if test_file_path:
        test_file_path = os.path.join(os.getcwd(), args["path"])
-        if not os.path.isfile(test_file_path):
+def run_python_test(test_name, args):
-            print(f"ERROR: test file '{test_file_path}' does not exist")
+    """Runs the test using pytest
            sys.exit(2)
-        test_file_extension = pathlib.Path(test_file_path).suffix
+    This function never returns as it usese os.execlp to replace the current
-        test_file_name = pathlib.Path(test_file_path).stem
+    process with a new pytest process.
-
+    """
-        if test_file_extension not in (".spec", ".sql", ".py"):
+    test_path = REGRESS_DIR / "citus_tests" / "test" / f"{test_name}.py"
-            print(
+    if not test_path.exists():
                "ERROR: Unrecognized test extension. Valid extensions are: .sql, .spec, and .py"
            )
            sys.exit(1)
    test_schedule = ""
    dependencies = []
    if test_file_name.startswith("test_"):
        run_python_test(test_file_name, args["repeat"])
    # find related schedule
    for schedule_file_path in sorted(regress_dir.glob("*_schedule")):
        for schedule_line in open(schedule_file_path, "r"):
            if re.search(r"\b" + test_file_name + r"\b", schedule_line):
                test_schedule = pathlib.Path(schedule_file_path).stem
                if use_whole_schedule_line:
                    test_schedule_line = schedule_line
                else:
                    test_schedule_line = f"test: {test_file_name}\n"
                break
        else:
            continue
        break
    else:
        raise Exception("Test could not be found in any schedule")
-    def default_base_schedule(test_schedule):
+    os.execlp(
-        if "isolation" in test_schedule:
+        "pytest",
-            return "base_isolation_schedule"
+        "pytest",
-
+        "--numprocesses",
-        if "failure" in test_schedule:
+        "auto",
-            return "failure_base_schedule"
+        "--count",
-
+        str(args["repeat"]),
-        if "enterprise" in test_schedule:
+        str(test_path),
            return "enterprise_minimal_schedule"
        if "split" in test_schedule:
            return "minimal_schedule"
        if "mx" in test_schedule:
            if use_base_schedule:
                return "mx_base_schedule"
            return "mx_minimal_schedule"
        if "operations" in test_schedule:
            return "minimal_schedule"
        if "after_citus_upgrade" in test_schedule:
            print(
                f"WARNING: After citus upgrade schedule ({test_schedule}) is not supported."
            )
            sys.exit(0)
        if "citus_upgrade" in test_schedule:
            return None
        if "pg_upgrade" in test_schedule:
            return "minimal_schedule"
        if test_schedule in ARBITRARY_SCHEDULE_NAMES:
            print(
                f"WARNING: Arbitrary config schedule ({test_schedule}) is not supported."
            )
            sys.exit(0)
        if use_base_schedule:
            return "base_schedule"
        return "minimal_schedule"
    # we run the tests with 2 workers by default.
    # If we find any dependency which requires more workers, we update the worker count.
    def worker_count_for(test_name):
        if test_name in deps:
            return deps[test_name].worker_count
        return 2
    test_worker_count = max(worker_count_for(test_file_name), 2)
    if test_file_name in deps:
        dependencies = deps[test_file_name]
    elif schedule_line_is_upgrade_after(test_schedule_line):
        dependencies = TestDeps(
            default_base_schedule(test_schedule),
            [test_file_name.replace("_after", "_before")],
        )
    else:
        dependencies = TestDeps(default_base_schedule(test_schedule))
    if "before_" in test_schedule:
        dependencies.repeatable = False
    # copy base schedule to a temp file and append test_schedule_line
    # to be able to run tests in parallel (if test_schedule_line is a parallel group.)
    tmp_schedule_path = os.path.join(
        regress_dir, f"tmp_schedule_{ random.randint(1, 10000)}"
    )
    # some tests don't need a schedule to run
    # e.g tests that are in the first place in their own schedule
    if dependencies.schedule:
        shutil.copy2(
            os.path.join(regress_dir, dependencies.schedule), tmp_schedule_path
        )
    with open(tmp_schedule_path, "a") as myfile:
        for dependency in dependencies.extra_tests():
            myfile.write(f"test: {dependency}\n")
            test_worker_count = max(worker_count_for(dependency), test_worker_count)
        repetition_cnt = args["repeat"]
        if repetition_cnt > 1 and not dependencies.repeatable:
            repetition_cnt = 1
            print(f"WARNING: Cannot repeatably run this test: '{test_file_name}'")
        for _ in range(repetition_cnt):
            myfile.write(test_schedule_line)
-    if "upgrade" in test_schedule_line:
+def run_regress_test(test_name, args):
-        try:
+    original_schedule, schedule_line = find_test_schedule_and_line(test_name, args)
-            run_schedule_with_python(pathlib.Path(tmp_schedule_path).stem)
+
-        finally:
+    dependencies = test_dependencies(test_name, original_schedule, schedule_line, args)
-            # remove temp schedule file
+
-            os.remove(tmp_schedule_path)
+    with tmp_schedule(test_name, dependencies, schedule_line, args) as schedule:
-        sys.exit(0)
+        if "upgrade" in original_schedule:
            run_schedule_with_python(schedule)
        else:
            run_schedule_with_multiregress(test_name, schedule, dependencies, args)
 def run_schedule_with_python(schedule):
    bindir = capture("pg_config --bindir").rstrip()
    pgxs_path = pathlib.Path(capture("pg_config --pgxs").rstrip())
    os.chdir(REGRESS_DIR)
    os.environ["PATH"] = str(REGRESS_DIR / "bin") + os.pathsep + os.environ["PATH"]
    os.environ["PG_REGRESS_DIFF_OPTS"] = "-dU10 -w"
    os.environ["CITUS_OLD_VERSION"] = f"v{MASTER_VERSION}.0"
    args = {
        "--pgxsdir": str(pgxs_path.parent.parent.parent),
        "--bindir": bindir,
    }
    config = CitusDefaultClusterConfig(args)
    common.initialize_temp_dir(config.temp_dir)
    common.initialize_citus_cluster(
        config.bindir, config.datadir, config.settings, config
    )
    common.run_pg_regress(
        config.bindir, config.pg_srcdir, config.coordinator_port(), schedule
    )
 def run_schedule_with_multiregress(test_name, schedule, dependencies, args):
    worker_count = needed_worker_count(test_name, dependencies)
    # find suitable make recipe
    if dependencies.schedule == "base_isolation_schedule":
@ -322,15 +201,160 @@ if __name__ == "__main__":
    # prepare command to run tests
    test_command = (
-        f"make -C {regress_dir} {make_recipe} "
+        f"make -C {REGRESS_DIR} {make_recipe} "
-        f"WORKERCOUNT={test_worker_count} "
+        f"WORKERCOUNT={worker_count} "
-        f"SCHEDULE='{pathlib.Path(tmp_schedule_path).stem}'"
+        f"SCHEDULE='{schedule}'"
    )
    run(test_command)
 def default_base_schedule(test_schedule, args):
    if "isolation" in test_schedule:
        return "base_isolation_schedule"
    if "failure" in test_schedule:
        return "failure_base_schedule"
    if "enterprise" in test_schedule:
        return "enterprise_minimal_schedule"
    if "split" in test_schedule:
        return "minimal_schedule"
    if "mx" in test_schedule:
        if args["use_base_schedule"]:
            return "mx_base_schedule"
        return "mx_minimal_schedule"
    if "operations" in test_schedule:
        return "minimal_schedule"
    if "after_citus_upgrade" in test_schedule:
        print(
            f"WARNING: After citus upgrade schedule ({test_schedule}) is not supported."
        )
        sys.exit(0)
    if "citus_upgrade" in test_schedule:
        return None
    if "pg_upgrade" in test_schedule:
        return "minimal_schedule"
    if test_schedule in ARBITRARY_SCHEDULE_NAMES:
        print(f"WARNING: Arbitrary config schedule ({test_schedule}) is not supported.")
        sys.exit(0)
    if args["use_base_schedule"]:
        return "base_schedule"
    return "minimal_schedule"
 # we run the tests with 2 workers by default.
 # If we find any dependency which requires more workers, we update the worker count.
 def worker_count_for(test_name):
    if test_name in DEPS:
        return DEPS[test_name].worker_count
    return 2
 def get_test_name(args):
    if args["test_name"]:
        return args["test_name"]
    if not args["path"]:
        print("FATAL: No test given.")
        sys.exit(2)
    absolute_test_path = os.path.join(os.getcwd(), args["path"])
    if not os.path.isfile(absolute_test_path):
        print(f"ERROR: test file '{absolute_test_path}' does not exist")
        sys.exit(2)
    if pathlib.Path(absolute_test_path).suffix not in (".spec", ".sql", ".py"):
        print(
            "ERROR: Unrecognized test extension. Valid extensions are: .sql, .spec, and .py"
        )
        sys.exit(1)
    return pathlib.Path(absolute_test_path).stem
 def find_test_schedule_and_line(test_name, args):
    for schedule_file_path in sorted(REGRESS_DIR.glob("*_schedule")):
        for schedule_line in open(schedule_file_path, "r"):
            if re.search(r"\b" + test_name + r"\b", schedule_line):
                test_schedule = pathlib.Path(schedule_file_path).stem
                if args["use_whole_schedule_line"]:
                    return test_schedule, schedule_line
                return test_schedule, f"test: {test_name}\n"
    raise Exception("Test could not be found in any schedule")
 def test_dependencies(test_name, test_schedule, schedule_line, args):
    if test_name in DEPS:
        return DEPS[test_name]
    if schedule_line_is_upgrade_after(schedule_line):
        # upgrade_xxx_after tests always depend on upgrade_xxx_before
        return TestDeps(
            default_base_schedule(test_schedule, args),
            [test_name.replace("_after", "_before")],
        )
    # before_ tests leave stuff around on purpose for the after tests. So they
    # are not repeatable by definition.
    if "before_" in test_schedule:
        repeatable = False
    else:
        repeatable = True
    return TestDeps(default_base_schedule(test_schedule, args), repeatable=repeatable)
 # Returns true if given test_schedule_line is of the form:
 #   "test: upgrade_ ... _after .."
 def schedule_line_is_upgrade_after(test_schedule_line: str) -> bool:
    return (
        test_schedule_line.startswith("test: upgrade_")
        and "_after" in test_schedule_line
    )
-    # run test command n times
+
@contextmanager
 def tmp_schedule(test_name, dependencies, schedule_line, args):
    tmp_schedule_path = REGRESS_DIR / f"tmp_schedule_{random.randint(1, 10000)}"
    # Prefill the temporary schedule with the base schedule that this test
    # depends on. Some tests don't need a base schedule to run though,
    # e.g tests that are in the first place in their own schedule
    if dependencies.schedule:
        shutil.copy2(REGRESS_DIR / dependencies.schedule, tmp_schedule_path)
    with open(tmp_schedule_path, "a") as myfile:
        # Add any specific dependencies
        for dependency in dependencies.extra_tests():
            myfile.write(f"test: {dependency}\n")
        repetition_cnt = args["repeat"]
        if repetition_cnt > 1 and not dependencies.repeatable:
            repetition_cnt = 1
            print(f"WARNING: Cannot repeatably run this test: '{test_name}'")
        for _ in range(repetition_cnt):
            myfile.write(schedule_line)
    try:
-        print(f"Executing.. {test_command}")
+        yield tmp_schedule_path.stem
        result = common.run(test_command)
    finally:
        # remove temp schedule file
        os.remove(tmp_schedule_path)
 def needed_worker_count(test_name, dependencies):
    worker_count = worker_count_for(test_name)
    for dependency in dependencies.extra_tests():
        worker_count = max(worker_count_for(dependency), worker_count)
 if __name__ == "__main__":
    main()