From 3ffcfe2c4b19ecee4559891755153cb0b819ba34 Mon Sep 17 00:00:00 2001
From: imcdo <ian_mcdonald@rocketmail.com>
Date: Fri, 27 Sep 2024 09:28:08 -0700
Subject: [PATCH] =?UTF-8?q?=E2=80=9Cother=E2=80=9D?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 ducktape/cluster/cluster_node.py |  18 ++
 ducktape/cluster/consts.py       |  19 ++
 ducktape/cluster/node_spec.py    |  38 ++++
 ducktape/mark/consts.py          |   2 +
 ducktape/tests/test_context.py   | 307 +++++++++++++++++++++++++++++++
 5 files changed, 384 insertions(+)
 create mode 100644 ducktape/cluster/cluster_node.py
 create mode 100644 ducktape/cluster/consts.py
 create mode 100644 ducktape/cluster/node_spec.py
 create mode 100644 ducktape/mark/consts.py
 create mode 100644 ducktape/tests/test_context.py

diff --git a/ducktape/cluster/cluster_node.py b/ducktape/cluster/cluster_node.py
new file mode 100644
index 000000000..f120e4a52
--- /dev/null
+++ b/ducktape/cluster/cluster_node.py
@@ -0,0 +1,18 @@
+from typing import Optional
+
+from ducktape.cluster.remoteaccount import RemoteAccount
+
+
+class ClusterNode(object):
+    def __init__(self, account: RemoteAccount, **kwargs):
+        self.account = account
+        for k, v in kwargs.items():
+            setattr(self, k, v)
+
+    @property
+    def name(self) -> Optional[str]:
+        return self.account.hostname
+
+    @property
+    def operating_system(self) -> Optional[str]:
+        return self.account.operating_system
diff --git a/ducktape/cluster/consts.py b/ducktape/cluster/consts.py
new file mode 100644
index 000000000..b5a6395c1
--- /dev/null
+++ b/ducktape/cluster/consts.py
@@ -0,0 +1,19 @@
+# Copyright 2017 Confluent Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+LINUX = "linux"
+
+WINDOWS = "windows"
+
+SUPPORTED_OS_TYPES = [LINUX, WINDOWS]
diff --git a/ducktape/cluster/node_spec.py b/ducktape/cluster/node_spec.py
new file mode 100644
index 000000000..1f0204ca8
--- /dev/null
+++ b/ducktape/cluster/node_spec.py
@@ -0,0 +1,38 @@
+# Copyright 2017 Confluent Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+
+import json
+
+from .consts import LINUX, SUPPORTED_OS_TYPES
+
+
+class NodeSpec(object):
+    """
+    The specification for a ducktape cluster node.
+
+    :param operating_system:    The operating system of the node.
+    """
+
+    def __init__(self, operating_system=LINUX):
+        self.operating_system = operating_system
+        if self.operating_system not in SUPPORTED_OS_TYPES:
+            raise RuntimeError("Unsupported os type %s" % self.operating_system)
+
+    def __str__(self):
+        dict = {
+            "os": self.operating_system,
+        }
+        return json.dumps(dict, sort_keys=True)
diff --git a/ducktape/mark/consts.py b/ducktape/mark/consts.py
new file mode 100644
index 000000000..7e64059e0
--- /dev/null
+++ b/ducktape/mark/consts.py
@@ -0,0 +1,2 @@
+CLUSTER_SPEC_KEYWORD = "cluster_spec"
+CLUSTER_SIZE_KEYWORD = "num_nodes"
diff --git a/ducktape/tests/test_context.py b/ducktape/tests/test_context.py
new file mode 100644
index 000000000..2adabfc69
--- /dev/null
+++ b/ducktape/tests/test_context.py
@@ -0,0 +1,307 @@
+# Copyright 2015 Confluent Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import copy
+import logging
+import os
+import re
+import shutil
+import sys
+import tempfile
+from typing import TYPE_CHECKING, Dict, Optional, Tuple
+
+from ducktape.cluster.cluster_spec import ClusterSpec
+from ducktape.command_line.defaults import ConsoleDefaults
+from ducktape.mark.consts import CLUSTER_SIZE_KEYWORD, CLUSTER_SPEC_KEYWORD
+from ducktape.services.service_registry import ServiceRegistry
+from ducktape.tests.loggermaker import LoggerMaker, close_logger
+from ducktape.tests.session import SessionContext
+from ducktape.utils.local_filesystem_utils import mkdir_p
+
+if TYPE_CHECKING:
+    from ducktape.services.service import Service
+
+
+def _escape_pathname(s):
+    """Remove fishy characters, replace most with dots"""
+    # Remove all whitespace completely
+    s = re.sub(r"\s+", "", s)
+
+    # Replace bad characters with dots
+    blacklist = r"[^\.\-=_\w\d]+"
+    s = re.sub(blacklist, ".", s)
+
+    # Multiple dots -> single dot (and no leading or trailing dot)
+    s = re.sub(r"[\.]+", ".", s)
+    return re.sub(r"^\.|\.$", "", s)
+
+
+class TestLoggerMaker(LoggerMaker):
+    def __init__(self, logger_name, log_dir, debug):
+        super(TestLoggerMaker, self).__init__(logger_name)
+        self.log_dir = log_dir
+        self.debug = debug
+
+    def configure_logger(self):
+        """Set up the logger to log to stdout and files.
+        This creates a directory and a few files as a side-effect.
+        """
+        if self.configured:
+            return
+
+        self._logger.setLevel(logging.DEBUG)
+        mkdir_p(self.log_dir)
+
+        # Create info and debug level handlers to pipe to log files
+        info_fh = logging.FileHandler(os.path.join(self.log_dir, "test_log.info"))
+        debug_fh = logging.FileHandler(os.path.join(self.log_dir, "test_log.debug"))
+
+        info_fh.setLevel(logging.INFO)
+        debug_fh.setLevel(logging.DEBUG)
+
+        formatter = logging.Formatter(ConsoleDefaults.TEST_LOG_FORMATTER)
+        info_fh.setFormatter(formatter)
+        debug_fh.setFormatter(formatter)
+
+        self._logger.addHandler(info_fh)
+        self._logger.addHandler(debug_fh)
+
+        ch = logging.StreamHandler(sys.stdout)
+        ch.setFormatter(formatter)
+        if self.debug:
+            # If debug flag is set, pipe debug logs to stdout
+            ch.setLevel(logging.DEBUG)
+        else:
+            # default - pipe warning level logging to stdout
+            ch.setLevel(logging.WARNING)
+        self._logger.addHandler(ch)
+
+
+def test_logger(logger_name, log_dir, debug):
+    """Helper method for getting a test logger object
+
+    Note that if this method is called multiple times with the same ``logger_name``, it returns the same logger object.
+    Note also, that for a fixed ``logger_name``, configuration occurs only the first time this function is called.
+    """
+    return TestLoggerMaker(logger_name, log_dir, debug).logger
+
+
+class TestContext(object):
+    """Wrapper class for state variables needed to properly run a single 'test unit'."""
+
+    def __init__(self, **kwargs) -> None:
+        """
+        :param session_context:
+        :param cluster: the cluster object which will be used by this test
+        :param module: name of the module containing the test class/method
+        :param cls: class object containing the test method
+        :param function: the test method
+        :param file: file containing this module
+        :param injected_args: a dict containing keyword args which will be passed to the test method
+        :param cluster_use_metadata: dict containing information about how this test will use cluster resources
+        """
+
+        self.session_context: SessionContext = kwargs["session_context"]
+        self.cluster = kwargs.get("cluster")
+        self.module = kwargs.get("module")
+        self.test_suite_name = kwargs.get("test_suite_name")
+
+        if kwargs.get("file") is not None:
+            self.file = os.path.abspath(kwargs["file"])
+        else:
+            self.file = None
+        self.cls = kwargs.get("cls")
+        self.function = kwargs.get("function")
+        self.injected_args = kwargs.get("injected_args")
+        self.ignore = kwargs.get("ignore", False)
+
+        # cluster_use_metadata is a dict containing information about how this test will use cluster resources
+        self.cluster_use_metadata = copy.copy(kwargs.get("cluster_use_metadata", {}))
+
+        self.services = ServiceRegistry()
+        self.test_index = None
+
+        # dict for toggling service log collection on/off
+        self.log_collect: Dict[Tuple[str, Service], bool] = {}
+
+        self._logger = None
+        self._local_scratch_dir = None
+
+    def __repr__(self) -> str:
+        return (
+            f"<module={self.module}, cls={self.cls_name}, function={self.function_name}, "
+            f"injected_args={self.injected_args}, file={self.file}, ignore={self.ignore}, "
+            f"cluster_spec={self.expected_cluster_spec}>"
+        )
+
+    def copy(self, **kwargs) -> "TestContext":
+        """Construct a new TestContext object from another TestContext object
+        Note that this is not a true copy, since a fresh ServiceRegistry instance will be created.
+        """
+        ctx_copy = TestContext(**self.__dict__)
+        ctx_copy.__dict__.update(**kwargs)
+
+        return ctx_copy
+
+    @property
+    def local_scratch_dir(self):
+        """This local scratch directory is created/destroyed on the test driver before/after each test is run."""
+        if not self._local_scratch_dir:
+            self._local_scratch_dir = tempfile.mkdtemp()
+        return self._local_scratch_dir
+
+    @property
+    def test_metadata(self):
+        return {
+            "directory": os.path.dirname(self.file),
+            "file_name": os.path.basename(self.file),
+            "cls_name": self.cls_name,
+            "method_name": self.function_name,
+            "injected_args": self.injected_args,
+        }
+
+    @staticmethod
+    def logger_name(test_context, test_index):
+        if test_index is None:
+            return test_context.test_id
+        else:
+            return "%s-%s" % (test_context.test_id, str(test_index))
+
+    @staticmethod
+    def results_dir(test_context, test_index):
+        d = test_context.session_context.results_dir
+
+        if test_context.cls is not None:
+            d = os.path.join(d, test_context.cls.__name__)
+        if test_context.function is not None:
+            d = os.path.join(d, test_context.function.__name__)
+        if test_context.injected_args is not None:
+            d = os.path.join(d, test_context.injected_args_name)
+        if test_index is not None:
+            d = os.path.join(d, str(test_index))
+
+        return d
+
+    @property
+    def expected_num_nodes(self) -> int:
+        """
+        How many nodes of any type we expect this test to consume when run.
+        Note that this will be 0 for both unschedulable tests and the tests that legitimately need 0 nodes.
+
+        :return:            an integer number of nodes.
+        """
+        return self.expected_cluster_spec.size() if self.expected_cluster_spec else 0
+
+    @property
+    def expected_cluster_spec(self) -> Optional[ClusterSpec]:
+        """
+        The cluster spec we expect this test to consume when run.
+
+        :return:            A ClusterSpec object or None if the test cannot be run
+                            (e.g. session context settings disallow tests with no cluster metadata attached).
+        """
+        cluster_spec = self.cluster_use_metadata.get(CLUSTER_SPEC_KEYWORD)
+        cluster_size = self.cluster_use_metadata.get(CLUSTER_SIZE_KEYWORD)
+        if cluster_spec is not None:
+            return cluster_spec
+        elif cluster_size is not None:
+            return ClusterSpec.simple_linux(cluster_size)
+        elif not self.cluster:
+            return ClusterSpec.empty()
+        elif self.session_context.fail_greedy_tests:
+            return None
+        else:
+            return self.cluster.all()
+
+    @property
+    def globals(self):
+        return self.session_context.globals
+
+    @property
+    def module_name(self) -> str:
+        return "" if self.module is None else self.module
+
+    @property
+    def cls_name(self) -> str:
+        return "" if self.cls is None else self.cls.__name__
+
+    @property
+    def function_name(self) -> str:
+        return "" if self.function is None else self.function.__name__
+
+    @property
+    def description(self):
+        """Description of the test, needed in particular for reporting.
+        If the function has a docstring, return that, otherwise return the class docstring or "".
+        """
+        if self.function.__doc__:
+            return self.function.__doc__
+        elif self.cls.__doc__ is not None:
+            return self.cls.__doc__
+        else:
+            return ""
+
+    @property
+    def injected_args_name(self) -> str:
+        if self.injected_args is None:
+            return ""
+        else:
+            params = ".".join(["%s=%s" % (k, self.injected_args[k]) for k in self.injected_args])
+            return _escape_pathname(params)
+
+    @property
+    def test_id(self) -> str:
+        return self.test_name
+
+    @property
+    def test_name(self) -> str:
+        """
+        The fully-qualified name of the test. This is similar to test_id, but does not include the session ID. It
+        includes the module, class, and method name.
+        """
+        name_components = [
+            self.module_name,
+            self.cls_name,
+            self.function_name,
+            self.injected_args_name,
+        ]
+
+        return ".".join(filter(lambda x: x is not None and len(x) > 0, name_components))
+
+    @property
+    def logger(self):
+        if self._logger is None:
+            self._logger = test_logger(
+                TestContext.logger_name(self, self.test_index),
+                TestContext.results_dir(self, self.test_index),
+                self.session_context.debug,
+            )
+        return self._logger
+
+    def close(self):
+        """Release resources, etc."""
+        if hasattr(self, "services"):
+            for service in self.services:
+                service.close()
+            # Remove reference to services. This is important to prevent potential memory leaks if users write services
+            # which themselves have references to large memory-intensive objects
+            del self.services
+
+        # Remove local scratch directory
+        if self._local_scratch_dir and os.path.exists(self._local_scratch_dir):
+            shutil.rmtree(self._local_scratch_dir)
+
+        # Release file handles held by logger
+        if self._logger:
+            close_logger(self._logger)