From 6954ae842a83440c7b6110c074bebb238a049cbd Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 4 Feb 2022 16:57:58 +0100
Subject: [PATCH 001/131] Sync dcs

  commit 6a9104f3e1a38ddf28d4f9346b24593288cc2edb
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Feb 4 16:27:09 2022 +0100

      Allow to parametrise default TorchDataSetProviderFactories in order to enable
      dynamic tensorisation

  dcs/sensai/torch/torch_base.py
  dcs/sensai/torch/torch_data.py

  commit 9857b52fc6b479035547182defee82a209a63526
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Jan 31 18:51:38 2022 +0100

      EvaluationUtil.compareModelsCrossValidation: Fixed data frame string conversion (could contain ellipses)

  dcs/sensai/evaluation/eval_util.py

  commit e91067624eac7f736ae34613099d8c00b309ac02
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sat Jan 29 21:03:42 2022 +0100

      TorchDataSetFromTensors: Avoid last batch containing but one item

  dcs/sensai/torch/torch_data.py

  commit 5de914517185af04110ac44992c372bd5deea272
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jan 20 11:44:16 2022 +0100

      TorchModel.apply:
        * Improved docstring
        * Report normalisation issue on a per input tensor basis

  dcs/sensai/torch/torch_base.py
---
 src/sensai/evaluation/eval_util.py |  3 ++-
 src/sensai/torch/torch_base.py     | 29 +++++++++++++++++------------
 src/sensai/torch/torch_data.py     | 25 +++++++++++++++++++++++--
 3 files changed, 42 insertions(+), 15 deletions(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 1c1ccb0a..5b29a77f 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -239,7 +239,8 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
         crossValidationData = crossValidator.evalModel(model)
         aggStatsByVar = {varName: crossValidationData.getEvalStatsCollection(predictedVarName=varName).aggStats()
                 for varName in crossValidationData.predictedVarNames}
-        strEvalResults = str(pd.DataFrame.from_dict(aggStatsByVar, orient="index"))
+        df = pd.DataFrame.from_dict(aggStatsByVar, orient="index")
+        strEvalResults = df.to_string()
         if logResults:
             log.info(f"Cross-validation results:\n{strEvalResults}")
         if resultWriter is not None:
diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index 1dc18613..8d9bddc2 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -10,7 +10,8 @@
 from torch.nn import functional as F
 
 from .torch_data import TensorScaler, VectorDataUtil, ClassificationVectorDataUtil, TorchDataSet, \
-    TorchDataSetProviderFromDataUtil, TorchDataSetProvider, Tensoriser, TorchDataSetFromDataFrames, RuleBasedTensoriser
+    TorchDataSetProvider, Tensoriser, TorchDataSetFromDataFrames, RuleBasedTensoriser, \
+    TorchDataSetProviderFromVectorDataUtil
 from .torch_enums import ClassificationOutputMode
 from .torch_opt import NNOptimiser, NNLossEvaluatorRegression, NNLossEvaluatorClassification, NNOptimiserParams, TrainingInfo
 from ..data import DataFrameSplitter
@@ -185,7 +186,7 @@ def apply(self, X: Union[torch.Tensor, np.ndarray, TorchDataSet, Sequence[torch.
             mcDropoutSamples: Optional[int] = None, mcDropoutProbability: Optional[float] = None, scaleOutput: bool = False,
             scaleInput: bool = False) -> Union[torch.Tensor, np.ndarray, Tuple]:
         """
-        Applies the model to the given input tensor and returns the result (normalized)
+        Applies the model to the given input tensor and returns the result
 
         :param X: the input tensor (either a batch or, if createBatch=True, a single data point), a data set or a tuple/list of tensors
             (if the model accepts more than one input).
@@ -194,8 +195,8 @@ def apply(self, X: Union[torch.Tensor, np.ndarray, TorchDataSet, Sequence[torch.
         :param createBatch: whether to add an additional tensor dimension for a batch containing just one data point
         :param mcDropoutSamples: if not None, apply MC-Dropout-based inference with the respective number of samples; if None, apply regular inference
         :param mcDropoutProbability: the probability with which to apply dropouts in MC-Dropout-based inference; if None, use model's default
-        :param scaleOutput: whether to scale the output that is produced by the underlying model (using this instance's output scaler)
-        :param scaleInput: whether to scale the input (using this instance's input scaler) before applying the underlying model
+        :param scaleOutput: whether to scale the output that is produced by the underlying model (using this instance's output scaler, if any)
+        :param scaleInput: whether to scale the input (using this instance's input scaler, if any) before applying the underlying model
 
         :return: an output tensor or, if MC-Dropout is applied, a pair (y, sd) where y the mean output tensor and sd is a tensor of the same dimension
             containing standard deviations
@@ -234,13 +235,11 @@ def extract(z):
 
         # check input normalisation
         if self.NORMALISATION_CHECK_THRESHOLD is not None:
-            maxValue = 0.0
-            for t in inputs:
+            for i, t in enumerate(inputs):
                 if t.is_floating_point() and t.numel() > 0:  # skip any integer tensors (which typically contain lengths) and empty tensors
-                    maxValue = max(t.abs().max().item(), maxValue)
-            if maxValue > self.NORMALISATION_CHECK_THRESHOLD:
-                log.warning("Received input which is likely to not be correctly normalised: maximum abs. value in input tensor is %f" % maxValue)
-
+                    maxValue = t.abs().max().item()
+                    if maxValue > self.NORMALISATION_CHECK_THRESHOLD:
+                        log.warning(f"Received value in input tensor {i} which is likely to not be correctly normalised: maximum abs. value in tensor is %f" % maxValue)
         if mcDropoutSamples is None:
             y = model(*inputs)
             return extract(y)
@@ -621,22 +620,28 @@ def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame,
 
 
 class TorchDataSetProviderFactoryClassificationDefault(TorchDataSetProviderFactory):
+    def __init__(self, tensoriseDynamically=False):
+        self.tensoriseDynamically = tensoriseDynamically
+
     def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame, model: TorchVectorClassificationModel,
             trainingContext: TrainingContext, inputTensoriser: Optional[Tensoriser], outputTensoriser: Optional[Tensoriser],
             dataFrameSplitter: Optional[DataFrameSplitter]) -> TorchDataSetProvider:
         dataUtil = ClassificationVectorDataUtil(inputs, outputs, model.model.cuda, len(model._labels),
             normalisationMode=model.normalisationMode, inputTensoriser=inputTensoriser, outputTensoriser=outputTensoriser,
             dataFrameSplitter=dataFrameSplitter)
-        return TorchDataSetProviderFromDataUtil(dataUtil, model.model.cuda)
+        return TorchDataSetProviderFromVectorDataUtil(dataUtil, model.model.cuda, tensoriseDynamically=self.tensoriseDynamically)
 
 
 class TorchDataSetProviderFactoryRegressionDefault(TorchDataSetProviderFactory):
+    def __init__(self, tensoriseDynamically=False):
+        self.tensoriseDynamically = tensoriseDynamically
+
     def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame, model: TorchVectorRegressionModel,
             trainingContext: TrainingContext, inputTensoriser: Optional[Tensoriser], outputTensoriser: Optional[Tensoriser],
             dataFrameSplitter: Optional[DataFrameSplitter]) -> TorchDataSetProvider:
         dataUtil = VectorDataUtil(inputs, outputs, model.model.cuda, normalisationMode=model.normalisationMode,
             inputTensoriser=inputTensoriser, outputTensoriser=outputTensoriser, dataFrameSplitter=dataFrameSplitter)
-        return TorchDataSetProviderFromDataUtil(dataUtil, model.model.cuda)
+        return TorchDataSetProviderFromVectorDataUtil(dataUtil, model.model.cuda, tensoriseDynamically=self.tensoriseDynamically)
 
 
 class OutputTensorToArrayConverter(ABC):
diff --git a/src/sensai/torch/torch_data.py b/src/sensai/torch/torch_data.py
index 51f58630..1a0dac6b 100644
--- a/src/sensai/torch/torch_data.py
+++ b/src/sensai/torch/torch_data.py
@@ -1,5 +1,6 @@
 import logging
 from abc import ABC, abstractmethod
+import math
 from typing import Tuple, Sequence, Optional, Union, List, Iterator
 
 import numpy as np
@@ -485,7 +486,15 @@ def _get_batches(self, tensorTuples: Sequence[TensorTuple], batch_size, shuffle)
             index = torch.LongTensor(range(length))
         start_idx = 0
         while start_idx < length:
-            end_idx = min(length, start_idx + batch_size)
+            remaining_items = length - start_idx
+            is_second_last_batch = remaining_items <= 2*batch_size and remaining_items > batch_size
+            if is_second_last_batch:
+                # to avoid cases where the last batch is excessively small (1 item in the worst case, where e.g. batch
+                # normalisation would not be applicable), we evenly distribute the items across the last two batches
+                adjusted_batch_size = math.ceil(remaining_items / 2)
+                end_idx = min(length, start_idx + adjusted_batch_size)
+            else:
+                end_idx = min(length, start_idx + batch_size)
             excerpt = index[start_idx:end_idx]
             batch = []
             for tensorTuple in tensorTuples:
@@ -504,7 +513,7 @@ def _get_batches(self, tensorTuples: Sequence[TensorTuple], batch_size, shuffle)
                 yield batch[0]
             else:
                 yield tuple(batch)
-            start_idx += batch_size
+            start_idx = end_idx
 
     def size(self):
         return len(self.x)
@@ -598,6 +607,18 @@ def provideSplit(self, fractionalSizeOfFirstSet: float) -> Tuple[TorchDataSet, T
         return TorchDataSetFromTensors(x1, y1, self.cuda), TorchDataSetFromTensors(x2, y2, self.cuda)
 
 
+class TorchDataSetProviderFromVectorDataUtil(TorchDataSetProvider):
+    def __init__(self, dataUtil: VectorDataUtil, cuda: bool, tensoriseDynamically=False):
+        super().__init__(inputTensorScaler=dataUtil.getInputTensorScaler(), outputTensorScaler=dataUtil.getOutputTensorScaler(),
+            inputDim=dataUtil.inputDim(), modelOutputDim=dataUtil.modelOutputDim())
+        self.dataUtil = dataUtil
+        self.cuda = cuda
+        self.tensoriseDynamically = tensoriseDynamically
+
+    def provideSplit(self, fractionalSizeOfFirstSet: float) -> Tuple[TorchDataSet, TorchDataSet]:
+        return self.dataUtil.splitIntoDataSets(fractionalSizeOfFirstSet, self.cuda, tensoriseDynamically=self.tensoriseDynamically)
+
+
 class TensorTransformer(ABC):
     @abstractmethod
     def transform(self, t: torch.Tensor) -> torch.Tensor:

From 437a912693423215b645e95ccddffa53496ad061 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Mon, 14 Mar 2022 12:37:13 +0100
Subject: [PATCH 002/131] Sync dcs

  commit f6f0689ec30faeccaf129fac14a32d8ac372c4ca
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Mar 10 15:03:46 2022 +0100

      SortedKeysAndValues:
        * Fixed valueSliceInner
        * Added parameter 'fallback' to valueSliceOuter

  dcs/sensai/util/datastruct.py

  commit 718cd1126aa16b37076f7afbda7b0a11dc20a704
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Mar 10 15:03:18 2022 +0100

      valueSliceOuter: Improved docstring, changed default value of fallbackBounds to False

  dcs/sensai/util/sequences.py

  commit d0c84bcda4655a75dbd7b2c08c86297a19f0f152
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Mar 10 14:37:17 2022 +0100

      Apply setstate

  dcs/sensai/torch/torch_base.py

  commit c6b2df5e708250e95a7ccc32a25c5939da5e22e4
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Mar 10 14:29:46 2022 +0100

      Added docstrings

  dcs/sensai/torch/torch_base.py

  commit feace45bebde85c02ef90cb9d7cf7ea75a9e2e75
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 15:20:07 2022 +0100

      LogTime: Allow to configure logger

  dcs/sensai/util/logging.py

  commit cfa9bac815f3e785906720f00aa87c72c0c89cb4
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 15:14:10 2022 +0100

      Vectoriser.applyMulti: Log application time in verbose mode

  dcs/sensai/vectoriser.py

  commit 96049012c66c7943b772911241d676ee9caba5b9
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 15:13:33 2022 +0100

      LogTime: Allow logging to be disabled via a flag given at construction

  dcs/sensai/util/logging.py

  commit e59cba1f25307f8e00c4fc63588c4a38db9de560
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 13:29:03 2022 +0100

      Vectoriser, SequenceVectoriser: Added optional caching of value-generating function
        when using applyMulti

  dcs/sensai/vectoriser.py

  commit f51a63826cca586df1dc4eab1d681076f7eb3e75
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 12:56:52 2022 +0100

      Vectoriser, SequenceVectoriser: Added verbose mode for more information during training

  dcs/sensai/vectoriser.py

  commit 66c8c7948a3a94310763667f345a77331bd84135
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 11:50:28 2022 +0100

      Fixed check for L-BFGS assuming string representation

  dcs/sensai/torch/torch_opt.py

  commit 1caf1b2907a126b48c5b37d9dde36299416baee8
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Mar 8 11:34:56 2022 +0100

      StopWatch: Extended time retrieval options

      LogTime: Improved logging of duration (depending on elapsed time)

  dcs/sensai/util/logging.py
---
 src/sensai/torch/torch_base.py | 82 +++++++++++++++++++++++++---------
 src/sensai/torch/torch_opt.py  | 16 ++++---
 src/sensai/util/datastruct.py  |  6 +--
 src/sensai/util/logging.py     | 44 +++++++++++++++---
 src/sensai/util/sequences.py   |  7 +--
 src/sensai/vectoriser.py       | 61 +++++++++++++++++++++----
 6 files changed, 167 insertions(+), 49 deletions(-)

diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index 8d9bddc2..fabb16af 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -17,6 +17,7 @@
 from ..data import DataFrameSplitter
 from ..normalisation import NormalisationMode
 from ..util.dtype import toFloatArray
+from ..util.pickle import setstate
 from ..util.string import ToStringMixin
 from ..vector_model import VectorRegressionModel, VectorClassificationModel, TrainingContext
 
@@ -389,7 +390,7 @@ def __init__(self, modelClass: Callable[..., TorchModel], modelArgs: Sequence =
         self.model: Optional[TorchModel] = None
         self.inputTensoriser: Optional[Tensoriser] = None
         self.outputTensoriser: Optional[Tensoriser] = None
-        self.outputTensorToArrayConverter = None
+        self.outputTensorToArrayConverter: Optional[OutputTensorToArrayConverter] = None
         self.torchDataSetProviderFactory: Optional[TorchDataSetProviderFactory] = None
         self.dataFrameSplitter: Optional[DataFrameSplitter] = None
 
@@ -397,36 +398,40 @@ def __setstate__(self, state) -> None:
         state["nnOptimiserParams"] = NNOptimiserParams.fromDictOrInstance(state["nnOptimiserParams"])
         newOptionalMembers = ["inputTensoriser", "torchDataSetProviderFactory", "dataFrameSplitter", "outputTensoriser",
             "outputTensorToArrayConverter"]
-        for m in newOptionalMembers:
-            if m not in state:
-                state[m] = None
-        s = super()
-        if hasattr(s, '__setstate__'):
-            s.__setstate__(state)
-        else:
-            self.__dict__ = state
+        setstate(TorchVectorRegressionModel, self, state, newOptionalProperties=newOptionalMembers)
 
     def withInputTensoriser(self, tensoriser: Tensoriser) -> __qualname__:
+        """
+        :param tensoriser: tensoriser to use in order to convert input data frames to (one or more) tensors.
+            The default tensoriser directly converts the data frame's values (which is assumed to contain only scalars that
+            can be coerced to floats) to a float tensor.
+            The use of a custom tensoriser is necessary if a non-trivial conversion is necessary or if the data frame
+            is to be converted to more than one input tensor.
+        :return: self
+        """
         self.inputTensoriser = tensoriser
         return self
 
     def withOutputTensoriser(self, tensoriser: RuleBasedTensoriser) -> __qualname__:
         """
         :param tensoriser: tensoriser to use in order to convert the output data frame to a tensor.
+            The default output tensoriser directly converts the data frame's values to a float tensor.
+
             NOTE: It is required to be a rule-based tensoriser, because mechanisms that require fitting on the data
             and thus perform a data-dependendent conversion are likely to cause problems because they would need
             to be reversed at inference time (since the model will be trained on the converted values). If you require
             a transformation, use a target transformer, which will be applied before the tensoriser.
+        :return: self
         """
         self.outputTensoriser = tensoriser
         return self
 
-    def withOutputTensorToArrayConverter(self, outputTensorToArrayConverter) -> __qualname__:
+    def withOutputTensorToArrayConverter(self, outputTensorToArrayConverter: "OutputTensorToArrayConverter") -> __qualname__:
         """
         Configures the use of a custom converter from tensors to numpy arrays, which is applied during inference.
         A custom converter can be required, for example, to handle variable-length outputs (where the output tensor
         will typically contain unwanted padding). Note that since the converter is for inference only, it may be
-        required to use a custom loss evaluator during training.
+        required to use a custom loss evaluator during training if the use of a custom converter is necessary.
 
         :param outputTensorToArrayConverter: the converter
         :return: self
@@ -434,10 +439,23 @@ def withOutputTensorToArrayConverter(self, outputTensorToArrayConverter) -> __qu
         self.outputTensorToArrayConverter = outputTensorToArrayConverter
 
     def withTorchDataSetProviderFactory(self, torchDataSetProviderFactory: "TorchDataSetProviderFactory") -> __qualname__:
+        """
+        :param torchDataSetProviderFactory: the torch data set provider factory, which is used to instantiate the provider which
+            will provide the training and validation data sets from the input data frame that is passed in for learning.
+            By default, TorchDataSetProviderFactoryRegressionDefault is used.
+        :return: self
+        """
         self.torchDataSetProviderFactory = torchDataSetProviderFactory
         return self
 
     def withDataFrameSplitter(self, dataFrameSplitter: DataFrameSplitter) -> __qualname__:
+        """
+        :param dataFrameSplitter: the data frame splitter which is used to split the input/output data frames that are passed for
+            learning into a data frame that is used for training and a data frame that is used for validation.
+            The input data frame is the data frame that is passed as input to the splitter, and the returned indices
+            are used to split both the input and output data frames in the same way.
+        :return: self
+        """
         self.dataFrameSplitter = dataFrameSplitter
         return self
 
@@ -525,18 +543,19 @@ def __init__(self, outputMode: ClassificationOutputMode,
     def __setstate__(self, state) -> None:
         state["nnOptimiserParams"] = NNOptimiserParams.fromDictOrInstance(state["nnOptimiserParams"])
         newOptionalMembers = ["inputTensoriser", "torchDataSetProviderFactory", "dataFrameSplitter", "outputTensoriser"]
-        for m in newOptionalMembers:
-            if m not in state:
-                state[m] = None
-        if "outputMode" not in state:
-            state["outputMode"] = ClassificationOutputMode.PROBABILITIES
-        s = super()
-        if hasattr(s, '__setstate__'):
-            s.__setstate__(state)
-        else:
-            self.__dict__ = state
+        newDefaultProperties = {"outputMode": ClassificationOutputMode.PROBABILITIES}
+        setstate(TorchVectorClassificationModel, self, state, newOptionalProperties=newOptionalMembers,
+            newDefaultProperties=newDefaultProperties)
 
     def withInputTensoriser(self, tensoriser: Tensoriser) -> __qualname__:
+        """
+        :param tensoriser: tensoriser to use in order to convert input data frames to (one or more) tensors.
+            The default tensoriser directly converts the data frame's values (which is assumed to contain only scalars that
+            can be coerced to floats) to a float tensor.
+            The use of a custom tensoriser is necessary if a non-trivial conversion is necessary or if the data frame
+            is to be converted to more than one input tensor.
+        :return: self
+        """
         self.inputTensoriser = tensoriser
         return self
 
@@ -552,10 +571,23 @@ def withOutputTensoriser(self, tensoriser: RuleBasedTensoriser) -> __qualname__:
         return self
 
     def withTorchDataSetProviderFactory(self, torchDataSetProviderFactory: "TorchDataSetProviderFactory") -> __qualname__:
+        """
+        :param torchDataSetProviderFactory: the torch data set provider factory, which is used to instantiate the provider which
+            will provide the training and validation data sets from the input data frame that is passed in for learning.
+            By default, TorchDataSetProviderFactoryClassificationDefault is used.
+        :return: self
+        """
         self.torchDataSetProviderFactory = torchDataSetProviderFactory
         return self
 
     def withDataFrameSplitter(self, dataFrameSplitter: DataFrameSplitter) -> __qualname__:
+        """
+        :param dataFrameSplitter: the data frame splitter which is used to split the input/output data frames that are passed for
+            learning into a data frame that is used for training and a data frame that is used for validation.
+            The input data frame is the data frame that is passed as input to the splitter, and the returned indices
+            are used to split both the input and output data frames in the same way.
+        :return: self
+        """
         self.dataFrameSplitter = dataFrameSplitter
         return self
 
@@ -621,6 +653,10 @@ def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame,
 
 class TorchDataSetProviderFactoryClassificationDefault(TorchDataSetProviderFactory):
     def __init__(self, tensoriseDynamically=False):
+        """
+        :param tensoriseDynamically: whether tensorisation shall take place on the fly whenever the provided data sets are iterated;
+              if False, tensorisation takes place once in a precomputation stage (tensors must jointly fit into memory)
+        """
         self.tensoriseDynamically = tensoriseDynamically
 
     def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame, model: TorchVectorClassificationModel,
@@ -634,6 +670,10 @@ def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame, mod
 
 class TorchDataSetProviderFactoryRegressionDefault(TorchDataSetProviderFactory):
     def __init__(self, tensoriseDynamically=False):
+        """
+        :param tensoriseDynamically: whether tensorisation shall take place on the fly whenever the provided data sets are iterated;
+              if False, tensorisation takes place once in a precomputation stage (tensors must jointly fit into memory)
+        """
         self.tensoriseDynamically = tensoriseDynamically
 
     def createDataSetProvider(self, inputs: pd.DataFrame, outputs: pd.DataFrame, model: TorchVectorRegressionModel,
diff --git a/src/sensai/torch/torch_opt.py b/src/sensai/torch/torch_opt.py
index 3e155159..f1b6118e 100644
--- a/src/sensai/torch/torch_opt.py
+++ b/src/sensai/torch/torch_opt.py
@@ -41,13 +41,20 @@ class Optimiser(enum.Enum):
     LBFGS = ("lbfgs", optim.LBFGS)
 
     @classmethod
-    def fromName(cls, name: str):
+    def fromName(cls, name: str) -> "Optimiser":
         lname = name.lower()
         for o in cls:
             if o.value[0] == lname:
                 return o
         raise ValueError(f"Unknown optimiser name '{name}'; known names: {[o.value[0] for o in cls]}")
 
+    @classmethod
+    def fromNameOrInstance(cls, nameOrInstance: Union[str, "Optimiser"]) -> "Optimiser":
+        if type(nameOrInstance) == str:
+            return cls.fromName(nameOrInstance)
+        else:
+            return nameOrInstance
+
 
 class _Optimiser(object):
     """
@@ -61,10 +68,7 @@ def __init__(self, params, method: Union[str, Optimiser], lr, max_grad_norm, use
         :param max_grad_norm: gradient norm value beyond which to apply gradient shrinkage
         :param optimiserArgs: keyword arguments to be used in actual torch optimiser
         """
-        if type(method) == str:
-            self.method = Optimiser.fromName(method)
-        else:
-            self.method = method
+        self.method = Optimiser.fromNameOrInstance(method)
         self.params = list(params)  # careful: params may be a generator
         self.last_ppl = None
         self.lr = lr
@@ -553,7 +557,7 @@ def __init__(self, lossEvaluator: NNLossEvaluator = None, gpu=None, optimiser: U
         :param shuffle: whether to shuffle the training data
         :param optimiserArgs: keyword arguments to be passed on to the actual torch optimiser
         """
-        if optimiser == 'lbfgs':
+        if Optimiser.fromNameOrInstance(optimiser) == Optimiser.LBFGS:
             largeBatchSize = 1e12
             if batchSize is not None:
                 log.warning(f"LBFGS does not make use of batches, therefore using large batch size {largeBatchSize} to achieve use of a single batch")
diff --git a/src/sensai/util/datastruct.py b/src/sensai/util/datastruct.py
index 27ca13d2..1b0f22dc 100644
--- a/src/sensai/util/datastruct.py
+++ b/src/sensai/util/datastruct.py
@@ -229,10 +229,10 @@ def closestKeyAndValue(self, key) -> Optional[Tuple[TKey, TValue]]:
         return None if idx is None else (self.keys[idx], self.values[idx])
 
     def valueSliceInner(self, lowerBoundKey, upperBoundKey):
-        return array_util.valueSliceOuter(self.keys, lowerBoundKey, upperBoundKey, values=self.values)
+        return array_util.valueSliceInner(self.keys, lowerBoundKey, upperBoundKey, values=self.values)
 
-    def valueSliceOuter(self, lowerBoundKey, upperBoundKey):
-        return array_util.valueSliceOuter(self.keys, lowerBoundKey, upperBoundKey, values=self.values)
+    def valueSliceOuter(self, lowerBoundKey, upperBoundKey, fallback=False):
+        return array_util.valueSliceOuter(self.keys, lowerBoundKey, upperBoundKey, values=self.values, fallbackBounds=fallback)
 
 
 class SortedKeyValuePairs(Generic[TKey, TValue]):
diff --git a/src/sensai/util/logging.py b/src/sensai/util/logging.py
index b90e533b..324392b1 100644
--- a/src/sensai/util/logging.py
+++ b/src/sensai/util/logging.py
@@ -7,7 +7,6 @@
 
 import pandas as pd
 
-
 log = getLogger(__name__)
 
 LOG_DEFAULT_FORMAT = '%(levelname)-5s %(asctime)-15s %(name)s:%(funcName)s - %(message)s'
@@ -69,6 +68,16 @@ def restart(self):
     def getElapsedTimeSecs(self) -> float:
         return time.time() - self.startTime
 
+    def getElapsedTimedelta(self) -> pd.Timedelta:
+        return pd.Timedelta(self.getElapsedTimeSecs(), unit="s")
+
+    def getElapsedTimeString(self) -> str:
+        secs = self.getElapsedTimeSecs()
+        if secs < 60:
+            return f"{secs:.3f} seconds"
+        else:
+            return str(pd.Timedelta(secs, unit="s"))
+
 
 class StopWatchManager:
     """
@@ -93,7 +102,7 @@ def start(self, name):
 
     def stop(self, name) -> float:
         """
-        :param name: the name of the time
+        :param name: the name of the stopwatch
         :return: the time that has passed in seconds
         """
         timePassedSecs = time.time() - self._stopWatches[name]
@@ -105,18 +114,39 @@ def isRunning(self, name):
 
 
 class LogTime:
-    def __init__(self, name):
+    """
+    An execution time logger which can be conveniently applied using a with-statement - in order to log the executing time of the respective
+    with-block.
+    """
+
+    def __init__(self, name, enabled=True, logger: Logger = None):
+        """
+        :param name: the name of the event whose time is to be logged upon completion as "<name> completed in <time>"
+        :param enabled: whether the logging is actually enabled; can be set to False to disable logging without necessitating
+            changes to client code
+        :param logger: the logger to use; if None, use the logger of LogTime's module
+        """
         self.name = name
-        self.startTime = None
+        self.enabled = enabled
+        self.stopwatch = None
+        self.logger = logger if logger is not None else log
 
     def start(self):
-        self.startTime = time.time()
+        """
+        Starts the stopwatch
+        """
+        self.stopwatch = StopWatch()
 
     def stop(self):
-        log.info(f"{self.name} completed in {time.time()-self.startTime:.3f} seconds")
+        """
+        Stops the stopwatch and logs the time taken (if enabled)
+        """
+        if self.stopwatch is not None and self.enabled:
+            self.logger.info(f"{self.name} completed in {self.stopwatch.getElapsedTimeString()}")
 
     def __exit__(self, exc_type, exc_value, traceback):
         self.stop()
 
     def __enter__(self):
-        return self.start()
\ No newline at end of file
+        self.start()
+        return self
\ No newline at end of file
diff --git a/src/sensai/util/sequences.py b/src/sensai/util/sequences.py
index 1b617918..dfb4f4fe 100644
--- a/src/sensai/util/sequences.py
+++ b/src/sensai/util/sequences.py
@@ -163,21 +163,22 @@ def valueSliceInner(keys, lowerBoundKey, upperBoundKey, values=None):
     return values[firstIdx:lastIdx+1]
 
 
-def valueSliceOuter(keys, lowerBoundKey, upperBoundKey, values=None, fallbackBounds=True):
+def valueSliceOuter(keys, lowerBoundKey, upperBoundKey, values=None, fallbackBounds=False):
     """
     For a sorted array of keys and an array of corresponding values,
     finds indices i, j such that i is the largest key where keys[i] <= lowerBoundKey and
     j is the lowest key where keys[j] <= upperBoundKey,
     and returns the corresponding slice of values values[i:j+1].
     If such indices do not exists and fallbackBounds==True, the array bounds are used (i.e. 0 or len-1).
-    Given the indices i and j, the function returns values[i:j+1].
-    This is an outer slice which is the smallest slice that definitely contains two given bounds
+    If such indices do not exists and fallbackBounds==False, an exception is raised.
+    This returned slice is an outer slice, which is the smallest slice that definitely contains two given bounds
     (for fallbackBounds==False).
 
     :param keys: the sorted array of key values
     :param lowerBoundKey: the key value defining the lower bound
     :param upperBoundKey: the key value defining the upper bound
     :param values: the sorted array of values; if None, use keys
+    :param fallbackBounds: whether to use the smallest/largest index (i.e. 0 or len-1) as a fallback in case no matching bounds exist
     :return: the corresponding slice of `values`
     """
     if values is None:
diff --git a/src/sensai/vectoriser.py b/src/sensai/vectoriser.py
index 0fa9ee0f..99b48ebf 100644
--- a/src/sensai/vectoriser.py
+++ b/src/sensai/vectoriser.py
@@ -4,6 +4,7 @@
 
 import numpy as np
 
+from dcs.sensai.util import LogTime
 from .util.pickle import setstate
 from .util.string import listString, ToStringMixin
 
@@ -17,6 +18,9 @@ class Vectoriser(Generic[T], ToStringMixin):
     A vectoriser represents a method for the conversion of instances of some type T into
     vectors, i.e. one-dimensional (numeric) arrays, or (in the special case of a 1D vector) scalars
     """
+
+    log = log.getChild(__qualname__)
+
     def __init__(self, f: Callable[[T], Union[float, np.ndarray, list]], transformer=None):
         """
         :param f: the function which maps from an instance of T to an array/list/scalar
@@ -75,7 +79,7 @@ def apply(self, item: T, transform=True) -> np.array:
             value = self.transformer.transform([value])[0]
         return value
 
-    def applyMulti(self, items: Iterable[T], transform=True) -> List[np.array]:
+    def applyMulti(self, items: Iterable[T], transform=True, useCache=False, verbose=False) -> List[np.array]:
         """
         Applies this vectoriser to multiple items at once.
         Especially for cases where this vectoriser uses a transformer, this method is significantly faster than
@@ -83,12 +87,33 @@ def applyMulti(self, items: Iterable[T], transform=True) -> List[np.array]:
 
         :param items: the items to be vectorised
         :param transform: whether to apply this instance's transformer (if any)
+        :param useCache: whether to apply caching of the value function f given at construction (keeping track of outputs for
+            each input object id), which can significantly speed up computation in cases where an items appears more than
+            once in the collection of items
+        :param verbose: whether to generate log messages
         :return: a list of vectors
         """
-        values = [self._f(x) for x in items]
-        if self.transformer is not None and transform:
-            values = self.transformer.transform(values)
-        return values
+        if verbose:
+            self.log.info(f"Applying {self}")
+
+        with LogTime("Application", enabled=verbose, logger=self.log):
+            if not useCache:
+                computeValue = self._f
+            else:
+                cache = {}
+
+                def computeValue(x):
+                    key = id(x)
+                    value = cache.get(key)
+                    if value is None:
+                        value = self._f(x)
+                        cache[key] = value
+                    return value
+
+            values = [computeValue(x) for x in items]
+            if self.transformer is not None and transform:
+                values = self.transformer.transform(values)
+            return values
 
     class ResultType(Enum):
         SCALAR = 0
@@ -124,6 +149,9 @@ class SequenceVectoriser(Generic[T], ToStringMixin):
     are used for training, we take into consideration the fact that the sequences of T may overlap and thus training
     is performed on the set of unique instances.
     """
+
+    log = log.getChild(__qualname__)
+
     class FittingMode(Enum):
         """
         Determines how the individual vectorisers are fitted based on several sequences of objects of type T that are given.
@@ -183,7 +211,7 @@ def apply(self, seq: Sequence[T], transform=True) -> List[np.array]:
             vectorsList.append(conc)
         return vectorsList
 
-    def applyMulti(self, sequences: Iterable[Sequence[T]]) -> Tuple[List[List[np.array]], List[int]]:
+    def applyMulti(self, sequences: Iterable[Sequence[T]], useCache=False, verbose=False) -> Tuple[List[List[np.array]], List[int]]:
         """
         Applies this vectoriser to multiple sequences of objects of type T, where each sequence is mapped to a sequence
         of 1D arrays.
@@ -191,16 +219,25 @@ def applyMulti(self, sequences: Iterable[Sequence[T]]) -> Tuple[List[List[np.arr
         use transformers.
 
         :param sequences: the sequences to vectorise
+        :param useCache: whether to apply caching of the value functions of contained vectorisers (keeping track of outputs for
+            each input object id), which can significantly speed up computation in cases where the given sequences contain individual
+            items more than once
+        :param verbose: whether to generate log messages
         :return: a pair (vl, l) where vl is a list of lists of vectors/arrays and l is a list of integers containing the lengths
             of the sequences
         """
+        if verbose:
+            self.log.info(f"Applying {self} (useCache={useCache})")
+
         lengths = [len(s) for s in sequences]
 
+        if verbose:
+            self.log.info("Generating combined sequence")
         combinedSeq = []
         for seq in sequences:
             combinedSeq.extend(seq)
 
-        individualVectoriserResults = [vectoriser.applyMulti(combinedSeq) for vectoriser in self.vectorisers]
+        individualVectoriserResults = [vectoriser.applyMulti(combinedSeq, useCache=useCache, verbose=verbose) for vectoriser in self.vectorisers]
         concVectors = [np.concatenate(x, axis=0) for x in zip(*individualVectoriserResults)]
 
         vectorSequences = []
@@ -211,7 +248,7 @@ def applyMulti(self, sequences: Iterable[Sequence[T]]) -> Tuple[List[List[np.arr
 
         return vectorSequences, lengths
 
-    def applyMultiWithPadding(self, sequences: Sequence[Sequence[T]]) -> Tuple[List[List[np.array]], List[int]]:
+    def applyMultiWithPadding(self, sequences: Sequence[Sequence[T]], useCache=False, verbose=False) -> Tuple[List[List[np.array]], List[int]]:
         """
         Applies this vectoriser to multiple sequences of objects of type T, where each sequence is mapped to a sequence
         of 1D arrays.
@@ -219,10 +256,16 @@ def applyMultiWithPadding(self, sequences: Sequence[Sequence[T]]) -> Tuple[List[
         is reached (padding).
 
         :param sequences: the sequences to vectorise
+        :param useCache: whether to apply caching of the value functions of contained vectorisers (keeping track of outputs for
+            each input object id), which can significantly speed up computation in cases where the given sequences contain individual
+            items more than once
+        :param verbose: whether to generate log messages
         :return: a pair (vl, l) where vl is a list of lists of vectors/arrays, each list having the same length, and l is a list of
             integers containing the original unpadded lengths of the sequences
         """
-        result, lengths = self.applyMulti(sequences)
+        result, lengths = self.applyMulti(sequences, useCache=useCache, verbose=verbose)
+        if verbose:
+            self.log.info("Applying padding")
         maxLength = max(lengths)
         dim = len(result[0][0])
         dummyVec = np.zeros((dim,))

From 26798a959f42c0fde9420f8fc3766a01833f96f5 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 26 Apr 2022 21:42:39 +0200
Subject: [PATCH 003/131] Sync pjm

  commit e87fb029d16c6cebf1815910318d4db76f799a89
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Apr 26 21:34:12 2022 +0200

      Increase precision of normalised matrix display from 2 to 4 decimals

  sensai/util/plot.py

  commit 07eef5539a2b42461b04c523c9801d7b362e2cbe
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Apr 25 20:41:25 2022 +0200

      MultiDataEvaluationUtil: Added support for provision of meta-data which is added to result data frames

  sensai/evaluation/eval_util.py

  commit 524af4d11c9fadbd2a75cd034d7faa6a40b70b06
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Apr 25 20:40:06 2022 +0200

      Fixed error in docstring

  sensai/evaluation/crossval.py

  commit fe4cacd06a22081324de0fd3d6f0d0dc47c1c96c
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Apr 25 20:39:51 2022 +0200

      Added DataSplitterFromSkLearnSplitter, DataSplitterStratifiedShuffleSplit

  sensai/data.py

  commit 30f93e6be4f8721bbb9137635a6dbf66aedabf54
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Apr 25 17:02:37 2022 +0200

      MultiDataEvaluationUtil: Added more flexible model comparison (which can also use simple evaluation)

  sensai/evaluation/eval_util.py

  commit ab3e11d8dcfe185d42db7b0708883cbb3ddbf88a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Apr 25 16:33:12 2022 +0200

      RelativeFrequencyCounter: Explicitly handle case where the frequency does not exist, returning None

  sensai/util/aggregation.py

  commit ed209da1caccf187c588247148749237b6e30f01
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 8 11:35:53 2022 +0200

      Changed display name of accuracy metric from 'ACC' to 'Accuracy'

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 2756e0d3ac0b536c8c4d44df56121f515e0cce92
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 8 11:32:00 2022 +0200

      Classifier evaluation: cater to binary classification case
        * EvalStats/EvaluatorParams: Allow to specify positive class (try to infer when not given)
        * Added metrics precision and recall (default for binary case)
        * Added precision-recall curve (generated by default when using util in binary case)

  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/eval_util.py
  sensai/evaluation/evaluator.py

  commit 972dd16868aab1a0ab9337af13540b074701964d
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Apr 5 22:51:15 2022 +0200

      AbstractSkLearnVectorClassificationModel: Support weighting of data points based on
      inverse class frequency in training data (via constructor argument)

      SkLearnRandomForestVectorClassificationModel: Added constructor argument

  sensai/sklearn/sklearn_base.py
  sensai/sklearn/sklearn_classification.py

  commit bb69f54a79deef3769d5ba3b60646065acdd0805
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Apr 5 22:33:07 2022 +0200

      Added docstring

  sensai/data.py
---
 src/sensai/data.py                            |  27 ++++-
 src/sensai/evaluation/crossval.py             |   2 +-
 .../eval_stats/eval_stats_classification.py   | 100 ++++++++++++++++--
 src/sensai/evaluation/eval_util.py            |  42 ++++++--
 src/sensai/evaluation/evaluator.py            |   5 +-
 src/sensai/sklearn/sklearn_base.py            |  29 ++++-
 src/sensai/sklearn/sklearn_classification.py  |   6 +-
 src/sensai/util/aggregation.py                |   9 +-
 src/sensai/util/plot.py                       |   2 +-
 9 files changed, 190 insertions(+), 32 deletions(-)

diff --git a/src/sensai/data.py b/src/sensai/data.py
index f9a6713a..d8166ccc 100644
--- a/src/sensai/data.py
+++ b/src/sensai/data.py
@@ -1,10 +1,13 @@
+import logging
 from abc import ABC, abstractmethod
 from typing import Tuple, Sequence, TypeVar, List, Generic
 
 import numpy as np
 import pandas as pd
 import scipy.stats
+from sklearn.model_selection import StratifiedShuffleSplit
 
+log = logging.getLogger(__name__)
 
 T = TypeVar("T")
 
@@ -47,8 +50,10 @@ def toTorchDataLoader(self, batchSize=64, shuffle=True):
         return DataLoader(dataSet, batch_size=batchSize, shuffle=shuffle)
 
 
-# TODO: Rename to InputOutputDataFrames when the time for breaking changes has come
 class InputOutputData(BaseInputOutputData[pd.DataFrame]):
+    """
+    Holds input and output data for learning problems
+    """
     def __init__(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         super().__init__(inputs, outputs)
 
@@ -134,6 +139,26 @@ def split(self, data: InputOutputData) -> Tuple[InputOutputData, InputOutputData
         return A, B
 
 
+class DataSplitterFromSkLearnSplitter(DataSplitter):
+    def __init__(self, skLearnSplitter):
+        """
+        :param skLearnSplitter: an instance of one of the splitter classes from sklearn.model_selection,
+            see https://scikit-learn.org/stable/modules/classes.html#module-sklearn.model_selection
+        """
+        self.skLearnSplitter = skLearnSplitter
+
+    def split(self, data: TInputOutputData) -> Tuple[TInputOutputData, TInputOutputData]:
+        splitterResult = self.skLearnSplitter.split(data.inputs, data.outputs)
+        split = next(iter(splitterResult))
+        firstIndices, secondIndices = split
+        return data.filterIndices(firstIndices), data.filterIndices(secondIndices)
+
+
+class DataSplitterStratifiedShuffleSplit(DataSplitterFromSkLearnSplitter):
+    def __init__(self, fractionalSizeOfFirstSet: float, randomSeed=42):
+        super().__init__(StratifiedShuffleSplit(n_splits=1, train_size=fractionalSizeOfFirstSet, random_state=randomSeed))
+
+
 class DataFrameSplitter(ABC):
     @abstractmethod
     def computeSplitIndices(self, df: pd.DataFrame, fractionalSizeOfFirstSet: float) -> Tuple[Sequence[int], Sequence[int]]:
diff --git a/src/sensai/evaluation/crossval.py b/src/sensai/evaluation/crossval.py
index a2552b83..4fe251d9 100644
--- a/src/sensai/evaluation/crossval.py
+++ b/src/sensai/evaluation/crossval.py
@@ -68,7 +68,7 @@ def createFolds(self, data: InputOutputData, numFolds: int) -> List[Tuple[Sequen
         """
         :param data: the data from which to obtain the folds
         :param numFolds: the number of splits/folds
-        :return: a list containing numSplits tuples (t, e) where t and e are sequences of data point indices to use for training
+        :return: a list containing numFolds tuples (t, e) where t and e are sequences of data point indices to use for training
             and evaluation respectively
         """
         pass
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index f1c9be04..f5dd9a7e 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -1,14 +1,22 @@
+from abc import ABC, abstractmethod
+from typing import List, Sequence
+import logging
+
+from matplotlib import pyplot as plt
 import numpy as np
 import pandas as pd
 import sklearn
-from abc import ABC, abstractmethod
-from sklearn.metrics import confusion_matrix, accuracy_score
-from typing import List, Sequence
+from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, PrecisionRecallDisplay
 
 from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric
 from ...util.plot import plotMatrix
 
 
+log = logging.getLogger(__name__)
+
+BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES = [1, True, "1", "True"]
+
+
 class ClassificationMetric(Metric["ClassificationEvalStats"], ABC):
     requiresProbabilities = False
 
@@ -26,7 +34,7 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
 
 
 class ClassificationMetricAccuracy(ClassificationMetric):
-    name = "ACC"
+    name = "Accuracy"
 
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return accuracy_score(y_true=y_true, y_pred=y_predicted)
@@ -66,13 +74,40 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return cnt / len(y_true)
 
 
+class BinaryClassificationMetric(ClassificationMetric, ABC):
+    def __init__(self, positiveClassLabel, name: str = None):
+        super().__init__(name)
+        self.positiveClassLabel = positiveClassLabel
+
+
+class BinaryClassificationMetricPrecision(BinaryClassificationMetric):
+    name = "Precision"
+
+    def __init__(self, positiveClassLabel):
+        super().__init__(positiveClassLabel)
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        return precision_score(y_true, y_predicted, pos_label=self.positiveClassLabel)
+
+
+class BinaryClassificationMetricRecall(BinaryClassificationMetric):
+    name = "Recall"
+
+    def __init__(self, positiveClassLabel):
+        super().__init__(positiveClassLabel)
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        return recall_score(y_true, y_predicted, pos_label=self.positiveClassLabel)
+
+
 class ClassificationEvalStats(PredictionEvalStats["ClassificationMetric"]):
     def __init__(self, y_predicted: PredictionArray = None,
-                 y_true: PredictionArray = None,
-                 y_predictedClassProbabilities: pd.DataFrame = None,
-                 labels: PredictionArray = None,
-                 metrics: Sequence["ClassificationMetric"] = None,
-                 additionalMetrics: Sequence["ClassificationMetric"] = None):
+            y_true: PredictionArray = None,
+            y_predictedClassProbabilities: pd.DataFrame = None,
+            labels: PredictionArray = None,
+            metrics: Sequence["ClassificationMetric"] = None,
+            additionalMetrics: Sequence["ClassificationMetric"] = None,
+            binaryPositiveLabel=None):
         """
         :param y_predicted: the predicted class labels
         :param y_true: the true class labels
@@ -80,6 +115,10 @@ def __init__(self, y_predicted: PredictionArray = None,
         :param labels: the list of class labels
         :param metrics: the metrics to compute for evaluation; if None, use default metrics
         :param additionalMetrics: the metrics to additionally compute
+        :param binaryPositiveLabel: the label of the positive class for the case where it is a binary classification;
+            if None, check `labels` for occurrence of one of BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES in the respective
+            order, and if none of these appear in `labels`, the classification will not be treated as a binary classification and
+            a warning will be logged
         """
         self.labels = labels
         self.y_predictedClassProbabilities = y_predictedClassProbabilities
@@ -91,8 +130,29 @@ def __init__(self, y_predicted: PredictionArray = None,
             if len(y_predictedClassProbabilities) != len(y_true):
                 raise ValueError("Row count in class probabilities data frame does not match ground truth")
 
+        numLabels = len(labels)
+        if binaryPositiveLabel is not None:
+            if numLabels != 2:
+                raise ValueError(f"Passed binaryPositiveLabel for non-binary classification (labels={self.labels})")
+            if binaryPositiveLabel not in self.labels:
+                raise ValueError(f"The binary positive label {binaryPositiveLabel} does not appear in labels={labels}")
+        else:
+            if numLabels == 2:
+                for c in BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES:
+                    if c in labels:
+                        binaryPositiveLabel = c
+        if numLabels == 2 and binaryPositiveLabel is None:
+            log.warning(f"Binary classification (labels={labels}) without specification of positive class label; binary classification metrics will not be considered")
+        self.binaryPositiveLabel = binaryPositiveLabel
+        self.isBinary = binaryPositiveLabel is not None
+
         if metrics is None:
             metrics = [ClassificationMetricAccuracy(), ClassificationMetricGeometricMeanOfTrueClassProbability()]
+            if self.isBinary:
+                metrics.extend([
+                    BinaryClassificationMetricPrecision(self.binaryPositiveLabel),
+                    BinaryClassificationMetricRecall(self.binaryPositiveLabel)])
+
         metrics = list(metrics)
         if additionalMetrics is not None:
             for m in additionalMetrics:
@@ -120,14 +180,31 @@ def plotConfusionMatrix(self, normalize=True, titleAdd: str = None):
         confusionMatrix = self.getConfusionMatrix()
         return confusionMatrix.plot(normalize=normalize, titleAdd=titleAdd)
 
+    def plotPrecisionRecallCurve(self, titleAdd: str = None):
+        if not self._probabilitiesAvailable:
+            raise Exception("Precision-recall curve requires probabilities")
+        if not self.isBinary:
+            raise Exception("Precision-recall curve is not applicable to non-binary classification")
+        probabilities = self.y_predictedClassProbabilities[self.binaryPositiveLabel]
+        precision, recall, thresholds = precision_recall_curve(y_true=self.y_true, probas_pred=probabilities,
+            pos_label=self.binaryPositiveLabel)
+        disp = PrecisionRecallDisplay(precision, recall)
+        disp.plot()
+        ax: plt.Axes = disp.ax_
+        ax.set_xlabel("precision")
+        ax.set_ylabel("recall")
+        title = "Precision-Recall Curve"
+        if titleAdd is not None:
+            title += "\n" + titleAdd
+        ax.set_title(title)
+        return disp.figure_
+
 
 class ClassificationEvalStatsCollection(EvalStatsCollection[ClassificationEvalStats]):
     def __init__(self, evalStatsList: List[ClassificationEvalStats]):
         super().__init__(evalStatsList)
         self.globalStats = None
 
-    # TODO once we moved to python 3.8: move to base class and use the new get_args method to infer the generic type at runtime
-    #  https://docs.python.org/3/library/typing.html#typing.get_args
     def getGlobalStats(self) -> ClassificationEvalStats:
         """
         Gets an evaluation statistics object that combines the data from all contained eval stats objects
@@ -148,3 +225,4 @@ def plot(self, normalize=True, titleAdd: str = None):
         title = 'Normalized Confusion Matrix' if normalize else 'Confusion Matrix (Counts)'
         return plotMatrix(self.confusionMatrix, title, self.labels, self.labels, 'true class', 'predicted class', normalize=normalize,
             titleAdd=titleAdd)
+
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 5b29a77f..9309bf9f 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -353,30 +353,51 @@ def _createEvalStatsPlots(self, evalStats: RegressionEvalStats, resultCollector:
 class ClassificationEvaluationUtil(EvaluationUtil[VectorClassificationModel, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, VectorClassificationModelCrossValidator, VectorClassificationModelCrossValidationData, ClassificationEvalStats]):
     def _createEvalStatsPlots(self, evalStats: ClassificationEvalStats, resultCollector: EvaluationUtil.ResultCollector, subtitle=None):
         resultCollector.addFigure("confusion-matrix", evalStats.plotConfusionMatrix(titleAdd=subtitle))
+        if evalStats.isBinary:
+            resultCollector.addFigure("precision-recall", evalStats.plotPrecisionRecallCurve(titleAdd=subtitle))
 
 
 class MultiDataEvaluationUtil:
-    def __init__(self, inputOutputDataDict: Dict[str, InputOutputData], keyName: str = "dataset"):
+    def __init__(self, inputOutputDataDict: Dict[str, InputOutputData], keyName: str = "dataset",
+            metaDataDict: Optional[Dict[str, Dict[str, Any]]] = None):
         """
         :param inputOutputDataDict: a dictionary mapping from names to the data sets with which to evaluate models
-        :param keyName: a name for the key value used in inputOutputDataDict
+        :param keyName: a name for the key value used in inputOutputDataDict, which will be used as a column name in result data frames
+        :param metaDataDict: a dictionary which maps from a name (same keys as in inputOutputDataDict) to a dictionary, which maps
+            from a column name to a value and which is to be used to extend the result data frames containing per-dataset results
         """
         self.inputOutputDataDict = inputOutputDataDict
         self.keyName = keyName
+        if metaDataDict is not None:
+            self.metaDF = pd.DataFrame(metaDataDict.values(), index=metaDataDict.keys())
+        else:
+            self.metaDF = None
 
     def compareModelsCrossValidation(self, modelFactories: Sequence[Callable[[], VectorModel]],
             resultWriter: Optional[ResultWriter] = None, writePerDatasetResults=True,
             crossValidatorParams: Optional[Dict[str, Any]] = None, columnNameForModelRanking: str = None, rankMax=True) -> Tuple[pd.DataFrame, pd.DataFrame]:
+        return self.compareModels(modelFactories, useCrossValidation=True, resultWriter=resultWriter, writePerDatasetResults=writePerDatasetResults,
+            crossValidatorParams=crossValidatorParams,
+            columnNameForModelRanking=columnNameForModelRanking, rankMax=rankMax)
+
+    def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], useCrossValidation=False,
+            resultWriter: Optional[ResultWriter] = None, writePerDatasetResults=True,
+            evaluatorParams: Optional[Union[VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, Dict[str, Any]]] = None,
+            crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None,
+            columnNameForModelRanking: str = None, rankMax=True) -> Tuple[pd.DataFrame, pd.DataFrame]:
         """
-        :param modelFactories: a sequence of factory functions for the creation of models to evaluate
+        :param modelFactories: a sequence of factory functions for the creation of models to evaluate; every factory must result
+            in a model with a fixed model name (otherwise results cannot be correctly aggregated)
+        :param useCrossValidation: whether to use cross-validation (rather than a single split) for model evaluation
         :param resultWriter: a writer with which to store results
         :param writePerDatasetResults: whether to use resultWriter (if not None) in order to generate detailed results for each
             dataset in a subdirectory named according to the name of the dataset
-        :param crossValidatorParams: parameters to use for the instantiation of cross-validators
+        :param evaluatorParams: parameters to use for the instantiation of evaluators (relevant if useCrossValidation==False)
+        :param crossValidatorParams: parameters to use for the instantiation of cross-validators (relevant if useCrossValidation==True)
         :param columnNameForModelRanking: column name to use for ranking models
         :param rankMax: if true, use max for ranking, else min
-        :return: a pair of data frames (allDF, meanDF) where allDF contains all the individual cross-validation results
-            for every dataset and meanDF contains one row for each model with results averaged across datasets
+        :return: a pair of data frames (allDF, meanDF) where allDF contains all the individual evaluation results (one row per data set)
+            and meanDF contains one row for each model with results averaged across datasets
         """
         allResults = pd.DataFrame()
         for key, inputOutputData in self.inputOutputDataDict.items():
@@ -389,9 +410,10 @@ def compareModelsCrossValidation(self, modelFactories: Sequence[Callable[[], Vec
                 isRegression = False
             else:
                 raise ValueError("The models have to be either all regression models or all classification, not a mixture")
-            ev = createEvaluationUtil(inputOutputData, isRegression=isRegression, crossValidatorParams=crossValidatorParams)
-            childResultWriter = resultWriter.childForSubdirectory(key) if writePerDatasetResults else None
-            df = ev.compareModelsCrossValidation(models, resultWriter=childResultWriter)
+            ev = createEvaluationUtil(inputOutputData, isRegression=isRegression, evaluatorParams=evaluatorParams,
+                crossValidatorParams=crossValidatorParams)
+            childResultWriter = resultWriter.childForSubdirectory(key) if (writePerDatasetResults and resultWriter is not None) else None
+            df = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter)
             df[self.keyName] = key
             df["modelName"] = df.index
             if columnNameForModelRanking is not None:
@@ -404,6 +426,8 @@ def compareModelsCrossValidation(self, modelFactories: Sequence[Callable[[], Vec
                     df["bestModel"].loc[df[columnNameForModelRanking].idxmin()] = 1
             df = df.reset_index(drop=True)
             allResults = pd.concat((allResults, df))
+        if self.metaDF is not None:
+            allResults = allResults.join(self.metaDF, on=self.keyName, how="left")
         strAllResults = f"All results:\n{allResults.to_string()}"
         log.info(strAllResults)
         meanResults = allResults.groupby("modelName").mean()
diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index 4f39d0e7..8ad78414 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -319,7 +319,7 @@ class VectorClassificationModelEvaluationData(VectorModelEvaluationData[Classifi
 class VectorClassificationModelEvaluatorParams(VectorModelEvaluatorParams):
     def __init__(self, dataSplitter: DataSplitter = None, fractionalSplitTestFraction: float = None, fractionalSplitRandomSeed=42,
             fractionalSplitShuffle=True, additionalMetrics: Sequence[ClassificationMetric] = None,
-            computeProbabilities: bool = False):
+            computeProbabilities: bool = False, binaryPositiveLabel=None):
         """
         :param dataSplitter: [if test data must be obtained via split] a splitter to use in order to obtain; if None, must specify
             fractionalSplitTestFraction for fractional split (default)
@@ -334,6 +334,7 @@ def __init__(self, dataSplitter: DataSplitter = None, fractionalSplitTestFractio
             fractionalSplitShuffle=fractionalSplitShuffle)
         self.additionalMetrics = additionalMetrics
         self.computeProbabilities = computeProbabilities
+        self.binaryPositiveLabel = binaryPositiveLabel
 
     @classmethod
     def fromOldKwArgs(cls, dataSplitter=None, testFraction=None,
@@ -382,7 +383,7 @@ def _evalModel(self, model: VectorClassificationModel, data: InputOutputData) ->
             raise ValueError(f"Expected a classification model, got {model}")
         predictions, predictions_proba, groundTruth = self._computeOutputs(model, data)
         evalStats = ClassificationEvalStats(y_predictedClassProbabilities=predictions_proba, y_predicted=predictions, y_true=groundTruth,
-            labels=model.getClassLabels(), additionalMetrics=self.params.additionalMetrics)
+            labels=model.getClassLabels(), additionalMetrics=self.params.additionalMetrics, binaryPositiveLabel=self.params.binaryPositiveLabel)
         predictedVarName = model.getPredictedVariableNames()[0]
         return VectorClassificationModelEvaluationData({predictedVarName: evalStats}, data.inputs, model)
 
diff --git a/src/sensai/sklearn/sklearn_base.py b/src/sensai/sklearn/sklearn_base.py
index 9c8023fe..d27f7df4 100644
--- a/src/sensai/sklearn/sklearn_base.py
+++ b/src/sensai/sklearn/sklearn_base.py
@@ -8,6 +8,7 @@
 import pandas as pd
 from sklearn import compose
 
+from ..util.pickle import setstate
 from ..vector_model import VectorRegressionModel, VectorClassificationModel
 
 log = logging.getLogger(__name__)
@@ -177,21 +178,27 @@ def _predictSkLearn(self, inputs: pd.DataFrame) -> pd.DataFrame:
 
 
 class AbstractSkLearnVectorClassificationModel(VectorClassificationModel, ABC):
-    def __init__(self, modelConstructor, **modelArgs):
+    def __init__(self, modelConstructor, useComputedClassWeights=False, **modelArgs):
         """
         :param modelConstructor: the sklearn model constructor
         :param modelArgs: arguments to be passed to the sklearn model constructor
+        :param useComputedClassWeights: whether to compute class weights from the training data that is given and pass it on to the
+            classifier's fit method; weighted data points may not be supported for all types of models
         """
         super().__init__()
         self.modelConstructor = modelConstructor
         self.sklearnInputTransformer = None
         self.sklearnOutputTransformer = None
         self.modelArgs = modelArgs
+        self.useComputedClassWeights = useComputedClassWeights
         self.model = None
 
+    def __setstate__(self, state):
+        setstate(AbstractSkLearnVectorClassificationModel, self, state, newDefaultProperties={"useComputedClassWeights": False})
+
     def _toStringExcludes(self) -> List[str]:
         return super()._toStringExcludes() + ["modelConstructor", "sklearnInputTransformer", "sklearnOutputTransformer",
-                                              "modelArgs", "model"]
+            "modelArgs", "model"]
 
     def _toStringAdditionalEntries(self) -> Dict[str, Any]:
         d = super()._toStringAdditionalEntries()
@@ -231,7 +238,13 @@ def _fitClassifier(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         self._updateModelArgs(inputs, outputs)
         self.model = createSkLearnModel(self.modelConstructor, self.modelArgs, self.sklearnOutputTransformer)
         log.info(f"Fitting sklearn classifier of type {self.model.__class__.__name__}")
-        self.model.fit(inputValues, np.ravel(outputs.values))
+        kwargs = {}
+        if self.useComputedClassWeights:
+            class2weight = self._computeClassWeights(outputs)
+            classes = outputs.iloc[:, 0]
+            weights = [class2weight[cls] for cls in classes]
+            kwargs["sample_weight"] = np.array(weights)
+        self.model.fit(inputValues, np.ravel(outputs.values), **kwargs)
 
     def _transformInput(self, inputs: pd.DataFrame, fit=False) -> np.ndarray:
         inputValues = inputs.values
@@ -258,3 +271,13 @@ def get_params(self, deep=True):
     def set_params(self, **params):
         self.model.set_params(**params)
 
+    def _computeClassWeights(self, outputs: pd.DataFrame):
+        """
+        :param outputs: the output data frame containing the class labels as the first column
+        :return: the dictionary of class weights mapping class to weight value
+        """
+        classes: pd.Series = outputs.iloc[:,0]
+        counts = classes.value_counts()
+        rfreqs = counts / counts.sum()
+        weights: pd.Series = 1.0 / rfreqs
+        return weights.to_dict()
\ No newline at end of file
diff --git a/src/sensai/sklearn/sklearn_classification.py b/src/sensai/sklearn/sklearn_classification.py
index 49e8c14f..e32d7d9d 100644
--- a/src/sensai/sklearn/sklearn_classification.py
+++ b/src/sensai/sklearn/sklearn_classification.py
@@ -19,9 +19,11 @@ def __init__(self, min_samples_leaf=8, random_state=42, **modelArgs):
 
 
 class SkLearnRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
-    def __init__(self, min_samples_leaf=8, random_state=42, **modelArgs):
+    def __init__(self, min_samples_leaf=8, random_state=42, useComputedClassWeights=False, **modelArgs):
         super().__init__(sklearn.ensemble.RandomForestClassifier,
-            random_state=random_state, min_samples_leaf=min_samples_leaf, **modelArgs)
+            random_state=random_state, min_samples_leaf=min_samples_leaf,
+            useComputedClassWeights=useComputedClassWeights,
+            **modelArgs)
 
 
 class SkLearnMLPVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
diff --git a/src/sensai/util/aggregation.py b/src/sensai/util/aggregation.py
index 3abf4343..12cf1307 100644
--- a/src/sensai/util/aggregation.py
+++ b/src/sensai/util/aggregation.py
@@ -1,5 +1,5 @@
 import collections
-from typing import Hashable, Dict
+from typing import Hashable, Dict, Optional
 
 from .string import ToStringMixin
 
@@ -39,7 +39,12 @@ def add(self, relativeFrequencyCounter: __qualname__) -> None:
         self.numTotal += relativeFrequencyCounter.numTotal
         self.numRelevant += relativeFrequencyCounter.numRelevant
 
-    def getRelativeFrequency(self) -> float:
+    def getRelativeFrequency(self) -> Optional[float]:
+        """
+        :return: the relative frequency (between 0 and 1) or None if nothing was counted (0 events considered)
+        """
+        if self.numTotal == 0:
+            return None
         return self.numRelevant / self.numTotal
 
 
diff --git a/src/sensai/util/plot.py b/src/sensai/util/plot.py
index e8157667..ca097d65 100644
--- a/src/sensai/util/plot.py
+++ b/src/sensai/util/plot.py
@@ -48,7 +48,7 @@ def plotMatrix(matrix, title, xticklabels: Sequence[str], yticklabels: Sequence[
         rotation_mode="anchor")
 
     # Loop over data dimensions and create text annotations.
-    fmt = '.2f' if normalize else ('.2f' if matrix.dtype == np.float else 'd')
+    fmt = '.4f' if normalize else ('.2f' if matrix.dtype == np.float else 'd')
     thresh = matrix.max() / 2.
     for i in range(matrix.shape[0]):
         for j in range(matrix.shape[1]):

From 55ee94e0f889b12ca7dd686aa9bd6b5b3e0a556b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Tue, 26 Apr 2022 22:51:49 +0200
Subject: [PATCH 004/131] Fixed non-relative import

---
 src/sensai/vectoriser.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/sensai/vectoriser.py b/src/sensai/vectoriser.py
index 99b48ebf..ce012fd1 100644
--- a/src/sensai/vectoriser.py
+++ b/src/sensai/vectoriser.py
@@ -4,7 +4,7 @@
 
 import numpy as np
 
-from dcs.sensai.util import LogTime
+from .util import LogTime
 from .util.pickle import setstate
 from .util.string import listString, ToStringMixin
 

From fa49f1336c88a0e9286fe518e01c855ac18e6f63 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 21:43:50 +0200
Subject: [PATCH 005/131] Sync pjm

  commit eff7256df1582821aa40e70ea2b79ce14b7afe51
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 6 14:46:14 2022 +0200

      Plot: Added methods: title, ylim, xlim

  sensai/util/plot.py

  commit 37577fa16fe18fa819100a7477ab3e6482064843
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 6 13:21:49 2022 +0200

      SkLearnTransformerFactoryFactory: Added MinMaxScaler, added/improved docstrings

  sensai/data_transformation/sklearn_transformer.py

  commit 8f0401e36f70d2f131a41a09976f2b2e4169672b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 6 13:21:13 2022 +0200

      FeatureCollector: Added convenience method getCategoricalFeatureNameRegex

  sensai/featuregen.py

  commit d708151fab258d4c32887e0f0e61be4542104d12
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 6 11:49:30 2022 +0200

      LightGBMVectorClassificationModel: Added parameters

  sensai/lightgbm.py

  commit 6415f7b5f285ade8c882a35489d54a677cb7c09e
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 6 11:24:18 2022 +0200

      MultiDataEvaluationUtil: Fixed ranking/sorting of results data frames

  sensai/evaluation/eval_util.py

  commit 55159e296d75973a31f4f6d198b78984721ba70c
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 5 11:26:56 2022 +0200

      MultiDataEvaluationUtil.compareModels: Added further aggregations (std, min, max)

  sensai/evaluation/eval_util.py

  commit acbb5c276425dcae7d52d2c028d2b582b7605afc
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 5 11:10:33 2022 +0200

       * EvaluationUtil.compareModels: Exclude evalStats column from reported text
       * MultiDataEvaluationUtil.compareModels: Report number of data sets being averaged

  sensai/evaluation/eval_util.py

  commit 269030665b52d2634cf2fea24e93138056b8605b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 3 19:36:46 2022 +0200

      Added helper function checkNotNaNDict

  sensai/util/helper.py

  commit 2d49ac28f704838f48014bb9d62f38a1f5d8ec46
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 3 19:18:17 2022 +0200

      MultiDataEvaluationUtil.compareModels: Added parameter createCombinedEvalStatsPlots (default False), because combination
      of EvalStats objects not always possible (particularly classification without a fixed set of classes throughout)

  sensai/evaluation/eval_util.py

  commit 7295fddd8d802a7cd2f57a92e03275e27c570f00
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 2 20:05:29 2022 +0200

       * Added representation of true/false positive/negative counts in binary classification: BinaryClassificationCounts
       * Added BinaryClassificationProbabilityThresholdVariationData to capture the variation of counts with the probability threshold
       * Added plots that illustrate these variations (counts, precision-recall + F1)

  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/eval_util.py

  commit 330455f5e0bec337fa98ef706d83681ecdbaee53
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 2 17:13:18 2022 +0200

      Reified plots generated from EvalStats (EvalStatsPlot) in order to simplify plot collection
      in evaluation utils (EvalStatsPlotCollector)

  sensai/evaluation/eval_stats/eval_stats_base.py
  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/eval_stats/eval_stats_regression.py
  sensai/evaluation/eval_util.py

  commit 4feadafe63a14309cd8ff2496100728962db1ab5
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 2 11:27:00 2022 +0200

      MultiDataEvaluationUtil: Improved logging

  sensai/evaluation/eval_util.py

  commit a8243a37e1b46c83b963d9f6fc90169cba81b3ca
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 2 11:23:38 2022 +0200

      PickleCached, cached: Added option to not load persisted result (as alternative to deleting the cache file)

  sensai/util/cache.py

  commit 50d920f9f31a825fdad7c627647ee098631f7d90
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 17:26:19 2022 +0200

      Minor logging improvement

  sensai/evaluation/eval_util.py

  commit 5ff94e0db03ccd74a670f552fc6d3a4ac4d5f83b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 16:46:11 2022 +0200

      Added function timeOfDay

  sensai/util/time.py

  commit a698981d4d211255369d8d55591f9a7d4a1d1399
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 16:44:35 2022 +0200

      featuregen:
        * MultiFeatureGenerator: Added check for duplicate feature generation
        * Added new base classes for feature generators that generate values from a
          single column:
                - FeatureGeneratorMapColumn (1:1 mapping)
                - FeatureGeneratorMapColumnDict (1:n mapping)

  sensai/featuregen.py

  commit 9512bbd4ef0cde503402f1682c44059ca3609885
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 15:10:37 2022 +0200

      EvalStatsCollection: Added check for consistency of set of metrics contained in eval stats list

  sensai/evaluation/eval_stats/eval_stats_base.py

  commit 2aa5e095f8542a529c391080346f41d6e7025819
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 12:35:35 2022 +0200

      BinaryClassificationMetricPrecision: Configured zero-division behaviour (assume 0 precision)

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 67bd7d5f564b22a5283345b6fe5a9d916912772b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 12:12:36 2022 +0200

      * EvaluationUtil.compareModels: Allow EvalStats objects to be returned

      * MultiDataEvaluationUtil.compareModels: Added generation of plots from combined
        EvalStats objects of all data sets per model type (for classification, to be
        generalised)

  sensai/evaluation/eval_util.py

  commit a8c2bbbec017adbc22f42af160c54d2905976e9a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 12:08:30 2022 +0200

      ClassificationEvalStatsCollection.getGlobalStats: Fixed: Only predictions and ground truth values
      were aggregated, other parameters were not considered for construction of combined EvalStats

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 887e30bbcbe8e145f870bc1b086a9140f1a8abdd
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 11:07:50 2022 +0200

      Classification metrics: Added balanced accuracy and F1 (both included by default)

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit dc6a7aea454761087e7073aa050ccf1718648f18
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Apr 29 11:01:46 2022 +0200

      Classification metrics: Changed names to lower case

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 39d96470f950753cc5473778e99e81552992e0e2
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Apr 28 15:54:28 2022 +0200

      listString: Added option to quote list elements

  sensai/util/string.py

  commit 503eb940a11ff252e239097453bf1223da125c72
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Apr 28 14:38:45 2022 +0200

      Added util functions for reading/writing line-based text files

  sensai/util/io.py

  commit 84fdf1f3b886309801cfdda02be02647a2319111
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Apr 27 16:53:51 2022 +0200

      ClassificationEvaluationUtil: Added plot of regular confusion matrix (with abs. numbers)

  sensai/evaluation/eval_util.py

  commit 4e77ac41ac454a2904d70f2eda800b01f07a55a1
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Apr 27 16:51:47 2022 +0200

      LightGBMVectorClassificationModel: Added useComputedClassWeights constructor parameter

  sensai/lightgbm.py

  commit 8ad1b7800fb2b63193f791fada21fbd32bccbff8
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Apr 27 11:50:14 2022 +0200

      ToStringMixin: More flexible inclusion mechanism which now allows empty
      list of inclusions (user override of _toStringIncludes with empty list returned)

  sensai/util/string.py

  commit f13afae4a46bd304e0835e9e8cb3806575539729
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Apr 27 11:09:19 2022 +0200

      Fixed precision-recall plot axis labels

  sensai/evaluation/eval_stats/eval_stats_classification.py
---
 .../sklearn_transformer.py                    |  15 +-
 .../evaluation/eval_stats/eval_stats_base.py  |  23 +-
 .../eval_stats/eval_stats_classification.py   | 190 ++++++++++++--
 .../eval_stats/eval_stats_regression.py       |  21 +-
 src/sensai/evaluation/eval_util.py            | 235 +++++++++++++-----
 src/sensai/featuregen.py                      |  70 +++++-
 src/sensai/lightgbm.py                        |  18 +-
 src/sensai/util/cache.py                      |  29 ++-
 src/sensai/util/helper.py                     |  13 +-
 src/sensai/util/io.py                         |  38 ++-
 src/sensai/util/plot.py                       |   9 +
 src/sensai/util/string.py                     |  33 ++-
 src/sensai/util/time.py                       |   8 +
 13 files changed, 598 insertions(+), 104 deletions(-)

diff --git a/src/sensai/data_transformation/sklearn_transformer.py b/src/sensai/data_transformation/sklearn_transformer.py
index f3d081a3..fe73033e 100644
--- a/src/sensai/data_transformation/sklearn_transformer.py
+++ b/src/sensai/data_transformation/sklearn_transformer.py
@@ -2,7 +2,7 @@
 import logging
 from typing import Optional, Sequence, Union, Any, Callable
 
-from sklearn.preprocessing import MaxAbsScaler, StandardScaler, RobustScaler
+from sklearn.preprocessing import MaxAbsScaler, StandardScaler, RobustScaler, MinMaxScaler
 import numpy as np
 from typing_extensions import Protocol
 
@@ -59,6 +59,10 @@ class SkLearnTransformerFactoryFactory:
     def MaxAbsScaler() -> Callable[[], MaxAbsScaler]:
         return MaxAbsScaler
 
+    @staticmethod
+    def MinMaxScaler() -> Callable[[], MinMaxScaler]:
+        return MinMaxScaler
+
     @staticmethod
     def StandardScaler(with_mean=True, with_std=True) -> Callable[[], StandardScaler]:
         return functools.partial(StandardScaler, with_mean=with_mean, with_std=with_std)
@@ -74,10 +78,15 @@ def RobustScaler(quantile_range=(25, 75), with_scaling=True, with_centering=True
             `min` being mapped to -1 and `max` being mapped to 1.
         :param with_scaling: whether to apply scaling based on quantile_range.
         :param with_centering: whether to apply centering by subtracting the median.
-        :return: a function, which when called without any arguments, produces the respective RobustScaler instace.
+        :return: a function, which when called without any arguments, produces the respective RobustScaler instance.
         """
         return functools.partial(RobustScaler, quantile_range=quantile_range, with_scaling=with_scaling, with_centering=with_centering)
 
     @staticmethod
-    def ManualScaler(centre: Optional[float] = None, scale: Optional[float] = None):
+    def ManualScaler(centre: Optional[float] = None, scale: Optional[float] = None) -> Callable[[], ManualScaler]:
+        """
+        :param centre: the value to subtract from all values (if any)
+        :param scale: the value with which to scale all values (after removing the centre)
+        :return: a function, which when called without any arguments, produces the respective scaler instance.
+        """
         return functools.partial(ManualScaler, centre=centre, scale=scale)
\ No newline at end of file
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_base.py b/src/sensai/evaluation/eval_stats/eval_stats_base.py
index 48ee2cc9..af6d1080 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_base.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_base.py
@@ -72,7 +72,17 @@ def computeValueForEvalStats(self, evalStats: TEvalStats) -> float:
 class EvalStatsCollection(Generic[TEvalStats], ABC):
     def __init__(self, evalStatsList: List[TEvalStats]):
         self.statsList = evalStatsList
-        metricsList = [es.getAll() for es in evalStatsList]
+        metricNamesSet = None
+        metricsList = []
+        for es in evalStatsList:
+            metrics = es.getAll()
+            currentMetricNamesSet = set(metrics.keys())
+            if metricNamesSet is None:
+                metricNamesSet = currentMetricNamesSet
+            else:
+                if metricNamesSet != currentMetricNamesSet:
+                    raise Exception(f"Inconsistent set of metrics in evaluation stats collection: Got {metricNamesSet} for one instance, {currentMetricNamesSet} for another")
+            metricsList.append(metrics)
         metricNames = sorted(metricsList[0].keys())
         self.metrics = {metric: [d[metric] for d in metricsList] for metric in metricNames}
 
@@ -206,3 +216,14 @@ def meanStats(evalStatsList: Sequence[EvalStats]) -> Dict[str, float]:
     dicts = [s.getAll() for s in evalStatsList]
     metrics = dicts[0].keys()
     return {m: np.mean([d[m] for d in dicts]) for m in metrics}
+
+
+class EvalStatsPlot(Generic[TEvalStats], ABC):
+    @abstractmethod
+    def createFigure(self, evalStats: TEvalStats, subtitle: str) -> Optional[plt.Figure]:
+        """
+        :param evalStats: the evaluation stats from which to generate the plot
+        :param subtitle: the plot's subtitle
+        :return: the figure or None if this plot is not applicable/cannot be created
+        """
+        pass
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index f5dd9a7e..8db7806c 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -1,14 +1,17 @@
 from abc import ABC, abstractmethod
-from typing import List, Sequence
+from dataclasses import dataclass
+from typing import List, Sequence, Optional
 import logging
 
 from matplotlib import pyplot as plt
 import numpy as np
 import pandas as pd
 import sklearn
-from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, PrecisionRecallDisplay
+from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, PrecisionRecallDisplay, \
+    balanced_accuracy_score, f1_score
 
-from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric
+from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric, EvalStatsPlot, TEvalStats
+from ...util.pickle import getstate
 from ...util.plot import plotMatrix
 
 
@@ -34,14 +37,21 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
 
 
 class ClassificationMetricAccuracy(ClassificationMetric):
-    name = "Accuracy"
+    name = "accuracy"
 
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return accuracy_score(y_true=y_true, y_pred=y_predicted)
 
 
+class ClassificationMetricBalancedAccuracy(ClassificationMetric):
+    name = "balancedAccuracy"
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        return balanced_accuracy_score(y_true=y_true, y_pred=y_predicted)
+
+
 class ClassificationMetricGeometricMeanOfTrueClassProbability(ClassificationMetric):
-    name = "GeoMeanTrueClassProb"
+    name = "geoMeanTrueClassProb"
     requiresProbabilities = True
 
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
@@ -62,7 +72,7 @@ class ClassificationMetricTopNAccuracy(ClassificationMetric):
 
     def __init__(self, n: int):
         self.n = n
-        super().__init__(name=f"Top{n}Accuracy")
+        super().__init__(name=f"top{n}Accuracy")
 
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         labels = y_predictedClassProbabilities.columns
@@ -81,17 +91,17 @@ def __init__(self, positiveClassLabel, name: str = None):
 
 
 class BinaryClassificationMetricPrecision(BinaryClassificationMetric):
-    name = "Precision"
+    name = "precision"
 
     def __init__(self, positiveClassLabel):
         super().__init__(positiveClassLabel)
 
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
-        return precision_score(y_true, y_predicted, pos_label=self.positiveClassLabel)
+        return precision_score(y_true, y_predicted, pos_label=self.positiveClassLabel, zero_division=0)
 
 
 class BinaryClassificationMetricRecall(BinaryClassificationMetric):
-    name = "Recall"
+    name = "recall"
 
     def __init__(self, positiveClassLabel):
         super().__init__(positiveClassLabel)
@@ -100,6 +110,16 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return recall_score(y_true, y_predicted, pos_label=self.positiveClassLabel)
 
 
+class BinaryClassificationMetricF1Score(BinaryClassificationMetric):
+    name = "F1"
+
+    def __init__(self, positiveClassLabel):
+        super().__init__(positiveClassLabel)
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        return f1_score(y_true, y_predicted, pos_label=self.positiveClassLabel)
+
+
 class ClassificationEvalStats(PredictionEvalStats["ClassificationMetric"]):
     def __init__(self, y_predicted: PredictionArray = None,
             y_true: PredictionArray = None,
@@ -147,11 +167,13 @@ def __init__(self, y_predicted: PredictionArray = None,
         self.isBinary = binaryPositiveLabel is not None
 
         if metrics is None:
-            metrics = [ClassificationMetricAccuracy(), ClassificationMetricGeometricMeanOfTrueClassProbability()]
+            metrics = [ClassificationMetricAccuracy(), ClassificationMetricBalancedAccuracy(),
+                ClassificationMetricGeometricMeanOfTrueClassProbability()]
             if self.isBinary:
                 metrics.extend([
                     BinaryClassificationMetricPrecision(self.binaryPositiveLabel),
-                    BinaryClassificationMetricRecall(self.binaryPositiveLabel)])
+                    BinaryClassificationMetricRecall(self.binaryPositiveLabel),
+                    BinaryClassificationMetricF1Score(self.binaryPositiveLabel)])
 
         metrics = list(metrics)
         if additionalMetrics is not None:
@@ -161,9 +183,20 @@ def __init__(self, y_predicted: PredictionArray = None,
 
         super().__init__(y_predicted, y_true, metrics, additionalMetrics=additionalMetrics)
 
+        # transient members
+        self._binaryClassificationProbabilityThresholdVariationData = None
+
+    def __getstate__(self):
+        return getstate(ClassificationEvalStats, self, transientProperties=["_binaryClassificationProbabilityThresholdVariationData"])
+
     def getConfusionMatrix(self) -> "ConfusionMatrix":
         return ConfusionMatrix(self.y_true, self.y_predicted)
 
+    def getBinaryClassificationProbabilityThresholdVariationData(self) -> "BinaryClassificationProbabilityThresholdVariationData":
+        if self._binaryClassificationProbabilityThresholdVariationData is None:
+            self._binaryClassificationProbabilityThresholdVariationData = BinaryClassificationProbabilityThresholdVariationData(self)
+        return self._binaryClassificationProbabilityThresholdVariationData
+
     def getAccuracy(self):
         return self.computeMetricValue(ClassificationMetricAccuracy())
 
@@ -191,8 +224,8 @@ def plotPrecisionRecallCurve(self, titleAdd: str = None):
         disp = PrecisionRecallDisplay(precision, recall)
         disp.plot()
         ax: plt.Axes = disp.ax_
-        ax.set_xlabel("precision")
-        ax.set_ylabel("recall")
+        ax.set_xlabel("recall")
+        ax.set_ylabel("precision")
         title = "Precision-Recall Curve"
         if titleAdd is not None:
             title += "\n" + titleAdd
@@ -212,7 +245,11 @@ def getGlobalStats(self) -> ClassificationEvalStats:
         if self.globalStats is None:
             y_true = np.concatenate([evalStats.y_true for evalStats in self.statsList])
             y_predicted = np.concatenate([evalStats.y_predicted for evalStats in self.statsList])
-            self.globalStats = ClassificationEvalStats(y_predicted, y_true)
+            es0 = self.statsList[0]
+            if es0.y_predictedClassProbabilities is not None:
+                y_probs = pd.concat([evalStats.y_predictedClassProbabilities for evalStats in self.statsList])
+            self.globalStats = ClassificationEvalStats(y_predicted=y_predicted, y_true=y_true, y_predictedClassProbabilities=y_probs,
+                labels=es0.labels, binaryPositiveLabel=es0.binaryPositiveLabel, metrics=es0.metrics)
         return self.globalStats
 
 
@@ -226,3 +263,128 @@ def plot(self, normalize=True, titleAdd: str = None):
         return plotMatrix(self.confusionMatrix, title, self.labels, self.labels, 'true class', 'predicted class', normalize=normalize,
             titleAdd=titleAdd)
 
+
+class BinaryClassificationCounts:
+    def __init__(self, isPositivePrediction: Sequence[bool], isPositiveGroundTruth: Sequence[bool], zeroDenominatorMetricValue=0):
+        """
+        :param isPositivePrediction: the sequence of Booleans indicating whether the model predicted the positive class
+        :param isPositiveGroundTruth: the sequence of Booleans indicating whether the true class is the positive class
+        :param zeroDenominatorMetricValue: the result to return for metrics such as precision and recall in case the denominator
+            is zero (i.e. zero counted cases)
+        """
+        self.zeroDenominatorMetricValue = zeroDenominatorMetricValue
+        self.tp = 0
+        self.tn = 0
+        self.fp = 0
+        self.fn = 0
+        for predPositive, gtPositive in zip(isPositivePrediction, isPositiveGroundTruth):
+            if gtPositive:
+                if predPositive:
+                    self.tp += 1
+                else:
+                    self.fn += 1
+            else:
+                if predPositive:
+                    self.fp += 1
+                else:
+                    self.tn += 1
+
+    @classmethod
+    def fromProbabilityThreshold(cls, probabilities: Sequence[float], threshold: float, isPositiveGroundTruth: Sequence[bool]) -> "BinaryClassificationCounts":
+        return cls([p >= threshold for p in probabilities], isPositiveGroundTruth)
+
+    @classmethod
+    def fromEvalStats(cls, evalStats: ClassificationEvalStats, threshold=0.5) -> "BinaryClassificationCounts":
+        if not evalStats.isBinary:
+            raise ValueError("Probability threshold variation data can only be computed for binary classification problems")
+        if evalStats.y_predictedClassProbabilities is None:
+            raise ValueError("No probability data")
+        posClassLabel = evalStats.binaryPositiveLabel
+        probs = evalStats.y_predictedClassProbabilities[posClassLabel]
+        isPositiveGT = [gtLabel == posClassLabel for gtLabel in evalStats.y_true]
+        return cls.fromProbabilityThreshold(probabilities=probs, threshold=threshold, isPositiveGroundTruth=isPositiveGT)
+
+    def _frac(self, numerator, denominator):
+        if denominator == 0:
+            return self.zeroDenominatorMetricValue
+        return numerator / denominator
+
+    def getPrecision(self):
+        return self._frac(self.tp, self.tp + self.fp)
+
+    def getRecall(self):
+        return self._frac(self.tp, self.tp + self.fn)
+
+    def getF1(self):
+        return self._frac(self.tp, self.tp + 0.5 * (self.fp + self.fn))
+
+
+class BinaryClassificationProbabilityThresholdVariationData:
+    def __init__(self, evalStats: ClassificationEvalStats):
+        self.thresholds = np.linspace(0, 1, 101)
+        self.counts: List[BinaryClassificationCounts] = []
+        for threshold in self.thresholds:
+            self.counts.append(BinaryClassificationCounts.fromEvalStats(evalStats, threshold=threshold))
+
+    def plotPrecisionRecall(self, subtitle=None) -> plt.Figure:
+        fig = plt.figure()
+        title = "Probability Threshold-Dependent Precision & Recall"
+        if subtitle is not None:
+            title += "\n" + subtitle
+        plt.title(title)
+        plt.xlabel("probability threshold")
+        precision = [c.getPrecision() for c in self.counts]
+        recall = [c.getRecall() for c in self.counts]
+        f1 = [c.getF1() for c in self.counts]
+        plt.plot(self.thresholds, precision, label="precision")
+        plt.plot(self.thresholds, recall, label="recall")
+        plt.plot(self.thresholds, f1, label="F1-score")
+        plt.legend()
+        return fig
+
+    def plotCounts(self, subtitle=None):
+        fig = plt.figure()
+        title = "Probability Threshold-Dependent Counts"
+        if subtitle is not None:
+            title += "\n" + subtitle
+        plt.title(title)
+        plt.xlabel("probability threshold")
+        plt.stackplot(self.thresholds,
+            [c.tp for c in self.counts], [c.tn for c in self.counts], [c.fp for c in self.counts], [c.fn for c in self.counts],
+            labels=["true positives", "true negatives", "false positives", "false negatives"],
+            colors=["#4fa244", "#79c36f", "#a25344", "#c37d6f"])
+        plt.legend()
+        return fig
+
+
+class ClassificationEvalStatsPlot(EvalStatsPlot[ClassificationEvalStats], ABC):
+    pass
+
+
+class ClassificationEvalStatsPlotConfusionMatrix(ClassificationEvalStatsPlot):
+    def __init__(self, normalise=True):
+        self.normalise = normalise
+
+    def createFigure(self, evalStats: ClassificationEvalStats, subtitle: str) -> plt.Figure:
+        return evalStats.plotConfusionMatrix(normalize=self.normalise, titleAdd=subtitle)
+
+
+class ClassificationEvalStatsPlotPrecisionRecall(ClassificationEvalStatsPlot):
+    def createFigure(self, evalStats: ClassificationEvalStats, subtitle: str) -> Optional[plt.Figure]:
+        if not evalStats.isBinary:
+            return None
+        return evalStats.plotPrecisionRecallCurve(titleAdd=subtitle)
+
+
+class ClassificationEvalStatsPlotProbabilityThresholdPrecisionRecall(ClassificationEvalStatsPlot):
+    def createFigure(self, evalStats: ClassificationEvalStats, subtitle: str) -> Optional[plt.Figure]:
+        if not evalStats.isBinary:
+            return None
+        return evalStats.getBinaryClassificationProbabilityThresholdVariationData().plotPrecisionRecall(subtitle=subtitle)
+
+
+class ClassificationEvalStatsPlotProbabilityThresholdCounts(ClassificationEvalStatsPlot):
+    def createFigure(self, evalStats: ClassificationEvalStats, subtitle: str) -> Optional[plt.Figure]:
+        if not evalStats.isBinary:
+            return None
+        return evalStats.getBinaryClassificationProbabilityThresholdVariationData().plotCounts(subtitle=subtitle)
\ No newline at end of file
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_regression.py b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
index 9e8b7a2e..2a8732d9 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_regression.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
@@ -6,7 +6,7 @@
 from matplotlib.colors import LinearSegmentedColormap
 from typing import List, Sequence, Optional
 
-from .eval_stats_base import PredictionEvalStats, Metric, EvalStatsCollection, PredictionArray
+from .eval_stats_base import PredictionEvalStats, Metric, EvalStatsCollection, PredictionArray, EvalStatsPlot
 
 log = logging.getLogger(__name__)
 
@@ -274,3 +274,22 @@ def getGlobalStats(self) -> RegressionEvalStats:
             y_predicted = np.concatenate([evalStats.y_predicted for evalStats in self.statsList])
             self.globalStats = RegressionEvalStats(y_predicted, y_true)
         return self.globalStats
+
+
+class RegressionEvalStatsPlot(EvalStatsPlot[RegressionEvalStats], ABC):
+    pass
+
+
+class RegressionEvalStatsPlotErrorDistribution(RegressionEvalStatsPlot):
+    def createFigure(self, evalStats: RegressionEvalStats, subtitle: str) -> plt.Figure:
+        return evalStats.plotErrorDistribution(titleAdd=subtitle)
+
+
+class RegressionEvalStatsPlotHeatmapGroundTruthPredictions(RegressionEvalStatsPlot):
+    def createFigure(self, evalStats: RegressionEvalStats, subtitle: str) -> plt.Figure:
+        return evalStats.plotHeatmapGroundTruthPredictions(titleAdd=subtitle)
+
+
+class RegressionEvalStatsPlotScatterGroundTruthPredictions(RegressionEvalStatsPlot):
+    def createFigure(self, evalStats: RegressionEvalStats, subtitle: str) -> plt.Figure:
+        return evalStats.plotScatterGroundTruthPredictions(titleAdd=subtitle)
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 9309bf9f..79d0bfd8 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -5,10 +5,11 @@
 """
 # TODO: provide a notebook (and possibly an rst file) that illustrates standard evaluation scenarios and at the same
 #  time serves as an integration test
-
+import functools
 import logging
 from abc import ABC, abstractmethod
-from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable
+from collections import defaultdict
+from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set
 
 import matplotlib.figure
 import matplotlib.pyplot as plt
@@ -18,7 +19,11 @@
 from .crossval import VectorModelCrossValidationData, VectorRegressionModelCrossValidationData, \
     VectorClassificationModelCrossValidationData, \
     VectorClassificationModelCrossValidator, VectorRegressionModelCrossValidator, VectorModelCrossValidator, VectorModelCrossValidatorParams
-from .eval_stats.eval_stats_base import EvalStats, EvalStatsCollection
+from .eval_stats import RegressionEvalStatsCollection, ClassificationEvalStatsCollection, RegressionEvalStatsPlotErrorDistribution, \
+    RegressionEvalStatsPlotHeatmapGroundTruthPredictions, RegressionEvalStatsPlotScatterGroundTruthPredictions, \
+    ClassificationEvalStatsPlotConfusionMatrix, ClassificationEvalStatsPlotPrecisionRecall, RegressionEvalStatsPlot, \
+    ClassificationEvalStatsPlotProbabilityThresholdPrecisionRecall, ClassificationEvalStatsPlotProbabilityThresholdCounts
+from .eval_stats.eval_stats_base import EvalStats, EvalStatsCollection, EvalStatsPlot
 from .eval_stats.eval_stats_classification import ClassificationEvalStats
 from .eval_stats.eval_stats_regression import RegressionEvalStats
 from .evaluator import VectorModelEvaluator, VectorModelEvaluationData, VectorRegressionModelEvaluator, \
@@ -33,6 +38,7 @@
 
 TModel = TypeVar("TModel", bound=VectorModel)
 TEvalStats = TypeVar("TEvalStats", bound=EvalStats)
+TEvalStatsPlot = TypeVar("TEvalStatsPlot", bound=EvalStatsPlot)
 TEvalStatsCollection = TypeVar("TEvalStatsCollection", bound=EvalStatsCollection)
 TEvaluator = TypeVar("TEvaluator", bound=VectorModelEvaluator)
 TCrossValidator = TypeVar("TCrossValidator", bound=VectorModelCrossValidator)
@@ -125,15 +131,75 @@ def evalModelViaEvaluator(model: TModel, inputOutputData: InputOutputData, testF
     return ev.performSimpleEvaluation(model, showPlots=True, logResults=True)
 
 
+class EvaluationResultCollector:
+    def __init__(self, showPlots: bool = True, resultWriter: Optional[ResultWriter] = None):
+        self.showPlots = showPlots
+        self.resultWriter = resultWriter
+
+    def addFigure(self, name, fig: matplotlib.figure.Figure):
+        if self.resultWriter is not None:
+            self.resultWriter.writeFigure(name, fig, closeFigure=not self.showPlots)
+
+    def child(self, addedFilenamePrefix):
+        resultWriter = self.resultWriter
+        if resultWriter:
+            resultWriter = resultWriter.childWithAddedPrefix(addedFilenamePrefix)
+        return self.__class__(showPlots=self.showPlots, resultWriter=resultWriter)
+
+
+class EvalStatsPlotCollector(Generic[TEvalStats, TEvalStatsPlot]):
+    def __init__(self):
+        self.plots: Dict[str, EvalStatsPlot] = {}
+        self.disabledPlots: Set[str] = set()
+
+    def addPlot(self, name: str, plot: EvalStatsPlot):
+        self.plots[name] = plot
+
+    def disablePlots(self, *names: str):
+        self.disabledPlots.update(names)
+
+    def createPlots(self, evalStats: EvalStats, subtitle: str, resultCollector: EvaluationResultCollector):
+        knownPlots = set(self.plots.keys())
+        unknownDisabledPlots = self.disabledPlots.difference(knownPlots)
+        if len(unknownDisabledPlots) > 0:
+            log.warning(f"Plots were disabled which are not registered: {unknownDisabledPlots}; known plots: {knownPlots}")
+        for name, plot in self.plots.items():
+            if name not in self.disabledPlots:
+                fig = plot.createFigure(evalStats, subtitle)
+                if fig is not None:
+                    resultCollector.addFigure(name, fig)
+
+
+class RegressionEvalStatsPlotCollector(EvalStatsPlotCollector[RegressionEvalStats, RegressionEvalStatsPlot]):
+    def __init__(self):
+        super().__init__()
+        self.addPlot("error-dist", RegressionEvalStatsPlotErrorDistribution())
+        self.addPlot("heatmap-gt-pred", RegressionEvalStatsPlotHeatmapGroundTruthPredictions())
+        self.addPlot("scatter-gt-pred", RegressionEvalStatsPlotScatterGroundTruthPredictions())
+
+
+class ClassificationEvalStatsPlotCollector(EvalStatsPlotCollector[RegressionEvalStats, RegressionEvalStatsPlot]):
+    def __init__(self):
+        super().__init__()
+        self.addPlot("confusion-matrix-rel", ClassificationEvalStatsPlotConfusionMatrix(normalise=True))
+        self.addPlot("confusion-matrix-abs", ClassificationEvalStatsPlotConfusionMatrix(normalise=False))
+        # the plots below apply to the binary case only (skipped for non-binary case)
+        self.addPlot("precision-recall", ClassificationEvalStatsPlotPrecisionRecall())
+        self.addPlot("threshold-precision-recall", ClassificationEvalStatsPlotProbabilityThresholdPrecisionRecall())
+        self.addPlot("threshold-counts", ClassificationEvalStatsPlotProbabilityThresholdCounts())
+
+
 class EvaluationUtil(ABC, Generic[TModel, TEvaluator, TEvalData, TCrossValidator, TCrossValData, TEvalStats]):
     """
     Utility class for the evaluation of models based on a dataset
     """
     def __init__(self, inputOutputData: InputOutputData,
+            evalStatsPlotCollector: Union[RegressionEvalStatsPlotCollector, ClassificationEvalStatsPlotCollector],
             evaluatorParams: Optional[Union[VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, Dict[str, Any]]] = None,
             crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None):
         """
         :param inputOutputData: the data set to use for evaluation
+        :param evalStatsPlotCollector: a collector for plots generated from evaluation stats objects
         :param evaluatorParams: parameters with which to instantiate evaluators
         :param crossValidatorParams: parameters with which to instantiate cross-validators
         """
@@ -144,21 +210,7 @@ def __init__(self, inputOutputData: InputOutputData,
         self.evaluatorParams = evaluatorParams
         self.crossValidatorParams = crossValidatorParams
         self.inputOutputData = inputOutputData
-
-    class ResultCollector:
-        def __init__(self, showPlots: bool = True, resultWriter: Optional[ResultWriter] = None):
-            self.showPlots = showPlots
-            self.resultWriter = resultWriter
-
-        def addFigure(self, name, fig: matplotlib.figure.Figure):
-            if self.resultWriter is not None:
-                self.resultWriter.writeFigure(name, fig, closeFigure=not self.showPlots)
-
-        def child(self, addedFilenamePrefix):
-            resultWriter = self.resultWriter
-            if resultWriter:
-                resultWriter = resultWriter.childWithAddedPrefix(addedFilenamePrefix)
-            return self.__class__(showPlots=self.showPlots, resultWriter=resultWriter)
+        self.evalStatsPlotCollector = evalStatsPlotCollector
 
     def createEvaluator(self, model: TModel = None, isRegression: bool = None) -> TEvaluator:
         """
@@ -249,7 +301,8 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
         return crossValidationData
 
     def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None, useCrossValidation=False,
-            fitModels=True, writeIndividualResults=True, sortColumn: Optional[str] = None, sortAscending: bool = True) -> pd.DataFrame:
+            fitModels=True, writeIndividualResults=True, sortColumn: Optional[str] = None, sortAscending: bool = True,
+            includeEvalStatsObjects=False) -> pd.DataFrame:
         """
         Compares several models via simple evaluation or cross-validation
 
@@ -262,6 +315,8 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
             summary)
         :param sortColumn: column/metric name by which to sort
         :param sortAscending: whether to sort in ascending order
+        :param includeEvalStatsObjects: whether to include, in addition to the metrics, a column "evalStats" (which holds
+            the classification or regression evaluation data object) in the result data frame
         :return: a data frame containing evaluation metrics on all models
         """
         statsList = []
@@ -270,11 +325,16 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
                 if not fitModels:
                     raise ValueError("Cross-validation necessitates that models be retrained; got fitModels=False")
                 crossValidationResult = self.performCrossValidation(model, resultWriter=resultWriter if writeIndividualResults else None)
-                statsDict = crossValidationResult.getEvalStatsCollection().aggStats()
+                evalStatsCollection = crossValidationResult.getEvalStatsCollection()
+                statsDict = evalStatsCollection.aggStats()
+                if includeEvalStatsObjects:
+                    statsDict["evalStats"] = evalStatsCollection.getGlobalStats()
             else:
                 evalStats: EvalStats = self.performSimpleEvaluation(model, resultWriter=resultWriter if writeIndividualResults else None,
                     fitModel=fitModels).getEvalStats()
                 statsDict = evalStats.getAll()
+                if includeEvalStatsObjects:
+                    statsDict["evalStats"] = evalStats
             statsDict["modelName"] = model.getName()
             statsList.append(statsDict)
         resultsDF = pd.DataFrame(statsList).set_index("modelName")
@@ -283,7 +343,8 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
                 log.warning(f"Requested sort column '{sortColumn}' not in list of columns {list(resultsDF.columns)}")
             else:
                 resultsDF.sort_values(sortColumn, ascending=sortAscending, inplace=True)
-        strResults = f"Model comparison results:\n{resultsDF.to_string()}"
+        resultsDFForReporting = resultsDF if not includeEvalStatsObjects else resultsDF.drop(columns="evalStats")
+        strResults = f"Model comparison results:\n{resultsDFForReporting.to_string()}"
         log.info(strResults)
         if resultWriter is not None:
             suffix = "crossval" if useCrossValidation else "simple-eval"
@@ -312,10 +373,10 @@ def createPlots(self, data: Union[TEvalData, TCrossValData], showPlots=True, res
         """
         if not showPlots and resultWriter is None:
             return
-        resultCollector = self.ResultCollector(showPlots=showPlots, resultWriter=resultWriter)
+        resultCollector = EvaluationResultCollector(showPlots=showPlots, resultWriter=resultWriter)
         self._createPlots(data, resultCollector, subtitle=subtitlePrefix + data.modelName)
 
-    def _createPlots(self, data: Union[TEvalData, TCrossValData], resultCollector: ResultCollector, subtitle=None):
+    def _createPlots(self, data: Union[TEvalData, TCrossValData], resultCollector: EvaluationResultCollector, subtitle=None):
 
         def createPlots(predVarName, rc, subt):
             if isinstance(data, VectorModelCrossValidationData):
@@ -333,28 +394,39 @@ def createPlots(predVarName, rc, subt):
             for predictedVarName in predictedVarNames:
                 createPlots(predictedVarName, resultCollector.child(predictedVarName+"-"), f"{predictedVarName}, {subtitle}")
 
-    @abstractmethod
-    def _createEvalStatsPlots(self, evalStats: TEvalStats, resultCollector: ResultCollector, subtitle=None):
+    def _createEvalStatsPlots(self, evalStats: TEvalStats, resultCollector: EvaluationResultCollector, subtitle=None):
         """
         :param evalStats: the evaluation results for which to create plots
         :param resultCollector: the collector to which all plots are to be passed
         :param subtitle: the subtitle to use for generated plots (if any)
         """
-        pass
+        self.evalStatsPlotCollector.createPlots(evalStats, subtitle, resultCollector)
 
 
 class RegressionEvaluationUtil(EvaluationUtil[VectorRegressionModel, VectorRegressionModelEvaluator, VectorRegressionModelEvaluationData, VectorRegressionModelCrossValidator, VectorRegressionModelCrossValidationData, RegressionEvalStats]):
-    def _createEvalStatsPlots(self, evalStats: RegressionEvalStats, resultCollector: EvaluationUtil.ResultCollector, subtitle=None):
-        resultCollector.addFigure("error-dist", evalStats.plotErrorDistribution(titleAdd=subtitle))
-        resultCollector.addFigure("heatmap-gt-pred", evalStats.plotHeatmapGroundTruthPredictions(titleAdd=subtitle))
-        resultCollector.addFigure("scatter-gt-pred", evalStats.plotScatterGroundTruthPredictions(titleAdd=subtitle))
+    def __init__(self, inputOutputData: InputOutputData,
+            evaluatorParams: Optional[Union[VectorRegressionModelEvaluatorParams, Dict[str, Any]]] = None,
+            crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None):
+        """
+        :param inputOutputData: the data set to use for evaluation
+        :param evaluatorParams: parameters with which to instantiate evaluators
+        :param crossValidatorParams: parameters with which to instantiate cross-validators
+        """
+        super().__init__(inputOutputData, evalStatsPlotCollector=RegressionEvalStatsPlotCollector(), evaluatorParams=evaluatorParams,
+            crossValidatorParams=crossValidatorParams)
 
 
 class ClassificationEvaluationUtil(EvaluationUtil[VectorClassificationModel, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, VectorClassificationModelCrossValidator, VectorClassificationModelCrossValidationData, ClassificationEvalStats]):
-    def _createEvalStatsPlots(self, evalStats: ClassificationEvalStats, resultCollector: EvaluationUtil.ResultCollector, subtitle=None):
-        resultCollector.addFigure("confusion-matrix", evalStats.plotConfusionMatrix(titleAdd=subtitle))
-        if evalStats.isBinary:
-            resultCollector.addFigure("precision-recall", evalStats.plotPrecisionRecallCurve(titleAdd=subtitle))
+    def __init__(self, inputOutputData: InputOutputData,
+            evaluatorParams: Optional[Union[VectorClassificationModelEvaluatorParams, Dict[str, Any]]] = None,
+            crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None):
+        """
+        :param inputOutputData: the data set to use for evaluation
+        :param evaluatorParams: parameters with which to instantiate evaluators
+        :param crossValidatorParams: parameters with which to instantiate cross-validators
+        """
+        super().__init__(inputOutputData, evalStatsPlotCollector=ClassificationEvalStatsPlotCollector(), evaluatorParams=evaluatorParams,
+            crossValidatorParams=crossValidatorParams)
 
 
 class MultiDataEvaluationUtil:
@@ -384,7 +456,9 @@ def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], use
             resultWriter: Optional[ResultWriter] = None, writePerDatasetResults=True,
             evaluatorParams: Optional[Union[VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, Dict[str, Any]]] = None,
             crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None,
-            columnNameForModelRanking: str = None, rankMax=True) -> Tuple[pd.DataFrame, pd.DataFrame]:
+            columnNameForModelRanking: str = None,
+            rankMax=True,
+            createCombinedEvalStatsPlots=False) -> Tuple[pd.DataFrame, pd.DataFrame]:
         """
         :param modelFactories: a sequence of factory functions for the creation of models to evaluate; every factory must result
             in a model with a fixed model name (otherwise results cannot be correctly aggregated)
@@ -396,43 +470,92 @@ def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], use
         :param crossValidatorParams: parameters to use for the instantiation of cross-validators (relevant if useCrossValidation==True)
         :param columnNameForModelRanking: column name to use for ranking models
         :param rankMax: if true, use max for ranking, else min
+        :param createCombinedEvalStatsPlots: whether to combine, for each type of model, the EvalStats objects from the individual experiments
+            into a single objects that holds all results and use it to create plots reflecting the overall result.
+            Note that for classification, this is only possible if all individual experiments use the same set of class labels.
         :return: a pair of data frames (allDF, meanDF) where allDF contains all the individual evaluation results (one row per data set)
             and meanDF contains one row for each model with results averaged across datasets
         """
         allResults = pd.DataFrame()
-        for key, inputOutputData in self.inputOutputDataDict.items():
-            log.info(f"Evaluating models for {key}")
+        evalStatsByModelName = defaultdict(list)
+        isRegression = None
+        plotCollector: Optional[EvalStatsPlotCollector] = None
+
+        for i, (key, inputOutputData) in enumerate(self.inputOutputDataDict.items(), start=1):
+            log.info(f"Evaluating models for data set #{i}/{len(self.inputOutputDataDict)}: {self.keyName}={key}")
             models = [f() for f in modelFactories]
-            modelsAreRegression = [model.isRegressionModel() for model in models]
-            if all(modelsAreRegression):
-                isRegression = True
-            elif not any(modelsAreRegression):
-                isRegression = False
-            else:
-                raise ValueError("The models have to be either all regression models or all classification, not a mixture")
+
+            if isRegression is None:
+                modelsAreRegression = [model.isRegressionModel() for model in models]
+                if all(modelsAreRegression):
+                    isRegression = True
+                elif not any(modelsAreRegression):
+                    isRegression = False
+                else:
+                    raise ValueError("The models have to be either all regression models or all classification, not a mixture")
+
             ev = createEvaluationUtil(inputOutputData, isRegression=isRegression, evaluatorParams=evaluatorParams,
                 crossValidatorParams=crossValidatorParams)
+
+            if plotCollector is None:
+                plotCollector = ev.evalStatsPlotCollector
+
+            # compute data frame with results for current data set
             childResultWriter = resultWriter.childForSubdirectory(key) if (writePerDatasetResults and resultWriter is not None) else None
-            df = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter)
+            df = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter, includeEvalStatsObjects=True)
+
+            # augment data frame
             df[self.keyName] = key
             df["modelName"] = df.index
-            if columnNameForModelRanking is not None:
-                if columnNameForModelRanking not in df.columns:
-                    raise ValueError(f"Rank metric {columnNameForModelRanking} not contained in columns {df.columns}")
-                df["bestModel"] = 0
-                if rankMax:
-                    df["bestModel"].loc[df[columnNameForModelRanking].idxmax()] = 1
-                else:
-                    df["bestModel"].loc[df[columnNameForModelRanking].idxmin()] = 1
             df = df.reset_index(drop=True)
+
+            # collect eval stats objects by model name and remove from data frame
+            for _, row in df.iterrows():
+                modelName = row.modelName
+                evalStats = row.evalStats
+                evalStatsByModelName[modelName].append(evalStats)
+            df = df.drop(columns="evalStats")
+
             allResults = pd.concat((allResults, df))
+
         if self.metaDF is not None:
             allResults = allResults.join(self.metaDF, on=self.keyName, how="left")
+
         strAllResults = f"All results:\n{allResults.to_string()}"
         log.info(strAllResults)
-        meanResults = allResults.groupby("modelName").mean()
-        strMeanResults = f"Mean results:\n{meanResults.to_string()}"
+
+        allResultsGrouped = allResults.groupby("modelName")
+        meanResults: pd.DataFrame = allResultsGrouped.mean()
+        if columnNameForModelRanking in meanResults:
+            meanResults.sort_values(columnNameForModelRanking, inplace=True, ascending=not rankMax)
+        strMeanResults = f"Mean results (averaged across {len(self.inputOutputDataDict)} data sets):\n{meanResults.to_string()}"
         log.info(strMeanResults)
+
+        # create further aggregations
+        aggDFs = []
+        for opName, aggFn in [("std", lambda x: x.std()), ("min", lambda x: x.min()), ("max", lambda x: x.max())]:
+            aggDF = aggFn(allResultsGrouped)
+            aggDF.columns = [f"{opName}[{c}]" for c in aggDF.columns]
+            aggDFs.append(aggDF)
+        furtherAggsDF = pd.concat(aggDFs, axis=1)
+        furtherAggsDF = furtherAggsDF.loc[meanResults.index]  # apply same sort order (index is modelName)
+        columnOrder = functools.reduce(lambda a, b: a + b, [list(t) for t in zip(*[df.columns for df in aggDFs])])
+        furtherAggsDF = furtherAggsDF[columnOrder]
+        strFurtherAggs = f"Further aggregations:\n{furtherAggsDF.to_string()}"
+        log.info(strFurtherAggs)
+
         if resultWriter is not None:
-            resultWriter.writeTextFile("model-comparison-results", strMeanResults + "\n\n" + strAllResults)
+            resultWriter.writeTextFile("model-comparison-results", strMeanResults + "\n\n" + strFurtherAggs + "\n\n" + strAllResults)
+
+        # create plots from combined data for each model
+        if createCombinedEvalStatsPlots:
+            for modelName, evalStatsList in evalStatsByModelName.items():
+                childResultWriter = resultWriter.childWithAddedPrefix(modelName + "_") if resultWriter is not None else None
+                resultCollector = EvaluationResultCollector(showPlots=False, resultWriter=childResultWriter)
+                if isRegression:
+                    evalStats = RegressionEvalStatsCollection(evalStatsList).getGlobalStats()
+                else:
+                    evalStats = ClassificationEvalStatsCollection(evalStatsList).getGlobalStats()
+                plotCollector.createPlots(evalStats, subtitle=modelName, resultCollector=resultCollector)
+
         return allResults, meanResults
diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 67d5c3da..22b86251 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -297,7 +297,10 @@ def _generateFromMultiple(self, generateFeatures: Callable[[FeatureGenerator], p
         if len(dfs) == 0:
             return pd.DataFrame(index=index)
         else:
-            return pd.concat(dfs, axis=1)
+            combinedDF = pd.concat(dfs, axis=1)
+            if len(combinedDF.columns) != len(set(combinedDF.columns)):
+                raise Exception(f"At least one column was generated more than once: {list(combinedDF.columns)}; check feature generators for correctness!")
+            return combinedDF
 
     def _generate(self, inputDF: pd.DataFrame, ctx=None):
         def generateFeatures(fg: FeatureGenerator):
@@ -736,8 +739,10 @@ def getMultiFeatureGenerator(self) -> MultiFeatureGenerator:
 
     def getNormalizationRules(self, includeGeneratedCategoricalRules=True):
         return self.getMultiFeatureGenerator().getNormalisationRules(
-            includeGeneratedCategoricalRules=includeGeneratedCategoricalRules
-        )
+            includeGeneratedCategoricalRules=includeGeneratedCategoricalRules)
+
+    def getCategoricalFeatureNameRegex(self) -> str:
+        return self.getMultiFeatureGenerator().getCategoricalFeatureNameRegex()
 
     def _createMultiFeatureGenerator(self):
         featureGenerators = []
@@ -802,6 +807,65 @@ def info(self):
         return info
 
 
+class FeatureGeneratorMapColumn(RuleBasedFeatureGenerator, ABC):
+    """
+    Creates a single feature from a single input column by applying a function to each element of the input column
+    """
+    def __init__(self, inputColName: str, featureColName: str, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None,
+            normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
+            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None, addCategoricalDefaultRules=True):
+        super().__init__(categoricalFeatureNames=categoricalFeatureNames, normalisationRules=normalisationRules,
+            normalisationRuleTemplate=normalisationRuleTemplate, addCategoricalDefaultRules=addCategoricalDefaultRules)
+        self._inputColName = inputColName
+        self._featureColName = featureColName
+
+    def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
+        if self._inputColName not in df.columns:
+            raise ValueError(f"Column '{self._inputColName}' required by feature generator not found in list of columns: {list(df.columns)}")
+        inputSeries = df[self._inputColName]
+        values = inputSeries.apply(self._createValue)
+        return pd.DataFrame({self._featureColName: values}, index=df.index)
+
+    @abstractmethod
+    def _createValue(self, value):
+        """
+        Maps a value from the input column to a feature value
+
+        :param value: a value from the input column
+        :return: the feature value
+        """
+        pass
+
+
+class FeatureGeneratorMapColumnDict(RuleBasedFeatureGenerator, ABC):
+    """
+    Creates an arbitrary number of features from a single input column by applying a function to each element of the input column
+    """
+    def __init__(self, inputColName: str, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None,
+            normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
+            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None, addCategoricalDefaultRules=True):
+        super().__init__(categoricalFeatureNames=categoricalFeatureNames, normalisationRules=normalisationRules,
+            normalisationRuleTemplate=normalisationRuleTemplate, addCategoricalDefaultRules=addCategoricalDefaultRules)
+        self._inputColName = inputColName
+
+    def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
+        if self._inputColName not in df.columns:
+            raise ValueError(f"Column '{self._inputColName}' required by feature generator not found in list of columns: {list(df.columns)}")
+        inputSeries = df[self._inputColName]
+        values = [self._createFeaturesDict(v) for v in inputSeries]
+        return pd.DataFrame(values, index=df.index)
+
+    @abstractmethod
+    def _createFeaturesDict(self, value) -> Dict[str, Any]:
+        """
+        Maps a value from the input column to a dictionary containing one or more features.
+
+        :param value: a value from the input column
+        :return: a dictionary mapping feature names to values
+        """
+        pass
+
+
 def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str] = None,
                             normalisationRules=(), normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
     """
diff --git a/src/sensai/lightgbm.py b/src/sensai/lightgbm.py
index 2c9189aa..4dfb92b8 100644
--- a/src/sensai/lightgbm.py
+++ b/src/sensai/lightgbm.py
@@ -59,7 +59,9 @@ def getFeatureImportances(self) -> Dict[str, Dict[str, int]]:
 class LightGBMVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     log = log.getChild(__qualname__)
 
-    def __init__(self, categoricalFeatureNames: Sequence[str] = None, random_state=42, num_leaves=31, **modelArgs):
+    def __init__(self, categoricalFeatureNames: Sequence[str] = None, random_state=42, num_leaves=31,
+            max_depth=-1, n_estimators=100, min_child_samples=20, importance_type="gain", useComputedClassWeights=False,
+            **modelArgs):
         """
         :param categoricalFeatureNames: sequence of feature names in the input data that are categorical
             Columns that have dtype 'category' (as will be the case for categorical columns created via FeatureGenerators)
@@ -68,9 +70,19 @@ def __init__(self, categoricalFeatureNames: Sequence[str] = None, random_state=4
             In general, passing categorical features may be preferable to using one-hot encoding, for example.
         :param random_state: the random seed to use
         :param num_leaves: the maximum number of leaves in one tree (original lightgbm default is 31)
-        :param modelArgs: see https://lightgbm.readthedocs.io/en/latest/Parameters.html
+        :param max_depth: maximum tree depth for base learners, <=0 means no limit
+        :param n_estimators: number of boosted trees to fit
+        :param min_child_samples: minimum number of data needed in a child (leaf)
+        :param importance_type: the type of feature importance to be set in the respective property of the wrapped model.
+            If ‘split’, result contains numbers of times the feature is used in a model.
+            If ‘gain’, result contains total gains of splits which use the feature.
+        :param useComputedClassWeights: whether to compute class weights from the training data that is given and pass it on to the
+            classifier's fit method; weighted data points may not be supported for all types of models
+        :param modelArgs: see https://lightgbm.readthedocs.io/en/latest/pythonapi/lightgbm.LGBMClassifier.html?highlight=LGBMClassifier
         """
-        super().__init__(lightgbm.sklearn.LGBMClassifier, random_state=random_state, num_leaves=num_leaves, **modelArgs)
+        super().__init__(lightgbm.sklearn.LGBMClassifier, random_state=random_state, num_leaves=num_leaves,
+            max_depth=max_depth, n_estimators=n_estimators, min_child_samples=min_child_samples, importance_type=importance_type,
+            useComputedClassWeights=useComputedClassWeights, **modelArgs)
 
         if type(categoricalFeatureNames) == str:
             categoricalFeatureNameRegex = categoricalFeatureNames
diff --git a/src/sensai/util/cache.py b/src/sensai/util/cache.py
index 50a7e100..64cde847 100644
--- a/src/sensai/util/cache.py
+++ b/src/sensai/util/cache.py
@@ -565,7 +565,7 @@ def _computeValue(self, key, data):
 
 
 def cached(fn: Callable[[], T], picklePath, functionName=None, validityCheckFn: Optional[Callable[[T], bool]] = None,
-        backend="pickle", protocol=pickle.HIGHEST_PROTOCOL) -> T:
+        backend="pickle", protocol=pickle.HIGHEST_PROTOCOL, load=True) -> T:
     """
     :param fn: the function whose result is to be cached
     :param picklePath: the path in which to store the cached result
@@ -576,7 +576,8 @@ def cached(fn: Callable[[], T], picklePath, functionName=None, validityCheckFn:
         the function fn is called to compute the result and the cached result is updated.
     :param backend: pickle or joblib
     :param protocol: the pickle protocol version
-    :return: the res (either obtained from the cache or the function)
+    :param load: whether to load a previously persisted result; if False, do not load an old result but store the newly computed result
+    :return: the result (either obtained from the cache or the function)
     """
     if functionName is None:
         functionName = fn.__name__
@@ -588,13 +589,17 @@ def callFnAndCacheResult():
         return res
 
     if os.path.exists(picklePath):
-        log.info(f"Loading cached result of function '{functionName}' from {picklePath}")
-        result = loadPickle(picklePath, backend=backend)
-        if validityCheckFn is not None:
-            if not validityCheckFn(result):
-                log.info(f"Cached result is no longer valid, recomputing ...")
-                result = callFnAndCacheResult()
-        return result
+        if load:
+            log.info(f"Loading cached result of function '{functionName}' from {picklePath}")
+            result = loadPickle(picklePath, backend=backend)
+            if validityCheckFn is not None:
+                if not validityCheckFn(result):
+                    log.info(f"Cached result is no longer valid, recomputing ...")
+                    result = callFnAndCacheResult()
+            return result
+        else:
+            log.info(f"Ignoring previously stored result in {picklePath}, calling function '{functionName}' ...")
+            return callFnAndCacheResult()
     else:
         log.info(f"No cached result found in {picklePath}, calling function '{functionName}' ...")
         return callFnAndCacheResult()
@@ -605,7 +610,7 @@ class PickleCached(object):
     Function decorator for caching function results via pickle
     """
     def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str = None, backend="pickle",
-            protocol=pickle.HIGHEST_PROTOCOL):
+            protocol=pickle.HIGHEST_PROTOCOL, load=True):
         """
         :param cacheBasePath: the directory where the pickle cache file will be stored
         :param filenamePrefix: a prefix of the name of the cache file to be created, to which the function name and, where applicable,
@@ -614,12 +619,14 @@ def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str
         :param filename: the full file name of the cache file to be created; this is admissible only if the function has no arguments
         :param backend: the serialisation backend to use (see dumpPickle)
         :param protocol: the pickle protocol version to use
+        :param load: whether to load a previously persisted result; if False, do not load an old result but store the newly computed result
         """
         self.filename = filename
         self.cacheBasePath = cacheBasePath
         self.filenamePrefix = filenamePrefix
         self.backend = backend
         self.protocol = protocol
+        self.load = load
 
         if self.filenamePrefix is None:
             self.filenamePrefix = ""
@@ -640,7 +647,7 @@ def wrapped(*args, **kwargs):
                     raise Exception("Function called with arguments but full cache filename specified: specify a cache filename prefix only to account for argument values")
                 filename = self.filename
             picklePath = os.path.join(self.cacheBasePath, filename)
-            return cached(lambda: fn(*args, **kwargs), picklePath, functionName=fn.__name__, backend=self.backend)
+            return cached(lambda: fn(*args, **kwargs), picklePath, functionName=fn.__name__, backend=self.backend, load=self.load)
 
         return wrapped
 
diff --git a/src/sensai/util/helper.py b/src/sensai/util/helper.py
index 076b71b0..e818c3e3 100644
--- a/src/sensai/util/helper.py
+++ b/src/sensai/util/helper.py
@@ -1,9 +1,9 @@
 """
 This module contains various helper functions.
 """
+import math
 from typing import Any, Sequence, Union, TypeVar, List
 
-
 T = TypeVar("T")
 
 
@@ -37,6 +37,17 @@ def allNone(*args: Any) -> bool:
     return countNone(*args) == len(args)
 
 
+def checkNotNaNDict(d: dict):
+    """
+    Raises ValueError if any of the values in the given dictionary are NaN, reporting the respective keys
+
+    :param d: a dictionary mapping to floats that are to be checked for NaN
+    """
+    invalidKeys = [k for k, v in d.items() if math.isnan(v)]
+    if len(invalidKeys) > 0:
+        raise ValueError(f"Got one or more NaN values: {invalidKeys}")
+
+
 def markUsed(*args):
     """
     Utility function to mark identifiers as used.
diff --git a/src/sensai/util/io.py b/src/sensai/util/io.py
index e6cf6a11..def4dcf0 100644
--- a/src/sensai/util/io.py
+++ b/src/sensai/util/io.py
@@ -1,6 +1,6 @@
 import logging
 import os
-from typing import Sequence, Optional, Tuple
+from typing import Sequence, Optional, Tuple, List
 
 import matplotlib.figure
 from matplotlib import pyplot as plt
@@ -64,6 +64,12 @@ def writeTextFile(self, filenameSuffix, content):
             f.write(content)
         return p
 
+    def writeTextFileLines(self, filenameSuffix, lines: List[str]):
+        p = self.path(filenameSuffix, extensionToAdd="txt")
+        self.log.info(f"Saving text file {p}")
+        writeTextFileLines(lines, p)
+        return p
+
     def writeDataFrameTextFile(self, filenameSuffix, df: pd.DataFrame):
         p = self.path(filenameSuffix, extensionToAdd="df.txt", validOtherExtensions="txt")
         self.log.info(f"Saving data frame text file {p}")
@@ -75,6 +81,7 @@ def writeDataFrameCsvFile(self, filenameSuffix, df: pd.DataFrame):
         p = self.path(filenameSuffix, extensionToAdd="csv")
         self.log.info(f"Saving data frame CSV file {p}")
         df.to_csv(p)
+        return p
 
     def writeFigure(self, filenameSuffix, fig, closeFigure=False):
         """
@@ -98,3 +105,32 @@ def writePickle(self, filenameSuffix, obj):
         p = self.path(filenameSuffix, extensionToAdd="pickle")
         self.log.info(f"Saving pickle {p}")
         dumpPickle(obj, p)
+        return p
+
+
+def writeTextFileLines(lines: List[str], path):
+    """
+    :param lines: the lines to write (without a trailing newline, which will be added)
+    :param path: the path of the text file to write to
+    """
+    with open(path, "w") as f:
+        for line in lines:
+            f.write(line)
+            f.write("\n")
+
+
+def readTextFileLines(path, strip=True, skipEmpty=True) -> List[str]:
+    """
+    :param path: the path of the text file to read from
+    :param strip: whether to strip each line, removing whitespace/newline characters
+    :param skipEmpty: whether to skip any lines that are empty (after stripping)
+    :return: the list of lines
+    """
+    lines = []
+    with open(path, "r") as f:
+        for line in f.readlines():
+            if strip:
+                line = line.strip()
+            if not skipEmpty or line != "":
+                lines.append(line)
+    return lines
\ No newline at end of file
diff --git a/src/sensai/util/plot.py b/src/sensai/util/plot.py
index ca097d65..8f50a4fa 100644
--- a/src/sensai/util/plot.py
+++ b/src/sensai/util/plot.py
@@ -78,6 +78,15 @@ def ylabel(self, label):
         plt.ylabel(label)
         return self
 
+    def title(self, title: str):
+        plt.title(title)
+
+    def xlim(self, minValue, maxValue):
+        plt.xlim(minValue, maxValue)
+
+    def ylim(self, minValue, maxValue):
+        plt.ylim(minValue, maxValue)
+
     def save(self, path):
         log.info(f"Saving figure in {path}")
         self.fig.savefig(path)
diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index 5af10374..b7814508 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -13,8 +13,15 @@ def dictString(d: Dict, brackets: Optional[str] = None):
         return s
 
 
-def listString(l: Iterable[Any], brackets="[]"):
-    return brackets[:1] + ", ".join((toString(x) for x in l)) + brackets[-1:]
+def listString(l: Iterable[Any], brackets="[]", quote: Optional[str] = None):
+    def item(x):
+        x = toString(x)
+        if quote is not None:
+            return quote + x + quote
+        else:
+            return x
+
+    return brackets[:1] + ", ".join((item(x) for x in l)) + brackets[-1:]
 
 
 def toString(x):
@@ -53,6 +60,7 @@ class ToStringMixin:
     Provides default implementations for __str__ and __repr__ which contain all attribute names and their values. The
     latter also contains the object id.
     """
+    _TOSTRING_INCLUDE_ALL = "__all__"
 
     def _toStringClassName(self):
         return type(self).__qualname__
@@ -93,10 +101,10 @@ def isExcluded(k):
                 return False
 
         # determine relevant attribute dictionary
-        if len(include) == 0:  # exclude semantics (include everything by default)
+        if len(include) == 1 and include[0] == self._TOSTRING_INCLUDE_ALL:  # exclude semantics (include everything by default)
             attributeDict = self.__dict__
         else:  # include semantics (include only inclusions)
-            attributeDict = {k: getattr(self, k) for k in set(include + includeForced) if hasattr(self, k)}
+            attributeDict = {k: getattr(self, k) for k in set(include + includeForced) if hasattr(self, k) and k != self._TOSTRING_INCLUDE_ALL}
 
         # apply exclusions and remove underscores from attribute names
         d = {k.strip("_"): v for k, v in attributeDict.items() if not isExcluded(k)}
@@ -132,16 +140,21 @@ def _toStringExcludes(self) -> List[str]:
 
     def _toStringIncludes(self) -> List[str]:
         """
-        Makes the string representation include only the returned attributes (i.e. introduces inclusion semantics) - except
-        if the list is empty, in which case all attributes are included by default.
-        To add an included attribute in a sub-class, regardless of any super-classes using exclusion or inclusion semantics,
+        Makes the string representation include only the returned attributes (i.e. introduces inclusion semantics);
+        By default, the list contains only a marker element, which is interpreted as "all attributes included".
+
+        This method can be overridden by sub-classes, which can call super in order to extend the list.
+        If a list containing the aforementioned marker element (which stands for all attributes) is extended, the marker element will be ignored,
+        and only the user-added elements will be considered as included.
+
+        Note: To add an included attribute in a sub-class, regardless of any super-classes using exclusion or inclusion semantics,
         use _toStringIncludesForced instead.
-        This method can be overwritten by sub-classes which can call super and extend the list.
+
         This method will only have no effect if _toStringObjectInfo is overridden to not use its result.
 
-        :return: a list of attribute names; if empty, include all attributes (except the ones being excluded according to other methods)
+        :return: a list of attribute names to be included in the string representation
         """
-        return []
+        return [self._TOSTRING_INCLUDE_ALL]
 
     def _toStringIncludesForced(self) -> List[str]:
         """
diff --git a/src/sensai/util/time.py b/src/sensai/util/time.py
index 5ff90893..af187bab 100644
--- a/src/sensai/util/time.py
+++ b/src/sensai/util/time.py
@@ -7,3 +7,11 @@ def tsNextMonth(ts: pd.Timestamp) -> pd.Timestamp:
         return ts.replace(year=ts.year+1, month=1)
     else:
         return ts.replace(month=m+1)
+
+
+def timeOfDay(ts: pd.Timestamp) -> float:
+    """
+    :param ts: the timestamp
+    :return: the time of day as a floating point number in [0, 24)
+    """
+    return ts.hour + ts.minute / 60

From 374710af39c431322c4cd560252218973b9797e1 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 22:03:10 +0200
Subject: [PATCH 006/131] Added/improved docstrings

---
 src/sensai/data_transformation/dft.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 95401b65..1a45d9cf 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -653,6 +653,9 @@ def findRule(self, colName: str) -> "DFTNormalisation.Rule":
 
 
 class DFTFromColumnGenerators(RuleBasedDataFrameTransformer):
+    """
+    Extends a data frame with columns generated from ColumnGenerator instances
+    """
     def __init__(self, columnGenerators: Sequence[ColumnGenerator], inplace=False):
         super().__init__()
         self.columnGenerators = columnGenerators
@@ -674,7 +677,9 @@ def info(self):
 
 class DFTCountEntries(RuleBasedDataFrameTransformer):
     """
-    Adds a new column with counts of the values on a selected column
+    Transforms a data frame, based on one of its columns, into a new data frame containing two columns that indicate the counts
+    of unique values in the input column. It is the "DataFrame output version" of pd.Series.value_counts.
+    Each row of the output column holds a unique value of the input column and the number of times it appears in the input column.
     """
     def __init__(self, columnForEntryCount: str, columnNameForResultingCounts: str = "counts"):
         super().__init__()

From 4eaab9e5c4e4969f65878430ee8bb26a5b98e900 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 22:03:28 +0200
Subject: [PATCH 007/131] Added DFTFillNA and DFTDropNA

---
 src/sensai/data_transformation/dft.py | 38 +++++++++++++++++++++++++++
 1 file changed, 38 insertions(+)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 1a45d9cf..9e8b7aba 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -804,3 +804,41 @@ class DFTSortColumns(RuleBasedDataFrameTransformer):
     """
     def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
         return df[sorted(df.columns)]
+
+
+class DFTFillNA(RuleBasedDataFrameTransformer):
+    """
+    Fills NA/NaN values with the given value
+    """
+    def __init__(self, fillValue, inplace: bool = False):
+        super().__init__()
+        self.fillValue = fillValue
+        self.inplace = inplace
+
+    def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
+        if self.inplace:
+            df.fillna(value=self.fillValue, inplace=True)
+            return df
+        else:
+            return df.fillna(value=self.fillValue)
+
+
+class DFTDropNA(RuleBasedDataFrameTransformer):
+    """
+    Drops rows or columns containin NA/NaN values
+    """
+    def __init__(self, axis=0, inplace=False):
+        """
+        :param axis: 0 to drop rows, 1 to drop columns containing an N/A value
+        :param inplace: whether to perform the operation in-place on the input data frame
+        """
+        super().__init__()
+        self.axis = axis
+        self.inplace = inplace
+
+    def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
+        if self.inplace:
+            df.dropna(axis=self.axis, inplace=True)
+            return df
+        else:
+            return df.dropna(axis=self.axis)
\ No newline at end of file

From 41f85149604f705c271704491697b1577d88d6cf Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 22:46:01 +0200
Subject: [PATCH 008/131] Added FeatureGeneratorNAMarker, which generates
 features which mark whether other features are N/A

---
 src/sensai/featuregen.py | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 22b86251..22370794 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -866,6 +866,30 @@ def _createFeaturesDict(self, value) -> Dict[str, Any]:
         pass
 
 
+class FeatureGeneratorNAMarker(RuleBasedFeatureGenerator):
+    """
+    Creates features indicating whether another feature is N/A (not available).
+    It can be practical to use this feature generator in conjunction with DFTFillNA for models that cannot handle missing values.
+    """
+    def __init__(self, columns: List[str], valueA=0, valueNA=1):
+        """
+        :param columns: the columns for which to generate
+        :param valueA: the feature value if the input feature is available
+        :param valueNA: the feature value if the input feature is not available
+        """
+        super().__init__()
+        self.columns = columns
+        self.valueA = valueA
+        self.valueNA = valueNA
+
+    def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
+        newCols = {}
+        valueMap = {True: self.valueNA, False: self.valueA}
+        for col in self.columns:
+            newCols[f"{col}_na"] = [valueMap[isNA] for isNA in df[col].isna()]
+        return pd.DataFrame(newCols, index=df.index)
+
+
 def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str] = None,
                             normalisationRules=(), normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
     """

From 1b8a315163aa125832896b2259a0a6f7dee0531c Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 22:46:40 +0200
Subject: [PATCH 009/131] Added integration test using FeatureGeneratorNAMarker
 in conjunction with DFTFillNA with an MLP classifier

---
 tests/base/test_data_transformation.py | 35 +++++++++++++++++++++++++-
 1 file changed, 34 insertions(+), 1 deletion(-)

diff --git a/tests/base/test_data_transformation.py b/tests/base/test_data_transformation.py
index 74bbc7f3..36ff2904 100644
--- a/tests/base/test_data_transformation.py
+++ b/tests/base/test_data_transformation.py
@@ -1,8 +1,16 @@
+import random
+
 import numpy as np
 import pandas as pd
 import sklearn.preprocessing
+from sensai.evaluation import VectorClassificationModelEvaluator
+
+from sensai import InputOutputData
 
-from sensai.data_transformation import DataFrameTransformer, RuleBasedDataFrameTransformer, DataFrameTransformerChain, DFTNormalisation
+from sensai.data_transformation import DataFrameTransformer, RuleBasedDataFrameTransformer, DataFrameTransformerChain, DFTNormalisation, \
+    DFTFillNA
+from sensai.featuregen import MultiFeatureGenerator, FeatureGeneratorTakeColumns, FeatureGeneratorNAMarker
+from sensai.sklearn.sklearn_classification import SkLearnMLPVectorClassificationModel
 
 
 class TestDFTTransformerBasics:
@@ -74,3 +82,28 @@ def test_arrayValued(self):
         dft = DFTNormalisation([DFTNormalisation.Rule(r"foo|bar", transformer=sklearn.preprocessing.MaxAbsScaler(), arrayValued=True)])
         df2 = dft.fitApply(df)
         assert np.all(df2.foo.iloc[0] == arr/100) and np.all(df2.foo.iloc[-1] == arr/10)
+
+
+
+def test_NA_transformation(irisClassificationTestCase):
+    iodata = irisClassificationTestCase.data
+
+    # create some random N/A values in the data set
+    inputs = iodata.inputs.copy()
+    rand = random.Random(42)
+    fullIndices = list(range(len(inputs)))
+    for col in inputs.columns:
+        indices = rand.sample(fullIndices, 20)
+        inputs[col].iloc[indices] = np.nan
+    iodata = InputOutputData(inputs, iodata.outputs)
+
+    fg = MultiFeatureGenerator(FeatureGeneratorTakeColumns(), FeatureGeneratorNAMarker(inputs.columns))
+    model = SkLearnMLPVectorClassificationModel() \
+        .withFeatureGenerator(fg) \
+        .withInputTransformers(DFTFillNA(0))
+
+    ev = VectorClassificationModelEvaluator(iodata, testFraction=0.2)
+    ev.fitModel(model)
+    result = ev.evalModel(model)
+    accuracy = result.getEvalStats().getAccuracy()
+    assert accuracy > 0.85
\ No newline at end of file

From 15fd2371ada6e73e34bae355a43e7ca63955a2a7 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 23:10:42 +0200
Subject: [PATCH 010/131] DFTNormalisation: Extended docstring to mention
 handling of N/A values

---
 src/sensai/data_transformation/dft.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 9e8b7aba..8dfa9d66 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -437,7 +437,8 @@ class DFTNormalisation(DataFrameTransformer):
     """
     Applies normalisation/scaling to a data frame by applying a set of transformation rules, where each
     rule defines a set of columns to which it applies (learning a single transformer based on the values
-    of all applicable columns)
+    of all applicable columns).
+    DFTNormalisation ignores N/A values during fitting and application.
     """
 
     class RuleTemplate:

From bd8316a83b85ea3055f3a74ee57ba3070c347020 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 23:14:35 +0200
Subject: [PATCH 011/131] FeatureGeneratorNAMarker: Added a normalisation rule
 template to enable use with DFTNormalisation

---
 src/sensai/featuregen.py | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 22370794..b93c535b 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -9,8 +9,9 @@
 
 from . import util, data_transformation
 from .columngen import ColumnGenerator
+from .data_transformation import DFTNormalisation
 from .util import flattenArguments
-from .util.string import orRegexGroup, ToStringMixin, dictString, listString
+from .util.string import orRegexGroup, ToStringMixin, listString
 
 if TYPE_CHECKING:
     from .vector_model import VectorModel
@@ -873,11 +874,15 @@ class FeatureGeneratorNAMarker(RuleBasedFeatureGenerator):
     """
     def __init__(self, columns: List[str], valueA=0, valueNA=1):
         """
+        Note: When changing the default values used, use only values that are considered to be normalised when using this
+        feature generation in a context where DFTNormalisation is used (no normalisation is applied to features generated
+        by this feature generator).
+
         :param columns: the columns for which to generate
         :param valueA: the feature value if the input feature is available
         :param valueNA: the feature value if the input feature is not available
         """
-        super().__init__()
+        super().__init__(normalisationRuleTemplate=DFTNormalisation.RuleTemplate(skip=True))
         self.columns = columns
         self.valueA = valueA
         self.valueNA = valueNA

From c2c8575f9de5a96f2bb3d453867e3c58d441b92a Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 6 May 2022 23:15:34 +0200
Subject: [PATCH 012/131] Added normalisation to N/A transformation test

---
 tests/base/test_data_transformation.py | 16 ++++++++++++++--
 1 file changed, 14 insertions(+), 2 deletions(-)

diff --git a/tests/base/test_data_transformation.py b/tests/base/test_data_transformation.py
index 36ff2904..a401d83b 100644
--- a/tests/base/test_data_transformation.py
+++ b/tests/base/test_data_transformation.py
@@ -1,8 +1,11 @@
+import logging
 import random
 
 import numpy as np
 import pandas as pd
 import sklearn.preprocessing
+
+from sensai.data_transformation.sklearn_transformer import SkLearnTransformerFactoryFactory
 from sensai.evaluation import VectorClassificationModelEvaluator
 
 from sensai import InputOutputData
@@ -13,6 +16,9 @@
 from sensai.sklearn.sklearn_classification import SkLearnMLPVectorClassificationModel
 
 
+log = logging.getLogger(__name__)
+
+
 class TestDFTTransformerBasics:
     class TestDFT(DataFrameTransformer):
         def _fit(self, df: pd.DataFrame):
@@ -97,13 +103,19 @@ def test_NA_transformation(irisClassificationTestCase):
         inputs[col].iloc[indices] = np.nan
     iodata = InputOutputData(inputs, iodata.outputs)
 
-    fg = MultiFeatureGenerator(FeatureGeneratorTakeColumns(), FeatureGeneratorNAMarker(inputs.columns))
+    fg = MultiFeatureGenerator(FeatureGeneratorTakeColumns(normalisationRuleTemplate=DFTNormalisation.RuleTemplate(independentColumns=True)),
+        FeatureGeneratorNAMarker(inputs.columns))
     model = SkLearnMLPVectorClassificationModel() \
         .withFeatureGenerator(fg) \
-        .withInputTransformers(DFTFillNA(0))
+        .withInputTransformers(
+            DFTNormalisation(fg.getNormalisationRules(), defaultTransformerFactory=SkLearnTransformerFactoryFactory.StandardScaler()),
+            DFTFillNA(-3))
+    # NOTE: using -3 instead of 0 to fill N/A values in order to force the model to learn the purpose of the N/A markers,
+    # because 0 values are actually a reasonable fallback (which happens to work) when using StandardScaler
 
     ev = VectorClassificationModelEvaluator(iodata, testFraction=0.2)
     ev.fitModel(model)
     result = ev.evalModel(model)
     accuracy = result.getEvalStats().getAccuracy()
+    log.info(f"Accuracy = {accuracy}")
     assert accuracy > 0.85
\ No newline at end of file

From 0b3dcb0429ff2e5af2bd1bbb96110a3bfe436aa6 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 7 May 2022 12:02:38 +0200
Subject: [PATCH 013/131] FeatureCollector: Renamed
 getNormalizationRules->getNormalisationRules, but keeping the old function as
 a wrapper for backward compatibility

---
 src/sensai/featuregen.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index b93c535b..f9889c1f 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -738,10 +738,13 @@ def __init__(self, *featureGeneratorsOrNames: Union[str, FeatureGenerator], regi
     def getMultiFeatureGenerator(self) -> MultiFeatureGenerator:
         return self._multiFeatureGenerator
 
-    def getNormalizationRules(self, includeGeneratedCategoricalRules=True):
+    def getNormalisationRules(self, includeGeneratedCategoricalRules=True):
         return self.getMultiFeatureGenerator().getNormalisationRules(
             includeGeneratedCategoricalRules=includeGeneratedCategoricalRules)
 
+    def getNormalizationRules(self, includeGeneratedCategoricalRules=True):  # for backward compatibility
+        return self.getNormalisationRules(includeGeneratedCategoricalRules=includeGeneratedCategoricalRules)
+
     def getCategoricalFeatureNameRegex(self) -> str:
         return self.getMultiFeatureGenerator().getCategoricalFeatureNameRegex()
 

From 0d6c6ebb051a5f26931441382aeefbd5b6c835c0 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 7 May 2022 12:03:57 +0200
Subject: [PATCH 014/131] Moved N/A values test to test_featuregen, as it
 primarily tests the effect of the feature generator, adding a second test for
 the (negative) effect of not using the feature generator

---
 tests/base/test_data_transformation.py | 43 +--------------------
 tests/base/test_featuregen.py          | 53 +++++++++++++++++++++++++-
 2 files changed, 53 insertions(+), 43 deletions(-)

diff --git a/tests/base/test_data_transformation.py b/tests/base/test_data_transformation.py
index a401d83b..33ea6c62 100644
--- a/tests/base/test_data_transformation.py
+++ b/tests/base/test_data_transformation.py
@@ -1,20 +1,10 @@
 import logging
-import random
 
 import numpy as np
 import pandas as pd
 import sklearn.preprocessing
 
-from sensai.data_transformation.sklearn_transformer import SkLearnTransformerFactoryFactory
-from sensai.evaluation import VectorClassificationModelEvaluator
-
-from sensai import InputOutputData
-
-from sensai.data_transformation import DataFrameTransformer, RuleBasedDataFrameTransformer, DataFrameTransformerChain, DFTNormalisation, \
-    DFTFillNA
-from sensai.featuregen import MultiFeatureGenerator, FeatureGeneratorTakeColumns, FeatureGeneratorNAMarker
-from sensai.sklearn.sklearn_classification import SkLearnMLPVectorClassificationModel
-
+from sensai.data_transformation import DataFrameTransformer, RuleBasedDataFrameTransformer, DataFrameTransformerChain, DFTNormalisation
 
 log = logging.getLogger(__name__)
 
@@ -88,34 +78,3 @@ def test_arrayValued(self):
         dft = DFTNormalisation([DFTNormalisation.Rule(r"foo|bar", transformer=sklearn.preprocessing.MaxAbsScaler(), arrayValued=True)])
         df2 = dft.fitApply(df)
         assert np.all(df2.foo.iloc[0] == arr/100) and np.all(df2.foo.iloc[-1] == arr/10)
-
-
-
-def test_NA_transformation(irisClassificationTestCase):
-    iodata = irisClassificationTestCase.data
-
-    # create some random N/A values in the data set
-    inputs = iodata.inputs.copy()
-    rand = random.Random(42)
-    fullIndices = list(range(len(inputs)))
-    for col in inputs.columns:
-        indices = rand.sample(fullIndices, 20)
-        inputs[col].iloc[indices] = np.nan
-    iodata = InputOutputData(inputs, iodata.outputs)
-
-    fg = MultiFeatureGenerator(FeatureGeneratorTakeColumns(normalisationRuleTemplate=DFTNormalisation.RuleTemplate(independentColumns=True)),
-        FeatureGeneratorNAMarker(inputs.columns))
-    model = SkLearnMLPVectorClassificationModel() \
-        .withFeatureGenerator(fg) \
-        .withInputTransformers(
-            DFTNormalisation(fg.getNormalisationRules(), defaultTransformerFactory=SkLearnTransformerFactoryFactory.StandardScaler()),
-            DFTFillNA(-3))
-    # NOTE: using -3 instead of 0 to fill N/A values in order to force the model to learn the purpose of the N/A markers,
-    # because 0 values are actually a reasonable fallback (which happens to work) when using StandardScaler
-
-    ev = VectorClassificationModelEvaluator(iodata, testFraction=0.2)
-    ev.fitModel(model)
-    result = ev.evalModel(model)
-    accuracy = result.getEvalStats().getAccuracy()
-    log.info(f"Accuracy = {accuracy}")
-    assert accuracy > 0.85
\ No newline at end of file
diff --git a/tests/base/test_featuregen.py b/tests/base/test_featuregen.py
index 43f60675..f8766d11 100644
--- a/tests/base/test_featuregen.py
+++ b/tests/base/test_featuregen.py
@@ -1,9 +1,20 @@
+import logging
+import random
+
 import numpy as np
 import pandas as pd
 import pytest
 
+from sensai import InputOutputData
+from sensai.data_transformation import DFTNormalisation, DFTFillNA
+from sensai.data_transformation.sklearn_transformer import SkLearnTransformerFactoryFactory
+from sensai.evaluation import VectorClassificationModelEvaluator
 from sensai.featuregen import FeatureGeneratorFlattenColumns, FeatureGeneratorTakeColumns, flattenedFeatureGenerator, \
-    FeatureGenerator, RuleBasedFeatureGenerator, MultiFeatureGenerator, ChainedFeatureGenerator
+    FeatureGenerator, RuleBasedFeatureGenerator, MultiFeatureGenerator, ChainedFeatureGenerator, FeatureGeneratorNAMarker, FeatureCollector
+from sensai.sklearn.sklearn_classification import SkLearnMLPVectorClassificationModel
+
+
+log = logging.getLogger(__name__)
 
 
 def test_take_columns():
@@ -95,3 +106,43 @@ def test_combinationFittedIffEachMemberFitted(self):
         chainfgen = ChainedFeatureGenerator(RuleBasedTestFgen(), RuleBasedTestFgen())
         assert multifgen.isFitted() and chainfgen.isFitted()
 
+
+def test_FeatureGeneratorNAMarker(irisClassificationTestCase):
+    """
+    Integration test for handling of N/A values via marker features (using FeatureGeneratorNAMarker) in the context of models
+    that do not support N/A values, replacing them with a different value (using FillNA)
+    """
+    iodata = irisClassificationTestCase.data
+
+    # create some random N/A values in the data set
+    inputs = iodata.inputs.copy()
+    rand = random.Random(42)
+    fullIndices = list(range(len(inputs)))
+    for col in inputs.columns:
+        indices = rand.sample(fullIndices, 20)
+        inputs[col].iloc[indices] = np.nan
+    iodata = InputOutputData(inputs, iodata.outputs)
+
+    for useFGNA in (True, False):
+        fgs = [FeatureGeneratorTakeColumns(normalisationRuleTemplate=DFTNormalisation.RuleTemplate(independentColumns=True))]
+        if useFGNA:
+            fgs.append(FeatureGeneratorNAMarker(inputs.columns))
+        fCollector = FeatureCollector(*fgs)
+        model = SkLearnMLPVectorClassificationModel() \
+            .withFeatureCollector(fCollector) \
+            .withInputTransformers(
+                DFTNormalisation(fCollector.getNormalisationRules(), defaultTransformerFactory=SkLearnTransformerFactoryFactory.StandardScaler()),
+                DFTFillNA(-3))
+        # NOTE: using -3 instead of 0 to fill N/A values in order to force the model to learn the purpose of the N/A markers,
+        # because 0 values are actually a reasonable fallback (which happens to work) when using StandardScaler
+        # NOTE: it is important to apply DFTNormalisation before DFTFillNA, because DFTNormalisation would learn using the filled values otherwise
+
+        ev = VectorClassificationModelEvaluator(iodata, testFraction=0.2)
+        ev.fitModel(model)
+        result = ev.evalModel(model)
+        accuracy = result.getEvalStats().getAccuracy()
+        log.info(f"Accuracy (for useFGNA={useFGNA}) = {accuracy}")
+        if useFGNA:
+            assert accuracy > 0.85
+        else:
+            assert accuracy < 0.85
\ No newline at end of file

From 22c66c7b82f25e19b70ac722a851134df4492ea1 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 7 May 2022 12:27:47 +0200
Subject: [PATCH 015/131] VectorModel: Allow input computation (particularly
 DFTs) to filter the data points

---
 src/sensai/vector_model.py | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index cb852f3a..8a7995b4 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -313,8 +313,16 @@ def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True)
             else:
                 if Y is None:
                     raise Exception(f"The underlying model requires a data frame for fitting but Y=None was passed")
+                if len(X) != len(Y):
+                    raise ValueError(f"Length of input ({len(X)}) does not match length of output ({len(Y)})")
                 Y = self._computeModelOutputs(Y)
                 X = self._computeModelInputs(X, Y=Y, fit=fitPreprocessors)
+                if len(X) != len(Y):
+                    log.debug(f"Input computation changed number of data points ({len(self._trainingContext.originalInput)} -> {len(X)})")
+                    Y = Y.loc[X.index]
+                    if len(X) != len(Y):
+                        raise ValueError("Could not recover matching outputs for changed inputs. Only input filtering is admissible, "
+                            "indices of input & ouput data frames must match.")
                 self._modelInputVariableNames = list(X.columns)
                 inputsWithTypes = ', '.join([n + '/' + X[n].dtype.name for n in self._modelInputVariableNames])
                 log.info(f"Fitting with outputs[{len(Y.columns)}]={list(Y.columns)}, "

From 8ccf5b66eb5bce0d3f8cfee59e6b7de9cdae9747 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 7 May 2022 12:29:18 +0200
Subject: [PATCH 016/131] Added test for VectorModel, where an input DFT
 removes input rows

---
 tests/base/test_vector_model.py | 35 ++++++++++++++++++++++++++++++---
 1 file changed, 32 insertions(+), 3 deletions(-)

diff --git a/tests/base/test_vector_model.py b/tests/base/test_vector_model.py
index c7e2a7db..2a196e0b 100644
--- a/tests/base/test_vector_model.py
+++ b/tests/base/test_vector_model.py
@@ -1,13 +1,16 @@
+import random
 from copy import copy
 from typing import Optional
 
+import numpy as np
 import pandas as pd
 import pytest
 
+from sensai import InputOutputData
 from sensai.data_transformation import DFTDRowFilterOnIndex, \
-    InvertibleDataFrameTransformer
+    InvertibleDataFrameTransformer, DFTDropNA
 from sensai.featuregen import FeatureGeneratorTakeColumns, FeatureGenerator
-from sensai.vector_model import RuleBasedVectorRegressionModel, VectorRegressionModel
+from sensai.vector_model import RuleBasedVectorRegressionModel, VectorRegressionModel, VectorClassificationModel
 
 
 class FittableFgen(FeatureGenerator):
@@ -146,4 +149,30 @@ def test_isFittedWithTargetTransformer(self, vectorModel, fittableDFT):
         assert vectorModel.getTargetTransformer().isFitted()
 
 
-
+def test_InputRowsRemovedByTransformer(irisClassificationTestCase):
+    """
+    Tests handling of case where the input generation process removes rows from the data
+    """
+    iodata = irisClassificationTestCase.data
+
+    # create some random N/A values in one of the columns
+    numNAValues = 20
+    inputs = iodata.inputs.copy()
+    rand = random.Random(42)
+    fullIndices = list(range(len(inputs)))
+    indices = rand.sample(fullIndices, numNAValues)
+    inputs.iloc[:, 0].iloc[indices] = np.nan
+    iodata = InputOutputData(inputs, iodata.outputs)
+    expectedLength = len(iodata) - numNAValues
+
+    class MyModel(VectorClassificationModel):
+        def _fitClassifier(self, X: pd.DataFrame, y: pd.DataFrame):
+            assert len(X) == expectedLength
+            assert len(y) == expectedLength
+            assert all(X.index.values == y.index.values)
+
+        def _predictClassProbabilities(self, X: pd.DataFrame) -> pd.DataFrame:
+            pass
+
+    model = MyModel().withInputTransformers(DFTDropNA())
+    model.fit(iodata.inputs, iodata.outputs)

From 60e5066c353e374e6ccd00c799e128c06d657109 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 7 May 2022 12:40:31 +0200
Subject: [PATCH 017/131] Try nbconvert 6.5.0 as a potential fix for build
 error: ImportError: cannot import name 'contextfilter' from 'jinja2'

---
 tox.ini | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tox.ini b/tox.ini
index 1dd21ca4..51eba350 100644
--- a/tox.ini
+++ b/tox.ini
@@ -21,7 +21,7 @@ deps =
     pytest-cov
     pytest-xdist
     jupyter==1.0.0
-    nbconvert==6.1.0
+    nbconvert==6.5.0
     clearml==0.17.1
 ;   TODO: For some reason including this into setup.py makes things slow locally, fail silently on gitlab
 ;     and lead to non-ending builds (2.5h+) on github. This dependency should be installable with pip install sensai[torch] though...

From a285dee3546e07c6ddf2cd2f213bceae638a9c1e Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 7 May 2022 12:57:36 +0200
Subject: [PATCH 018/131] Fixed type annotations and a format string

---
 src/sensai/torch/torch_eval_util.py | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/src/sensai/torch/torch_eval_util.py b/src/sensai/torch/torch_eval_util.py
index 5bfc152b..1cb59839 100644
--- a/src/sensai/torch/torch_eval_util.py
+++ b/src/sensai/torch/torch_eval_util.py
@@ -1,22 +1,23 @@
 from typing import Union
 
-from ..evaluation import RegressionEvaluationUtil
-from ..evaluation.crossval import VectorModelCrossValidationData
-from ..evaluation.eval_util import TEvalData, TCrossValData
-from ..evaluation.evaluator import VectorModelEvaluationData
 from . import TorchVectorRegressionModel
+from ..evaluation import RegressionEvaluationUtil
+from ..evaluation.crossval import VectorModelCrossValidationData, VectorRegressionModelCrossValidationData
+from ..evaluation.eval_util import EvaluationResultCollector
+from ..evaluation.evaluator import VectorModelEvaluationData, VectorRegressionModelEvaluationData
 
 
 class TorchVectorRegressionModelEvaluationUtil(RegressionEvaluationUtil):
 
-    def _createPlots(self, data: Union[TEvalData, TCrossValData], resultCollector: RegressionEvaluationUtil.ResultCollector, subtitle=None):
+    def _createPlots(self, data: Union[VectorRegressionModelEvaluationData, VectorRegressionModelCrossValidationData], resultCollector: EvaluationResultCollector,
+            subtitle=None):
         super()._createPlots(data, resultCollector, subtitle)
         if isinstance(data, VectorModelEvaluationData):
             self._addLossProgressionPlotIfTorchVectorRegressionModel(data.model, "loss-progression", resultCollector)
         elif isinstance(data, VectorModelCrossValidationData):
             if data.trainedModels is not None:
                 for i, model in enumerate(data.trainedModels, start=1):
-                    self._addLossProgressionPlotIfTorchVectorRegressionModel(model, "loss-progression-{i}", resultCollector)
+                    self._addLossProgressionPlotIfTorchVectorRegressionModel(model, f"loss-progression-{i}", resultCollector)
 
     @staticmethod
     def _addLossProgressionPlotIfTorchVectorRegressionModel(model, plotName, resultCollector):

From 5de96427f730a4b47f271969875efa407ba28ada Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Sun, 8 May 2022 15:34:34 +0200
Subject: [PATCH 019/131] Moved package contents of sensai.geoanalytics to
 sensai.geoanalytics.geopandas to make room for other non-geopandas-dependent
 geoanalytics modules that shall be usable without requiring geopandas

---
 notebooks/Clustering Evaluation.ipynb         |   4 +-
 .../Intro to Coordinate Clustering.ipynb      | 144 ++++++++++++++----
 notebooks/Tracking Experiments.ipynb          |   4 +-
 src/sensai/geoanalytics/__init__.py           |   1 -
 src/sensai/geoanalytics/geopandas/__init__.py |   1 +
 .../{ => geopandas}/coordinate_clustering.py  |  10 +-
 .../coordinate_clustering_ground_truth.py     |   0
 .../{ => geopandas}/coordinates.py            |   2 +-
 .../geoanalytics/{ => geopandas}/geometry.py  |   0
 .../geoanalytics/{ => geopandas}/graph.py     |   0
 .../geoanalytics/test_geoanalytics.py         |   8 +-
 11 files changed, 135 insertions(+), 39 deletions(-)
 create mode 100644 src/sensai/geoanalytics/geopandas/__init__.py
 rename src/sensai/geoanalytics/{ => geopandas}/coordinate_clustering.py (96%)
 rename src/sensai/geoanalytics/{ => geopandas}/coordinate_clustering_ground_truth.py (100%)
 rename src/sensai/geoanalytics/{ => geopandas}/coordinates.py (97%)
 rename src/sensai/geoanalytics/{ => geopandas}/geometry.py (100%)
 rename src/sensai/geoanalytics/{ => geopandas}/graph.py (100%)

diff --git a/notebooks/Clustering Evaluation.ipynb b/notebooks/Clustering Evaluation.ipynb
index b2cd9d0a..2b718151 100644
--- a/notebooks/Clustering Evaluation.ipynb	
+++ b/notebooks/Clustering Evaluation.ipynb	
@@ -66,13 +66,13 @@
     "import matplotlib.pyplot as plt\n",
     "import logging\n",
     "\n",
-    "from sensai.geoanalytics.coordinate_clustering import SkLearnCoordinateClustering\n",
+    "from sensai.geoanalytics.geopandas.coordinate_clustering import SkLearnCoordinateClustering\n",
     "from sensai.hyperopt import GridSearch\n",
     "from sensai.evaluation.evaluator_clustering import ClusteringModelSupervisedEvaluator, \\\n",
     "    ClusteringModelUnsupervisedEvaluator\n",
     "from sensai.evaluation.eval_stats import ClusteringUnsupervisedEvalStats, ClusteringSupervisedEvalStats, \\\n",
     "    AdjustedMutualInfoScore\n",
-    "from sensai.geoanalytics.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates\n",
+    "from sensai.geoanalytics.geopandas.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates\n",
     "\n",
     "from config import get_config\n",
     "\n",
diff --git a/notebooks/Intro to Coordinate Clustering.ipynb b/notebooks/Intro to Coordinate Clustering.ipynb
index 0753b9bd..cc9ee369 100644
--- a/notebooks/Intro to Coordinate Clustering.ipynb	
+++ b/notebooks/Intro to Coordinate Clustering.ipynb	
@@ -2,7 +2,11 @@
  "cells": [
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "# The Coordinate Clustering Module\n",
     "\n",
@@ -25,7 +29,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "# Note - this cell should be executed only once per session\n",
@@ -42,7 +50,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "import os\n",
@@ -53,9 +65,9 @@
     "from sklearn.cluster import DBSCAN\n",
     "\n",
     "import logging\n",
-    "from sensai.geoanalytics.graph import CoordinateSpanningTree\n",
-    "from sensai.geoanalytics.coordinate_clustering import SkLearnCoordinateClustering\n",
-    "from sensai.geoanalytics.geometry import alphaShape\n",
+    "from sensai.geoanalytics.geopandas.graph import CoordinateSpanningTree\n",
+    "from sensai.geoanalytics.geopandas.coordinate_clustering import SkLearnCoordinateClustering\n",
+    "from sensai.geoanalytics.geopandas.geometry import alphaShape\n",
     "from config import get_config\n",
     "\n",
     "logging.basicConfig(level=logging.INFO)\n",
@@ -64,7 +76,11 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "## Loading and Fitting"
    ]
@@ -85,7 +101,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "sampleFile = c.datafile_path(\"sample\", stage=c.RAW) # this can point to a directory or a shp/geojson file\n",
@@ -96,7 +116,11 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "The resulting `CoordinateClusteringAlgorithm` instance has many useful methods.\n",
     "You can retrieve clusters individually or via a generator. The noise cluster can be accessed individually"
@@ -105,7 +129,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "print(f\"Clusters found: {dbscan.numClusters}\")\n",
@@ -117,14 +145,22 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "## Analysis and Visualization"
    ]
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "From the dbscan single clusters which are instances of `CoordinateClusteringAlgorithm.Cluster` \n",
     "can be retrieved and visualized. Most objects, including the dbscan itself, have an inbuilt plot method"
@@ -133,7 +169,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "dbscan.plot(markersize=0.2)"
@@ -141,7 +181,11 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "We can condition before plotting as well as pass custom arguments"
    ]
@@ -149,7 +193,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "dbscan.plot(condition=lambda x: len(x) >= 50, cmap='plasma')"
@@ -157,7 +205,11 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "### Properties of a single cluster\n",
     "\n",
@@ -167,7 +219,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "sampleCluster = dbscan.getCluster(0)\n",
@@ -177,7 +233,11 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "Clusters have an identifier and coordinates. It is easy to extract additional information,\n",
     "e.g. via the summary method"
@@ -186,7 +246,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "pprint(sampleCluster.summaryDict())"
@@ -279,7 +343,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "print(\"cluster summary:\")\n",
@@ -289,7 +357,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "dbscan.summaryDF().head()"
@@ -297,14 +369,22 @@
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "## Saving and Loading"
    ]
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "All of the objects used above can be exported to a GeoDataFrame using the `toGeoDF` method. This geodataframe\n",
     "can then be persisted as usual.\n",
@@ -320,7 +400,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "dbscanGeoDF = dbscan.toGeoDF() # here again a condition for filtering clusters can be passed\n",
@@ -332,7 +416,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "dbscanSavedPath = os.path.join(c.temp, f\"{dbscan}_sample.pickle\")\n",
@@ -346,7 +434,11 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "loadedDBSCAN = SkLearnCoordinateClustering.load(dbscanSavedPath)\n",
diff --git a/notebooks/Tracking Experiments.ipynb b/notebooks/Tracking Experiments.ipynb
index fa8f0b95..c539a9de 100644
--- a/notebooks/Tracking Experiments.ipynb	
+++ b/notebooks/Tracking Experiments.ipynb	
@@ -51,9 +51,9 @@
     "from sklearn.cluster import DBSCAN\n",
     "import logging\n",
     "\n",
-    "from sensai.geoanalytics.coordinate_clustering import SkLearnCoordinateClustering\n",
+    "from sensai.geoanalytics.geopandas.coordinate_clustering import SkLearnCoordinateClustering\n",
     "from sensai.evaluation.evaluator_clustering import ClusteringModelSupervisedEvaluator\n",
-    "from sensai.geoanalytics.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates\n",
+    "from sensai.geoanalytics.geopandas.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates\n",
     "from sensai.tracking.clearml_tracking import ClearMLExperiment\n",
     "\n",
     "import matplotlib.pyplot as plt\n",
diff --git a/src/sensai/geoanalytics/__init__.py b/src/sensai/geoanalytics/__init__.py
index ee3ddaa4..e69de29b 100644
--- a/src/sensai/geoanalytics/__init__.py
+++ b/src/sensai/geoanalytics/__init__.py
@@ -1 +0,0 @@
-from . import coordinates, coordinate_clustering, coordinate_clustering_ground_truth, geometry
\ No newline at end of file
diff --git a/src/sensai/geoanalytics/geopandas/__init__.py b/src/sensai/geoanalytics/geopandas/__init__.py
new file mode 100644
index 00000000..ee3ddaa4
--- /dev/null
+++ b/src/sensai/geoanalytics/geopandas/__init__.py
@@ -0,0 +1 @@
+from . import coordinates, coordinate_clustering, coordinate_clustering_ground_truth, geometry
\ No newline at end of file
diff --git a/src/sensai/geoanalytics/coordinate_clustering.py b/src/sensai/geoanalytics/geopandas/coordinate_clustering.py
similarity index 96%
rename from src/sensai/geoanalytics/coordinate_clustering.py
rename to src/sensai/geoanalytics/geopandas/coordinate_clustering.py
index 229213e2..88f901b4 100644
--- a/src/sensai/geoanalytics/coordinate_clustering.py
+++ b/src/sensai/geoanalytics/geopandas/coordinate_clustering.py
@@ -4,12 +4,12 @@
 from shapely.geometry import MultiPoint
 from typing import Callable, Union, Iterable
 
-from ..clustering.clustering_base import EuclideanClusterer
-from ..clustering import SkLearnEuclideanClusterer
-from ..clustering.sklearn_clustering import SkLearnClustererProtocol
-from ..util.cache import LoadSaveInterface
+from ...clustering.clustering_base import EuclideanClusterer
+from ...clustering import SkLearnEuclideanClusterer
+from ...clustering.sklearn_clustering import SkLearnClustererProtocol
+from ...util.cache import LoadSaveInterface
 from .coordinates import validateCoordinates, extractCoordinatesArray, TCoordinates, GeoDataFrameWrapper
-from ..util.profiling import timed
+from ...util.profiling import timed
 
 log = logging.getLogger(__name__)
 
diff --git a/src/sensai/geoanalytics/coordinate_clustering_ground_truth.py b/src/sensai/geoanalytics/geopandas/coordinate_clustering_ground_truth.py
similarity index 100%
rename from src/sensai/geoanalytics/coordinate_clustering_ground_truth.py
rename to src/sensai/geoanalytics/geopandas/coordinate_clustering_ground_truth.py
diff --git a/src/sensai/geoanalytics/coordinates.py b/src/sensai/geoanalytics/geopandas/coordinates.py
similarity index 97%
rename from src/sensai/geoanalytics/coordinates.py
rename to src/sensai/geoanalytics/geopandas/coordinates.py
index 6867bfad..c2414b75 100644
--- a/src/sensai/geoanalytics/coordinates.py
+++ b/src/sensai/geoanalytics/geopandas/coordinates.py
@@ -4,7 +4,7 @@
 from shapely.geometry import MultiPoint
 from typing import Union
 
-from ..clustering import EuclideanClusterer
+from ...clustering import EuclideanClusterer
 
 TCoordinates = Union[np.ndarray, MultiPoint, gp.GeoDataFrame, EuclideanClusterer.Cluster]
 
diff --git a/src/sensai/geoanalytics/geometry.py b/src/sensai/geoanalytics/geopandas/geometry.py
similarity index 100%
rename from src/sensai/geoanalytics/geometry.py
rename to src/sensai/geoanalytics/geopandas/geometry.py
diff --git a/src/sensai/geoanalytics/graph.py b/src/sensai/geoanalytics/geopandas/graph.py
similarity index 100%
rename from src/sensai/geoanalytics/graph.py
rename to src/sensai/geoanalytics/geopandas/graph.py
diff --git a/tests/frameworks/geoanalytics/test_geoanalytics.py b/tests/frameworks/geoanalytics/test_geoanalytics.py
index 999d99f5..07ba6b2a 100644
--- a/tests/frameworks/geoanalytics/test_geoanalytics.py
+++ b/tests/frameworks/geoanalytics/test_geoanalytics.py
@@ -1,3 +1,7 @@
-def test_geoanalytics():
-    import sensai.geoanalytics
+from sensai.util import markUsed
+
+
+def test_geoanalytics_geopandas():
+    import sensai.geoanalytics.geopandas
+    markUsed(sensai.geoanalytics.geopandas)
     assert True
\ No newline at end of file

From 31ecb4781ae1248b5428c96424af8edae596b87b Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Sun, 8 May 2022 16:50:48 +0200
Subject: [PATCH 020/131] Added comment indicating preferred use of conda

---
 requirements-dev.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/requirements-dev.txt b/requirements-dev.txt
index fc4f6fcd..5d623e77 100644
--- a/requirements-dev.txt
+++ b/requirements-dev.txt
@@ -1,3 +1,4 @@
+# This file has been superseded by environment.yml; use conda to install a developer environment
 PyQt5==5.14.1
 psutil==5.6.7
 torch==1.4.0

From 92f20ef83ecc7450cdca8302801792fed0685085 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Sun, 8 May 2022 16:51:25 +0200
Subject: [PATCH 021/131] Added new modules for geoanalytics dealing with
 geographic coordinates, local coordinate systems and map tiles

---
 docs/conf.py                               |   3 +-
 environment.yml                            |   1 +
 setup.py                                   |   7 +-
 src/sensai/geoanalytics/_globalmaptiles.py | 359 +++++++++++++++++++++
 src/sensai/geoanalytics/geo_coords.py      | 183 +++++++++++
 src/sensai/geoanalytics/local_coords.py    | 181 +++++++++++
 src/sensai/geoanalytics/map_tiles.py       |  57 ++++
 7 files changed, 789 insertions(+), 2 deletions(-)
 create mode 100644 src/sensai/geoanalytics/_globalmaptiles.py
 create mode 100644 src/sensai/geoanalytics/geo_coords.py
 create mode 100644 src/sensai/geoanalytics/local_coords.py
 create mode 100644 src/sensai/geoanalytics/map_tiles.py

diff --git a/docs/conf.py b/docs/conf.py
index cc989b07..ae65ad76 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -121,7 +121,8 @@ def findLineFromObjectName(sourceFile, objectName):
     "azure",
     "geopandas",
     "shapely",
-    "networkx"
+    "networkx",
+    "utm"
 ]
 
 # Render docu of __init__ methods
diff --git a/environment.yml b/environment.yml
index a51d3e9e..8c68ebaf 100644
--- a/environment.yml
+++ b/environment.yml
@@ -20,6 +20,7 @@ dependencies:
   - pyyaml=5.3
   - lightgbm=3.1.1
   - sphinx_rtd_theme
+  - utm
   - pip
   - pip:
       - -r file:requirements.txt
diff --git a/setup.py b/setup.py
index 0a983c24..665a2b45 100644
--- a/setup.py
+++ b/setup.py
@@ -6,17 +6,22 @@
 tf_requirements = ['tensorflow==1.15.0']
 torch_requirements = ['torch==1.4.0', 'torchtext==0.5.0']
 lightgbm_requirements = ['lightgbm==2.3.0']
-geoanalytics_requirements = ['networkx==2.4', 'Shapely~=1.7.0', 'geopandas==0.7.0']
+geoanalytics_requirements = ['networkx==2.4', 'Shapely~=1.7.0', 'geopandas==0.7.0', 'utm==0.7.0']
 
 
 # list of dependencies where ==/~= dependencies (used by us, particularly in requirements.txt) are relaxed:
 # any later version is OK (as long as we are not aware of a concrete limitation - and once we are, we shall define
 # the respective upper bound below)
+# TODO: check if we can relax all of the optional requirements as well (above)
 DEPS_VERSION_LOWER_BOUND = ["pandas", "scipy", "numpy", "scikit-learn", "seaborn", "typing-extensions"]
 DEPS_VERSION_UPPER_BOUND_EXCLUSIVE: Dict[str, str] = {}
 
 
 def required_packages(deps: Iterable[str]):
+    """
+    :param deps: the set of requirements
+    :return: the set of updated requirements with the relaxations defined above applied
+    """
     updated_deps = []
     for dep in deps:
         dep = dep.strip()
diff --git a/src/sensai/geoanalytics/_globalmaptiles.py b/src/sensai/geoanalytics/_globalmaptiles.py
new file mode 100644
index 00000000..da3d20bb
--- /dev/null
+++ b/src/sensai/geoanalytics/_globalmaptiles.py
@@ -0,0 +1,359 @@
+#!/usr/bin/env python
+###############################################################################
+# $Id$
+#
+# Project:  GDAL2Tiles, Google Summer of Code 2007 & 2008
+#           Global Map Tiles Classes
+# Purpose:  Convert a raster into TMS tiles, create KML SuperOverlay EPSG:4326,
+#           generate a simple HTML viewers based on Google Maps and OpenLayers
+# Author:   Klokan Petr Pridal, klokan at klokan dot cz
+# Web:      http://www.klokan.cz/projects/gdal2tiles/
+#
+###############################################################################
+# Copyright (c) 2008 Klokan Petr Pridal. All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included
+# in all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
+# OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+# DEALINGS IN THE SOFTWARE.
+###############################################################################
+
+"""
+_globalmaptiles.py
+
+Global Map Tiles as defined in MapTile Map Service (TMS) Profiles
+==============================================================
+
+Functions necessary for generation of global tiles used on the web.
+It contains classes implementing coordinate conversions for:
+
+  - GlobalMercator (based on EPSG:900913 = EPSG:3785)
+       for Google Maps, Yahoo Maps, Microsoft Maps compatible tiles
+  - GlobalGeodetic (based on EPSG:4326)
+       for OpenLayers Base Map and Google Earth compatible tiles
+
+More info at:
+
+http://wiki.osgeo.org/wiki/Tile_Map_Service_Specification
+http://wiki.osgeo.org/wiki/WMS_Tiling_Client_Recommendation
+http://msdn.microsoft.com/en-us/library/bb259689.aspx
+http://code.google.com/apis/maps/documentation/overlays.html#Google_Maps_Coordinates
+
+Created by Klokan Petr Pridal on 2008-07-03.
+Google Summer of Code 2008, project GDAL2Tiles for OSGEO.
+
+In case you use this class in your product, translate it to another language
+or find it usefull for your project please let me know.
+My email: klokan at klokan dot cz.
+I would like to know where it was used.
+
+Class is available under the open-source GDAL license (www.gdal.org).
+"""
+
+import math
+from typing import Tuple
+
+
+class GlobalMercator(object):
+    """
+    TMS Global Mercator Profile
+    ---------------------------
+
+    Functions necessary for generation of tiles in Spherical Mercator projection,
+    EPSG:900913 (EPSG:gOOglE, Google Maps Global Mercator), EPSG:3785, OSGEO:41001.
+
+    Such tiles are compatible with Google Maps, Microsoft Virtual Earth, Yahoo Maps,
+    UK Ordnance Survey OpenSpace API, ...
+    and you can overlay them on top of base maps of those web mapping applications.
+
+    Pixel and tile coordinates are in TMS notation (origin [0,0] in bottom-left).
+
+    What coordinate conversions do we need for TMS Global Mercator tiles::
+
+         LatLon      <->       Meters      <->     Pixels    <->       MapTile
+
+     WGS84 coordinates   Spherical Mercator  Pixels in pyramid  Tiles in pyramid
+         lat/lon            XY in metres     XY pixels Z zoom      XYZ from TMS
+        EPSG:4326           EPSG:900913
+         .----.              ---------               --                TMS
+        /      \     <->     |       |     <->     /----/    <->      Google
+        \      /             |       |           /--------/          QuadTree
+         -----               ---------         /------------/
+       KML, public         WebMapService         Web Clients      TileMapService
+
+    What is the coordinate extent of Earth in EPSG:900913?
+
+      [-20037508.342789244, -20037508.342789244, 20037508.342789244, 20037508.342789244]
+      Constant 20037508.342789244 comes from the circumference of the Earth in meters,
+      which is 40 thousand kilometers, the coordinate origin is in the middle of extent.
+      In fact you can calculate the constant as: 2 * math.pi * 6378137 / 2.0
+      $ echo 180 85 | gdaltransform -s_srs EPSG:4326 -t_srs EPSG:900913
+      Polar areas with abs(latitude) bigger then 85.05112878 are clipped off.
+
+    What are zoom level constants (pixels/meter) for pyramid with EPSG:900913?
+
+      whole region is on top of pyramid (zoom=0) covered by 256x256 pixels tile,
+      every lower zoom level resolution is always divided by two
+      initialResolution = 20037508.342789244 * 2 / 256 = 156543.03392804062
+
+    What is the difference between TMS and Google Maps/QuadTree tile name convention?
+
+      The tile raster itself is the same (equal extent, projection, pixel size),
+      there is just different identification of the same raster tile.
+      Tiles in TMS are counted from [0,0] in the bottom-left corner, id is XYZ.
+      Google placed the origin [0,0] to the top-left corner, reference is XYZ.
+      Microsoft is referencing tiles by a QuadTree name, defined on the website:
+      http://msdn2.microsoft.com/en-us/library/bb259689.aspx
+
+    The lat/lon coordinates are using WGS84 datum, yeh?
+
+      Yes, all lat/lon we are mentioning should use WGS84 Geodetic Datum.
+      Well, the web clients like Google Maps are projecting those coordinates by
+      Spherical Mercator, so in fact lat/lon coordinates on sphere are treated as if
+      the were on the WGS84 ellipsoid.
+
+      From MSDN documentation:
+      To simplify the calculations, we use the spherical form of projection, not
+      the ellipsoidal form. Since the projection is used only for map display,
+      and not for displaying numeric coordinates, we don't need the extra precision
+      of an ellipsoidal projection. The spherical projection causes approximately
+      0.33 percent scale distortion in the Y direction, which is not visually noticable.
+
+    How do I create a raster in EPSG:900913 and convert coordinates with PROJ.4?
+
+      You can use standard GIS tools like gdalwarp, cs2cs or gdaltransform.
+      All of the tools supports -t_srs 'epsg:900913'.
+
+      For other GIS programs check the exact definition of the projection:
+      More info at http://spatialreference.org/ref/user/google-projection/
+      The same projection is degined as EPSG:3785. WKT definition is in the official
+      EPSG database.
+
+      Proj4 Text:
+        +proj=merc +a=6378137 +b=6378137 +lat_ts=0.0 +lon_0=0.0 +x_0=0.0 +y_0=0
+        +k=1.0 +units=m +nadgrids=@null +no_defs
+
+      Human readable WKT format of EPGS:900913:
+         PROJCS["Google Maps Global Mercator",
+             GEOGCS["WGS 84",
+                 DATUM["WGS_1984",
+                     SPHEROID["WGS 84",6378137,298.2572235630016,
+                         AUTHORITY["EPSG","7030"]],
+                     AUTHORITY["EPSG","6326"]],
+                 PRIMEM["Greenwich",0],
+                 UNIT["degree",0.0174532925199433],
+                 AUTHORITY["EPSG","4326"]],
+             PROJECTION["Mercator_1SP"],
+             PARAMETER["central_meridian",0],
+             PARAMETER["scale_factor",1],
+             PARAMETER["false_easting",0],
+             PARAMETER["false_northing",0],
+             UNIT["metre",1,
+                 AUTHORITY["EPSG","9001"]]]
+    """
+
+    def __init__(self, tileSize=256):
+        """
+        Initialize the TMS Global Mercator pyramid
+
+        :param tileSize: the tile size in pixels
+        """
+        self.tileSize = tileSize
+        self.initialResolution = 2 * math.pi * 6378137 / self.tileSize
+        # 156543.03392804062 for tileSize 256 pixels
+        self.originShift = 2 * math.pi * 6378137 / 2.0
+        # 20037508.342789244
+
+    def LatLonToMeters(self, lat: float, lon: float):
+        """"Converts given lat/lon in WGS84 Datum to XY in Spherical Mercator EPSG:900913"""
+
+        mx = lon * self.originShift / 180.0
+        my = math.log(math.tan((90 + lat) * math.pi / 360.0)) / (math.pi / 180.0)
+
+        my = my * self.originShift / 180.0
+        return mx, my
+
+    def MetersToLatLon(self, mx, my):
+        """Converts XY point from Spherical Mercator EPSG:900913 to lat/lon in WGS84 Datum"""
+
+        lon = (mx / self.originShift) * 180.0
+        lat = (my / self.originShift) * 180.0
+
+        lat = 180 / math.pi * (2 * math.atan(math.exp(lat * math.pi / 180.0)) - math.pi / 2.0)
+        return lat, lon
+
+    def PixelsToMeters(self, px, py, zoom):
+        """Converts pixel coordinates in given zoom level of pyramid to EPSG:900913"""
+
+        res = self.Resolution(zoom)
+        mx = px * res - self.originShift
+        my = py * res - self.originShift
+        return mx, my
+
+    def MetersToPixels(self, mx, my, zoom):
+        """Converts EPSG:900913 to pyramid pixel coordinates in given zoom level"""
+
+        res = self.Resolution(zoom)
+        px = (mx + self.originShift) / res
+        py = (my + self.originShift) / res
+        return px, py
+
+    def PixelsToTile(self, px, py):
+        """Returns a tile covering region in given pixel coordinates"""
+
+        tx = int(math.ceil(px / float(self.tileSize)) - 1)
+        ty = int(math.ceil(py / float(self.tileSize)) - 1)
+        return tx, ty
+
+    def PixelsToRaster(self, px, py, zoom):
+        """Move the origin of pixel coordinates to top-left corner"""
+
+        mapSize = self.tileSize << zoom
+        return px, mapSize - py
+
+    def MetersToTile(self, mx, my, zoom):
+        """Returns tile for given mercator coordinates"""
+
+        px, py = self.MetersToPixels(mx, my, zoom)
+        return self.PixelsToTile(px, py)
+
+    def LatLonToTile(self, lat, lon, zoom) -> Tuple[int, int]:
+        return self.MetersToTile(*self.LatLonToMeters(lat, lon), zoom)
+
+    def TileBounds(self, tx, ty, zoom):
+        """Returns bounds of the given tile in EPSG:900913 coordinates"""
+
+        minx, miny = self.PixelsToMeters(tx*self.tileSize, ty*self.tileSize, zoom)
+        maxx, maxy = self.PixelsToMeters((tx+1)*self.tileSize, (ty+1)*self.tileSize, zoom)
+        return minx, miny, maxx, maxy
+
+    def TileLatLonBounds(self, tx, ty, zoom):
+        """Returns bounds of the given tile in latutude/longitude using WGS84 datum"""
+
+        bounds = self.TileBounds(tx, ty, zoom)
+        minLat, minLon = self.MetersToLatLon(bounds[0], bounds[1])
+        maxLat, maxLon = self.MetersToLatLon(bounds[2], bounds[3])
+
+        return minLat, minLon, maxLat, maxLon
+
+    def Resolution(self, zoom):
+        """Resolution (meters/pixel) for given zoom level (measured at Equator)"""
+
+        # return (2 * math.pi * 6378137) / (self.tileSize * 2**zoom)
+        return self.initialResolution / (2**zoom)
+
+    def ZoomForPixelSize(self, pixelSize):
+        """Maximal scaledown zoom of the pyramid closest to the pixelSize."""
+
+        for i in range(30):
+            if pixelSize > self.Resolution(i):
+                return i-1 if i != 0 else 0  # We don't want to scale up
+
+    @staticmethod
+    def GoogleTile(tx, ty, zoom):
+        """Converts TMS tile coordinates to Google MapTile coordinates"""
+
+        # coordinate origin is moved from bottom-left to top-left corner of the extent
+        return tx, (2**zoom - 1) - ty
+
+    @staticmethod
+    def QuadTree(tx, ty, zoom):
+        """Converts TMS tile coordinates to Microsoft QuadTree"""
+
+        quadKey = ""
+        ty = (2**zoom - 1) - ty
+        for i in range(zoom, 0, -1):
+            digit = 0
+            mask = 1 << (i-1)
+            if (tx & mask) != 0:
+                digit += 1
+            if (ty & mask) != 0:
+                digit += 2
+            quadKey += str(digit)
+
+        return quadKey
+
+
+class GlobalGeodetic(object):
+    """
+    TMS Global Geodetic Profile
+    ---------------------------
+
+    Functions necessary for generation of global tiles in Plate Carre projection,
+    EPSG:4326, "unprojected profile".
+
+    Such tiles are compatible with Google Earth (as any other EPSG:4326 rasters)
+    and you can overlay the tiles on top of OpenLayers base map.
+
+    Pixel and tile coordinates are in TMS notation (origin [0,0] in bottom-left).
+
+    What coordinate conversions do we need for TMS Global Geodetic tiles?
+
+      Global Geodetic tiles are using geodetic coordinates (latitude,longitude)
+      directly as planar coordinates XY (it is also called Unprojected or Plate
+      Carre). We need only scaling to pixel pyramid and cutting to tiles.
+      Pyramid has on top level two tiles, so it is not square but rectangle.
+      Area [-180,-90,180,90] is scaled to 512x256 pixels.
+      TMS has coordinate origin (for pixels and tiles) in bottom-left corner.
+      Rasters are in EPSG:4326 and therefore are compatible with Google Earth.
+
+         LatLon      <->      Pixels      <->     Tiles
+
+     WGS84 coordinates   Pixels in pyramid  Tiles in pyramid
+         lat/lon         XY pixels Z zoom      XYZ from TMS
+        EPSG:4326
+         .----.                ----
+        /      \     <->    /--------/    <->      TMS
+        \      /         /--------------/
+         -----        /--------------------/
+       WMS, KML    Web Clients, Google Earth  TileMapService
+    """
+
+    def __init__(self, tileSize=256):
+        self.tileSize = tileSize
+
+    @staticmethod
+    def LatLonToPixels(lat, lon, zoom):
+        """Converts lat/lon to pixel coordinates in given zoom of the EPSG:4326 pyramid"""
+
+        res = 180 / 256.0 / 2**zoom
+        px = (180 + lat) / res
+        py = (90 + lon) / res
+        return px, py
+
+    def PixelsToTile(self, px, py):
+        """Returns coordinates of the tile covering region in pixel coordinates"""
+
+        tx = int(math.ceil(px / float(self.tileSize)) - 1)
+        ty = int(math.ceil(py / float(self.tileSize)) - 1)
+        return tx, ty
+
+    @staticmethod
+    def Resolution(zoom):
+        """Resolution (arc/pixel) for given zoom level (measured at Equator)"""
+
+        return 180 / 256.0 / 2**zoom
+        #return 180 / float(1 << (8+zoom))
+
+    @staticmethod
+    def TileBounds(tx, ty, zoom):
+        """Returns bounds of the given tile"""
+        res = 180 / 256.0 / 2**zoom
+        return (
+            tx*256*res - 180,
+            ty*256*res - 90,
+            (tx+1)*256*res - 180,
+            (ty+1)*256*res - 90)
diff --git a/src/sensai/geoanalytics/geo_coords.py b/src/sensai/geoanalytics/geo_coords.py
new file mode 100644
index 00000000..93b78398
--- /dev/null
+++ b/src/sensai/geoanalytics/geo_coords.py
@@ -0,0 +1,183 @@
+"""
+Utility functions and classes for geographic coordinates
+"""
+
+import math
+from typing import Tuple
+
+import pandas as pd
+
+from .local_coords import LocalCoordinateSystem
+from ..util.string import ToStringMixin
+
+
+EARTH_RADIUS = 6371000
+EARTH_CIRCUMFERENCE = 2 * math.pi * EARTH_RADIUS
+LATITUDE_PER_METRE = 360.0 / EARTH_CIRCUMFERENCE
+
+
+def longitudePerM(latitude):
+    return LATITUDE_PER_METRE / math.cos(math.radians(latitude))
+
+
+def latitudePerM():
+    return LATITUDE_PER_METRE
+
+
+def approximateSquaredDistance(p1: Tuple[float, float], p2: Tuple[float, float]):
+    """
+    :param p1: a tuple (latitude, longitude)
+    :param p2: a tuple (latitude, longitude)
+    :return: the approximate squared distance (in m²) between p1 and p2
+    """
+    latPerM = latitudePerM()
+    p1lat, p1lon = p1
+    p2lat, p2lon = p2
+    lonPerM = longitudePerM((p1lat + p2lat) / 2)
+    dx = (p2lon - p1lon) / lonPerM
+    dy = (p2lat - p1lat) / latPerM
+    return dx * dx + dy * dy
+
+
+def closestPointOnSegment(searchPos: Tuple[float, float], segPoint1: Tuple[float, float], segPoint2: Tuple[float, float]):
+    """
+    Gets the point on the line segment connecting segPoint1 and segPoint2 that is closest to searchPos
+
+    :param searchPos: the position for which to search for the closest point on the line segment
+    :param segPoint1: the first point defining the line segment on which to search
+    :param segPoint2: the second point defining the line segment on which to search
+    :return: the closest point, which is on the line connecting segPoint1 and segPoint2 (and may be one of the two points)
+    """
+    seg1lat, seg1lon = segPoint1
+    seg2lat, seg2lon = segPoint2
+    srchlat, srchlon = searchPos
+    latPerM = latitudePerM()
+    lonPerM = longitudePerM(srchlat)
+    sp1x = (seg1lon - srchlon) / lonPerM
+    sp1y = (seg1lat - srchlat) / latPerM
+    sp2x = (seg2lon - srchlon) / lonPerM
+    sp2y = (seg2lat - srchlat) / latPerM
+    vx = sp2x - sp1x
+    vy = sp2y - sp1y
+    c1 = -vx * sp1x - vy * sp1y
+    if c1 <= 0:
+        return segPoint1
+    c2 = vx * vx + vy * vy
+    if c2 <= c1:
+        return segPoint2
+    b = 0 if c2 == 0 else c1 / c2
+    lon = seg1lon + b * vx * lonPerM
+    lat = seg1lat + b * vy * latPerM
+    return [lat, lon]
+
+
+def orientation(p1: Tuple[float, float], p2: Tuple[float, float]) -> float:
+    """
+    Gets the orientation angle for the vector from p1 to p2
+
+    :param p1: a (lat, lon) pair
+    :param p2: a (lat, lon) pair
+    :return: the orientation angle in rad
+    """
+    p1Lat, p1Lon = p1
+    p2Lat, p2Lon = p2
+    centerLat = (p1Lat + p2Lat) / 2
+    dx = (p2Lon - p1Lon) / longitudePerM(centerLat)
+    dy = (p2Lat - p1Lat) / latitudePerM()
+    return math.atan2(dy, dx)
+
+
+def absAngleDifference(a1: float, a2: float) -> float:
+    """
+    Computes the absolute angle difference in ]-pi, pi] between two angles
+
+    :param a1: an angle in rad
+    :param a2: an angle in rad
+    :return: the difference in rad
+    """
+    d = a1 - a2
+    while d > math.pi:
+        d -= 2*math.pi
+    while d <= -math.pi:
+        d += 2*math.pi
+    return abs(d)
+
+
+def closestPointOnPolyline(searchPos, polyline, searchOrientationAngle=None, maxAngleDifference=0) -> Tuple[Tuple[float, float], float, int]:
+    """
+    Gets the point on the given polyline that is closest to the given search position along with the
+    distance (in metres) to the polyline
+
+    :param searchPos: a (lat, lon) pair indicating the position for which to find the closest math on the polyline
+    :param polyline: list of (lat, lon) pairs that make up the polyline on which to search
+    :param searchOrientationAngle: if not None, defines the orientation with which to compute angle differences (if maxAngleDifference > 0)
+    :param maxAngleDifference: the maximum absolute angle difference (in rad) that is admissible (between the orientation of the
+        respective line segment and the orientation given in searchOrientationAngle)
+    :return: a tuple (optPoint, optDist, optSegmentStartIdx) where
+        optPoint is the closest point (with admissible orientation - or None if there is none),
+        optDist is the distance from the polyline to the closest point,
+        optSegmentStartIdx is the index of the first point of the segment on the polyline for which the closest point was found
+    """
+    if len(polyline) < 2:
+        raise Exception("Polyline must consist of at least two points")
+    optSegmentStartIdx = None
+    optPoint = None
+    optSqDist = None
+    for i in range(len(polyline)-1):
+        if maxAngleDifference > 0:
+            orientationAngle = orientation(polyline[i], polyline[i+1])
+            angDiff = absAngleDifference(orientationAngle, searchOrientationAngle)
+            if angDiff > maxAngleDifference:
+                continue
+        optSegPoint = closestPointOnSegment(searchPos, polyline[i], polyline[i + 1])
+        sqDist = approximateSquaredDistance(searchPos, optSegPoint)
+        if optSqDist is None or sqDist < optSqDist:
+            optPoint = optSegPoint
+            optSqDist = sqDist
+            optSegmentStartIdx = i
+    return optPoint, math.sqrt(optSqDist), optSegmentStartIdx
+
+
+class GeoCoord(ToStringMixin):
+    """
+    Represents geographic coordinates (WGS84)
+    """
+    def __init__(self, lat: float, lon: float):
+        self.lat = lat
+        self.lon = lon
+
+    def latlon(self):
+        return self.lat, self.lon
+
+    def distanceTo(self, gpsPosition: 'GeoCoord'):
+        return math.sqrt(self.squaredDistanceTo(gpsPosition))
+
+    def squaredDistanceTo(self, gpsPosition: 'GeoCoord'):
+        return approximateSquaredDistance(self.latlon(), gpsPosition.latlon())
+
+    def localCoords(self, lcs):
+        return lcs.getLocalCoords(self.lat, self.lon)
+
+
+class GpsTracePoint(GeoCoord):
+    def __init__(self, lat, lon, time: pd.Timestamp):
+        super().__init__(lat, lon)
+        self.time = time
+
+
+class GeoRect:
+    def __init__(self, minLat: float, minLon: float, maxLat: float, maxLon: float):
+        if maxLat < minLat or maxLon < minLon:
+            raise ValueError()
+        self.minLat = minLat
+        self.minLon = minLon
+        self.maxLat = maxLat
+        self.maxLon = maxLon
+
+    @staticmethod
+    def fromCircle(centreLat, centreLon, radiusM):
+        """Creates the bounding rectangle for the given circular area"""
+        lcs = LocalCoordinateSystem(centreLat, centreLon)
+        minLat, minLon = lcs.getLatLon(-radiusM, -radiusM)
+        maxLat, maxLon = lcs.getLatLon(radiusM, radiusM)
+        return GeoRect(minLat, minLon, maxLat, maxLon)
diff --git a/src/sensai/geoanalytics/local_coords.py b/src/sensai/geoanalytics/local_coords.py
new file mode 100644
index 00000000..b0e69173
--- /dev/null
+++ b/src/sensai/geoanalytics/local_coords.py
@@ -0,0 +1,181 @@
+"""
+Local coordinate systems (for geographic data)
+"""
+import math
+from functools import reduce
+from typing import Tuple, Union, List
+
+import numpy as np
+import utm
+from shapely.geometry import polygon, multipolygon, point, LineString, mapping
+from shapely.ops import polygonize, unary_union
+
+
+class LocalCoordinateSystem(object):
+    """
+    Represents a local coordinate system for the conversion of geo-coordinates
+    (latitude, longitude) to a local Cartesian coordinate system (unit=metre) and vice versa
+    using the UTM transform
+    """
+
+    def __init__(self, lat, lon):
+        """
+        Parameters:
+            lat: the latitude of the origin of the coordinate system
+            lon: the longitude of the origin of the coordinate system
+        """
+        self.uRef = utm.from_latlon(lat, lon)
+        self.uRefE = self.uRef[0]
+        self.uRefN = self.uRef[1]
+        self.uRefPseudoN = self._pseudoNorthing(self.uRefN)
+
+    def getLocalCoords(self, lat, lon) -> Tuple[float, float]:
+        uE, uN, zM, zL = utm.from_latlon(lat, lon)
+        x = uE - self.uRefE
+        y = self._pseudoNorthing(uN) - self.uRefPseudoN
+        return x, y
+
+    def getLatLon(self, localX, localY) -> Tuple[float, float]:
+        easting = localX + self.uRefE
+        pseudoNorthing = localY + self.uRefPseudoN
+        return utm.to_latlon(easting, self._realNorthing(pseudoNorthing), self.uRef[2], self.uRef[3])
+
+    @staticmethod
+    def _pseudoNorthing(realNorthing):
+        if realNorthing >= 10000000:
+            return realNorthing - 10000000
+        else:
+            return realNorthing
+
+    @staticmethod
+    def _realNorthing(pseudoNorthing):
+        if pseudoNorthing < 0:
+            return pseudoNorthing + 10000000
+        else:
+            return pseudoNorthing
+
+
+class LocalHexagonalGrid:
+    """
+    A local hexagonal grid, where hex cells can be referenced by two integer coordinates relative to
+    the central grid cell, whose centre is at local coordinate (0, 0) and where positive x-coordinates/columns
+    are towards the east and positive y-coordinates/rows are towards the north.
+    Every odd row of cells is shifted half a hexagon to the right, i.e. column x for row 1 is half a grid cell
+    further to the right than column x for row 0.
+
+    For visualisation purposes, see https://www.redblobgames.com/grids/hexagons/
+    """
+    def __init__(self, radiusM):
+        """
+        :param radiusM: the radius, in metres, of each hex cell
+        """
+        self.radiusM = radiusM
+        startAngle = math.pi / 6
+        stepAngle = math.pi / 3
+        self.offsetVectors = []
+        for i in range(6):
+            angle = startAngle + i * stepAngle
+            x = math.cos(angle) * radiusM
+            y = math.sin(angle) * radiusM
+            self.offsetVectors.append(np.array([x, y]))
+        self.hexagonWidth = 2 * self.offsetVectors[0][0]
+        self.hexagonHeight = 2 * self.offsetVectors[1][1]
+        self.rowStep = 0.75 * self.hexagonHeight
+        self.polygonArea = 6 * self.hexagonHeight * self.hexagonWidth / 8
+
+    def getHexagon(self, xColumn: int, yRow: int) -> polygon.Polygon:
+        """
+        Gets the hexagon (polygon) for the given integer hex cell coordinates
+        :param xColumn: the column coordinate
+        :param yRow: the row coordinate
+        :return: the hexagon
+        """
+        centreX = xColumn * self.hexagonWidth
+        centreY = yRow * self.rowStep
+        if yRow % 2 == 1:
+            centreX += 0.5 * self.hexagonWidth
+        centre = np.array([centreX, centreY])
+        return polygon.Polygon([centre + o for o in self.offsetVectors])
+
+    def getMinHexagonColumn(self, x):
+        lowestXDefinitelyInColumn0 = 0
+        return math.floor((x - lowestXDefinitelyInColumn0) / self.hexagonWidth)
+
+    def getMaxHexagonColumn(self, x):
+        highestXDefinitelyInColumn0 = self.hexagonWidth / 2
+        return math.ceil((x - highestXDefinitelyInColumn0) / self.hexagonWidth)
+
+    def getMinHexagonRow(self, y):
+        lowestYDefinitelyInRow0 = -self.hexagonHeight / 4
+        return math.floor((y - lowestYDefinitelyInRow0) / self.rowStep)
+
+    def getMaxHexagonRow(self, y):
+        highestYDefinitelyInRow0 = self.hexagonHeight / 4
+        return math.ceil((y - highestYDefinitelyInRow0) / self.rowStep)
+
+    def getHexagonCoordSpanForBoundingBox(self, minX, minY, maxX, maxY) -> Tuple[Tuple[int, int], Tuple[int, int]]:
+        """
+        Gets the range of hex-cell coordinates that cover the given bounding box
+
+        :param minX: minimum x-coordinate of bounding box
+        :param minY: minimum y-coordinate of bounding box
+        :param maxX: maximum  x-coordinate of bounding box
+        :param maxY: maximum y-coordinate of bounding box
+        :return: a pair of pairs ((minCol, minRow), (maxCol, maxRow)) indicating the span of cell coordinates
+        """
+        if minX > maxX or minY > maxY:
+            raise ValueError()
+        minColumn = self.getMinHexagonColumn(minX)
+        maxColumn = self.getMaxHexagonColumn(maxX)
+        minRow = self.getMinHexagonRow(minY)
+        maxRow = self.getMaxHexagonRow(maxY)
+        return ((minColumn, minRow), (maxColumn, maxRow))
+
+    def getHexagonCoordsForPoint(self, x, y):
+        ((minColumn, minRow), (maxColumn, maxRow)) = self.getHexagonCoordSpanForBoundingBox(x, y, x, y)
+        for xCol in range(minColumn, maxColumn+1):
+            for yRow in range(minRow, maxRow+1):
+                if self.getHexagon(xCol, yRow).contains(point.Point(x, y)):
+                    return xCol, yRow
+        raise Exception("No Hexagon matched; possible edge case (point on hexagon boundary)")
+
+
+def fixPolygon(poly: Union[polygon.Polygon, multipolygon.MultiPolygon], maxAreaDiff=1e-2) -> Union[polygon.Polygon, multipolygon.MultiPolygon]:
+    """
+    Fix invalid shapely polygons or multipolygons.
+
+    Reference:
+    https://stackoverflow.com/questions/35110632/splitting-self-intersecting-polygon-only-returned-one-polygon-in-shapely
+
+    :param poly: the polygon to fix
+    :param maxAreaDiff: the maximum change in area
+    :return: the fixed polygon or None if it cannot be fixed given the area change constraint
+    """
+    def _fixPolygonComponent(coords: List[Tuple[float, float]]):
+        res = list(polygonize(unary_union(LineString(list(coords) + [coords[0]]))))
+        return reduce(lambda p1, p2: p1.union(p2), res)
+
+    if poly.is_valid:
+        return poly
+    else:
+        if isinstance(poly, polygon.Polygon):
+            exteriorCoords = poly.exterior.coords[:]
+            fixedExterior = _fixPolygonComponent(exteriorCoords)
+            fixedInterior = polygon.Polygon()
+            for interior in poly.interiors:
+                coords = interior.coords[:]
+                fixedInterior = fixedInterior.union(_fixPolygonComponent(coords))
+            fixedPolygon = fixedExterior.difference(fixedInterior)
+        elif isinstance(poly, multipolygon.MultiPolygon):
+            polys = list(poly)
+            fixedPolys = [fixPolygon(p, maxAreaDiff=maxAreaDiff) for p in polys]
+            fixedPolygon = reduce(lambda p1, p2: p1.union(p2), fixedPolys)
+        else:
+            raise Exception(f"Unsupported type {type(poly)}")
+        areaDiff = float('Inf') if poly.area == 0 else abs(poly.area - fixedPolygon.area) / poly.area
+        #log.info(f"Invalid polygon\n{poly}\nComputed fix:\n{fixedPolygon}.\nArea error: {areaDiff}")
+        if areaDiff > maxAreaDiff:
+            return None
+        else:
+            return fixedPolygon
+
diff --git a/src/sensai/geoanalytics/map_tiles.py b/src/sensai/geoanalytics/map_tiles.py
new file mode 100644
index 00000000..afb91fc9
--- /dev/null
+++ b/src/sensai/geoanalytics/map_tiles.py
@@ -0,0 +1,57 @@
+"""
+Utility functions and classes for geographic coordinates
+"""
+
+import math
+from typing import Tuple, List, Generator
+
+from ._globalmaptiles import GlobalMercator
+from .geo_coords import GeoRect
+
+EARTH_RADIUS = 6371000
+EARTH_CIRCUMFERENCE = 2 * math.pi * EARTH_RADIUS
+LATITUDE_PER_METRE = 360.0 / EARTH_CIRCUMFERENCE
+
+
+
+class MapTile:
+    def __init__(self, tx: int, ty: int, rect: GeoRect, zoom: int):
+        self.tx = tx
+        self.ty = ty
+        self.rect = rect
+        self.zoom = zoom
+
+
+class MapTiles:
+    def __init__(self, zoom=13):
+        self.zoom = zoom
+        self._mercator = GlobalMercator()
+        self._tiles = {}
+
+    def _getTile(self, tx, ty):
+        key = (tx, ty)
+        tile = self._tiles.get(key)
+        if tile is None:
+            tile = MapTile(tx, ty, GeoRect(*self._mercator.TileLatLonBounds(tx, ty, self.zoom)), self.zoom)
+            self._tiles[key] = tile
+        return tile
+
+    def iterTileCoordinatesInRect(self, rect: GeoRect) -> Generator[Tuple[int, int], None, None]:
+        tx1, ty1 = self._mercator.LatLonToTile(rect.minLat, rect.minLon, self.zoom)
+        tx2, ty2 = self._mercator.LatLonToTile(rect.maxLat, rect.maxLon, self.zoom)
+        txMin = min(tx1, tx2)
+        txMax = max(tx1, tx2)
+        tyMin = min(ty1, ty2)
+        tyMax = max(ty1, ty2)
+        for tx in range(txMin, txMax+1):
+            for ty in range(tyMin, tyMax+1):
+                yield tx, ty
+
+    def getTilesInRect(self, rect: GeoRect) -> List[MapTile]:
+        return [self._getTile(tx, ty) for tx, ty in self.iterTileCoordinatesInRect(rect)]
+
+    def getTile(self, lat: float, lon: float) -> MapTile:
+        return self._getTile(*self.getTileCoordinates(lat, lon))
+
+    def getTileCoordinates(self, lat: float, lon: float) -> Tuple[int, int]:
+        return self._mercator.LatLonToTile(lat, lon, self.zoom)
\ No newline at end of file

From 293ac17be6cffc26e1676284340347f76b0b0a88 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 9 May 2022 23:34:39 +0200
Subject: [PATCH 022/131] Fixed no longer supported syntax for inclusion of
 requirements.txt

Grouped dependencies by function, limiting build-related deps to tox
(excluding docs/sphinx-related deps, because once we add notebooks where
the installation of sensai in the environment is a requirement,
tox will be the preferred way of building the docs)
---
 environment.yml | 23 ++++++++++++++---------
 1 file changed, 14 insertions(+), 9 deletions(-)

diff --git a/environment.yml b/environment.yml
index 8c68ebaf..4ce2bfb4 100644
--- a/environment.yml
+++ b/environment.yml
@@ -5,7 +5,10 @@ channels:
   - anaconda
   - defaults
 dependencies:
+  # basics
   - python=3.7
+  - pip
+  # optional sensai dependencies for development
   - pytorch=1.4.0
   - tensorflow=1.14.0
   - pyqt=5.12
@@ -13,15 +16,17 @@ dependencies:
   - pytorch=1.4.0
   - catboost=0.23
   - xgboost=1.4.0
+  - lightgbm=3.1.1
+  - utm=0.7.0
+  # for notebook support
+  - jupyter
+  # for tests
   - pytest=5.4.1
-  - tox=3.14.6
+  # for release process
   - bump2version
-  - jupyter
-  - pyyaml=5.3
-  - lightgbm=3.1.1
-  - sphinx_rtd_theme
-  - utm
-  - pip
   - pip:
-      - -r file:requirements.txt
-      - nbsphinx
\ No newline at end of file
+      # non-optional sensai dependencies
+      - -r requirements.txt
+      # required for locally running the tox build
+      - tox
+      - virtualenv
\ No newline at end of file

From b46f2d02024f164bfb2201f8747c034e5cfe9bc3 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 9 May 2022 23:38:24 +0200
Subject: [PATCH 023/131] Extended the section on the docs build, adding
 instructions for a manual build (e.g. under Windows, where the tox build has
 problems)

---
 README-dev.md | 27 +++++++++++++++++++++++++--
 1 file changed, 25 insertions(+), 2 deletions(-)

diff --git a/README-dev.md b/README-dev.md
index 384b11b5..599edc06 100644
--- a/README-dev.md
+++ b/README-dev.md
@@ -7,9 +7,32 @@ The tests and docs build are executed via **tox** in several environments:
 
 ## Docs Build
 
-Docs are automatically created, all .rst files are auto-generated; only `index.rst` is manually defined.
+Docs are automatically created during the GitHub build via tox.
 
-Make sure that any optional sensAI dependencies (which are not included in the `docs` tox environment) are added to `docs/conf.py` under `autodoc_mock_imports`.
+All .rst files are auto-generated, with the exception of the root index file  `index.rst`.
+
+### Dependency Handling
+
+**Attention**: Make sure that any optional sensAI dependencies (which are not included in the `docs` tox environment) are added to `docs/conf.py` under `autodoc_mock_imports`.
+
+### Manually Running the Docs Build
+
+The docs build is designed to be run by tox. As soon as a single iPython notebook is included, `sensai` must be available as an installed dependency in the environment in which the docs build is run, as the notebook executions takes place in a Jupyter environment. 
+
+Under Linux, running tox should work fine. Under Windows, we are yet to succeed.
+
+To run the docs build without tox, first create an environment that has the additional requirements installed and, most importantly, sensai installed.
+
+    conda env create -n sensai-docs -f environment.yml
+    conda activate sensai-docs
+    pip install sphinx sphinx_rtd_theme nbsphinx
+    pip install .
+    
+The last command obviously needs to be repeated every time the library changes.
+In the new environment `sensai-docs`, we can then run the sphinx build
+
+    rm -rf docs-build; mkdir docs-build
+    sphinx -b html docs docs-build
 
 # Creating a New Release
 

From e348a7206b653831b1651a92f78626c40f8f57c9 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 17:15:04 +0200
Subject: [PATCH 024/131] Added default imports

---
 src/sensai/evaluation/__init__.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/sensai/evaluation/__init__.py b/src/sensai/evaluation/__init__.py
index 868cea30..c3d11de9 100644
--- a/src/sensai/evaluation/__init__.py
+++ b/src/sensai/evaluation/__init__.py
@@ -1,8 +1,10 @@
 from .crossval import VectorClassificationModelCrossValidator, VectorRegressionModelCrossValidator, \
-    VectorClassificationModelCrossValidationData, VectorRegressionModelCrossValidationData
+    VectorClassificationModelCrossValidationData, VectorRegressionModelCrossValidationData, \
+    VectorModelCrossValidatorParams
 from .eval_util import RegressionEvaluationUtil, ClassificationEvaluationUtil, MultiDataEvaluationUtil, \
     evalModelViaEvaluator, createEvaluationUtil, createVectorModelEvaluator, createVectorModelCrossValidator
 from .evaluator import VectorClassificationModelEvaluator, VectorRegressionModelEvaluator, \
+    VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, \
     VectorRegressionModelEvaluationData, VectorClassificationModelEvaluationData, \
     RuleBasedVectorClassificationModelEvaluator, RuleBasedVectorRegressionModelEvaluator
 

From 1aa72afed80e760c06541ef6151af0bc77a55c99 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 17:19:10 +0200
Subject: [PATCH 025/131] EvalStats: Renamed getAll -> getMetricsDict,
 retaining getAll as alias

EvalStatsCollection:
  * Renamed aggStats -> aggMetricsDict, adding option to specify aggregation functions
  * Renamed meanStats -> meanMetricsDict
---
 src/sensai/evaluation/crossval.py             |  2 +-
 .../evaluation/eval_stats/eval_stats_base.py  | 29 ++++++++++++-------
 .../eval_stats/eval_stats_classification.py   |  5 ++--
 .../eval_stats/eval_stats_clustering.py       |  4 +--
 src/sensai/evaluation/eval_util.py            |  6 ++--
 src/sensai/evaluation/evaluator.py            |  6 ++--
 src/sensai/evaluation/evaluator_clustering.py |  2 +-
 7 files changed, 30 insertions(+), 24 deletions(-)

diff --git a/src/sensai/evaluation/crossval.py b/src/sensai/evaluation/crossval.py
index 4fe251d9..1b339d3a 100644
--- a/src/sensai/evaluation/crossval.py
+++ b/src/sensai/evaluation/crossval.py
@@ -193,7 +193,7 @@ def _computeMetrics(self, model: VectorModel, **kwargs):
 
     def _computeMetricsForVarName(self, model, predictedVarName: Optional[str]):
         data = self.evalModel(model)
-        return data.getEvalStatsCollection(predictedVarName=predictedVarName).aggStats()
+        return data.getEvalStatsCollection(predictedVarName=predictedVarName).aggMetricsDict()
 
     def createMetricsDictProvider(self, predictedVarName: Optional[str]) -> MetricsDictProvider:
         """
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_base.py b/src/sensai/evaluation/eval_stats/eval_stats_base.py
index af6d1080..2a135508 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_base.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_base.py
@@ -40,15 +40,23 @@ def addMetric(self, metric: TMetric):
     def computeMetricValue(self, metric: TMetric) -> float:
         return metric.computeValueForEvalStats(self)
 
-    def getAll(self) -> Dict[str, float]:
-        """Gets a dictionary with all metrics"""
+    def metricsDict(self) -> Dict[str, float]:
+        """
+        Computes all metrics
+
+        :return: a dictionary mapping metric names to values
+        """
         d = {}
         for metric in self.metrics:
             d[metric.name] = self.computeMetricValue(metric)
         return d
 
+    def getAll(self) -> Dict[str, float]:
+        """Alias for metricsDict; may be deprecated in the future"""
+        return self.metricsDict()
+
     def _toStringObjectInfo(self) -> str:
-        return dictString(self.getAll())
+        return dictString(self.metricsDict())
 
 
 TEvalStats = TypeVar("TEvalStats", bound=EvalStats)
@@ -75,7 +83,7 @@ def __init__(self, evalStatsList: List[TEvalStats]):
         metricNamesSet = None
         metricsList = []
         for es in evalStatsList:
-            metrics = es.getAll()
+            metrics = es.metricsDict()
             currentMetricNamesSet = set(metrics.keys())
             if metricNamesSet is None:
                 metricNamesSet = currentMetricNamesSet
@@ -89,16 +97,15 @@ def __init__(self, evalStatsList: List[TEvalStats]):
     def getValues(self, metric):
         return self.metrics[metric]
 
-    def aggStats(self):
+    def aggMetricsDict(self, aggFns=(np.mean, np.std)) -> Dict[str, float]:
         agg = {}
         for metric, values in self.metrics.items():
-            agg[f"mean[{metric}]"] = float(np.mean(values))
-            agg[f"std[{metric}]"] = float(np.std(values))
+            for aggFn in aggFns:
+                agg[f"{aggFn.__name__}[{metric}]"] = float(aggFn(values))
         return agg
 
-    def meanStats(self):
+    def meanMetricsDict(self) -> Dict[str, float]:
         metrics = {metric: np.mean(values) for (metric, values) in self.metrics.items()}
-        metrics.update({f"StdDev[{metric}]": np.std(values) for (metric, values) in self.metrics.items()})
         return metrics
 
     def plotDistribution(self, metric):
@@ -124,7 +131,7 @@ def getGlobalStats(self) -> TEvalStats:
 
     def __str__(self):
         return f"{self.__class__.__name__}[" + \
-               ", ".join([f"{key}={self.aggStats()[key]:.4f}" for key in self.metrics]) + "]"
+               ", ".join([f"{key}={self.aggMetricsDict()[key]:.4f}" for key in self.metrics]) + "]"
 
 
 class PredictionEvalStats(EvalStats[TMetric], ABC):
@@ -213,7 +220,7 @@ def meanStats(evalStatsList: Sequence[EvalStats]) -> Dict[str, float]:
     For a list of EvalStats objects compute the mean values of all metrics in a dictionary.
     Assumes that all provided EvalStats have the same metrics
     """
-    dicts = [s.getAll() for s in evalStatsList]
+    dicts = [s.metricsDict() for s in evalStatsList]
     metrics = dicts[0].keys()
     return {m: np.mean([d[m] for d in dicts]) for m in metrics}
 
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index 8db7806c..ed01dc37 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -1,6 +1,6 @@
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
-from typing import List, Sequence, Optional
+from typing import List, Sequence, Optional, Dict
 import logging
 
 from matplotlib import pyplot as plt
@@ -200,8 +200,7 @@ def getBinaryClassificationProbabilityThresholdVariationData(self) -> "BinaryCla
     def getAccuracy(self):
         return self.computeMetricValue(ClassificationMetricAccuracy())
 
-    def getAll(self):
-        """Gets a dictionary with all metrics"""
+    def metricsDict(self) -> Dict[str, float]:
         d = {}
         for metric in self.metrics:
             if not metric.requiresProbabilities or self._probabilitiesAvailable:
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_clustering.py b/src/sensai/evaluation/eval_stats/eval_stats_clustering.py
index 680fc848..0838fa22 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_clustering.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_clustering.py
@@ -47,8 +47,8 @@ def getDistributionSummary(self) -> Dict[str, float]:
             result[self.NOISE_SIZE] = int(self.noiseClusterSize)
         return result
 
-    def getAll(self) -> Dict[str, float]:
-        metricsDict = super().getAll()
+    def metricsDict(self) -> Dict[str, float]:
+        metricsDict = super().metricsDict()
         metricsDict.update(self.getDistributionSummary())
         return metricsDict
 
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 79d0bfd8..cd14f4c5 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -289,7 +289,7 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
         resultWriter = self._resultWriterForModel(resultWriter, model)
         crossValidator = self.createCrossValidator(model)
         crossValidationData = crossValidator.evalModel(model)
-        aggStatsByVar = {varName: crossValidationData.getEvalStatsCollection(predictedVarName=varName).aggStats()
+        aggStatsByVar = {varName: crossValidationData.getEvalStatsCollection(predictedVarName=varName).aggMetricsDict()
                 for varName in crossValidationData.predictedVarNames}
         df = pd.DataFrame.from_dict(aggStatsByVar, orient="index")
         strEvalResults = df.to_string()
@@ -326,13 +326,13 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
                     raise ValueError("Cross-validation necessitates that models be retrained; got fitModels=False")
                 crossValidationResult = self.performCrossValidation(model, resultWriter=resultWriter if writeIndividualResults else None)
                 evalStatsCollection = crossValidationResult.getEvalStatsCollection()
-                statsDict = evalStatsCollection.aggStats()
+                statsDict = evalStatsCollection.aggMetricsDict()
                 if includeEvalStatsObjects:
                     statsDict["evalStats"] = evalStatsCollection.getGlobalStats()
             else:
                 evalStats: EvalStats = self.performSimpleEvaluation(model, resultWriter=resultWriter if writeIndividualResults else None,
                     fitModel=fitModels).getEvalStats()
-                statsDict = evalStats.getAll()
+                statsDict = evalStats.metricsDict()
                 if includeEvalStatsObjects:
                     statsDict["evalStats"] = evalStats
             statsDict["modelName"] = model.getName()
diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index 8ad78414..b7754d04 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -96,7 +96,7 @@ def getDataFrame(self):
         statsDicts = []
         varNames = []
         for predictedVarName, evalStats in self.evalStatsByVarName.items():
-            statsDicts.append(evalStats.getAll())
+            statsDicts.append(evalStats.metricsDict())
             varNames.append(predictedVarName)
         df = pd.DataFrame(statsDicts, index=varNames)
         df.index.name = "predictedVar"
@@ -194,8 +194,8 @@ def _computeMetrics(self, model: VectorModel, onTrainingData=False) -> Dict[str,
 
     def _computeMetricsForVarName(self, model, predictedVarName: Optional[str], onTrainingData=False):
         self.fitModel(model)
-        evalData = self.evalModel(model, onTrainingData=onTrainingData)
-        return evalData.getEvalStats(predictedVarName=predictedVarName).getAll()
+        evalData: VectorModelEvaluationData = self.evalModel(model, onTrainingData=onTrainingData)
+        return evalData.getEvalStats(predictedVarName=predictedVarName).metricsDict()
 
     def createMetricsDictProvider(self, predictedVarName: Optional[str]) -> MetricsDictProvider:
         """
diff --git a/src/sensai/evaluation/evaluator_clustering.py b/src/sensai/evaluation/evaluator_clustering.py
index 704ceffe..b3b29525 100644
--- a/src/sensai/evaluation/evaluator_clustering.py
+++ b/src/sensai/evaluation/evaluator_clustering.py
@@ -21,7 +21,7 @@ def _computeMetrics(self, model: EuclideanClusterer, **kwargs) -> Dict[str, floa
         :return:
         """
         evalStats = self.evalModel(model, **kwargs)
-        return evalStats.getAll()
+        return evalStats.metricsDict()
 
     @abstractmethod
     def evalModel(self, model: EuclideanClusterer, **kwargs) -> TClusteringEvalStats:

From 61e9e4f2e9ade09c65b48e83ecdaa53537212bf4 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 17:19:35 +0200
Subject: [PATCH 026/131] EvalStatsPlotCollector: Added getEnabledPlots

---
 src/sensai/evaluation/eval_util.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index cd14f4c5..64c31675 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -9,7 +9,7 @@
 import logging
 from abc import ABC, abstractmethod
 from collections import defaultdict
-from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set
+from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set, List
 
 import matplotlib.figure
 import matplotlib.pyplot as plt
@@ -155,6 +155,9 @@ def __init__(self):
     def addPlot(self, name: str, plot: EvalStatsPlot):
         self.plots[name] = plot
 
+    def getEnabledPlots(self) -> List[str]:
+        return [p for p in self.plots if p not in self.disabledPlots]
+
     def disablePlots(self, *names: str):
         self.disabledPlots.update(names)
 

From 9cf38ace48c19451da5f72bbac9e4e134ed9ce6b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 17:19:56 +0200
Subject: [PATCH 027/131] VectorModel: Added convenience method
 fitInputOutputData

---
 src/sensai/vector_model.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 8a7995b4..878d1917 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -290,6 +290,9 @@ def _fitPreprocessors(self, X: pd.DataFrame, Y: pd.DataFrame = None):
                 X = self._featureGenerator.fitGenerate(X, Y, self)
         self._inputTransformerChain.fit(X)
 
+    def fitInputOutputData(self, ioData: InputOutputData, fitPreprocessors=True):
+        self.fit(ioData.inputs, ioData.outputs, fitPreprocessors=fitPreprocessors)
+
     def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True):
         """
         Fits the model using the given data

From 6ed0b7fb744e69a697387007da3d6c7589ac2c62 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 17:38:40 +0200
Subject: [PATCH 028/131] Do not ignore notebooks in docs

---
 docs/.gitignore | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/.gitignore b/docs/.gitignore
index 9bc9e6c3..e69de29b 100644
--- a/docs/.gitignore
+++ b/docs/.gitignore
@@ -1 +0,0 @@
-*.ipynb
\ No newline at end of file

From 28557c36d39cb56dbefd816dacf09149f29f204d Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 17:38:58 +0200
Subject: [PATCH 029/131] Ignore *.env

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index aca3fcd8..d645cc3f 100644
--- a/.gitignore
+++ b/.gitignore
@@ -18,3 +18,4 @@ dist
 /.pytest_cache
 data
 .coverage
+/*.env
\ No newline at end of file

From 5f93a5509f2b073423bda17e3d562dcdd57fbea9 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 18:09:23 +0200
Subject: [PATCH 030/131] Ignore docs-build

---
 .gitignore | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index d645cc3f..901772ba 100644
--- a/.gitignore
+++ b/.gitignore
@@ -18,4 +18,5 @@ dist
 /.pytest_cache
 data
 .coverage
-/*.env
\ No newline at end of file
+/*.env
+/docs-build
\ No newline at end of file

From 93bc18a0e9a24dfe07365de7b4810373fda76c84 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 18:14:38 +0200
Subject: [PATCH 031/131] Added notebook 'Introduction to sensAI' for docs

---
 docs/intro.ipynb | 501 +++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 501 insertions(+)
 create mode 100644 docs/intro.ipynb

diff --git a/docs/intro.ipynb b/docs/intro.ipynb
new file mode 100644
index 00000000..fa43e219
--- /dev/null
+++ b/docs/intro.ipynb
@@ -0,0 +1,501 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys\n",
+    "sys.path.append(\"../src\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Introduction to sensAI"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sensai"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Logging\n",
+    "\n",
+    "sensAI will log relevant activies and inform you about ongoing processes as well as results via the log. It is therefore highly recommended that you enable logging when using sensAI.\n",
+    "\n",
+    "sensAI provides a `logging` module which includes Python's standard logging module and adds some additional functionality. To enable logging, simply use the `configureLogging` function.\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from sensai.util import logging\n",
+    "\n",
+    "logging.configureLogging(level=logging.INFO)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "To additionally write log output to a file, use the function `logging.addFileLogger`."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Training and Evaluating Models\n",
+    "\n",
+    "First, let us load a dataset which we can experiment. sklearn provides, for example, the Iris classification dataset, where the task is to differentiate three different types of flowers based on measurements of their petals and sepals."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sklearn.datasets\n",
+    "import pandas as pd\n",
+    "\n",
+    "irisData = sklearn.datasets.load_iris()\n",
+    "irisInputDF = pd.DataFrame(irisData[\"data\"], columns=irisData[\"feature_names\"]).reset_index(drop=True)\n",
+    "irisOutputDF = pd.DataFrame({\"class\": [irisData[\"target_names\"][idx] for idx in irisData[\"target\"]]}).reset_index(drop=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Here's a sample of the data, combining both the inputs and outputs:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "irisCombinedDF = pd.concat((irisInputDF, irisOutputDF), axis=1)\n",
+    "irisCombinedDF.sample(10)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "When working with sensAI, we typically use a DataFrame such as this as the starting point. DataFrames are a good basis, because they provide much-needed meta-data in the form of column names and as such provide a more well-defined interface for learning and inference than raw numpy arrays.\n",
+    "\n",
+    "We create an instance of **InputOutputData** from the two data frames."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "irisInputOutputData = sensai.InputOutputData(irisInputDF, irisOutputDF)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Low-Level Training and Inference "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We use a **DataSplitter** (see subclasses) to split the data into a training and test set, specifically a **DataSplitterFractional**."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataSplitter = sensai.data.DataSplitterFractional(0.8, shuffle=True)\n",
+    "trainingIoData, testIoData = dataSplitter.split(irisInputOutputData)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now we are ready to train a model. Let us train a random forest classifier, which should work well for this sort of problem. sensAI provides models from various libraries, including scikit-learn, PyTorch, lightgbm, xgboost, catboost, and TensorFlow.\n",
+    "\n",
+    "In this case, let us use the random forest implementation from sklearn, which is provided via the wrapper class SkLearnRandomForestVectorClassificationModel.\n",
+    "\n",
+    "sensAI's **VectorModel** classes (specialised for classification and regression) provide a common interface with a lot of useful functionality, which we will see later."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "randomForestModel = sensai.sklearn.classification.SkLearnRandomForestVectorClassificationModel(min_samples_leaf=2)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The class suppports all the parameters supported by the original sklearn model. In this case, we only set the minimum number of samples that must end up in each leaf.\n",
+    "\n",
+    "We train the model using the `fitInputOutputData` method; we could also use the `fit` method, which is analogous to the sklearn interface and takes two arguments (input, output)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "randomForestModel.fitInputOutputData(trainingIoData)\n",
+    "randomForestModel"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can now apply the trained model and predict the outputs for the test set we reserved."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "predictedOutputsDF = randomForestModel.predict(testIoData.inputs)\n",
+    "predictedOutputsDF.head(5)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Let's compare some of the predictions to the ground truth."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "pd.concat((predictedOutputsDF.rename(columns={\"class\": \"predictedClass\"}), testIoData.outputs), axis=1).sample(10)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Using the ground truth and predicted values, we could now compute the metrics we're interested in. We could, for example, use the metrics implemented in sklearn to analyse the result. Yet sensAI already provides abstractions that facilitate the generation of metrics and the collection of results. Read on!"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Using Evaluators\n",
+    "\n",
+    "sensAI provides evaluator abstractions which facilitate the training and evaluation of models.\n",
+    "\n",
+    "For a classification problem, we instantiate a VectorClassificationModelEvaluator. An evaluator serves to evaluate one or more models based on the same data, so we construct it with the data and instructions on how to handle/split the data for evaluation."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evaluatorParams = sensai.evaluation.VectorClassificationModelEvaluatorParams(dataSplitter=dataSplitter, computeProbabilities=True)\n",
+    "evaluator = sensai.evaluation.VectorClassificationModelEvaluator(irisInputOutputData, params=evaluatorParams)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can use this evaluator to evaluate one or more models. Let us evaluate the random forest model from above."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evaluator.fitModel(randomForestModel)\n",
+    "evalData = evaluator.evalModel(randomForestModel)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The evaluation data holds, in particular, an **EvalStats** object, which can provide data on the quality of the results.\n",
+    "Depending on the type of problem, many metrics will already be computed by default."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalStats = evalData.getEvalStats()\n",
+    "evalStats"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can get the metrics in a dictionary as follows:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalStats.metricsDict()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can compute additional metrics by passing a metric to the `computeMetricValue` method, but we could also have added additional metrics to the `evaluatorParams` above and have the metric included in all results.\n",
+    "\n",
+    "Let's see how frequently the true class is among the top two most probable classes."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalStats.computeMetricValue(sensai.eval_stats_classification.ClassificationMetricTopNAccuracy(2))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The EvalStats object can also be used to generate plots, such as a confusion matrix or a precision-recall plot for binary classification."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalStats.plotConfusionMatrix(normalize=True);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Using the Fully-Integrated Evaluation Utilities\n",
+    "\n",
+    "sensAI's evaluation utilities take things one step further and assist you in out all the evaluation steps and results computations in a single call.\n",
+    "\n",
+    "You can perform evaluations based on a single split or cross-validation. We simply declare the necessary parameters for both types of computations (or the one type we seek to carry out)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evaluatorParams = sensai.evaluation.VectorClassificationModelEvaluatorParams(\n",
+    "    dataSplitter=dataSplitter, computeProbabilities=True, \n",
+    "    additionalMetrics=[sensai.eval_stats_classification.ClassificationMetricTopNAccuracy(2)])\n",
+    "crossValidatorParams = sensai.evaluation.crossval.VectorModelCrossValidatorParams(folds=10, \n",
+    "    evaluatorParams=evaluatorParams)\n",
+    "evalUtil = sensai.evaluation.ClassificationEvaluationUtil(irisInputOutputData, \n",
+    "    evaluatorParams=evaluatorParams, crossValidatorParams=crossValidatorParams)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In practice, we will usually want to save evaluation results. The evaluation methods of `evalUtil` take a parameter `resultWriter` which allows us to define where results shall be written. Within this notebook, we shall simply inspect the resulting metrics in the log that is printed, and we shall configure plots to be shown directly.\n",
+    "\n",
+    "#### Simple Evaluation"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can perform the same evaluation as above (which uses a single split) like so:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalUtil.performSimpleEvaluation(randomForestModel, showPlots=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "#### Customising the Set of Plots"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "If we decide that we don't really want to have the normalised confusion matrix, we can disable it for any further experiments."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalUtil.evalStatsPlotCollector.getEnabledPlots()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Some of these are only active for binary classification. The one we don't want is \"confusion-matrx-rel\"."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalUtil.evalStatsPlotCollector.disablePlots(\"confusion-matrix-rel\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We could also define our own plot class (by creating a new subclass of `ClassificationEvalStatsPlot`) and add it to the `evalStatsPlotCollector` in order to have the plot auto-generated whenever we apply one of `evalUtil`'s methods."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "#### Cross-Validation"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can similarly run cross-validation and produce the respective evaluation metrics with a single call."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalUtil.performCrossValidation(randomForestModel, showPlots=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "As you can see, the plot we disabled earlier is no longer being generated."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "#### Comparing Models\n",
+    "\n",
+    "A most common use case is to compare the performance of several models. The evaluation utility makes it very simple to compare any number of models.\n",
+    "\n",
+    "Let's say we want to compare the random forest we have been using thus far to a simple decision tree."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalUtil.compareModels([\n",
+    "        randomForestModel.withName(\"RandomForest\"), \n",
+    "        sensai.sklearn.classification.SkLearnDecisionTreeVectorClassificationModel(min_samples_leaf=2).withName(\"DecisionTree\")], \n",
+    "    useCrossValidation=False);"
+   ]
+  }
+ ],
+ "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
+  "kernelspec": {
+   "display_name": "Python 3.7.9 ('sensai')",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.9"
+  },
+  "orig_nbformat": 4
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

From 58f58a1dc2d24f3ea058cc00ee6ab421b07e4d37 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 18:15:09 +0200
Subject: [PATCH 032/131] Added notebook to docs index, removing obsolete
 getting-started.rst

---
 docs/getting-started.rst | 9 ---------
 docs/index.rst           | 2 +-
 2 files changed, 1 insertion(+), 10 deletions(-)
 delete mode 100644 docs/getting-started.rst

diff --git a/docs/getting-started.rst b/docs/getting-started.rst
deleted file mode 100644
index 061f6114..00000000
--- a/docs/getting-started.rst
+++ /dev/null
@@ -1,9 +0,0 @@
-Getting started
-===============
-
-This library works with python>=3.7. Install it by executing \n
-``python setup.py install`` \n
-from the root directory.
-
-For developing the usage of tox is encouraged. Run ``tox`` from the root directory in order to build the package,
-these docs and perform several tests. You should not merge to master without tox having executed successfully!
diff --git a/docs/index.rst b/docs/index.rst
index 9ed3f2a6..78f90a25 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -5,7 +5,7 @@ sensAI - the Python library for sensible AI
    :caption: Guides and Tutorials
    :glob:
 
-   *
+   intro.ipynb
 
 
 .. toctree::

From ac0cef1f031cb2c6b155031c8f560060b74bf3b6 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 21:07:49 +0200
Subject: [PATCH 033/131] Moved intro notebook to notebooks folder

---
 {docs => notebooks}/intro.ipynb | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename {docs => notebooks}/intro.ipynb (100%)

diff --git a/docs/intro.ipynb b/notebooks/intro.ipynb
similarity index 100%
rename from docs/intro.ipynb
rename to notebooks/intro.ipynb

From d4ef28c8825e485946124a43c30e1aacf1555fa6 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 21:07:58 +0200
Subject: [PATCH 034/131] Revert "Do not ignore notebooks in docs"

This reverts commit 6ed0b7fb744e69a697387007da3d6c7589ac2c62.

Notebooks need to be ignored because the notebooks stored in the
notebooks/ folder are copied to the docs/ folder during test_notebooks
---
 docs/.gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/.gitignore b/docs/.gitignore
index e69de29b..9bc9e6c3 100644
--- a/docs/.gitignore
+++ b/docs/.gitignore
@@ -0,0 +1 @@
+*.ipynb
\ No newline at end of file

From 32d3e22bb87756fdc2d93ed6bd07121ca7003325 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 21:11:31 +0200
Subject: [PATCH 035/131] Include all notebooks in index.rst

---
 docs/index.rst | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/index.rst b/docs/index.rst
index 78f90a25..58e1ffec 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -5,7 +5,10 @@ sensAI - the Python library for sensible AI
    :caption: Guides and Tutorials
    :glob:
 
-   intro.ipynb
+..
+  Comment: include all notebooks (copied to docs/ by test_notebooks)
+  
+   *
 
 
 .. toctree::

From c52f251152cd25d61ca5087cbc3ff173be61456d Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Sun, 15 May 2022 21:41:54 +0200
Subject: [PATCH 036/131] Fixed comment

---
 docs/index.rst | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/docs/index.rst b/docs/index.rst
index 58e1ffec..fc5272ea 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -5,11 +5,10 @@ sensAI - the Python library for sensible AI
    :caption: Guides and Tutorials
    :glob:
 
-..
-  Comment: include all notebooks (copied to docs/ by test_notebooks)
-  
    *
 
+..
+  Above, we include notebooks, copied here by test_notebooks
 
 .. toctree::
    :caption: Modules

From 596ae0ca1826244c63f53acd6b31e466ccdf7a0c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 15 May 2022 21:34:01 +0200
Subject: [PATCH 037/131] README:   * Moved details source-level inclusion of
 sensAI to README-dev.   * More details on handling of notebooks in docs
 build.   * Changed docs URL to github.io (readthedocs now deleted)   *
 Mention appliedAI

---
 README-dev.md | 69 +++++++++++++++++++++++++++++++++++++++++++++------
 README.md     | 54 +++-------------------------------------
 2 files changed, 65 insertions(+), 58 deletions(-)

diff --git a/README-dev.md b/README-dev.md
index 599edc06..601f50ae 100644
--- a/README-dev.md
+++ b/README-dev.md
@@ -15,24 +15,29 @@ All .rst files are auto-generated, with the exception of the root index file  `i
 
 **Attention**: Make sure that any optional sensAI dependencies (which are not included in the `docs` tox environment) are added to `docs/conf.py` under `autodoc_mock_imports`.
 
+### Notebooks
+
+Notebooks in the `notebooks/` folder are executed and saved with outputs to the `docs/` folder by a test in `notebooks/test_notebooks.py`.
+
+Notebooks are included in the documentation in `docs/index.rst`.
+
 ### Manually Running the Docs Build
 
-The docs build is designed to be run by tox. As soon as a single iPython notebook is included, `sensai` must be available as an installed dependency in the environment in which the docs build is run, as the notebook executions takes place in a Jupyter environment. 
+The docs build is designed to be run by tox. As soon as a single iPython notebook is included in index.rst, `sensai` must be available as an installed dependency in the environment in which the docs build is run, as the notebook executions take place in a Jupyter environment where we can't simply extend sys.path. 
 
 Under Linux, running tox should work fine. Under Windows, we are yet to succeed.
 
-To run the docs build without tox, first create an environment that has the additional requirements installed and, most importantly, sensai installed.
+To run the docs build without tox (under Windows), first create an environment that has the additional requirements installed.
 
     conda env create -n sensai-docs -f environment.yml
     conda activate sensai-docs
     pip install sphinx sphinx_rtd_theme nbsphinx
-    pip install .
-    
-The last command obviously needs to be repeated every time the library changes.
-In the new environment `sensai-docs`, we can then run the sphinx build
 
+Then, to build the docs, we need to perform the following steps with the new environment `sensai-docs` activated. The first command installs the current source version of  `sensai` itself.
+
+    pip install .
     rm -rf docs-build; mkdir docs-build
-    sphinx -b html docs docs-build
+    sphinx-build -b html docs docs-build
 
 # Creating a New Release
 
@@ -65,3 +70,53 @@ In the new environment `sensai-docs`, we can then run the sphinx build
      `bumpversion build --commit`
    * Continue with step 3.
 
+# Source-Level Directory Sync
+
+#### Details on the Synchonisation of a Source Directory within Your Project with the sensAI Repository
+
+We support the synchronisation of a branch in the sensAI repository with a directory within the git repository of your project which is to contain the sensAI source code (i.e. alternative #2 from above) via a convenient scripting solution.
+
+We consider two local repositories: the sensAI repository in directory `sensAI/` and your project in, for instance, directory `sensAI/../myprj/`. Let us assume that we want to synchronise branch `myprj-branch` in the sensAI repository with directory `myprj/src/sensai`.
+
+##### Synchronisation Script
+
+To perform the synchronisation, please create a script as follows, which you should save to `sensAI/sync.py`:
+
+```python
+import os
+from repo_dir_sync import LibRepo, OtherRepo
+
+r = LibRepo()
+r.add(OtherRepo("myprj", "myprj-branch", os.path.join("..", "myprj", "src", "sensai")))
+r.runMain()
+```
+
+You can add multiple other repositories if you so desire in the future.
+
+From directory `sensAI/` you can use the script in order to 
+
+* ***Push***: Update your project (i.e. `myprj/src/sensai`) with changes that were made in other projects by running `python sync.py myprj push`
+* ***Pull***: Update `myprj-branch` in the sensAI repository with changes made in your project by running `python sync.py myprj pull`
+
+##### Initialisation
+
+To initialise the synchronisation, proceed as follows:
+
+1. Create the branch `myprj-branch` in the sensAI repository, i.e. in `sensAI/` run this command:
+   `git branch myprj-branch master`
+2. Create the directory `myprj/src/sensai`.
+3. Make sure you have a `.gitignore` file in `myprj/` with at least the following entries:
+
+       *.pyc
+       __pycache__
+       *.bak
+       *.orig
+
+   Otherwise you may end up with unwanted tracked files after a synchronisation.
+4. Perform the initial *push*, i.e. in `sensAI/` run this command:
+   `python sync.py myprj push`
+
+##### Things to Keep in Mind
+
+* Both *push* and *pull* operations are always performed based on the branch that is currently checked out in `myprj/`. The best practice is to only use one branch for synchronisation, e.g. master.
+* *Push* and *pull* operations will make git commits in both repositories. Should an operation ever go wrong/not do what you intended, use `git reset --hard` to go back to the commits before the operation in both repositories.
\ No newline at end of file
diff --git a/README.md b/README.md
index f2e4ad3c..c517b870 100644
--- a/README.md
+++ b/README.md
@@ -24,7 +24,7 @@ In particular, sensAI provides ...
 
 ## Documentation
 
-Source code documentation and tutorials can be found [here](https://sensai.readthedocs.io/)
+Reference documentation and tutorials can be found [here](https://jambit.github.io/sensAI/docs/).
 
 ### Integrating sensAI into a Project
 
@@ -34,62 +34,14 @@ sensAI may be integrated into your project in several ways:
    Choose this option if you do not intend to make changes to sensAI in the context of your project.
 2. **Include sensAI's source code as a package within your project** (e.g. in `src/sensai`), which you synchronise with a sensAI branch.
    Choose this option if you intend to make changes to sensAI as you develop your project. When using this option, you (and others) may even make changes to sensAI in several branches of your project and even several projects using the same inclusion mechanism at the same time.
-   See below for details on how synchronisation works.
+   See developer documentation in README-dev.md for details on how synchronisation works.
 3. **Clone sensAI and add its source directory to your `PYTHONPATH`**.
    Choose this option if you potentially intend to make changes to sensAI but no one else working on your project will do the same and you will be modifying sensAI's source in no more than one branch at a time.
 
-#### Details on the Synchonisation of a Source Directory within Your Project with the sensAI Repository
-
-We support the synchronisation of a branch in the sensAI repository with a directory within the git repository of your project which is to contain the sensAI source code (i.e. alternative #2 from above) via a convenient scripting solution.
-
-We consider two local repositories: the sensAI repository in directory `sensAI/` and your project in, for instance, directory `sensAI/../myprj/`. Let us assume that we want to synchronise branch `myprj-branch` in the sensAI repository with directory `myprj/src/sensai`.
-
-##### Synchronisation Script
-
-To perform the synchronisation, please create a script as follows, which you should save to `sensAI/sync.py`:
-
-```python
-import os
-from repo_dir_sync import LibRepo, OtherRepo
-
-r = LibRepo()
-r.add(OtherRepo("myprj", "myprj-branch", os.path.join("..", "myprj", "src", "sensai")))
-r.runMain()
-```
-
-You can add multiple other repositories if you so desire in the future.
-
-From directory `sensAI/` you can use the script in order to 
-
-* ***Push***: Update your project (i.e. `myprj/src/sensai`) with changes that were made in other projects by running `python sync.py myprj push`
-* ***Pull***: Update `myprj-branch` in the sensAI repository with changes made in your project by running `python sync.py myprj pull`
-
-##### Initialisation
-
-To initialise the synchronisation, proceed as follows:
-
-1. Create the branch `myprj-branch` in the sensAI repository, i.e. in `sensAI/` run this command:
-   `git branch myprj-branch master`
-2. Create the directory `myprj/src/sensai`.
-3. Make sure you have a `.gitignore` file in `myprj/` with at least the following entries:
-
-       *.pyc
-       __pycache__
-       *.bak
-       *.orig
-  
-   Otherwise you may end up with unwanted tracked files after a synchronisation.
-4. Perform the initial *push*, i.e. in `sensAI/` run this command:
-   `python sync.py myprj push`
-
-##### Things to Keep in Mind
-
-* Both *push* and *pull* operations are always performed based on the branch that is currently checked out in `myprj/`. The best practice is to only use one branch for synchronisation, e.g. master.
-* *Push* and *pull* operations will make git commits in both repositories. Should an operation ever go wrong/not do what you intended, use `git reset --hard` to go back to the commits before the operation in both repositories.
 
 ## Contributors
 
-sensAI is being developed by the artificial intelligence group at jambit GmbH.
+sensAI is being developed by the artificial intelligence group at [jambit GmbH](http://www.jambit.com) and by members of [appliedAI](www.appliedai.de).
 
 The main contributors are Dominik Jain, Michael Panchenko, Kristof Schröder and Magnus Winter.
 

From ca4d099dfd4e89a701f35eafbfedce383b022314 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 02:30:51 +0200
Subject: [PATCH 038/131] Updated development environment specification
 (solvable!), now including all depenencies (except catboost) of the actual
 library as well as packages required for testing/the build pipeline

---
 environment.yml          | 42 ++++++++++++++++++++++++++--------------
 requirements-relaxed.txt |  7 +++++++
 2 files changed, 35 insertions(+), 14 deletions(-)
 create mode 100644 requirements-relaxed.txt

diff --git a/environment.yml b/environment.yml
index 4ce2bfb4..ebb44c8d 100644
--- a/environment.yml
+++ b/environment.yml
@@ -1,32 +1,46 @@
+# environment definition for development
+# NOTE: versions are mostly unpinned, because this facilitates conda dependency resolution. Also,
+# sensAI should be compatible to all (newer) versions of the dependencies. If it isn't, we need to specify 
+# an upper version bound in setup.py (where it matters the most) as well as here.
+# Compatibility with old (pinned) versions and the latest versions is tested in the tox build.
 name: sensai
 channels:
   - pytorch
-  - conda-forge
-  - anaconda
   - defaults
+  - conda-forge
 dependencies:
   # basics
-  - python=3.7
+  # we use Python 3.8 because it has better conda dependency support; the code must still be compatible to 3.7 (which is tested by the github build)
+  - python=3.8
   - pip
   # optional sensai dependencies for development
-  - pytorch=1.4.0
-  - tensorflow=1.14.0
-  - pyqt=5.12
-  - psutil=5.6.7
-  - pytorch=1.4.0
-  - catboost=0.23
-  - xgboost=1.4.0
-  - lightgbm=3.1.1
+  # NOTE: catboost is disabled, because it causes conflicts
+  #- catboost
+  - pytorch
+  - pyqt
+  - psutil
+  - xgboost
+  - lightgbm
   - utm=0.7.0
+  - geopandas
   # for notebook support
   - jupyter
   # for tests
-  - pytest=5.4.1
+  - pytest
+  # for docs build
+  - sphinx 
+  - sphinx_rtd_theme 
+  - nbsphinx
   # for release process
   - bump2version
   - pip:
       # non-optional sensai dependencies
-      - -r requirements.txt
-      # required for locally running the tox build
+      - -r requirements-relaxed.txt
+      # optional sensai pip dependencies
+      # clearml is only available through pip, and pulling tensorflow from conda causes dependency issues
+      - clearml
+      - tensorflow-cpu
+      - pytorch-lightning
+      # required for locally running the tox build (which will work on Linux only at this time)
       - tox
       - virtualenv
\ No newline at end of file
diff --git a/requirements-relaxed.txt b/requirements-relaxed.txt
new file mode 100644
index 00000000..1f97947c
--- /dev/null
+++ b/requirements-relaxed.txt
@@ -0,0 +1,7 @@
+# this is a relaxed version of requirements.txt where newer versions are allowed
+pandas>=1.0.0
+scipy>=1.4
+numpy>=1.18.0
+scikit-learn>=0.22.0
+seaborn>=0.10.0
+typing-extensions>=3.7

From a7d14879f27e7e77f2d03267c0bb5f6d2ffd47da Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 02:35:13 +0200
Subject: [PATCH 039/131] Added notes on development environment setup

---
 README-dev.md | 26 ++++++++++++++++++++++++--
 1 file changed, 24 insertions(+), 2 deletions(-)

diff --git a/README-dev.md b/README-dev.md
index 601f50ae..25ceb3bd 100644
--- a/README-dev.md
+++ b/README-dev.md
@@ -1,15 +1,37 @@
+# Development Environment
+
+This section explains the steps required to set up an environment in order to develop sensAI further.
+
+## Clone Large Files
+
+Clone the full repo, including large files using [git large file storage](https://git-lfs.github.com):
+
+    git lfs pull
+
+This adds, in particular, data that is used in notebooks.
+
+## Create the Python Virtual Environment
+
+Use conda to set up the Python environment:
+
+    conda env create -f environment.py
+
+Solving the environment may take several minutes (but should ultimately work).
+
+NOTE: versions are mostly unpinned in the environment specification, because this facilitates conda dependency resolution. Also, sensAI is intended to be compatible with all (newer) versions of the dependencies. If it isn't, we need to specify  an upper version bound in `setup.py` (where it matters the most) as well as in `environment.yml`. Compatibility with old (pinned) versions and the latest versions is tested in the tox build (see blow).
+
 # Build and Test Pipeline
 
 The tests and docs build are executed via **tox** in several environments:
 * `py`: the "regular" test environment, where we test against the pinned dependencies which we also use for development (by explicitly including `requirements.txt` with the pinned versions; this is also the environment in which we test the execution of notebooks
 * `py_latest_dependencies`: the environment where we use the latest versions of all dependencies (except where we have identified an incompatibility; see `setup.py` definitions `DEPS_VERSION_LOWER_BOUND` and `DEPS_VERSION_UPPER_BOUND_EXCLUSIVE`); by not including `requirements.txt`, we depend on the latest admissible versions according to `setup.py`
-* `docs`: the environment in which docs are built via sphinx (by executing `build_scripts/update_docs.py`)
+* `docs`: the environment in which docs are built via sphinx 
 
 ## Docs Build
 
 Docs are automatically created during the GitHub build via tox.
 
-All .rst files are auto-generated, with the exception of the root index file  `index.rst`.
+All .rst files are auto-generated (by `build_scripts/update_docs.py`), with the exception of the root index file  `index.rst`.
 
 ### Dependency Handling
 

From ac49c64aae5425666e615c700c1ed23782d39a0c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 02:50:39 +0200
Subject: [PATCH 040/131] Mark import used

---
 tests/frameworks/tensorflow/test_tf.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/frameworks/tensorflow/test_tf.py b/tests/frameworks/tensorflow/test_tf.py
index 59304cad..2f520b83 100644
--- a/tests/frameworks/tensorflow/test_tf.py
+++ b/tests/frameworks/tensorflow/test_tf.py
@@ -1,3 +1,7 @@
+from sensai.util import markUsed
+
+
 def test_tf():
     import sensai.tensorflow
+    markUsed(sensai.tensorflow)
     assert True

From 70c8e50cb1f64a527927e321bae3f8a06d6593f2 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 03:17:28 +0200
Subject: [PATCH 041/131] Added run scripts for pytest

---
 run_pytest_notebooks.sh | 6 ++++++
 run_pytest_tests.sh     | 2 ++
 2 files changed, 8 insertions(+)
 create mode 100644 run_pytest_notebooks.sh
 create mode 100644 run_pytest_tests.sh

diff --git a/run_pytest_notebooks.sh b/run_pytest_notebooks.sh
new file mode 100644
index 00000000..f1895b65
--- /dev/null
+++ b/run_pytest_notebooks.sh
@@ -0,0 +1,6 @@
+if ! git lfs pull; then
+  printf "\n\nERROR: git lfs pull failed\n\n"
+  exit
+fi
+export PYTHONPATH="`realpath src`"
+pytest notebooks
\ No newline at end of file
diff --git a/run_pytest_tests.sh b/run_pytest_tests.sh
new file mode 100644
index 00000000..ed02adaa
--- /dev/null
+++ b/run_pytest_tests.sh
@@ -0,0 +1,2 @@
+export PYTHONPATH=src
+pytest tests
\ No newline at end of file

From 1f1252554cc1ef087e4271cb13e7a1d0bc3a322d Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 03:17:58 +0200
Subject: [PATCH 042/131] Allow the docs build to run without sensai being
 installed

---
 docs/conf.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/docs/conf.py b/docs/conf.py
index ae65ad76..fff3c2e4 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -156,10 +156,14 @@ def findLineFromObjectName(sourceFile, objectName):
 # built documents.
 #
 # The full version, including alpha/beta/rc tags.
-release = pkg_resources.get_distribution(project).version
-# The short X.Y version.
-major_v, minor_v = release.split(".")[:2]
-version = f"{major_v}.{minor_v}"
+try:
+    version = pkg_resources.get_distribution(project).version
+    # The short X.Y version.
+    #major_v, minor_v = release.split(".")[:2]
+    #version = f"{major_v}.{minor_v}"
+except:
+    version = "dev"
+    log.warning(f"The {project} distribution was not found; using dummy version string '{version}'")
 
 # The language for content autogenerated by Sphinx. Refer to documentation
 # for a list of supported languages.

From 3fe7f1bf67b76b5beccc2b63cac63c13b5519a55 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 22:57:16 +0200
Subject: [PATCH 043/131] extractArray: Fixed pandas apply causing dtypes to be
 changed (int64 -> int32),   added option to specify target dtype

---
 src/sensai/util/pandas.py | 19 +++++++++++++++++--
 1 file changed, 17 insertions(+), 2 deletions(-)

diff --git a/src/sensai/util/pandas.py b/src/sensai/util/pandas.py
index 0892812b..d05a7dae 100644
--- a/src/sensai/util/pandas.py
+++ b/src/sensai/util/pandas.py
@@ -63,7 +63,7 @@ def assertChangeWasTracked(self):
                             f"Did you forget to call trackChange on the resulting data frame?")
 
 
-def extractArray(df: pd.DataFrame):
+def extractArray(df: pd.DataFrame, dtype=None):
     """
     Extracts array from data frame. It is expected that each row corresponds to a data point and
     each column corresponds to a "channel". Moreover, all entries are expected to be arrays of the same shape
@@ -101,11 +101,26 @@ def extractArray(df: pd.DataFrame):
     In both cases the returned array will have shape `(N_images, 3, width, height)`
 
     :param df: data frame where each entry is an array of shape tensorShape
+    :param dtype: if not None, convert the array's data type to this type (string or numpy dtype)
     :return: array of shape `(N_rows, N_columns, *tensorShape)` with stripped empty dimensions
     """
     log.debug(f"Stacking tensors of shape {np.array(df.iloc[0, 0]).shape}")
     try:
-        return np.stack(df.apply(np.stack, axis=1)).squeeze()
+        # This compact way of extracting the array causes dtypes to be modified,
+        #    arr = np.stack(df.apply(np.stack, axis=1)).squeeze()
+        # so we use this numpy-only alternative:
+        arr = df.values
+        if arr.shape[1] > 1:
+            arr = np.stack([np.stack(arr[i]) for i in range(arr.shape[0])])
+        else:
+            arr = np.stack(arr[:, 0])
+        # For the case where there is only one row, the old implementation above removed the first dimension,
+        # so we do the same, even though it seems odd to do so (potential problem for batch size 1)
+        if arr.shape[0] == 1:
+            arr = arr[0]
     except ValueError:
         raise ValueError(f"No array can be extracted from frame of length {len(df)} with columns {list(df.columns)}. "
                          f"Make sure that all entries have the same shape")
+    if dtype is not None:
+        arr = arr.astype(dtype, copy=False)
+    return arr

From f8d831952d77e6759c61d936f1321b3a87c3300d Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 22:58:09 +0200
Subject: [PATCH 044/131] Fixed incompatibility with new torch versions where
 class indices must be longs (int64)

Added workaround to make the notebook runnable without sensai being installed
---
 .../Tensor Models with Torchlightning.ipynb   | 247 ++++++++++--------
 1 file changed, 133 insertions(+), 114 deletions(-)

diff --git a/notebooks/Tensor Models with Torchlightning.ipynb b/notebooks/Tensor Models with Torchlightning.ipynb
index 1dd3071f..daf1260b 100644
--- a/notebooks/Tensor Models with Torchlightning.ipynb	
+++ b/notebooks/Tensor Models with Torchlightning.ipynb	
@@ -2,21 +2,24 @@
  "cells": [
   {
    "cell_type": "markdown",
-   "source": [
-    "# Tensor Models with PyTorch-Lightning\n",
-    "\n",
-    "In this notebook we show how sensAI's TensorModel wrappers can be used together with pytorch-lightning models\n",
-    "and trainers for even faster development and experimentation."
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "# Tensor Models with PyTorch-Lightning\n",
+    "\n",
+    "In this notebook we show how sensAI's TensorModel wrappers can be used together with pytorch-lightning models\n",
+    "and trainers for even faster development and experimentation."
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {
+    "collapsed": false
+   },
    "source": [
     "### Before running the notebook\n",
     "\n",
@@ -26,10 +29,7 @@
     "```\n",
     "from the root directory. You can also execute this command directly in the notebook but will need to reload the\n",
     "kernel afterwards\n"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
@@ -46,7 +46,12 @@
     "\n",
     "# in order to get the top level modules; they are not part of the package\n",
     "os.chdir(\"..\")\n",
-    "sys.path.append(os.path.abspath(\".\"))"
+    "sys.path.append(os.path.abspath(\".\"))\n",
+    "try:\n",
+    "    import sensai\n",
+    "except:\n",
+    "    sys.path.append(os.path.abspath(\"src\"))\n",
+    "    import sensai"
    ]
   },
   {
@@ -60,6 +65,7 @@
     "from torch.nn import functional as F\n",
     "import pytorch_lightning as pl\n",
     "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
     "import pandas as pd\n",
     "from sensai.data import InputOutputArrays, DataSplitterFractional\n",
     "\n",
@@ -76,18 +82,18 @@
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "## Loading the Data\n",
-    "\n",
-    "Unlike in the mnist-based torch-lightning tutorial, here we will load the data in a more \"realistic\" way,\n",
-    "namely with pandas from disc."
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "## Loading the Data\n",
+    "\n",
+    "Unlike in the mnist-based torch-lightning tutorial, here we will load the data in a more \"realistic\" way,\n",
+    "namely with pandas from disc."
+   ]
   },
   {
    "cell_type": "code",
@@ -100,7 +106,7 @@
    "outputs": [],
    "source": [
     "X = pd.read_csv(c.datafile_path(\"mnist_train.csv.zip\"))\n",
-    "labels = pd.DataFrame(X.pop(\"label\"))\n",
+    "labels = pd.DataFrame(X.pop(\"label\")).astype(np.int64)\n",
     "X = X.values.reshape(len(X), 28, 28) / 2 ** 8\n",
     "X = pd.DataFrame({\"mnist_image\": list(X)}, index=labels.index)\n",
     "\n",
@@ -115,6 +121,12 @@
   },
   {
    "cell_type": "markdown",
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
    "source": [
     "## Using Data Loaders in pure PyTorch Lightning\n",
     "\n",
@@ -122,16 +134,18 @@
     "\n",
     "We will use sensaAI only for obtaining torch data loaders (which otherwise would require a few more lines of code)\n",
     "by transforming the data frames to arrays, splitting them and converting them to loaders."
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%% md\n"
+     "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
+   },
+   "outputs": [],
    "source": [
     "VALIDATION_FRACTION = 0.1\n",
     "\n",
@@ -141,31 +155,31 @@
     "train_ds, val_ds = splitter.split(full_ds)\n",
     "train_dataloader = train_ds.toTorchDataLoader()\n",
     "val_dataloader = val_ds.toTorchDataLoader()"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
    },
-   "execution_count": null,
-   "outputs": []
-  },
-  {
-   "cell_type": "markdown",
    "source": [
     "Now that we have the data loaders, let us forget about sensAI for the moment. We create the model declaration and\n",
     "trainer with pytorch-lightning and fit on the MNIST data"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%% md\n"
+     "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
+   },
+   "outputs": [],
    "source": [
     "class MNISTModel(pl.LightningModule):\n",
     "\n",
@@ -190,65 +204,63 @@
     "\n",
     "    def configure_optimizers(self):\n",
     "        return torch.optim.Adam(self.parameters(), lr=0.02)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
    },
-   "execution_count": null,
-   "outputs": []
-  },
-  {
-   "cell_type": "code",
+   "outputs": [],
    "source": [
     "mnist_model = MNISTModel()\n",
     "\n",
     "trainer = pl.Trainer(max_epochs=3, progress_bar_refresh_rate=20)\n",
     "trainer.fit(mnist_model, train_dataloader, val_dataloader)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   },
-   "execution_count": null,
-   "outputs": []
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "Let us pick some images from the validation set and look at the results"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "Let us pick some images from the validation set and look at the results"
+   ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
+   "outputs": [],
    "source": [
     "mini_test_set = val_dataloader.dataset[10:20]\n",
     "test_images, test_labels = mini_test_set\n",
     "\n",
     "display(mnist_model(test_images).argmax(axis=1))\n",
     "display(test_labels)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
    },
-   "execution_count": null,
-   "outputs": []
-  },
-  {
-   "cell_type": "markdown",
    "source": [
     "## Wrapping the Model with sensAI\n",
     "\n",
@@ -257,122 +269,129 @@
     "\n",
     "This model maps a tensor to a single label, so the correct class to wrap it with is `PLTensorToScalarClassificationModel`,\n",
     "where the `PL` prefix stands for pytorch-lightning."
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "mnist_model = MNISTModel()\n",
     "trainer = pl.Trainer(max_epochs=3, progress_bar_refresh_rate=20)\n",
     "sensaiMnistModel = PLTensorToScalarClassificationModel(mnist_model, trainer, validationFraction=VALIDATION_FRACTION)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "NB: Even without dedicated wrappers, it would require only a few more lines of code to get a custom implementation of\n",
     "a suitable sensAI base class that wraps one's model."
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "With the wrapped model, we can fit directly on the data frames. We don't lose any of the niceties that pytorch-lightning\n",
     "brings to the game (both the original model and the trainer are available in `sensaiMnistModel`). By wrapping the\n",
     "model and trainer we gain all the safety, transparency, flexibility in feature engineering as well\n",
     "as extensive support for model evaluation that sensAI is all about."
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {},
    "outputs": [],
    "source": [
-    "sensaiMnistModel.fit(X, labels)"
-   ],
+    "display(labels.dtypes)\n",
+    "np.stack(np.stack(labels.values, axis=1).squeeze(), axis=0).shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
+   },
+   "outputs": [],
+   "source": [
+    "sensaiMnistModel.fit(X, labels)"
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "The wrapped model performs predictions on data frames. Let us take some points from the training set,\n",
-    "perform a prediction on them and have a look at the true labels"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "The wrapped model performs predictions on data frames. Let us take some points from the training set,\n",
+    "perform a prediction on them and have a look at the true labels"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "display(\"Predicted data frame\")\n",
     "display(sensaiMnistModel.predict(X.iloc[:10]))\n",
     "display(\"True labels data frame\")\n",
     "display(labels.iloc[:10])"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "## Evaluating Tensor Models\n",
     "\n",
     "TODO - the evaluation part is unfinished yet (although we could already the above classifier with the standard\n",
     "vector model evaluators).\n",
     "We should also include TensorToTensor models here and show how to evaluate them\n"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   }
  ],
  "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3.7.9 ('sensai')",
    "language": "python",
    "name": "python3"
   },
@@ -386,9 +405,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 1
-}
\ No newline at end of file
+}

From aff0809962ce53a667f29a96d5a38e8668b8fc1b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 23:02:23 +0200
Subject: [PATCH 045/131] Renamed notebooks to use all lower-case and no spaces

---
 .../{Clustering Evaluation.ipynb => clustering_evaluation.ipynb}  | 0
 ...to Coordinate Clustering.ipynb => coordinate_clustering.ipynb} | 0
 notebooks/{Intro to sensAI.ipynb => intro_old.ipynb}              | 0
 ...Torchlightning.ipynb => tensor_models_pytorch_lightning.ipynb} | 0
 .../{Tracking Experiments.ipynb => tracking_experiments.ipynb}    | 0
 5 files changed, 0 insertions(+), 0 deletions(-)
 rename notebooks/{Clustering Evaluation.ipynb => clustering_evaluation.ipynb} (100%)
 rename notebooks/{Intro to Coordinate Clustering.ipynb => coordinate_clustering.ipynb} (100%)
 rename notebooks/{Intro to sensAI.ipynb => intro_old.ipynb} (100%)
 rename notebooks/{Tensor Models with Torchlightning.ipynb => tensor_models_pytorch_lightning.ipynb} (100%)
 rename notebooks/{Tracking Experiments.ipynb => tracking_experiments.ipynb} (100%)

diff --git a/notebooks/Clustering Evaluation.ipynb b/notebooks/clustering_evaluation.ipynb
similarity index 100%
rename from notebooks/Clustering Evaluation.ipynb
rename to notebooks/clustering_evaluation.ipynb
diff --git a/notebooks/Intro to Coordinate Clustering.ipynb b/notebooks/coordinate_clustering.ipynb
similarity index 100%
rename from notebooks/Intro to Coordinate Clustering.ipynb
rename to notebooks/coordinate_clustering.ipynb
diff --git a/notebooks/Intro to sensAI.ipynb b/notebooks/intro_old.ipynb
similarity index 100%
rename from notebooks/Intro to sensAI.ipynb
rename to notebooks/intro_old.ipynb
diff --git a/notebooks/Tensor Models with Torchlightning.ipynb b/notebooks/tensor_models_pytorch_lightning.ipynb
similarity index 100%
rename from notebooks/Tensor Models with Torchlightning.ipynb
rename to notebooks/tensor_models_pytorch_lightning.ipynb
diff --git a/notebooks/Tracking Experiments.ipynb b/notebooks/tracking_experiments.ipynb
similarity index 100%
rename from notebooks/Tracking Experiments.ipynb
rename to notebooks/tracking_experiments.ipynb

From 53abc9112b4ac8657fe3b71ac3bb2bd7dd0cf483 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 16 May 2022 23:12:04 +0200
Subject: [PATCH 046/131] Fixed link to other notebook

---
 notebooks/tracking_experiments.ipynb | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/notebooks/tracking_experiments.ipynb b/notebooks/tracking_experiments.ipynb
index c539a9de..7ee4b0ff 100644
--- a/notebooks/tracking_experiments.ipynb
+++ b/notebooks/tracking_experiments.ipynb
@@ -77,7 +77,7 @@
     "\n",
     "The main entrypoint to reproducible experiments is the evaluator api. We will use clustering evaluation for\n",
     "demonstration purposes. We load the data and create a SupervisedClusteringEvaluator, see\n",
-    "[intro to evaluation](Clustering%20Evaluation.ipynb) for more details.\n",
+    "[intro to evaluation](clustering_evaluation.ipynb) for more details.\n",
     "\n",
     "[comment]: <> (TODO - use some VectorModel with an sklearn dataset instead, move the notebook to sensAI repo)"
    ],

From b6c349ea75c9ce52731753ef40f68b1ca372344a Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 18 May 2022 00:07:42 +0200
Subject: [PATCH 047/131] Relaxed requirements of all extras, storing all
 extras dependencies in files (requirements_<extra>.txt)

---
 requirements-relaxed.txt      |  3 ++-
 requirements.txt              |  2 ++
 requirements_geoanalytics.txt |  6 +++++
 requirements_lightgbm.txt     |  3 +++
 requirements_tensorflow.txt   |  3 +++
 requirements_torch.txt        |  4 +++
 setup.py                      | 49 +++++++++++++++++++++++++----------
 tox.ini                       | 16 +++++++-----
 8 files changed, 66 insertions(+), 20 deletions(-)
 create mode 100644 requirements_geoanalytics.txt
 create mode 100644 requirements_lightgbm.txt
 create mode 100644 requirements_tensorflow.txt
 create mode 100644 requirements_torch.txt

diff --git a/requirements-relaxed.txt b/requirements-relaxed.txt
index 1f97947c..645eba2e 100644
--- a/requirements-relaxed.txt
+++ b/requirements-relaxed.txt
@@ -1,4 +1,5 @@
-# this is a relaxed version of requirements.txt where newer versions are allowed
+# sensAI main requirements
+# This is a relaxed version with lower bounds, which exists only for inclusion in environment.yml (developer environment)
 pandas>=1.0.0
 scipy>=1.4
 numpy>=1.18.0
diff --git a/requirements.txt b/requirements.txt
index 9cd84cbe..965c93f6 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,3 +1,5 @@
+# sensAI main requirements
+# These are the pinned lowest versions we test; setup.py relaxes them, changing them to lower bounds
 pandas~=1.0.0
 scipy~=1.4
 numpy~=1.18.0
diff --git a/requirements_geoanalytics.txt b/requirements_geoanalytics.txt
new file mode 100644
index 00000000..6395d261
--- /dev/null
+++ b/requirements_geoanalytics.txt
@@ -0,0 +1,6 @@
+# Requirements for extra 'geoanalytics'
+# These are the pinned lowest versions we test; setup.py relaxes them, changing them to lower bounds
+networkx==2.4
+Shapely~=1.7.0
+geopandas==0.7.0
+utm==0.7.0
diff --git a/requirements_lightgbm.txt b/requirements_lightgbm.txt
new file mode 100644
index 00000000..cbe441d5
--- /dev/null
+++ b/requirements_lightgbm.txt
@@ -0,0 +1,3 @@
+# Requirements for extra 'lightgbm'
+# These are the pinned lowest versions we test; setup.py relaxes them, changing them to lower bounds
+lightgbm==2.3.0
diff --git a/requirements_tensorflow.txt b/requirements_tensorflow.txt
new file mode 100644
index 00000000..52ab1364
--- /dev/null
+++ b/requirements_tensorflow.txt
@@ -0,0 +1,3 @@
+# Requirements for extra 'tensorflow'
+# These are the pinned lowest versions we test; setup.py relaxes them, changing them to lower bounds
+tensorflow==1.15.0
diff --git a/requirements_torch.txt b/requirements_torch.txt
new file mode 100644
index 00000000..cf3fedf3
--- /dev/null
+++ b/requirements_torch.txt
@@ -0,0 +1,4 @@
+# Requirements for extra 'torch'
+# These are the pinned lowest versions we test; setup.py relaxes them, changing them to lower bounds
+torch==1.4.0
+torchtext==0.5.0
diff --git a/setup.py b/setup.py
index 665a2b45..e6caad2e 100644
--- a/setup.py
+++ b/setup.py
@@ -1,5 +1,7 @@
+import functools
 import re
 from typing import Iterable, Dict
+from glob import glob
 
 from setuptools import setup, find_namespace_packages
 
@@ -9,15 +11,26 @@
 geoanalytics_requirements = ['networkx==2.4', 'Shapely~=1.7.0', 'geopandas==0.7.0', 'utm==0.7.0']
 
 
-# list of dependencies where ==/~= dependencies (used by us, particularly in requirements.txt) are relaxed:
+# list of dependencies where ==/~= dependencies (used in requirements.txt and for the extras in requirements_*.txt) are relaxed:
 # any later version is OK (as long as we are not aware of a concrete limitation - and once we are, we shall define
 # the respective upper bound below)
-# TODO: check if we can relax all of the optional requirements as well (above)
-DEPS_VERSION_LOWER_BOUND = ["pandas", "scipy", "numpy", "scikit-learn", "seaborn", "typing-extensions"]
+DEPS_VERSION_LOWER_BOUND = [
+    # main
+    "pandas", "scipy", "numpy", "scikit-learn", "seaborn", "typing-extensions",
+    # extra "torch"
+    "torch", "torchtext",
+    # extra "tensorflow"
+    "tensorflow",
+    # extra "lightgbm"
+    "lightgbm",
+    # extra "geoanalytics"
+    "networkx", "Shapely", "geopandas", "utm",
+]
+# upper bound: map dependency name to lowest exluded version
 DEPS_VERSION_UPPER_BOUND_EXCLUSIVE: Dict[str, str] = {}
 
 
-def required_packages(deps: Iterable[str]):
+def relaxed_requirements(deps: Iterable[str]):
     """
     :param deps: the set of requirements
     :return: the set of updated requirements with the relaxations defined above applied
@@ -25,6 +38,8 @@ def required_packages(deps: Iterable[str]):
     updated_deps = []
     for dep in deps:
         dep = dep.strip()
+        if dep.startswith("#"):
+            continue
         m = re.match(r'([\w-]+)[=~]=', dep)  # match package with == or ~= version spec
         if m:
             package = m.group(1)
@@ -37,6 +52,20 @@ def required_packages(deps: Iterable[str]):
     return updated_deps
 
 
+def relaxed_requirements_from_file(path):
+    with open(path, "r") as f:
+        return relaxed_requirements(f.readlines())
+
+
+# create extras requirements from requirements_*.txt, and add "full" extras which combines them all
+extras_require = {}
+for extras_requirements_file in glob("requirements_*.txt"):
+    m = re.match(r"requirements_(\w+).txt", extras_requirements_file)
+    extra_name = m.group(1)
+    extras_require[extra_name] = relaxed_requirements_from_file(extras_requirements_file)
+extras_require["full"] = functools.reduce(lambda x, y: x + y, list(extras_require.values()))
+
+
 setup(
     name='sensai',
     package_dir={"": "src"},
@@ -46,15 +75,9 @@ def required_packages(deps: Iterable[str]):
     include_package_data=True,
     version='0.1.6',
     description='Library for sensible AI',
-    install_requires=required_packages(open("requirements.txt").readlines()),
+    install_requires=relaxed_requirements_from_file("requirements.txt"),
     dependency_links=["https://download.pytorch.org/whl/torch_stable.html"],
     setup_requires=["wheel"],
-    extras_require={
-        "torch": torch_requirements,
-        "tensorflow": tf_requirements,
-        "lightgbm": lightgbm_requirements,
-        "geoanalytics": geoanalytics_requirements,
-        "full": tf_requirements + torch_requirements + lightgbm_requirements + geoanalytics_requirements
-    },
+    extras_require=extras_require,
     author='jambit GmbH'
-)
\ No newline at end of file
+)
diff --git a/tox.ini b/tox.ini
index 51eba350..4d0187d2 100644
--- a/tox.ini
+++ b/tox.ini
@@ -23,23 +23,27 @@ deps =
     jupyter==1.0.0
     nbconvert==6.5.0
     clearml==0.17.1
-;   TODO: For some reason including this into setup.py makes things slow locally, fail silently on gitlab
-;     and lead to non-ending builds (2.5h+) on github. This dependency should be installable with pip install sensai[torch] though...
+; NOTE: For some reason including this into setup.py makes things slow locally, fail silently on gitlab
+;     and lead to non-ending builds (2.5h+) on github. We might want to add it to extra "torch" though (sensai[torch])
     pytorch-lightning~=1.1.0
+; pin all versions to the lowest tested ones from the requirements files
     -rrequirements.txt
-extras =
-    full
+    -rrequirements_torch.txt
+    -rrequirements_lightgbm.txt
+    -rrequirements_geoanalytics.txt
+    -rrequirements_tensorflow.txt
 
-# TODO or not TODO: notebooks are not executed here again (the build would become very slow) so they are not tested with
+# NOTE: notebooks are not executed here again (the build would become very slow) so they are not tested with
 #   latest dependencies. Hopefully, this is not a problem
 [testenv:py_latest_dependencies]
 commands =
     pytest
 deps =
     pytest
-;   TODO: For some reason including this into setup.py makes things slow locally, fail silently on gitlab
+;   NOTE: For some reason including this into setup.py makes things slow locally, fail silently on gitlab
 ;     and lead to non-ending builds (2.5h+) on github. This dependency should be installable with pip install sensai[torch] though...
     pytorch-lightning>=1.1
+; no pinned requirements included, so relaxed versions created in by setup.py apply
 extras =
     full
 

From 3b286d1d97c8861b6058195fbf0b06a9c7cab222 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 18 May 2022 00:55:50 +0200
Subject: [PATCH 048/131] Raised tensorflow version to ~2.0

---
 requirements_tensorflow.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/requirements_tensorflow.txt b/requirements_tensorflow.txt
index 52ab1364..dc5d55bb 100644
--- a/requirements_tensorflow.txt
+++ b/requirements_tensorflow.txt
@@ -1,3 +1,3 @@
 # Requirements for extra 'tensorflow'
 # These are the pinned lowest versions we test; setup.py relaxes them, changing them to lower bounds
-tensorflow==1.15.0
+tensorflow~=2.0

From cdadb9f54ddee0dfecc268d88e09e7c9859d5e77 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Wed, 18 May 2022 18:32:53 +0200
Subject: [PATCH 049/131] Sync pjm

  commit 854a4464debc16ae2b537603b915a784c0caf394
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed May 18 18:27:42 2022 +0200

      EvalStatsCollection.plotDistribution: More flexibility, added docstring, changed stat to 'percent'

  sensai/evaluation/eval_stats/eval_stats_base.py

  commit a3b24423e07edf1f89b5e3a419ed3e208beed5e9
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 17 21:03:36 2022 +0200

      Improved docstrings

  sensai/evaluation/eval_stats/eval_stats_base.py
  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/eval_stats/eval_stats_regression.py

  commit 4017596698553d572fd9374d100165fe28ec0c85
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 17 21:01:08 2022 +0200

      EvalStatsCollection: Added getMetricNames; made plotDistribution more flexible and return figure

  sensai/evaluation/eval_stats/eval_stats_base.py

  commit 90c6e1440cfe23cac6ee1218ffec567e942521de
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 17 21:00:13 2022 +0200

      MultiDataEvaluationUtil.compareModels: Return a results object with all EvalStats objects

  sensai/evaluation/eval_util.py

  commit 9d74ef709ad1e5e68c944c6cfce5f10fbde205b8
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 16 20:26:05 2022 +0200

      WeightedMean: Added toString and default for weight (1)

  sensai/util/aggregation.py

  commit 2f28506291b7dd38c470c57189037c76853d590c
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 16 20:25:30 2022 +0200

      TimeInterval: Added methods midTimestamp and intersection

  sensai/util/time.py

  commit 3c0a683cba63235b9a107a66a00344884241f090
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 13 10:46:31 2022 +0200

      MultiDataEvaluationUtil.compareModels: Exclude columns with NaN values from aggregations

  sensai/evaluation/eval_util.py

  commit db09a71baeef9352d00fcd391172b3fb5b5abdd2
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 12 16:47:01 2022 +0200

      Added BinaryClassificationMetricRecallForPrecision

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 00bf3fec5ef0940235ceaae85576bdf8a417eab3
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 12 15:32:59 2022 +0200

      Improved handling of positive label for binary classification, differentiating 'guess' from 'none';
      Add class label to metric names (if not one of obvious positive candidates)

  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/evaluator.py

  commit fa6730ed1b51a3bf7636ba1279fad2ce7d024498
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 12 11:33:29 2022 +0200

      * EvaluationUtil.compareModels: Changed interface to return a result object (ModelComparisonData)
        that contains all the model-specific evaluation data, removing the old mechanism
        of returning EvalStats in the data frame
      * Introduced ModelComparisionVisitor for custom data collection during
        model comparisons
      * Added ModelComparisonVisitorAggregatedFeatureImportances

  sensai/evaluation/eval_util.py

  commit daafa582daeea3995aff3d61807b5e4f30a88d49
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 12 11:31:52 2022 +0200

      Added module sklearn_util with class AggregatedFeatureImportances

  sensai/sklearn/sklearn_util.py

  commit bc54e1cc01b2df7b9a324fd5c0efe7f4ebdfd12a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu May 12 11:28:54 2022 +0200

      SkLearnRandomForestVectorClassificationModel: Added getFeatureImportances

  sensai/sklearn/sklearn_classification.py

  commit 6eeef3f2f5408225bedb21087039195e9af6a657
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 10 20:29:59 2022 +0200

      dictString: More general type annotation

  sensai/util/string.py

  commit 7610be3fbc9bcaf0cb6d3fd68d9f01025b6fe08a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 10 10:39:34 2022 +0200

      Added TimeInterval.timeDelta

  sensai/util/time.py

  commit 1b62c6300785734c05e1041cb00f59e745726896
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 9 16:42:51 2022 +0200

      Added util.time.TimeInterval

  sensai/util/time.py

  commit 6b2bdfbb3bbe0c0fd4cbf6c0d4a1589d6fc647f6
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sun May 8 19:19:45 2022 +0200

      Fixed log levels, removed obsolete TODO

  sensai/clustering/greedy_clustering.py

  commit a1dd70be7ca57bc1b9872ef0c73851046229a65e
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sun May 8 19:12:59 2022 +0200

      Added module geoanalytics.geo_clustering with GreedyAgglomerativeGeoCoordClusterer

  sensai/geoanalytics/geo_clustering.py

  commit 89815d24fa689b67b6fc2091d52ac1f67da7f3df
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sun May 8 19:09:50 2022 +0200

      Improved docstring

  sensai/featuregen.py

  commit 0fc4f67c752a4642dfd01f86c2b82ea79c8e30cc
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sun May 8 19:07:55 2022 +0200

       * Added GeoCoord.meanCoord
       * Module geo_coords: Moved local_coord import into the only function that uses it
         to minimise transitive external dependencies of geo_coords

  sensai/geoanalytics/geo_coords.py
---
 src/sensai/clustering/greedy_clustering.py    |   3 +-
 .../evaluation/eval_stats/eval_stats_base.py  |  32 ++-
 .../eval_stats/eval_stats_classification.py   |  60 ++++--
 .../eval_stats/eval_stats_regression.py       |   3 -
 src/sensai/evaluation/eval_util.py            | 184 ++++++++++++++----
 src/sensai/evaluation/evaluator.py            |   5 +-
 src/sensai/featuregen.py                      |   4 +-
 src/sensai/geoanalytics/geo_clustering.py     |  80 ++++++++
 src/sensai/geoanalytics/geo_coords.py         |  13 +-
 src/sensai/sklearn/sklearn_classification.py  |   5 +-
 src/sensai/sklearn/sklearn_util.py            |  44 +++++
 src/sensai/util/aggregation.py                |   9 +-
 src/sensai/util/string.py                     |   4 +-
 src/sensai/util/time.py                       |  24 +++
 14 files changed, 394 insertions(+), 76 deletions(-)
 create mode 100644 src/sensai/geoanalytics/geo_clustering.py
 create mode 100644 src/sensai/sklearn/sklearn_util.py

diff --git a/src/sensai/clustering/greedy_clustering.py b/src/sensai/clustering/greedy_clustering.py
index cfb43165..475f0ae7 100644
--- a/src/sensai/clustering/greedy_clustering.py
+++ b/src/sensai/clustering/greedy_clustering.py
@@ -8,7 +8,6 @@
 log = logging.getLogger(__name__)
 
 
-# TODO: implement an adapter or wrapper such that we get a GreedyAgglomerativeClusteringModel class
 class GreedyAgglomerativeClustering(object):
     """
     An implementation of greedy agglomerative clustering which avoids unnecessary 
@@ -69,7 +68,7 @@ def applyClustering(self) -> List[Cluster]:
             clusters merged into them)
         """
         # compute all possible merges, adding them to the priority queue
-        self.log.info("Computing initial merges")
+        self.log.debug("Computing initial merges")
         for idx, wc in enumerate(self.wrappedClusters):
             self.log.debug("Computing potential merges for cluster index %d" % idx)
             wc.computeMerges(False)
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_base.py b/src/sensai/evaluation/eval_stats/eval_stats_base.py
index af6d1080..57bd34a6 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_base.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_base.py
@@ -89,6 +89,9 @@ def __init__(self, evalStatsList: List[TEvalStats]):
     def getValues(self, metric):
         return self.metrics[metric]
 
+    def getMetricNames(self) -> List[str]:
+        return list(self.metrics.keys())
+
     def aggStats(self):
         agg = {}
         for metric, values in self.metrics.items():
@@ -101,11 +104,27 @@ def meanStats(self):
         metrics.update({f"StdDev[{metric}]": np.std(values) for (metric, values) in self.metrics.items()})
         return metrics
 
-    def plotDistribution(self, metric):
-        values = self.metrics[metric]
-        plt.figure()
-        plt.title(metric)
-        sns.distplot(values)
+    def plotDistribution(self, metricName: str, subtitle: Optional[str] = None, bins=None, kde=True, stat="percent",
+            **kwargs) -> plt.Figure:
+        """
+        Plots the distribution of a metric as a histogram
+
+        :param metricName: the name of the metric for which to plot the distribution (histogram) across evaluations
+        :param subtitle: the subtitle to add, if any
+        :param bins: the histogram bins (number of bins or boundaries); if None, auto
+        :param kde: whether to add a kernel density estimator plot
+        :param stat: the statistic to compute for each bin ('percent', 'probability', 'count', 'frequency' or 'density'), y-axis value
+        :param kwargs: additional parameters to pass to seaborn.histplot (see https://seaborn.pydata.org/generated/seaborn.histplot.html)
+        :return:
+        """
+        values = self.metrics[metricName]
+        fig = plt.figure()
+        title = metricName
+        if subtitle is not None:
+            title += "\n" + subtitle
+        plt.title(title)
+        sns.histplot(values, kde=kde, bins=bins, stat=stat, **kwargs)
+        return fig
 
     def toDataFrame(self) -> pd.DataFrame:
         """
@@ -120,6 +139,9 @@ def toDataFrame(self) -> pd.DataFrame:
 
     @abstractmethod
     def getGlobalStats(self) -> TEvalStats:
+        """
+        :return: an EvalStats object that combines the data from all contained EvalStats objects
+        """
         pass
 
     def __str__(self):
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index 8db7806c..0b383168 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -17,6 +17,8 @@
 
 log = logging.getLogger(__name__)
 
+
+GUESS = ("__guess",)
 BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES = [1, True, "1", "True"]
 
 
@@ -86,6 +88,9 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
 
 class BinaryClassificationMetric(ClassificationMetric, ABC):
     def __init__(self, positiveClassLabel, name: str = None):
+        name = name if name is not None else self.__class__.name
+        if positiveClassLabel not in BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES:
+            name = f"{name}[{positiveClassLabel}]"
         super().__init__(name)
         self.positiveClassLabel = positiveClassLabel
 
@@ -120,6 +125,30 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return f1_score(y_true, y_predicted, pos_label=self.positiveClassLabel)
 
 
+class BinaryClassificationMetricRecallForPrecision(BinaryClassificationMetric):
+    """
+    Computes the maximum recall that can be achieved in cases where at least the given precision is reached.
+    The given precision may not be achievable at all, in which case the metric value is NaN.
+    """
+    def __init__(self, precision: float, positiveClassLabel):
+        self.minPrecision = precision
+        super().__init__(positiveClassLabel, name=f"recallForPrecision[{precision}]")
+
+    def computeValueForEvalStats(self, evalStats: "ClassificationEvalStats"):
+        varData = evalStats.getBinaryClassificationProbabilityThresholdVariationData()
+        result = np.nan
+        for c in varData.counts:
+            precision = c.getPrecision()
+            if precision >= self.minPrecision:
+                recall = c.getRecall()
+                if np.isnan(result) or result < recall:
+                    result = recall
+        return result
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        raise NotImplementedError(f"{self.__class__.__qualname__} only supports computeValueForEvalStats")
+
+
 class ClassificationEvalStats(PredictionEvalStats["ClassificationMetric"]):
     def __init__(self, y_predicted: PredictionArray = None,
             y_true: PredictionArray = None,
@@ -127,7 +156,7 @@ def __init__(self, y_predicted: PredictionArray = None,
             labels: PredictionArray = None,
             metrics: Sequence["ClassificationMetric"] = None,
             additionalMetrics: Sequence["ClassificationMetric"] = None,
-            binaryPositiveLabel=None):
+            binaryPositiveLabel=GUESS):
         """
         :param y_predicted: the predicted class labels
         :param y_true: the true class labels
@@ -135,10 +164,11 @@ def __init__(self, y_predicted: PredictionArray = None,
         :param labels: the list of class labels
         :param metrics: the metrics to compute for evaluation; if None, use default metrics
         :param additionalMetrics: the metrics to additionally compute
-        :param binaryPositiveLabel: the label of the positive class for the case where it is a binary classification;
-            if None, check `labels` for occurrence of one of BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES in the respective
-            order, and if none of these appear in `labels`, the classification will not be treated as a binary classification and
-            a warning will be logged
+        :param binaryPositiveLabel: the label of the positive class for the case where it is a binary classification, adding further
+            binary metrics by default;
+            if GUESS (default), check `labels` (if length 2) for occurrence of one of BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES in
+            the respective order and use the first one found (if any);
+            if None, treat the problem as non-binary, regardless of the labels being used.
         """
         self.labels = labels
         self.y_predictedClassProbabilities = y_predictedClassProbabilities
@@ -151,16 +181,21 @@ def __init__(self, y_predicted: PredictionArray = None,
                 raise ValueError("Row count in class probabilities data frame does not match ground truth")
 
         numLabels = len(labels)
-        if binaryPositiveLabel is not None:
-            if numLabels != 2:
-                raise ValueError(f"Passed binaryPositiveLabel for non-binary classification (labels={self.labels})")
-            if binaryPositiveLabel not in self.labels:
-                raise ValueError(f"The binary positive label {binaryPositiveLabel} does not appear in labels={labels}")
-        else:
+        if binaryPositiveLabel == GUESS:
+            foundCandidateLabel = False
             if numLabels == 2:
                 for c in BINARY_CLASSIFICATION_POSITIVE_LABEL_CANDIDATES:
                     if c in labels:
                         binaryPositiveLabel = c
+                        foundCandidateLabel = True
+                        break
+            if not foundCandidateLabel:
+                binaryPositiveLabel = None
+        elif binaryPositiveLabel is not None:
+            if numLabels != 2:
+                log.warning(f"Passed binaryPositiveLabel for non-binary classification (labels={self.labels})")
+            if binaryPositiveLabel not in self.labels:
+                log.warning(f"The binary positive label {binaryPositiveLabel} does not appear in labels={labels}")
         if numLabels == 2 and binaryPositiveLabel is None:
             log.warning(f"Binary classification (labels={labels}) without specification of positive class label; binary classification metrics will not be considered")
         self.binaryPositiveLabel = binaryPositiveLabel
@@ -239,9 +274,6 @@ def __init__(self, evalStatsList: List[ClassificationEvalStats]):
         self.globalStats = None
 
     def getGlobalStats(self) -> ClassificationEvalStats:
-        """
-        Gets an evaluation statistics object that combines the data from all contained eval stats objects
-        """
         if self.globalStats is None:
             y_true = np.concatenate([evalStats.y_true for evalStats in self.statsList])
             y_predicted = np.concatenate([evalStats.y_predicted for evalStats in self.statsList])
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_regression.py b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
index 2a8732d9..16e557e1 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_regression.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
@@ -266,9 +266,6 @@ def __init__(self, evalStatsList: List[RegressionEvalStats]):
         self.globalStats = None
 
     def getGlobalStats(self) -> RegressionEvalStats:
-        """
-        Gets an evaluation statistics object that combines the data from all contained eval stats objects
-        """
         if self.globalStats is None:
             y_true = np.concatenate([evalStats.y_true for evalStats in self.statsList])
             y_predicted = np.concatenate([evalStats.y_predicted for evalStats in self.statsList])
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 79d0bfd8..5294365f 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -9,7 +9,8 @@
 import logging
 from abc import ABC, abstractmethod
 from collections import defaultdict
-from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set
+from dataclasses import dataclass
+from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set, Iterable, List
 
 import matplotlib.figure
 import matplotlib.pyplot as plt
@@ -30,6 +31,7 @@
     VectorRegressionModelEvaluationData, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, \
     VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, VectorModelEvaluatorParams
 from ..data import InputOutputData
+from ..sklearn.sklearn_util import AggregatedFeatureImportances
 from ..util.io import ResultWriter
 from ..util.string import prettyStringRepr
 from ..vector_model import VectorClassificationModel, VectorRegressionModel, VectorModel
@@ -302,7 +304,7 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
 
     def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None, useCrossValidation=False,
             fitModels=True, writeIndividualResults=True, sortColumn: Optional[str] = None, sortAscending: bool = True,
-            includeEvalStatsObjects=False) -> pd.DataFrame:
+            visitors: Optional[Iterable["ModelComparisonVisitor"]] = None) -> "ModelComparisonData":
         """
         Compares several models via simple evaluation or cross-validation
 
@@ -315,50 +317,54 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
             summary)
         :param sortColumn: column/metric name by which to sort
         :param sortAscending: whether to sort in ascending order
-        :param includeEvalStatsObjects: whether to include, in addition to the metrics, a column "evalStats" (which holds
-            the classification or regression evaluation data object) in the result data frame
-        :return: a data frame containing evaluation metrics on all models
+        :param visitors: visitors which may process individual results
+        :return: the comparison results
         """
         statsList = []
+        resultByModelName = {}
         for model in models:
+            modelName = model.getName()
             if useCrossValidation:
                 if not fitModels:
                     raise ValueError("Cross-validation necessitates that models be retrained; got fitModels=False")
-                crossValidationResult = self.performCrossValidation(model, resultWriter=resultWriter if writeIndividualResults else None)
-                evalStatsCollection = crossValidationResult.getEvalStatsCollection()
+                crossValData = self.performCrossValidation(model, resultWriter=resultWriter if writeIndividualResults else None)
+                modelResult = ModelComparisonData.Result(crossValData=crossValData)
+                resultByModelName[modelName] = modelResult
+                evalStatsCollection = crossValData.getEvalStatsCollection()
                 statsDict = evalStatsCollection.aggStats()
-                if includeEvalStatsObjects:
-                    statsDict["evalStats"] = evalStatsCollection.getGlobalStats()
             else:
-                evalStats: EvalStats = self.performSimpleEvaluation(model, resultWriter=resultWriter if writeIndividualResults else None,
-                    fitModel=fitModels).getEvalStats()
+                evalData = self.performSimpleEvaluation(model, resultWriter=resultWriter if writeIndividualResults else None,
+                    fitModel=fitModels)
+                modelResult = ModelComparisonData.Result(evalData=evalData)
+                resultByModelName[modelName] = modelResult
+                evalStats = evalData.getEvalStats()
                 statsDict = evalStats.getAll()
-                if includeEvalStatsObjects:
-                    statsDict["evalStats"] = evalStats
-            statsDict["modelName"] = model.getName()
+            statsDict["modelName"] = modelName
             statsList.append(statsDict)
+            if visitors is not None:
+                for visitor in visitors:
+                    visitor.visit(modelName, modelResult)
         resultsDF = pd.DataFrame(statsList).set_index("modelName")
         if sortColumn is not None:
             if sortColumn not in resultsDF.columns:
                 log.warning(f"Requested sort column '{sortColumn}' not in list of columns {list(resultsDF.columns)}")
             else:
                 resultsDF.sort_values(sortColumn, ascending=sortAscending, inplace=True)
-        resultsDFForReporting = resultsDF if not includeEvalStatsObjects else resultsDF.drop(columns="evalStats")
-        strResults = f"Model comparison results:\n{resultsDFForReporting.to_string()}"
+        strResults = f"Model comparison results:\n{resultsDF.to_string()}"
         log.info(strResults)
         if resultWriter is not None:
             suffix = "crossval" if useCrossValidation else "simple-eval"
             strResults += "\n\n" + "\n\n".join([f"{model.getName()} = {str(model)}" for model in models])
             resultWriter.writeTextFile(f"model-comparison-results-{suffix}", strResults)
-        return resultsDF
+        return ModelComparisonData(resultsDF, resultByModelName)
 
-    def compareModelsCrossValidation(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None) -> pd.DataFrame:
+    def compareModelsCrossValidation(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None) -> "ModelComparisonData":
         """
         Compares several models via cross-validation
 
         :param models: the models to compare
         :param resultWriter: a writer with which to store results of the comparison
-        :return: a data frame containing evaluation metrics on all models
+        :return: the comparison results
         """
         return self.compareModels(models, resultWriter=resultWriter, useCrossValidation=True)
 
@@ -445,20 +451,26 @@ def __init__(self, inputOutputDataDict: Dict[str, InputOutputData], keyName: str
         else:
             self.metaDF = None
 
-    def compareModelsCrossValidation(self, modelFactories: Sequence[Callable[[], VectorModel]],
+    def compareModelsCrossValidation(self, modelFactories: Sequence[Callable[[], Union[VectorRegressionModel, VectorClassificationModel]]],
             resultWriter: Optional[ResultWriter] = None, writePerDatasetResults=True,
-            crossValidatorParams: Optional[Dict[str, Any]] = None, columnNameForModelRanking: str = None, rankMax=True) -> Tuple[pd.DataFrame, pd.DataFrame]:
+            crossValidatorParams: Optional[Dict[str, Any]] = None, columnNameForModelRanking: str = None, rankMax=True) -> "MultiDataModelComparisonData":
+        """
+        Deprecated. Use compareModels instead.
+        """
         return self.compareModels(modelFactories, useCrossValidation=True, resultWriter=resultWriter, writePerDatasetResults=writePerDatasetResults,
             crossValidatorParams=crossValidatorParams,
             columnNameForModelRanking=columnNameForModelRanking, rankMax=rankMax)
 
-    def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], useCrossValidation=False,
-            resultWriter: Optional[ResultWriter] = None, writePerDatasetResults=True,
+    def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegressionModel, VectorClassificationModel]]],
+            useCrossValidation=False,
+            resultWriter: Optional[ResultWriter] = None,
+            writePerDatasetResults=True,
             evaluatorParams: Optional[Union[VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, Dict[str, Any]]] = None,
             crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None,
             columnNameForModelRanking: str = None,
             rankMax=True,
-            createCombinedEvalStatsPlots=False) -> Tuple[pd.DataFrame, pd.DataFrame]:
+            createCombinedEvalStatsPlots=False,
+            visitors: Optional[Iterable["ModelComparisonVisitor"]] = None) -> Union["RegressionMultiDataModelComparisonData", "ClassificationMultiDataModelComparisonData"]:
         """
         :param modelFactories: a sequence of factory functions for the creation of models to evaluate; every factory must result
             in a model with a fixed model name (otherwise results cannot be correctly aggregated)
@@ -473,18 +485,26 @@ def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], use
         :param createCombinedEvalStatsPlots: whether to combine, for each type of model, the EvalStats objects from the individual experiments
             into a single objects that holds all results and use it to create plots reflecting the overall result.
             Note that for classification, this is only possible if all individual experiments use the same set of class labels.
+        :param visitors: visitors which may process individual results
         :return: a pair of data frames (allDF, meanDF) where allDF contains all the individual evaluation results (one row per data set)
             and meanDF contains one row for each model with results averaged across datasets
         """
-        allResults = pd.DataFrame()
+        allResultsDF = pd.DataFrame()
         evalStatsByModelName = defaultdict(list)
         isRegression = None
         plotCollector: Optional[EvalStatsPlotCollector] = None
+        modelNames = None
 
         for i, (key, inputOutputData) in enumerate(self.inputOutputDataDict.items(), start=1):
             log.info(f"Evaluating models for data set #{i}/{len(self.inputOutputDataDict)}: {self.keyName}={key}")
             models = [f() for f in modelFactories]
 
+            currentModelNames = [model.getName() for model in models]
+            if modelNames is None:
+                modelNames = currentModelNames
+            elif modelNames != currentModelNames:
+                log.warning(f"Model factories do not produce fixed names; use model.withName to name your models. Got {currentModelNames}, previously got {modelNames}")
+
             if isRegression is None:
                 modelsAreRegression = [model.isRegressionModel() for model in models]
                 if all(modelsAreRegression):
@@ -502,7 +522,8 @@ def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], use
 
             # compute data frame with results for current data set
             childResultWriter = resultWriter.childForSubdirectory(key) if (writePerDatasetResults and resultWriter is not None) else None
-            df = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter, includeEvalStatsObjects=True)
+            comparisonData = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter, visitors=visitors)
+            df = comparisonData.resultsDF
 
             # augment data frame
             df[self.keyName] = key
@@ -510,35 +531,38 @@ def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], use
             df = df.reset_index(drop=True)
 
             # collect eval stats objects by model name and remove from data frame
-            for _, row in df.iterrows():
-                modelName = row.modelName
-                evalStats = row.evalStats
+            for modelName, result in comparisonData.resultByModelName.items():
+                if useCrossValidation:
+                    evalStats = result.crossValData.getEvalStatsCollection().getGlobalStats()
+                else:
+                    evalStats = result.evalData.getEvalStats()
                 evalStatsByModelName[modelName].append(evalStats)
-            df = df.drop(columns="evalStats")
 
-            allResults = pd.concat((allResults, df))
+            allResultsDF = pd.concat((allResultsDF, df))
 
         if self.metaDF is not None:
-            allResults = allResults.join(self.metaDF, on=self.keyName, how="left")
+            allResultsDF = allResultsDF.join(self.metaDF, on=self.keyName, how="left")
 
-        strAllResults = f"All results:\n{allResults.to_string()}"
+        strAllResults = f"All results:\n{allResultsDF.to_string()}"
         log.info(strAllResults)
 
-        allResultsGrouped = allResults.groupby("modelName")
-        meanResults: pd.DataFrame = allResultsGrouped.mean()
-        if columnNameForModelRanking in meanResults:
-            meanResults.sort_values(columnNameForModelRanking, inplace=True, ascending=not rankMax)
-        strMeanResults = f"Mean results (averaged across {len(self.inputOutputDataDict)} data sets):\n{meanResults.to_string()}"
+        # create mean result by model, removing any metrics/columns that produced NaN values
+        # (because the mean would be computed without them, skipna parameter unsupported)
+        allResultsGrouped = allResultsDF.dropna(axis=1).groupby("modelName")
+        meanResultsDF: pd.DataFrame = allResultsGrouped.mean()
+        if columnNameForModelRanking in meanResultsDF:
+            meanResultsDF.sort_values(columnNameForModelRanking, inplace=True, ascending=not rankMax)
+        strMeanResults = f"Mean results (averaged across {len(self.inputOutputDataDict)} data sets):\n{meanResultsDF.to_string()}"
         log.info(strMeanResults)
 
         # create further aggregations
         aggDFs = []
-        for opName, aggFn in [("std", lambda x: x.std()), ("min", lambda x: x.min()), ("max", lambda x: x.max())]:
+        for opName, aggFn in [("mean", lambda x: x.mean()), ("std", lambda x: x.std()), ("min", lambda x: x.min()), ("max", lambda x: x.max())]:
             aggDF = aggFn(allResultsGrouped)
             aggDF.columns = [f"{opName}[{c}]" for c in aggDF.columns]
             aggDFs.append(aggDF)
         furtherAggsDF = pd.concat(aggDFs, axis=1)
-        furtherAggsDF = furtherAggsDF.loc[meanResults.index]  # apply same sort order (index is modelName)
+        furtherAggsDF = furtherAggsDF.loc[meanResultsDF.index]  # apply same sort order (index is modelName)
         columnOrder = functools.reduce(lambda a, b: a + b, [list(t) for t in zip(*[df.columns for df in aggDFs])])
         furtherAggsDF = furtherAggsDF[columnOrder]
         strFurtherAggs = f"Further aggregations:\n{furtherAggsDF.to_string()}"
@@ -558,4 +582,82 @@ def compareModels(self, modelFactories: Sequence[Callable[[], VectorModel]], use
                     evalStats = ClassificationEvalStatsCollection(evalStatsList).getGlobalStats()
                 plotCollector.createPlots(evalStats, subtitle=modelName, resultCollector=resultCollector)
 
-        return allResults, meanResults
+        if isRegression:
+            return RegressionMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
+        else:
+            return ClassificationMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
+
+
+class ModelComparisonData:
+    @dataclass
+    class Result:
+        evalData: Union[VectorClassificationModelEvaluationData, VectorRegressionModelEvaluationData] = None
+        crossValData: Union[VectorClassificationModelCrossValidationData, VectorRegressionModelCrossValidationData] = None
+
+    def __init__(self, resultsDF: pd.DataFrame, resultsByModelName: Dict[str, Result]):
+        self.resultsDF = resultsDF
+        self.resultByModelName = resultsByModelName
+
+
+class ModelComparisonVisitor(ABC):
+    @abstractmethod
+    def visit(self, modelName: str, result: ModelComparisonData.Result):
+        pass
+
+
+class ModelComparisonVisitorAggregatedFeatureImportances(ModelComparisonVisitor):
+    """
+    During a model comparison, computes aggregated feature importance values for the model with the given name
+    """
+    def __init__(self, modelName: str):
+        """
+        :param modelName: the name of the model for which to compute the aggregated feature importance values
+        """
+        self.modelName = modelName
+        self.aggFeatureImportance = AggregatedFeatureImportances()
+
+    def visit(self, modelName: str, result: ModelComparisonData.Result):
+        if modelName == self.modelName:
+            if result.crossValData is not None:
+                models = result.crossValData.trainedModels
+                if models is not None:
+                    for model in models:
+                        self._collect(model)
+                else:
+                    raise ValueError("Models were not returned in cross-validation results")
+            elif result.evalData is not None:
+                self._collect(result.evalData.model)
+
+    def _collect(self, model):
+        if not hasattr(model, "getFeatureImportances"):
+            raise ValueError(f"Got model which does not have method 'getFeatureImportances': {model}")
+        self.aggFeatureImportance.add(model.getFeatureImportances())
+
+
+class MultiDataModelComparisonData(Generic[TEvalStats, TEvalStatsCollection], ABC):
+    def __init__(self, allResultsDF: pd.DataFrame, meanResultsDF: pd.DataFrame, aggResultsDF: pd.DataFrame,
+            evalStatsByModelName: Dict[str, List[TEvalStats]]):
+        self.allResultsDF = allResultsDF
+        self.meanResultsDF = meanResultsDF
+        self.aggResultsDF = aggResultsDF
+        self.evalStatsByModelName = evalStatsByModelName
+
+    def getModelNames(self) -> List[str]:
+        return list(self.evalStatsByModelName.keys())
+
+    def getEvalStatsList(self, modelName: str) -> List[TEvalStats]:
+        return self.evalStatsByModelName[modelName]
+
+    @abstractmethod
+    def getEvalStatsCollection(self, modelName: str) -> TEvalStatsCollection:
+        pass
+
+
+class ClassificationMultiDataModelComparisonData(MultiDataModelComparisonData[ClassificationEvalStats, ClassificationEvalStatsCollection]):
+    def getEvalStatsCollection(self, modelName: str):
+        return ClassificationEvalStatsCollection(self.getEvalStatsList(modelName))
+
+
+class RegressionMultiDataModelComparisonData(MultiDataModelComparisonData[RegressionEvalStats, RegressionEvalStatsCollection]):
+    def getEvalStatsCollection(self, modelName: str):
+        return RegressionEvalStatsCollection(self.getEvalStatsList(modelName))
\ No newline at end of file
diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index 8ad78414..38ebc67a 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -5,6 +5,7 @@
 
 import pandas as pd
 
+from .eval_stats import GUESS
 from .eval_stats.eval_stats_base import EvalStats, EvalStatsCollection
 from .eval_stats.eval_stats_classification import ClassificationEvalStats, ClassificationMetric
 from .eval_stats.eval_stats_regression import RegressionEvalStats, RegressionEvalStatsCollection, RegressionMetric
@@ -319,7 +320,7 @@ class VectorClassificationModelEvaluationData(VectorModelEvaluationData[Classifi
 class VectorClassificationModelEvaluatorParams(VectorModelEvaluatorParams):
     def __init__(self, dataSplitter: DataSplitter = None, fractionalSplitTestFraction: float = None, fractionalSplitRandomSeed=42,
             fractionalSplitShuffle=True, additionalMetrics: Sequence[ClassificationMetric] = None,
-            computeProbabilities: bool = False, binaryPositiveLabel=None):
+            computeProbabilities: bool = False, binaryPositiveLabel=GUESS):
         """
         :param dataSplitter: [if test data must be obtained via split] a splitter to use in order to obtain; if None, must specify
             fractionalSplitTestFraction for fractional split (default)
@@ -329,6 +330,8 @@ def __init__(self, dataSplitter: DataSplitter = None, fractionalSplitTestFractio
             splitting it
         :param additionalMetrics: additional metrics to apply
         :param computeProbabilities: whether to compute class probabilities
+        :param binaryPositiveLabel: the positive class label for binary classification; if GUESS, true to detect from labels;
+            if None, no detection (non-binary classification)
         """
         super().__init__(dataSplitter, fractionalSplitTestFraction=fractionalSplitTestFraction, fractionalSplitRandomSeed=fractionalSplitRandomSeed,
             fractionalSplitShuffle=fractionalSplitShuffle)
diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index f9889c1f..009be4fd 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -32,7 +32,9 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
                  normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
                  normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None, addCategoricalDefaultRules=True):
         """
-        :param categoricalFeatureNames: either a sequence of column names or a regex that is to match all categorical feature names.
+        :param categoricalFeatureNames: either a sequence of column names or a regex that is to match all categorical feature names
+            (which must not only work for the feature generated by this feature, i.e. it should not match feature names generated
+            by other feature generators).
             It will be ensured that the respective columns in the generated data frames will have dtype 'category'.
             Furthermore, presence of meta-information can later be leveraged for further transformations, e.g. one-hot encoding.
         :param normalisationRules: Rules to be used by DFTNormalisation (e.g. for constructing an input transformer for a model).
diff --git a/src/sensai/geoanalytics/geo_clustering.py b/src/sensai/geoanalytics/geo_clustering.py
new file mode 100644
index 00000000..3a397bdb
--- /dev/null
+++ b/src/sensai/geoanalytics/geo_clustering.py
@@ -0,0 +1,80 @@
+import itertools
+import math
+from typing import List, Tuple
+
+import numpy as np
+
+from .geo_coords import GeoCoord
+from .local_coords import LocalCoordinateSystem
+from ..clustering import GreedyAgglomerativeClustering
+
+
+class GreedyAgglomerativeGeoCoordClusterer:
+    def __init__(self, maxMinDistanceForMergeM: float, maxDistanceM: float, minClusterSize: int):
+        """
+        :param maxMinDistanceForMergeM: the maximum distance, in metres, for the minimum distance between two existing clusters for a merge
+            to be admissible
+        :param maxDistanceM: the maximum distance, in metres, between any two points for the points to be allowed to be in the same cluster
+        :param minClusterSize: the minimum number of points any valid cluster must ultimately contain; the points in any smaller clusters
+            shall be considered as outliers
+        """
+        self.minClusterSize = minClusterSize
+        self.maxMinDistanceForMerge = maxMinDistanceForMergeM
+        self.squaredMaxMinDistanceForMerge = maxMinDistanceForMergeM * maxMinDistanceForMergeM
+        self.squaredMaxDistance = maxDistanceM * maxDistanceM
+        self.localPoints = None
+
+    class LocalPoint:
+        def __init__(self, xy: np.ndarray, idx: int):
+            self.idx = idx
+            self.xy = xy
+
+    class Cluster(GreedyAgglomerativeClustering.Cluster):
+        def __init__(self, point: "GreedyAgglomerativeGeoCoordClusterer.LocalPoint", clusterer: 'GreedyAgglomerativeGeoCoordClusterer'):
+            self.clusterer = clusterer
+            self.points = [point]
+
+        def mergeCost(self, other):
+            cartesianProduct = itertools.product(self.points, other.points)
+            minSquaredDistance = math.inf
+            for p1, p2 in cartesianProduct:
+                diff = p1.xy - p2.xy
+                squaredDistance = np.dot(diff, diff)
+                if squaredDistance > self.clusterer.squaredMaxDistance:
+                    return math.inf
+                else:
+                    minSquaredDistance = min(squaredDistance, minSquaredDistance)
+            if minSquaredDistance <= self.clusterer.squaredMaxMinDistanceForMerge:
+                return minSquaredDistance
+            return math.inf
+
+        def merge(self, other):
+            self.points += other.points
+
+    def fitGeoCoords(self, geoCoords: List[GeoCoord], lcs: LocalCoordinateSystem = None) -> None:
+        """
+        :param geoCoords: the coordinates to be clustered
+        :param lcs: the local coordinate system to use for clustering; if None, compute based on mean coordinates
+        """
+        if lcs is None:
+            meanCoord = GeoCoord.meanCoord(geoCoords)
+            lcs = LocalCoordinateSystem(meanCoord.lat, meanCoord.lon)
+        self.localPoints = [self.LocalPoint(np.array(lcs.getLocalCoords(p.lat, p.lon)), idx) for idx, p in enumerate(geoCoords)]
+        clusters = [self.Cluster(lp, self) for lp in self.localPoints]
+        clusters = GreedyAgglomerativeClustering(clusters).applyClustering()
+        self.clusters = clusters
+
+    def clustersIndices(self) -> Tuple[List[List[int]], List[int]]:
+        """
+        :return: a tuple (clusters, outliers), where clusters is a list of lists of original point indices where each inner list forms
+         a cluster and outliers is the list of indices of points not within a cluster
+        """
+        outliers = []
+        clusters = []
+        for c in self.clusters:
+            indices = [p.idx for p in c.points]
+            if len(c.points) < self.minClusterSize:
+                outliers.extend(indices)
+            else:
+                clusters.append(indices)
+        return clusters, outliers
diff --git a/src/sensai/geoanalytics/geo_coords.py b/src/sensai/geoanalytics/geo_coords.py
index 93b78398..6878583b 100644
--- a/src/sensai/geoanalytics/geo_coords.py
+++ b/src/sensai/geoanalytics/geo_coords.py
@@ -3,14 +3,13 @@
 """
 
 import math
-from typing import Tuple
+from typing import Tuple, Iterable
 
+import numpy as np
 import pandas as pd
 
-from .local_coords import LocalCoordinateSystem
 from ..util.string import ToStringMixin
 
-
 EARTH_RADIUS = 6371000
 EARTH_CIRCUMFERENCE = 2 * math.pi * EARTH_RADIUS
 LATITUDE_PER_METRE = 360.0 / EARTH_CIRCUMFERENCE
@@ -158,6 +157,13 @@ def squaredDistanceTo(self, gpsPosition: 'GeoCoord'):
     def localCoords(self, lcs):
         return lcs.getLocalCoords(self.lat, self.lon)
 
+    @classmethod
+    def meanCoord(cls, geoCoords: Iterable["GeoCoord"]):
+        meanLat = np.mean([c.lat for c in geoCoords])
+        meanLon = np.mean([c.lon for c in geoCoords])
+        # noinspection PyTypeChecker
+        return GeoCoord(meanLat, meanLon)
+
 
 class GpsTracePoint(GeoCoord):
     def __init__(self, lat, lon, time: pd.Timestamp):
@@ -177,6 +183,7 @@ def __init__(self, minLat: float, minLon: float, maxLat: float, maxLon: float):
     @staticmethod
     def fromCircle(centreLat, centreLon, radiusM):
         """Creates the bounding rectangle for the given circular area"""
+        from .local_coords import LocalCoordinateSystem
         lcs = LocalCoordinateSystem(centreLat, centreLon)
         minLat, minLon = lcs.getLatLon(-radiusM, -radiusM)
         maxLat, maxLon = lcs.getLatLon(radiusM, radiusM)
diff --git a/src/sensai/sklearn/sklearn_classification.py b/src/sensai/sklearn/sklearn_classification.py
index e32d7d9d..a57b80ae 100644
--- a/src/sensai/sklearn/sklearn_classification.py
+++ b/src/sensai/sklearn/sklearn_classification.py
@@ -1,5 +1,5 @@
 import logging
-from typing import Union, Optional
+from typing import Union, Optional, Dict
 
 import sklearn.ensemble
 import sklearn.naive_bayes
@@ -25,6 +25,9 @@ def __init__(self, min_samples_leaf=8, random_state=42, useComputedClassWeights=
             useComputedClassWeights=useComputedClassWeights,
             **modelArgs)
 
+    def getFeatureImportances(self) -> Dict[str, float]:
+        return  dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+
 
 class SkLearnMLPVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     def __init__(self, hidden_layer_sizes=(100,), activation: str = "relu",
diff --git a/src/sensai/sklearn/sklearn_util.py b/src/sensai/sklearn/sklearn_util.py
new file mode 100644
index 00000000..9fef82fd
--- /dev/null
+++ b/src/sensai/sklearn/sklearn_util.py
@@ -0,0 +1,44 @@
+import collections
+from typing import Dict, Union
+
+
+class AggregatedFeatureImportances:
+    """
+    Aggregates feature importance values from models that suppurt method getFeatureImportances
+    (e.g. sklearn's RandomForest models and compatible models from lightgbm, etc.)
+    """
+    def __init__(self, *featureImportanceDicts: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
+        self.aggDict = None
+        self._isNested = None
+        self._numDictsAdded = 0
+        for d in featureImportanceDicts:
+            self.add(d)
+
+    @staticmethod
+    def _isDict(x):
+        return hasattr(x, "get")
+
+    def add(self, featureImportance: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
+        """
+        Adds the feature importance values from the given dictionary
+
+        :param featureImportance: the dictionary obtained via a model's getFeatureImportances method
+        """
+        if self._isNested is None:
+            self._isNested = self._isDict(next(iter(featureImportance.values())))
+        if self._isNested:
+            if self.aggDict is None:
+                self.aggDict = collections.defaultdict(lambda: collections.defaultdict(lambda: 0))
+                for targetName, d in featureImportance.items():
+                    d: dict
+                    for featureName, value in d.items():
+                        self.aggDict[targetName][featureName] += value
+        else:
+            if self.aggDict is None:
+                self.aggDict = collections.defaultdict(lambda: 0)
+            for featureName, value in featureImportance.items():
+                self.aggDict[featureName] += value
+        self._numDictsAdded += 1
+
+    def getFeatureImportanceSum(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
+        return self.aggDict
diff --git a/src/sensai/util/aggregation.py b/src/sensai/util/aggregation.py
index 12cf1307..e875a6d2 100644
--- a/src/sensai/util/aggregation.py
+++ b/src/sensai/util/aggregation.py
@@ -75,7 +75,7 @@ def _toStringObjectInfo(self):
         return ", ".join([f"{str(k)}: {v} ({v/self.totalCount:.3f})" for k, v in self.counts.items()])
 
 
-class WeightedMean:
+class WeightedMean(ToStringMixin):
     """
     Computes a weighted mean of values
     """
@@ -83,12 +83,15 @@ def __init__(self):
         self.weightedValueSum = 0
         self.weightSum = 0
 
-    def add(self, value, weight) -> None:
+    def _toStringObjectInfo(self) -> str:
+        return f"{self.weightedValueSum/self.weightSum}"
+
+    def add(self, value, weight=1) -> None:
         """
         Adds the given value with the the given weight to the calculation
 
         :param value: the value
-        :param weight: the weight with which to consider tha value
+        :param weight: the weight with which to consider the value
         """
         self.weightedValueSum += value * weight
         self.weightSum += weight
diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index b7814508..ecebaa93 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -1,11 +1,11 @@
-from typing import Union, List, Dict, Any, Sequence, Iterable, Optional
+from typing import Union, List, Dict, Any, Sequence, Iterable, Optional, Mapping
 import re
 
 
 reCommaWhitespacePotentiallyBreaks = re.compile(r",\s+")
 
 
-def dictString(d: Dict, brackets: Optional[str] = None):
+def dictString(d: Mapping, brackets: Optional[str] = None):
     s = ', '.join([f'{k}={toString(v)}' for k, v in d.items()])
     if brackets is not None:
         return brackets[:1] + s + brackets[-1:]
diff --git a/src/sensai/util/time.py b/src/sensai/util/time.py
index af187bab..339a8c81 100644
--- a/src/sensai/util/time.py
+++ b/src/sensai/util/time.py
@@ -15,3 +15,27 @@ def timeOfDay(ts: pd.Timestamp) -> float:
     :return: the time of day as a floating point number in [0, 24)
     """
     return ts.hour + ts.minute / 60
+
+
+class TimeInterval:
+    def __init__(self, start: pd.Timestamp, end: pd.Timestamp):
+        self.start = start
+        self.end = end
+
+    def contains(self, t: pd.Timestamp):
+        return self.start <= t <= self.end
+
+    def overlapsWith(self, other: "TimeInterval") -> bool:
+        otherEndsBefore = other.end <= self.start
+        otherStartsAfter = other.start >= self.end
+        return not (otherEndsBefore or otherStartsAfter)
+
+    def intersection(self, other: "TimeInterval") -> "TimeInterval":
+        return TimeInterval(max(self.start, other.start), min(self.end, other.end))
+
+    def timeDelta(self) -> pd.Timedelta:
+        return self.end - self.start
+
+    def midTimestamp(self) -> pd.Timestamp:
+        midTime: pd.Timestamp = self.start + 0.5 * self.timeDelta()
+        return midTime
\ No newline at end of file

From 9952fec3a3b70fc03d1558b2c784a885fc022196 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 18 May 2022 22:28:40 +0200
Subject: [PATCH 050/131] Order notebooks in index.rst by specifing inclusions
 explicitly, changed test_notebooks to only copy files included in index.rst

---
 docs/index.rst              | 10 ++++++++--
 notebooks/test_notebooks.py | 32 +++++++++++++++++++++++---------
 2 files changed, 31 insertions(+), 11 deletions(-)

diff --git a/docs/index.rst b/docs/index.rst
index fc5272ea..6d03c3a3 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -5,10 +5,16 @@ sensAI - the Python library for sensible AI
    :caption: Guides and Tutorials
    :glob:
 
-   *
+   intro.ipynb
+   intro_old.ipynb
+   tracking_experiments.ipynb
+   tensor_models_pytorch_lightning.ipynb
+   coordinate_clustering.ipynb
+   clustering_evaluation.ipynb
 
 ..
-  Above, we include notebooks, copied here by test_notebooks
+  Above, we can include any notebooks from ../notebooks; Within the build process, they will be copied
+  here by test_notebooks if they are referenced in this file.
 
 .. toctree::
    :caption: Modules
diff --git a/notebooks/test_notebooks.py b/notebooks/test_notebooks.py
index 52948be9..af304e51 100644
--- a/notebooks/test_notebooks.py
+++ b/notebooks/test_notebooks.py
@@ -1,17 +1,28 @@
 import logging
 import os
+import pathlib
+import re
 
 import nbformat
 import pytest
 from nbconvert.preprocessors import ExecutePreprocessor
 
-NOTEBOOKS_DIR = "notebooks"
-DOCS_DIR = "docs"
-resources = {"metadata": {"path": NOTEBOOKS_DIR}}
 
+ROOT_DIR = pathlib.Path(__file__).parent.parent.absolute()
+DOCS_DIR = ROOT_DIR / "docs"
+NOTEBOOKS_DIR = ROOT_DIR / "notebooks"
 log = logging.getLogger(__name__)
 
 
+def notebooksUsedInDocs():
+    with open(ROOT_DIR / "docs/index.rst", "r") as f:
+        content = f.read()
+    return re.findall(r"\s(\w+\.ipynb)", content)
+
+
+NOTEBOOKS_TO_COPY = notebooksUsedInDocs()
+
+
 class LoggingExecutePreprocessor(ExecutePreprocessor):
     def __init__(self, notebookName, **kw):
         self._notebookName = notebookName
@@ -26,15 +37,18 @@ def preprocess_cell(self, cell, resources, index):
     "notebook", [file for file in os.listdir(NOTEBOOKS_DIR) if file.endswith(".ipynb")]
 )
 def test_notebook(notebook):
-    notebook_path = os.path.join(NOTEBOOKS_DIR, notebook)
+    notebook_path = NOTEBOOKS_DIR / notebook
     log.info(f"Reading jupyter notebook from {notebook_path}")
     with open(notebook_path) as f:
         nb = nbformat.read(f, as_version=4)
     ep = LoggingExecutePreprocessor(notebook, timeout=600)
-    ep.preprocess(nb, resources=resources)
+    ep.preprocess(nb, resources={"metadata": {"path": str(NOTEBOOKS_DIR)}})
 
     # saving the executed notebook to docs
-    output_path = os.path.join(DOCS_DIR, notebook)
-    log.info(f"Saving executed notebook to {output_path} for documentation purposes")
-    with open(output_path, "w", encoding="utf-8") as f:
-        nbformat.write(nb, f)
+    if notebook in NOTEBOOKS_TO_COPY:
+        output_path = os.path.join(DOCS_DIR, notebook)
+        log.info(f"Saving executed notebook to {output_path} for documentation purposes")
+        with open(output_path, "w", encoding="utf-8") as f:
+            nbformat.write(nb, f)
+    else:
+        log.info(f"Notebook {notebook} is not used in docs; not copied")
\ No newline at end of file

From 1d6fa1d4e3c4d1eb56074adaa4d9b6804703f8e2 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 18 May 2022 23:08:39 +0200
Subject: [PATCH 051/131] Fixed reference to renamed function (aggStats ->
 aggMetricsDict)

---
 src/sensai/evaluation/eval_util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 83827a4d..5e7a812c 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -334,7 +334,7 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
                 modelResult = ModelComparisonData.Result(crossValData=crossValData)
                 resultByModelName[modelName] = modelResult
                 evalStatsCollection = crossValData.getEvalStatsCollection()
-                statsDict = evalStatsCollection.aggStats()
+                statsDict = evalStatsCollection.aggMetricsDict()
             else:
                 evalData = self.performSimpleEvaluation(model, resultWriter=resultWriter if writeIndividualResults else None,
                     fitModel=fitModels)

From bc9ad45c4bb43185555fa8567d7c65d1b828017a Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 18 May 2022 23:12:14 +0200
Subject: [PATCH 052/131] Extended intro notebook

---
 notebooks/intro.ipynb | 60 ++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 53 insertions(+), 7 deletions(-)

diff --git a/notebooks/intro.ipynb b/notebooks/intro.ipynb
index fa43e219..a7d63d90 100644
--- a/notebooks/intro.ipynb
+++ b/notebooks/intro.ipynb
@@ -23,7 +23,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import sensai"
+    "import sensai\n",
+    "import numpy as np"
    ]
   },
   {
@@ -32,9 +33,9 @@
    "source": [
     "## Logging\n",
     "\n",
-    "sensAI will log relevant activies and inform you about ongoing processes as well as results via the log. It is therefore highly recommended that you enable logging when using sensAI.\n",
+    "sensAI will log relevant activies and inform about ongoing processes as well as results via the log. It is therefore highly recommended that logging be enabled when using sensAI.\n",
     "\n",
-    "sensAI provides a `logging` module which includes Python's standard logging module and adds some additional functionality. To enable logging, simply use the `configureLogging` function.\n"
+    "sensAI provides a `logging` module which includes Python's standard logging module and adds some additional functionality. To enable logging, simply use its `configureLogging` function.\n"
    ]
   },
   {
@@ -154,7 +155,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "randomForestModel = sensai.sklearn.classification.SkLearnRandomForestVectorClassificationModel(min_samples_leaf=2)"
+    "randomForestModel = sensai.sklearn.classification.SkLearnRandomForestVectorClassificationModel(\n",
+    "    min_samples_leaf=2).withName(\"RandomForest\")"
    ]
   },
   {
@@ -466,10 +468,54 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "evalUtil.compareModels([\n",
-    "        randomForestModel.withName(\"RandomForest\"), \n",
+    "results = evalUtil.compareModels([\n",
+    "        randomForestModel, \n",
     "        sensai.sklearn.classification.SkLearnDecisionTreeVectorClassificationModel(min_samples_leaf=2).withName(\"DecisionTree\")], \n",
-    "    useCrossValidation=False);"
+    "    useCrossValidation=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In addition to the data frame with the aggregated metrics, which was already printed to the log, the results object contains all the data that was generated during the evaluation. We can, for example, use it to plot the distribution of one of the metrics across all the folds for one of our models."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "display(results.resultsDF)\n",
+    "\n",
+    "escRandomForest = results.resultByModelName[\"RandomForest\"].crossValData.getEvalStatsCollection()\n",
+    "escRandomForest.plotDistribution(\"accuracy\", bins=np.linspace(0,1,21), stat=\"count\", kde=False);\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can also compute additional aggregations or inspect the full list of metrics."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "escRandomForest.aggMetricsDict(aggFns=[np.max, np.min])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "escRandomForest.getValues(\"accuracy\")"
    ]
   }
  ],

From 2a6cdd3732830e44568e3f5df6c225f90ae6cc4b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 18 May 2022 23:40:15 +0200
Subject: [PATCH 053/131] Raised minimum seaborn version to 0.11 (for histplot,
 new displot)

---
 requirements-relaxed.txt | 5 ++---
 requirements.txt         | 2 +-
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/requirements-relaxed.txt b/requirements-relaxed.txt
index 645eba2e..b496490c 100644
--- a/requirements-relaxed.txt
+++ b/requirements-relaxed.txt
@@ -1,8 +1,7 @@
-# sensAI main requirements
-# This is a relaxed version with lower bounds, which exists only for inclusion in environment.yml (developer environment)
+# this is a relaxed version of requirements.txt where newer versions are allowed
 pandas>=1.0.0
 scipy>=1.4
 numpy>=1.18.0
 scikit-learn>=0.22.0
-seaborn>=0.10.0
+seaborn>=0.11.0
 typing-extensions>=3.7
diff --git a/requirements.txt b/requirements.txt
index 965c93f6..86cccaa9 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -4,5 +4,5 @@ pandas~=1.0.0
 scipy~=1.4
 numpy~=1.18.0
 scikit-learn~=0.22.0
-seaborn~=0.10.0
+seaborn~=0.11.0
 typing-extensions~=3.7

From d9fa1bb56fec554471c0eab4442ace5c45e0b385 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 19 May 2022 21:46:46 +0200
Subject: [PATCH 054/131] Added section on VectorModel

---
 notebooks/intro.ipynb | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/notebooks/intro.ipynb b/notebooks/intro.ipynb
index a7d63d90..cdc8dd6f 100644
--- a/notebooks/intro.ipynb
+++ b/notebooks/intro.ipynb
@@ -53,7 +53,17 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "To additionally write log output to a file, use the function `logging.addFileLogger`."
+    "To additionally write log output to a file, use the function `logging.addFileLogger`.\n",
+    "\n",
+    "## VectorModels\n",
+    "\n",
+    "The central base class for supervised learning problems in sensAI is `VectorModel`. A VectorModel is any model which operates on data points that can be reprsented as vectors of data. Here, vector is to be understood not in the mathematical sense but in the computer science sense, where a vector is simply an array of (potentially arbitaririly complex) data. (The mathematical equivalent is a tuple.) Models are typically expected to be able to process more than one data point at a time and thus should be able to process a sequence of vectors. \n",
+    "\n",
+    "We use pandas DataFrames to represent such sequences of data points. Note that pandas DataFrames are not limited to primitive data types but can hold arbitrary objects in every cell. When dealing with a large number of inputs, DataFrames also provide at least limited meta-information in the form of column names, so we do not lose track of what is contained in which element of a data point (vector).\n",
+    "\n",
+    "VectorModel itself is an abstract base class, which provides a lot of useful functionality that all its specialisations inherit (as we will see later, particularly in the more advanced tutorials). The class is specialised in `VectorClassificationModel` and `VectorRegressionModel`, which in turn are specialised for various machine learning frameworks (such as sklearn and PyTorch) or can be directly subclassed to create your own model. \n",
+    "\n",
+    "In this tutorial, we will be dealing with a classification problem. Therefore, we will apply subclasses of `VectorClassificationModel` such as `SkLearnRandomForestVectorClassificationModel`. As an sklearn classification model which uses a well-defined training and inference interface, the implementation of the class is essentially justa few lines of code (given the intermediate abstraction `AbstractSkLearnVectorClassificationModel` for all classification models that use the sklearn protocol)."
    ]
   },
   {
@@ -100,7 +110,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "When working with sensAI, we typically use a DataFrame such as this as the starting point. DataFrames are a good basis, because they provide much-needed meta-data in the form of column names and as such provide a more well-defined interface for learning and inference than raw numpy arrays.\n",
+    "When working with sensAI, we typically use DataFrames such as this as the starting point.\n",
     "\n",
     "We create an instance of **InputOutputData** from the two data frames."
    ]

From 4a5db6aadabfc0dacd330c30f614642df736010e Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 19 May 2022 23:13:33 +0200
Subject: [PATCH 055/131] Added InputOutputData.fromDataFrame

---
 src/sensai/data.py | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/src/sensai/data.py b/src/sensai/data.py
index d8166ccc..635438e9 100644
--- a/src/sensai/data.py
+++ b/src/sensai/data.py
@@ -57,6 +57,17 @@ class InputOutputData(BaseInputOutputData[pd.DataFrame]):
     def __init__(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         super().__init__(inputs, outputs)
 
+    @classmethod
+    def fromDataFrame(cls, df: pd.DataFrame, *outputColumns: str) -> "InputOutputData":
+        """
+        :param df: a data frame containing both input and output columns
+        :param outputColumns: the output column name(s)
+        :return: an InputOutputData instance with inputs and outputs separated
+        """
+        inputs = df[[c for c in df.columns if c not in outputColumns]]
+        outputs = df[list(outputColumns)]
+        return cls(inputs, outputs)
+
     def filterIndices(self, indices: Sequence[int]) -> __qualname__:
         inputs = self.inputs.iloc[indices]
         outputs = self.outputs.iloc[indices]

From eed896316d97f35dcb7aae580a9e92bd7cfc7bfa Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 19 May 2022 23:29:10 +0200
Subject: [PATCH 056/131] MultiLayerPerceptronTorchModel: Allow to override
 inputDim determined from data frame

MultiLayerPerceptronVector*Model:
  * Use NormalisationMode.NONE as default
  * Added inputDim as optional parameter
  * Fixed warning pertaining to log_softmax usage without specifying dim by using
    ActivationFunction enum
---
 .../torch/torch_models/mlp/mlp_models.py      | 28 ++++++++++++++-----
 1 file changed, 21 insertions(+), 7 deletions(-)

diff --git a/src/sensai/torch/torch_models/mlp/mlp_models.py b/src/sensai/torch/torch_models/mlp/mlp_models.py
index dae5bf73..f1caec26 100644
--- a/src/sensai/torch/torch_models/mlp/mlp_models.py
+++ b/src/sensai/torch/torch_models/mlp/mlp_models.py
@@ -14,15 +14,25 @@
 
 class MultiLayerPerceptronTorchModel(VectorTorchModel):
     def __init__(self, cuda: bool, hiddenDims: Sequence[int], hidActivationFunction: Callable[[torch.Tensor], torch.Tensor],
-            outputActivationFunction: Optional[Callable[[torch.Tensor], torch.Tensor]], pDropout: Optional[float] = None) -> None:
+            outputActivationFunction: Optional[Callable[[torch.Tensor], torch.Tensor]], pDropout: Optional[float] = None,
+            inputDim: Optional[int] = None) -> None:
+        """
+        :param cuda: whether to enable CUDA
+        :param hiddenDims: the sequence of hidden layer dimensions
+        :param hidActivationFunction: the output activation function for hidden layers
+        :param outputActivationFunction: the output activation function
+        :param pDropout: the dropout probability for training
+        :param inputDim: the input dimension; if None, use dimensions determined by the input data (number of columns in data frame)
+        """
         super().__init__(cuda=cuda)
         self.hidActivationFunction = ActivationFunction.torchFunctionFromAny(hidActivationFunction)
         self.outputActivationFunction = ActivationFunction.torchFunctionFromAny(outputActivationFunction)
         self.hiddenDims = hiddenDims
         self.pDropout = pDropout
+        self.overrideInputDim = inputDim
 
     def createTorchModuleForDims(self, inputDim: int, outputDim: int) -> torch.nn.Module:
-        return MultiLayerPerceptron(inputDim, outputDim, self.hiddenDims,
+        return MultiLayerPerceptron(inputDim if self.overrideInputDim is None else self.overrideInputDim, outputDim, self.hiddenDims,
             hidActivationFn=self.hidActivationFunction, outputActivationFn=self.outputActivationFunction,
             pDropout=self.pDropout)
 
@@ -30,13 +40,15 @@ def createTorchModuleForDims(self, inputDim: int, outputDim: int) -> torch.nn.Mo
 class MultiLayerPerceptronVectorRegressionModel(TorchVectorRegressionModel):
     def __init__(self, hiddenDims: Sequence[int] = (5, 5), hidActivationFunction: Callable[[torch.Tensor], torch.Tensor] = torch.sigmoid,
             outputActivationFunction: Optional[Callable[[torch.Tensor], torch.Tensor]] = None,
-            normalisationMode: NormalisationMode = NormalisationMode.MAX_BY_COLUMN,
+            inputDim: Optional[int] = None,
+            normalisationMode: NormalisationMode = NormalisationMode.NONE,
             cuda: bool = True, pDropout: Optional[float] = None, nnOptimiserParams: Optional[NNOptimiserParams] = None,
             **nnOptimiserDictParams) -> None:
         """
         :param hiddenDims: sequence containing the number of neurons to use in hidden layers
         :param hidActivationFunction: the activation function (torch.nn.functional.* or torch.*) to use for all hidden layers
         :param outputActivationFunction: the output activation function (torch.nn.functional.* or torch.* or None)
+        :param inputDim: the input dimension; if None, use dimensions determined by the input data (number of columns in data frame)
         :param normalisationMode: the normalisation mode to apply to input and output data
         :param cuda: whether to use CUDA (GPU acceleration)
         :param pDropout: the probability with which to apply dropouts after each hidden layer
@@ -45,19 +57,21 @@ def __init__(self, hiddenDims: Sequence[int] = (5, 5), hidActivationFunction: Ca
         """
         nnOptimiserParams = NNOptimiserParams.fromEitherDictOrInstance(nnOptimiserDictParams, nnOptimiserParams)
         super().__init__(MultiLayerPerceptronTorchModel, [cuda, hiddenDims, hidActivationFunction, outputActivationFunction],
-                dict(pDropout=pDropout), normalisationMode, nnOptimiserParams)
+                dict(pDropout=pDropout, inputDim=inputDim), normalisationMode, nnOptimiserParams)
 
 
 class MultiLayerPerceptronVectorClassificationModel(TorchVectorClassificationModel):
     def __init__(self, hiddenDims: Sequence[int] = (5, 5),
             hidActivationFunction: Callable[[torch.Tensor], torch.Tensor] = torch.sigmoid,
-            outputActivationFunction: Optional[Union[Callable[[torch.Tensor], torch.Tensor], str, ActivationFunction]] = torch.nn.functional.log_softmax,
-            normalisationMode: NormalisationMode = NormalisationMode.MAX_BY_COLUMN, cuda: bool = True, pDropout: Optional[float] = None,
+            outputActivationFunction: Optional[Union[Callable[[torch.Tensor], torch.Tensor], str, ActivationFunction]] = ActivationFunction.LOG_SOFTMAX,
+            inputDim: Optional[int] = None,
+            normalisationMode: NormalisationMode = NormalisationMode.NONE, cuda: bool = True, pDropout: Optional[float] = None,
             nnOptimiserParams: Optional[NNOptimiserParams] = None, **nnOptimiserDictParams) -> None:
         """
         :param hiddenDims: sequence containing the number of neurons to use in hidden layers
         :param hidActivationFunction: the activation function (torch.nn.functional.* or torch.*) to use for all hidden layers
         :param outputActivationFunction: the output activation function (function from torch.nn.functional.*, function name, enum instance or None)
+        :param inputDim: the input dimension; if None, use dimensions determined by the input data (number of columns in data frame)
         :param normalisationMode: the normalisation mode to apply to input and output data
         :param cuda: whether to use CUDA (GPU acceleration)
         :param pDropout: the probability with which to apply dropouts after each hidden layer
@@ -67,4 +81,4 @@ def __init__(self, hiddenDims: Sequence[int] = (5, 5),
         nnOptimiserParams = NNOptimiserParams.fromEitherDictOrInstance(nnOptimiserDictParams, nnOptimiserParams)
         outputMode = ClassificationOutputMode.forActivationFn(ActivationFunction.torchFunctionFromAny(outputActivationFunction))
         super().__init__(outputMode, MultiLayerPerceptronTorchModel, [cuda, hiddenDims, hidActivationFunction, outputActivationFunction],
-            dict(pDropout=pDropout), normalisationMode, nnOptimiserParams)
+            dict(pDropout=pDropout, inputDim=inputDim), normalisationMode, nnOptimiserParams)

From ae99cf7b1977124b7f9827a0dd04932fdf6ec31f Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 19 May 2022 23:31:35 +0200
Subject: [PATCH 057/131] Ignore temp*.py

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index 901772ba..83eac1fa 100644
--- a/.gitignore
+++ b/.gitignore
@@ -12,6 +12,7 @@ docs/sensai
 dist
 *.egg-info*
 /temp
+/temp*.py
 /default_console.py
 /build
 /git-split.sh

From 0da490b017dc53927119aab65ab3604bc93d9105 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 20 May 2022 01:58:57 +0200
Subject: [PATCH 058/131] TorchMode: Exclude private members from toString;
 improved docstrings

---
 src/sensai/torch/torch_base.py | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index fabb16af..c845a97e 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -109,6 +109,9 @@ def __init__(self, cuda=True) -> None:
         self.trainingInfo: Optional[TrainingInfo] = None
         self._gpu: Optional[int] = None
 
+    def _toStringExcludePrivate(self) -> bool:
+        return True
+
     def setTorchModule(self, module: torch.nn.Module) -> None:
         self.module = module
 
@@ -352,6 +355,13 @@ def createTorchModule(self) -> torch.nn.Module:
 
     @abstractmethod
     def createTorchModuleForDims(self, inputDim: int, outputDim: int) -> torch.nn.Module:
+        """
+        :param inputDim: the number of input dimensions as reported by the data set provider (number of columns
+            in input data frame for default providers)
+        :param outputDim: the number of output dimensions as reported by the data set provider (number of columns
+            in output data frame for default providers)
+        :return: the torch module
+        """
         pass
 
 
@@ -510,7 +520,7 @@ def __init__(self, outputMode: ClassificationOutputMode,
             nnOptimiserParams: Union[dict, NNOptimiserParams, None] = None) -> None:
         """
         :param outputMode: specifies the nature of the output of the underlying neural network model
-        :param modelClass: the constructor with which to create the wrapped torch vector model
+        :param modelClass: the constructor with which to create the wrapped torch model
         :param modelArgs: the constructor argument list to pass to modelClass
         :param modelKwArgs: the dictionary of constructor keyword arguments to pass to modelClass
         :param normalisationMode: the normalisation mode to apply to input data frames

From 619cab86b6edb45cb1dce4a325aefee31aa866ce Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 20 May 2022 01:59:58 +0200
Subject: [PATCH 059/131] ClassificationOutputMode.forActivationFn: Support
 ActivationFunction enum argument; Improved type annotation

---
 src/sensai/torch/torch_enums.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/sensai/torch/torch_enums.py b/src/sensai/torch/torch_enums.py
index 3025b725..c8f6b899 100644
--- a/src/sensai/torch/torch_enums.py
+++ b/src/sensai/torch/torch_enums.py
@@ -20,7 +20,7 @@ def fromName(cls, name) -> "ActivationFunction":
                 return item
         raise ValueError(f"No function found for name '{name}'")
 
-    def getTorchFunction(self) -> Callable:
+    def getTorchFunction(self) -> Optional[Callable]:
         return {
                 ActivationFunction.NONE: None,
                 ActivationFunction.SIGMOID: F.sigmoid,
@@ -62,9 +62,13 @@ class ClassificationOutputMode(Enum):
     UNNORMALISED_LOG_PROBABILITIES = "unnormalised_log_probabilities"
 
     @classmethod
-    def forActivationFn(cls, fn: Optional[Callable]):
+    def forActivationFn(cls, fn: Optional[Union[Callable, ActivationFunction]]):
+        if isinstance(fn, ActivationFunction):
+            fn = fn.getTorchFunction()
         if fn is None:
             return cls.UNNORMALISED_LOG_PROBABILITIES
+        if not callable(fn):
+            raise ValueError(fn)
         if isinstance(fn, functools.partial):
             fn = fn.func
         name = fn.__name__

From 54ffb39e0e0e78f2e4d356895e7131dbad2c4b25 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 24 May 2022 14:15:23 +0200
Subject: [PATCH 060/131] Sync pjm

  commit 378ba01d67c0337dc70b701f6c0090ec5c8a8c00
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 14:12:03 2022 +0200

      ModelComparisonVisitorAggregatedFeatureImportances.plotFeatureImportance: Account for
        * long feature names (-> horizontal bars, tight layout)
        * large number of features (-> dynamic height)

  sensai/evaluation/eval_util.py

  commit f0ff85ab9d249234a6b8e3434984a66b7870a5c2
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 14:10:27 2022 +0200

      Added default figure size constant

  sensai/util/plot.py

  commit c58b7e32db447b1785e7da998c6255e8dfcc2366
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 13:26:06 2022 +0200

      Added plot collection to ModelComparisonVisitor, implemented in in subclasses
      and applied in MultiDataEvaluationUtil

  sensai/evaluation/eval_util.py

  commit f2c043e63f90239861e69ff139eac4ad1e386ffc
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 12:18:33 2022 +0200

      Added interface FeatureImportanceProvider

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py
  sensai/lightgbm.py
  sensai/sklearn/sklearn_classification.py
  sensai/sklearn/sklearn_regression.py

  commit adbc2a886e87508234069677b8f856b0a626a49f
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 12:04:01 2022 +0200

      Moved module sklearn_util, which deals only with feature importance, to root as feature_importance

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py

  commit 6483ed12abe748dc228ebabe6ed25edaf5d261cd
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 12:01:55 2022 +0200

      MultiDataEvaluationUtil: Take into account that the metric column name used for sorting may not include the aggregation 'mean[*]'

  sensai/evaluation/eval_util.py

  commit 99e6b12739a7cad39950a8cb938f6918561369f1
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 11:07:28 2022 +0200

      Added metrics:
        * ClassificationMetricAccuracyMaxProbabilityBeyondThreshold
        * ClassificationMetricRelFreqMaxProbabilityBeyondThreshold

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 961a58ada9ad52390d99c800a66c7aaf2e250536
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 09:37:33 2022 +0200

      ClassificationEvalStatsCollection: Fixed problem combining EvalStats instances with different set of classes

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit 6622c2c78d533b1e0bf10d6f5364d3e150eed187
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 14:29:21 2022 +0200

      LightGBM: Fixed categorical features now being required to be specified as
      an argument to the fit method (when using the sklearn-style interface) as
      the model argument is overridden by a default value in the sklearn interface

  sensai/lightgbm.py
  sensai/sklearn/sklearn_base.py

  commit c565bd8dea8bd94f2e34c2f396b6356d6237e8ad
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 14:13:35 2022 +0200

      AbstractSkLearnVectorClassificationModel: Fixed _transformInput losing all data frame meta-data
      (e.g. category columns) even if no sklearn input transformer was specified

  sensai/sklearn/sklearn_base.py

  commit 561d321bceb96795b5cabdd0e7723956a52f5c73
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 14:00:37 2022 +0200

      Improved type annotations and docstrings

  sensai/lightgbm.py

  commit eabb5dffb33d7b0bda41f30994156c7402386f01
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 13:18:46 2022 +0200

      PickleCached: Avoid substring '<locals>' in filenames (not supported under Windows)

  sensai/util/cache.py

  commit 5b0f753251201f6db57fe74e80efd20a3964b58c
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 12:06:38 2022 +0200

      Improved docstrings

  sensai/featuregen.py

  commit eaedda59abfe842911f426fc0d1e040f91a14ff0
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 10:51:24 2022 +0200

      Extracted abstraction GeoCoordClusterer from agglomerative clusterer,
      adding new specialisations SkLearnGeoCoordClusterer (abstract) and
      DBSCANGeoCoordClusterer (concrete)

  sensai/geoanalytics/geo_clustering.py

  commit 02c2a534a79ea5eaaf2e33dd1abb5fbd68cfc072
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 10:35:34 2022 +0200

      Fixed spelling in xgboost classifier class names (breaking change)

  sensai/xgboost.py

  commit 4afa40cd48316014cf8f2ebcd1ed75c0cbccbaa0
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri May 20 17:54:50 2022 +0200

      PickleCached: Allow full filename specification for case with arguments

  sensai/util/cache.py
---
 .../eval_stats/eval_stats_classification.py   | 69 +++++++++++--
 src/sensai/evaluation/eval_util.py            | 50 ++++++++--
 .../sklearn_util.py => feature_importance.py} | 24 ++++-
 src/sensai/featuregen.py                      | 23 +++--
 src/sensai/geoanalytics/geo_clustering.py     | 97 ++++++++++++++++---
 src/sensai/lightgbm.py                        | 51 +++++-----
 src/sensai/sklearn/sklearn_base.py            | 77 +++++++++------
 src/sensai/sklearn/sklearn_classification.py  |  6 +-
 src/sensai/sklearn/sklearn_regression.py      |  6 +-
 src/sensai/util/cache.py                      | 23 +++--
 src/sensai/util/plot.py                       |  3 +
 src/sensai/xgboost.py                         |  4 +-
 12 files changed, 327 insertions(+), 106 deletions(-)
 rename src/sensai/{sklearn/sklearn_util.py => feature_importance.py} (60%)

diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index 9497b9f4..f81db0ad 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -1,20 +1,19 @@
+import logging
 from abc import ABC, abstractmethod
-from dataclasses import dataclass
 from typing import List, Sequence, Optional, Dict
-import logging
 
-from matplotlib import pyplot as plt
 import numpy as np
 import pandas as pd
 import sklearn
+from matplotlib import pyplot as plt
 from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, PrecisionRecallDisplay, \
     balanced_accuracy_score, f1_score
 
-from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric, EvalStatsPlot, TEvalStats
+from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric, EvalStatsPlot
+from ...util.aggregation import RelativeFrequencyCounter
 from ...util.pickle import getstate
 from ...util.plot import plotMatrix
 
-
 log = logging.getLogger(__name__)
 
 
@@ -86,6 +85,58 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return cnt / len(y_true)
 
 
+class ClassificationMetricAccuracyMaxProbabilityBeyondThreshold(ClassificationMetric):
+    """
+    Accuracy limited to cases where the probability of the most likely class is at least a given threshold
+    """
+    requiresProbabilities = True
+
+    def __init__(self, threshold: float, zeroValue=0.0):
+        """
+        :param threshold: minimum probability of the most likely class
+        :param zeroValue: the value of the metric for the case where the probability of the most likely class never reaches the threshold
+        """
+        self.threshold = threshold
+        self.zeroValue = zeroValue
+        super().__init__(name=f"accuracy[p_max >= {threshold}]")
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        labels = y_predictedClassProbabilities.columns
+        labelToColIdx = {l: i for i, l in enumerate(labels)}
+        relFreq = RelativeFrequencyCounter()
+        for i, probabilities in enumerate(y_predictedClassProbabilities.values.tolist()):
+            classIdx_predicted = np.argmax(probabilities)
+            prob_predicted = probabilities[classIdx_predicted]
+            if prob_predicted >= self.threshold:
+                classIdx_true = labelToColIdx[y_true[i]]
+                relFreq.count(classIdx_predicted == classIdx_true)
+        if relFreq.numTotal == 0:
+            return self.zeroValue
+        else:
+            return relFreq.getRelativeFrequency()
+
+
+class ClassificationMetricRelFreqMaxProbabilityBeyondThreshold(ClassificationMetric):
+    """
+    Relative frequency of cases where the probability of the most likely class is at least a given threshold
+    """
+    requiresProbabilities = True
+
+    def __init__(self, threshold: float):
+        """
+        :param threshold: minimum probability of the most likely class
+        """
+        self.threshold = threshold
+        super().__init__(name=f"relFreq[p_max >= {threshold}]")
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        relFreq = RelativeFrequencyCounter()
+        for i, probabilities in enumerate(y_predictedClassProbabilities.values.tolist()):
+            pMax = np.max(probabilities)
+            relFreq.count(pMax >= self.threshold)
+        return relFreq.getRelativeFrequency()
+
+
 class BinaryClassificationMetric(ClassificationMetric, ABC):
     def __init__(self, positiveClassLabel, name: str = None):
         name = name if name is not None else self.__class__.name
@@ -176,7 +227,7 @@ def __init__(self, y_predicted: PredictionArray = None,
         if self._probabilitiesAvailable:
             colSet = set(y_predictedClassProbabilities.columns)
             if colSet != set(labels):
-                raise ValueError(f"Set of columns in class probabilities data frame ({colSet}) does not correspond to labels ({labels}")
+                raise ValueError(f"Columns in class probabilities data frame ({y_predictedClassProbabilities.columns}) do not correspond to labels ({labels}")
             if len(y_predictedClassProbabilities) != len(y_true):
                 raise ValueError("Row count in class probabilities data frame does not match ground truth")
 
@@ -279,8 +330,12 @@ def getGlobalStats(self) -> ClassificationEvalStats:
             es0 = self.statsList[0]
             if es0.y_predictedClassProbabilities is not None:
                 y_probs = pd.concat([evalStats.y_predictedClassProbabilities for evalStats in self.statsList])
+                labels = list(y_probs.columns)
+            else:
+                y_probs = None
+                labels = es0.labels
             self.globalStats = ClassificationEvalStats(y_predicted=y_predicted, y_true=y_true, y_predictedClassProbabilities=y_probs,
-                labels=es0.labels, binaryPositiveLabel=es0.binaryPositiveLabel, metrics=es0.metrics)
+                labels=labels, binaryPositiveLabel=es0.binaryPositiveLabel, metrics=es0.metrics)
         return self.globalStats
 
 
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 5e7a812c..68e30710 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -10,7 +10,7 @@
 from abc import ABC, abstractmethod
 from collections import defaultdict
 from dataclasses import dataclass
-from typing import Tuple, Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set, Iterable, List
+from typing import Dict, Any, Union, Generic, TypeVar, Optional, Sequence, Callable, Set, Iterable, List
 
 import matplotlib.figure
 import matplotlib.pyplot as plt
@@ -31,10 +31,11 @@
     VectorRegressionModelEvaluationData, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, \
     VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, VectorModelEvaluatorParams
 from ..data import InputOutputData
-from ..sklearn.sklearn_util import AggregatedFeatureImportances
+from ..feature_importance import AggregatedFeatureImportances, FeatureImportanceProvider
 from ..util.io import ResultWriter
+from ..util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 from ..util.string import prettyStringRepr
-from ..vector_model import VectorClassificationModel, VectorRegressionModel, VectorModel
+from ..vector_model import VectorClassificationModel, VectorRegressionModel, VectorModel, VectorModelBase
 
 log = logging.getLogger(__name__)
 
@@ -488,7 +489,8 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
         :param createCombinedEvalStatsPlots: whether to combine, for each type of model, the EvalStats objects from the individual experiments
             into a single objects that holds all results and use it to create plots reflecting the overall result.
             Note that for classification, this is only possible if all individual experiments use the same set of class labels.
-        :param visitors: visitors which may process individual results
+        :param visitors: visitors which may process individual results. Plots generated by visitors are created/collected at the end of the
+            comparison.
         :return: a pair of data frames (allDF, meanDF) where allDF contains all the individual evaluation results (one row per data set)
             and meanDF contains one row for each model with results averaged across datasets
         """
@@ -553,8 +555,10 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
         # (because the mean would be computed without them, skipna parameter unsupported)
         allResultsGrouped = allResultsDF.dropna(axis=1).groupby("modelName")
         meanResultsDF: pd.DataFrame = allResultsGrouped.mean()
-        if columnNameForModelRanking in meanResultsDF:
-            meanResultsDF.sort_values(columnNameForModelRanking, inplace=True, ascending=not rankMax)
+        for colName in [columnNameForModelRanking, f"mean[{columnNameForModelRanking}]"]:
+            if colName in meanResultsDF:
+                meanResultsDF.sort_values(columnNameForModelRanking, inplace=True, ascending=not rankMax)
+                break
         strMeanResults = f"Mean results (averaged across {len(self.inputOutputDataDict)} data sets):\n{meanResultsDF.to_string()}"
         log.info(strMeanResults)
 
@@ -585,6 +589,11 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
                     evalStats = ClassificationEvalStatsCollection(evalStatsList).getGlobalStats()
                 plotCollector.createPlots(evalStats, subtitle=modelName, resultCollector=resultCollector)
 
+        # create plots from visitors (if any)
+        resultCollector = EvaluationResultCollector(showPlots=False, resultWriter=resultWriter)
+        for visitor in visitors:
+            visitor.collectPlots(resultCollector)
+
         if isRegression:
             return RegressionMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
         else:
@@ -607,6 +616,15 @@ class ModelComparisonVisitor(ABC):
     def visit(self, modelName: str, result: ModelComparisonData.Result):
         pass
 
+    @abstractmethod
+    def collectPlots(self, resultCollector: EvaluationResultCollector) -> None:
+        """
+        Collects figures at the end of the model comparison, based on the results collected
+
+        :param resultCollector: the collector to which figures are to be added
+        """
+        pass
+
 
 class ModelComparisonVisitorAggregatedFeatureImportances(ModelComparisonVisitor):
     """
@@ -631,11 +649,25 @@ def visit(self, modelName: str, result: ModelComparisonData.Result):
             elif result.evalData is not None:
                 self._collect(result.evalData.model)
 
-    def _collect(self, model):
-        if not hasattr(model, "getFeatureImportances"):
-            raise ValueError(f"Got model which does not have method 'getFeatureImportances': {model}")
+    def _collect(self, model: Union[FeatureImportanceProvider, VectorModelBase]):
+        if not isinstance(model, FeatureImportanceProvider):
+            raise ValueError(f"Got model which does inherit from {FeatureImportanceProvider.__qualname__}: {model}")
         self.aggFeatureImportance.add(model.getFeatureImportances())
 
+    def plotFeatureImportance(self) -> plt.Figure:
+        featureImportanceDict = self.aggFeatureImportance.aggDict
+        numFeatures = len(featureImportanceDict)
+        defaultWidth, defaultHeight = MATPLOTLIB_DEFAULT_FIGURE_SIZE
+        height = max(defaultHeight, defaultHeight * numFeatures / 20)
+        fig, ax = plt.subplots(figsize=(defaultWidth, height))
+        sns.barplot(list(featureImportanceDict.values()), list(featureImportanceDict.keys()), ax=ax)
+        plt.title(f"Feature Importance\n{self.modelName}")
+        plt.tight_layout()
+        return fig
+
+    def collectPlots(self, resultCollector: EvaluationResultCollector):
+        resultCollector.addFigure(f"{self.modelName}_feature-importance", self.plotFeatureImportance())
+
 
 class MultiDataModelComparisonData(Generic[TEvalStats, TEvalStatsCollection], ABC):
     def __init__(self, allResultsDF: pd.DataFrame, meanResultsDF: pd.DataFrame, aggResultsDF: pd.DataFrame,
diff --git a/src/sensai/sklearn/sklearn_util.py b/src/sensai/feature_importance.py
similarity index 60%
rename from src/sensai/sklearn/sklearn_util.py
rename to src/sensai/feature_importance.py
index 9fef82fd..f752c139 100644
--- a/src/sensai/sklearn/sklearn_util.py
+++ b/src/sensai/feature_importance.py
@@ -1,29 +1,47 @@
 import collections
+from abc import ABC, abstractmethod
 from typing import Dict, Union
 
 
+class FeatureImportanceProvider(ABC):
+    """
+    Interface for models that can provide feature importance values
+    """
+    @abstractmethod
+    def getFeatureImportances(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
+        """
+        Gets the feature importance values
+
+        :return: either a dictionary mapping feature names to importance values or (for models predicting multiple
+            variables (independently)) a dictionary which maps predicted variable names to such dictionaries
+        """
+        pass
+
+
 class AggregatedFeatureImportances:
     """
     Aggregates feature importance values from models that suppurt method getFeatureImportances
     (e.g. sklearn's RandomForest models and compatible models from lightgbm, etc.)
     """
-    def __init__(self, *featureImportanceDicts: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
+    def __init__(self, *featureImportances: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]]):
         self.aggDict = None
         self._isNested = None
         self._numDictsAdded = 0
-        for d in featureImportanceDicts:
+        for d in featureImportances:
             self.add(d)
 
     @staticmethod
     def _isDict(x):
         return hasattr(x, "get")
 
-    def add(self, featureImportance: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
+    def add(self, featureImportance: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]]):
         """
         Adds the feature importance values from the given dictionary
 
         :param featureImportance: the dictionary obtained via a model's getFeatureImportances method
         """
+        if isinstance(featureImportance, FeatureImportanceProvider):
+            featureImportance = featureImportance.getFeatureImportances()
         if self._isNested is None:
             self._isNested = self._isDict(next(iter(featureImportance.values())))
         if self._isNested:
diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 009be4fd..688f0183 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -33,7 +33,7 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
                  normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None, addCategoricalDefaultRules=True):
         """
         :param categoricalFeatureNames: either a sequence of column names or a regex that is to match all categorical feature names
-            (which must not only work for the feature generated by this feature, i.e. it should not match feature names generated
+            (which must not only work for the feature generated by this feature generator, i.e. it should not match feature names generated
             by other feature generators).
             It will be ensured that the respective columns in the generated data frames will have dtype 'category'.
             Furthermore, presence of meta-information can later be leveraged for further transformations, e.g. one-hot encoding.
@@ -372,16 +372,23 @@ def _generateFeatureDict(self, namedTuple) -> Dict[str, Any]:
 
 
 class FeatureGeneratorTakeColumns(RuleBasedFeatureGenerator):
-    def __init__(self, columns: Union[str, List[str]] = None, exceptColumns: Sequence[str] = (), categoricalFeatureNames: Sequence[str] = (),
-                 normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
-                 normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
+    def __init__(self, columns: Union[str, List[str]] = None, exceptColumns: Sequence[str] = (),
+            categoricalFeatureNames: Optional[Union[Sequence[str], str]] = (),
+            normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
+            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
         """
-
         :param columns: name of the column or list of names of columns to be taken. If None, all columns will be taken.
         :param exceptColumns: list of names of columns to not take if present in the input df
-        :param categoricalFeatureNames:
-        :param normalisationRules:
-        :param normalisationRuleTemplate:
+        :param categoricalFeatureNames: either a sequence of column names or a regex that is to match all categorical feature names
+            (which must not only work for the feature generated by this feature generator, i.e. it should not match feature names generated
+            by other feature generators).
+            It will be ensured that the respective columns in the generated data frames will have dtype 'category'.
+            Furthermore, presence of meta-information can later be leveraged for further transformations, e.g. one-hot encoding.
+        :param normalisationRules: Rules to be used by DFTNormalisation (e.g. for constructing an input transformer for a model).
+            These rules are only relevant if a DFTNormalisation object consuming them is instantiated and used
+            within a data processing pipeline. They do not affect feature generation.
+        :param normalisationRuleTemplate: This parameter can be supplied instead of normalisationRules for the case where
+            there shall be a single rule that applies to all columns generated by this feature generator that were not labeled as categorical.
         """
         super().__init__(categoricalFeatureNames=categoricalFeatureNames, normalisationRules=normalisationRules, normalisationRuleTemplate=normalisationRuleTemplate)
         if isinstance(columns, str):
diff --git a/src/sensai/geoanalytics/geo_clustering.py b/src/sensai/geoanalytics/geo_clustering.py
index 3a397bdb..2f351cef 100644
--- a/src/sensai/geoanalytics/geo_clustering.py
+++ b/src/sensai/geoanalytics/geo_clustering.py
@@ -1,23 +1,46 @@
+import collections
 import itertools
 import math
+from abc import abstractmethod, ABC
 from typing import List, Tuple
 
 import numpy as np
+import sklearn.cluster
 
 from .geo_coords import GeoCoord
 from .local_coords import LocalCoordinateSystem
 from ..clustering import GreedyAgglomerativeClustering
 
 
+class GeoCoordClusterer(ABC):
+    @abstractmethod
+    def fitGeoCoords(self, geoCoords: List[GeoCoord]):
+        """
+        :param geoCoords: the coordinates to be clustered
+        """
+        pass
+
+    @abstractmethod
+    def clustersIndices(self) -> Tuple[List[List[int]], List[int]]:
+        """
+        :return: a tuple (clusters, outliers), where clusters is a dictionary mapping from cluster index to
+            the list of original point indices within the cluster and outliers is the list of indices of points not within
+            clusters
+        """
+        pass
+
+
 class GreedyAgglomerativeGeoCoordClusterer:
-    def __init__(self, maxMinDistanceForMergeM: float, maxDistanceM: float, minClusterSize: int):
+    def __init__(self, maxMinDistanceForMergeM: float, maxDistanceM: float, minClusterSize: int, lcs: LocalCoordinateSystem = None):
         """
         :param maxMinDistanceForMergeM: the maximum distance, in metres, for the minimum distance between two existing clusters for a merge
             to be admissible
         :param maxDistanceM: the maximum distance, in metres, between any two points for the points to be allowed to be in the same cluster
         :param minClusterSize: the minimum number of points any valid cluster must ultimately contain; the points in any smaller clusters
             shall be considered as outliers
+        :param lcs: the local coordinate system to use for clustering; if None, compute based on mean coordinates passed when fitting
         """
+        self.lcs = lcs
         self.minClusterSize = minClusterSize
         self.maxMinDistanceForMerge = maxMinDistanceForMergeM
         self.squaredMaxMinDistanceForMerge = maxMinDistanceForMergeM * maxMinDistanceForMergeM
@@ -51,24 +74,16 @@ def mergeCost(self, other):
         def merge(self, other):
             self.points += other.points
 
-    def fitGeoCoords(self, geoCoords: List[GeoCoord], lcs: LocalCoordinateSystem = None) -> None:
-        """
-        :param geoCoords: the coordinates to be clustered
-        :param lcs: the local coordinate system to use for clustering; if None, compute based on mean coordinates
-        """
-        if lcs is None:
+    def fitGeoCoords(self, geoCoords: List[GeoCoord]) -> None:
+        if self.lcs is None:
             meanCoord = GeoCoord.meanCoord(geoCoords)
-            lcs = LocalCoordinateSystem(meanCoord.lat, meanCoord.lon)
-        self.localPoints = [self.LocalPoint(np.array(lcs.getLocalCoords(p.lat, p.lon)), idx) for idx, p in enumerate(geoCoords)]
+            self.lcs = LocalCoordinateSystem(meanCoord.lat, meanCoord.lon)
+        self.localPoints = [self.LocalPoint(np.array(self.lcs.getLocalCoords(p.lat, p.lon)), idx) for idx, p in enumerate(geoCoords)]
         clusters = [self.Cluster(lp, self) for lp in self.localPoints]
         clusters = GreedyAgglomerativeClustering(clusters).applyClustering()
         self.clusters = clusters
 
     def clustersIndices(self) -> Tuple[List[List[int]], List[int]]:
-        """
-        :return: a tuple (clusters, outliers), where clusters is a list of lists of original point indices where each inner list forms
-         a cluster and outliers is the list of indices of points not within a cluster
-        """
         outliers = []
         clusters = []
         for c in self.clusters:
@@ -78,3 +93,59 @@ def clustersIndices(self) -> Tuple[List[List[int]], List[int]]:
             else:
                 clusters.append(indices)
         return clusters, outliers
+
+
+class SkLearnGeoCoordClusterer(GeoCoordClusterer):
+    def __init__(self, clusterer, lcs: LocalCoordinateSystem = None):
+        """
+        :param clusterer: a clusterer from sklearn.cluster
+        :param lcs: the local coordinate system to use for Euclidian conversion; if None, determine from data (using mean coordinate as centre)
+        """
+        self.lcs = lcs
+        self.clusterer = clusterer
+        self.localPoints = None
+
+    def fitGeoCoords(self, geoCoords: List[GeoCoord]):
+        if self.lcs is None:
+            meanCoord = GeoCoord.meanCoord(geoCoords)
+            self.lcs = LocalCoordinateSystem(meanCoord.lat, meanCoord.lon)
+        self.localPoints = [self.lcs.getLocalCoords(p.lat, p.lon) for p in geoCoords]
+        self.clusterer.fit(self.localPoints)
+
+    def _clusters(self, mode):
+        clusters = collections.defaultdict(list)
+        outliers = []
+        for idxPoint, idxCluster in enumerate(self.clusterer.labels_):
+            if mode == "localPoints":
+                item = self.localPoints[idxPoint]
+            elif mode == "indices":
+                item = idxPoint
+            else:
+                raise ValueError()
+            if idxCluster >= 0:
+                clusters[idxCluster].append(item)
+            else:
+                outliers.append(item)
+        return list(clusters.values()), outliers
+
+    def clustersLocalPoints(self) -> Tuple[List[List[Tuple[float, float]]], List[Tuple[float, float]]]:
+        """
+        :return: a tuple (clusters, outliers), where clusters is a dictionary mapping from cluster index to
+            the list of local points within the cluster and outliers is a list of local points not within
+            clusters
+        """
+        return self._clusters("localPoints")
+
+    def clustersIndices(self) -> Tuple[List[List[int]], List[int]]:
+        return self._clusters("indices")
+
+
+class DBSCANGeoCoordClusterer(SkLearnGeoCoordClusterer):
+    def __init__(self, eps, min_samples, lcs: LocalCoordinateSystem = None, **kwargs):
+        """
+        :param eps: the maximum distance between two samples for one to be considered as in the neighbourhood of the other
+        :param min_samples: the minimum number of samples that must be within a neighbourhood for a cluster to be formed
+        :param lcs: the local coordinate system for conversion to a Euclidian space
+        :param kwargs: additional arguments to pass to DBSCAN (see https://scikit-learn.org/stable/modules/generated/sklearn.cluster.DBSCAN.html)
+        """
+        super().__init__(sklearn.cluster.DBSCAN(eps=eps, min_samples=min_samples, **kwargs), lcs)
\ No newline at end of file
diff --git a/src/sensai/lightgbm.py b/src/sensai/lightgbm.py
index 4dfb92b8..c354b931 100644
--- a/src/sensai/lightgbm.py
+++ b/src/sensai/lightgbm.py
@@ -4,21 +4,36 @@
 import pandas as pd
 import re
 
+from .feature_importance import FeatureImportanceProvider
 from .util.string import orRegexGroup
 from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel
 
 log = logging.getLogger(__name__)
 
 
-class LightGBMVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
+# noinspection PyUnusedLocal
+def _updateFitArgs(fitArgs: dict, inputs: pd.DataFrame, outputs: pd.DataFrame, categoricalFeatureNameRegex: Optional[str]):
+    if categoricalFeatureNameRegex is not None:
+        cols = list(inputs.columns)
+        categoricalFeatureNames = [col for col in cols if re.match(categoricalFeatureNameRegex, col)]
+        colIndices = [cols.index(f) for f in categoricalFeatureNames]
+        args = {"categorical_feature": colIndices}
+        log.info(f"Updating fit parameters with {args}")
+        fitArgs.update(args)
+    else:
+        fitArgs.pop("categorical_feature", None)
+
+
+class LightGBMVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
     log = log.getChild(__qualname__)
 
     def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None, random_state=42, num_leaves=31,
             max_depth=-1, n_estimators=100, min_child_samples=20, importance_type="gain", **modelArgs):
         """
-        :param categoricalFeatureNames: sequence of feature names in the input data that are categorical.
+        :param categoricalFeatureNames: sequence of feature names in the input data that are categorical or a single string containing
+            a regex matching the categorical feature names.
             Columns that have dtype 'category' (as will be the case for categorical columns created via FeatureGenerators)
-            need not be specified (should be inferred automatically).
+            need not be specified (will be inferred automatically).
             In general, passing categorical features is preferable to using one-hot encoding, for example.
         :param random_state: the random seed to use
         :param num_leaves: the maximum number of leaves in one tree (original lightgbm default is 31)
@@ -43,30 +58,24 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
                 categoricalFeatureNameRegex = None
         self._categoricalFeatureNameRegex: str = categoricalFeatureNameRegex
 
-    def _updateModelArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
-        if self._categoricalFeatureNameRegex is not None:
-            cols = list(inputs.columns)
-            categoricalFeatureNames = [col for col in cols if re.match(self._categoricalFeatureNameRegex, col)]
-            colIndices = [cols.index(f) for f in categoricalFeatureNames]
-            args = {"cat_column": colIndices}
-            self.log.info(f"Updating model parameters with {args}")
-            self.modelArgs.update(args)
+    def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
+        _updateFitArgs(self.fitArgs, inputs, outputs, self._categoricalFeatureNameRegex)
 
     def getFeatureImportances(self) -> Dict[str, Dict[str, int]]:
         return {targetFeature: dict(zip(model.feature_name_, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
 
-class LightGBMVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
+class LightGBMVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
     log = log.getChild(__qualname__)
 
-    def __init__(self, categoricalFeatureNames: Sequence[str] = None, random_state=42, num_leaves=31,
+    def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None, random_state=42, num_leaves=31,
             max_depth=-1, n_estimators=100, min_child_samples=20, importance_type="gain", useComputedClassWeights=False,
             **modelArgs):
         """
-        :param categoricalFeatureNames: sequence of feature names in the input data that are categorical
+        :param categoricalFeatureNames: sequence of feature names in the input data that are categorical or a single string containing
+            a regex matching the categorical feature names.
             Columns that have dtype 'category' (as will be the case for categorical columns created via FeatureGenerators)
-            need not be specified (should be inferred automatically, but we have never actually tested this behaviour
-            successfully for a classification model).
+            need not be specified (will be inferred automatically).
             In general, passing categorical features may be preferable to using one-hot encoding, for example.
         :param random_state: the random seed to use
         :param num_leaves: the maximum number of leaves in one tree (original lightgbm default is 31)
@@ -93,14 +102,8 @@ def __init__(self, categoricalFeatureNames: Sequence[str] = None, random_state=4
                 categoricalFeatureNameRegex = None
         self._categoricalFeatureNameRegex: str = categoricalFeatureNameRegex
 
-    def _updateModelArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
-        if self._categoricalFeatureNameRegex is not None:
-            cols = list(inputs.columns)
-            categoricalFeatureNames = [col for col in cols if re.match(self._categoricalFeatureNameRegex, col)]
-            colIndices = [cols.index(f) for f in categoricalFeatureNames]
-            args = {"cat_column": colIndices}
-            self.log.info(f"Updating model parameters with {args}")
-            self.modelArgs.update(args)
+    def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
+        _updateFitArgs(self.fitArgs, inputs, outputs, self._categoricalFeatureNameRegex)
 
     def getFeatureImportances(self) -> Dict[str, Dict[str, int]]:
         return dict(zip(self.model.feature_name_, self.model.feature_importances_))
diff --git a/src/sensai/sklearn/sklearn_base.py b/src/sensai/sklearn/sklearn_base.py
index d27f7df4..38f7859a 100644
--- a/src/sensai/sklearn/sklearn_base.py
+++ b/src/sensai/sklearn/sklearn_base.py
@@ -1,8 +1,8 @@
 import copy
 import logging
-from abc import ABC, abstractmethod
-from typing import List, Any, Dict
 import re
+from abc import ABC, abstractmethod
+from typing import List, Any, Dict, Optional
 
 import numpy as np
 import pandas as pd
@@ -31,6 +31,21 @@ def strSkLearnModel(model):
     return re.sub(r",\s*", ", ", str(model))
 
 
+def _applySkLearnInputTransformer(inputs: pd.DataFrame, sklearnInputTransformer: Optional, fit: bool) -> pd.DataFrame:
+    if sklearnInputTransformer is None:
+        return inputs
+    else:
+        inputValues = inputs.values
+        shapeBefore = inputValues.shape
+        if fit:
+            inputValues = sklearnInputTransformer.fit_transform(inputValues)
+        else:
+            inputValues = sklearnInputTransformer.transform(inputValues)
+        if inputValues.shape != shapeBefore:
+            raise Exception("sklearnInputTransformer changed the shape of the input, which is unsupported. Consider using an a DFTSkLearnTransformer in inputTransformers instead.")
+        return pd.DataFrame(inputValues, index=inputs.index, columns=inputs.columns)
+
+
 class AbstractSkLearnVectorRegressionModel(VectorRegressionModel, ABC):
     """
     Base class for models built upon scikit-learn's model implementations
@@ -47,6 +62,7 @@ def __init__(self, modelConstructor, **modelArgs):
         self.sklearnOutputTransformer = None
         self.modelConstructor = modelConstructor
         self.modelArgs = modelArgs
+        self.fitArgs = {}
 
     def _toStringExcludes(self) -> List[str]:
         return super()._toStringExcludes() + ["sklearnInputTransformer", "sklearnOutputTransformer", "modelConstructor", "modelArgs"]
@@ -68,18 +84,7 @@ def withSkLearnOutputTransformer(self, sklearnOutputTransformer):
         return self
 
     def _transformInput(self, inputs: pd.DataFrame, fit=False) -> pd.DataFrame:
-        if self.sklearnInputTransformer is None:
-            return inputs
-        else:
-            inputValues = inputs.values
-            shapeBefore = inputValues.shape
-            if fit:
-                inputValues = self.sklearnInputTransformer.fit_transform(inputValues)
-            else:
-                inputValues = self.sklearnInputTransformer.transform(inputValues)
-            if inputValues.shape != shapeBefore:
-                raise Exception("sklearnInputTransformer changed the shape of the input, which is unsupported. Consider using an a DFTSkLearnTransformer in inputTransformers instead.")
-            return pd.DataFrame(inputValues, index=inputs.index, columns=inputs.columns)
+        return _applySkLearnInputTransformer(inputs, self.sklearnInputTransformer, fit)
 
     def _updateModelArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         """
@@ -90,9 +95,20 @@ def _updateModelArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         """
         pass
 
+    def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
+        """
+        Designed to be overridden in order to make input data-specific changes to fitArgs (arguments to be passed to the
+        underlying model's fit method)
+
+        :param inputs: the training input data
+        :param outputs: the training output data
+        """
+        pass
+
     def _fit(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         inputs = self._transformInput(inputs, fit=True)
         self._updateModelArgs(inputs, outputs)
+        self._updateFitArgs(inputs, outputs)
         self._fitSkLearn(inputs, outputs)
 
     @abstractmethod
@@ -134,7 +150,7 @@ def _fitSkLearn(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
             model = createSkLearnModel(self.modelConstructor,
                     self.modelArgs,
                     outputTransformer=copy.deepcopy(self.sklearnOutputTransformer))
-            model.fit(inputs, outputs[predictedVarName])
+            model.fit(inputs, outputs[predictedVarName], **self.fitArgs)
             self.models[predictedVarName] = model
 
     def _predictSkLearn(self, inputs: pd.DataFrame) -> pd.DataFrame:
@@ -170,7 +186,7 @@ def _fitSkLearn(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         outputValues = outputs.values
         if outputValues.shape[1] == 1:  # for 1D output, shape must be (numSamples,) rather than (numSamples, 1)
             outputValues = np.ravel(outputValues)
-        self.model.fit(inputs, outputValues)
+        self.model.fit(inputs, outputValues, **self.fitArgs)
 
     def _predictSkLearn(self, inputs: pd.DataFrame) -> pd.DataFrame:
         Y = self.model.predict(inputs)
@@ -190,6 +206,7 @@ def __init__(self, modelConstructor, useComputedClassWeights=False, **modelArgs)
         self.sklearnInputTransformer = None
         self.sklearnOutputTransformer = None
         self.modelArgs = modelArgs
+        self.fitArgs = {}
         self.useComputedClassWeights = useComputedClassWeights
         self.model = None
 
@@ -233,27 +250,33 @@ def _updateModelArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         """
         pass
 
+    def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
+        """
+        Designed to be overridden in order to make input data-specific changes to fitArgs (arguments to be passed to the
+        underlying model's fit method)
+
+        :param inputs: the training input data
+        :param outputs: the training output data
+        """
+        pass
+
     def _fitClassifier(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
-        inputValues = self._transformInput(inputs, fit=True)
+        inputs = self._transformInput(inputs, fit=True)
         self._updateModelArgs(inputs, outputs)
+        self._updateFitArgs(inputs, outputs)
         self.model = createSkLearnModel(self.modelConstructor, self.modelArgs, self.sklearnOutputTransformer)
         log.info(f"Fitting sklearn classifier of type {self.model.__class__.__name__}")
-        kwargs = {}
+        kwargs = dict(self.fitArgs)
         if self.useComputedClassWeights:
             class2weight = self._computeClassWeights(outputs)
             classes = outputs.iloc[:, 0]
             weights = [class2weight[cls] for cls in classes]
             kwargs["sample_weight"] = np.array(weights)
-        self.model.fit(inputValues, np.ravel(outputs.values), **kwargs)
+        outputValues = np.ravel(outputs.values)
+        self.model.fit(inputs, outputValues, **kwargs)
 
-    def _transformInput(self, inputs: pd.DataFrame, fit=False) -> np.ndarray:
-        inputValues = inputs.values
-        if self.sklearnInputTransformer is not None:
-            if fit:
-                inputValues = self.sklearnInputTransformer.fit_transform(inputValues)
-            else:
-                inputValues = self.sklearnInputTransformer.transform(inputValues)
-        return inputValues
+    def _transformInput(self, inputs: pd.DataFrame, fit=False) -> pd.DataFrame:
+        return _applySkLearnInputTransformer(inputs, self.sklearnInputTransformer, fit)
 
     def _predict(self, x: pd.DataFrame):
         inputValues = self._transformInput(x)
diff --git a/src/sensai/sklearn/sklearn_classification.py b/src/sensai/sklearn/sklearn_classification.py
index a57b80ae..e1349aea 100644
--- a/src/sensai/sklearn/sklearn_classification.py
+++ b/src/sensai/sklearn/sklearn_classification.py
@@ -7,7 +7,7 @@
 import sklearn.tree
 
 from .sklearn_base import AbstractSkLearnVectorClassificationModel
-
+from ..feature_importance import FeatureImportanceProvider
 
 log = logging.getLogger(__name__)
 
@@ -18,7 +18,7 @@ def __init__(self, min_samples_leaf=8, random_state=42, **modelArgs):
             min_samples_leaf=min_samples_leaf, random_state=random_state, **modelArgs)
 
 
-class SkLearnRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
+class SkLearnRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
     def __init__(self, min_samples_leaf=8, random_state=42, useComputedClassWeights=False, **modelArgs):
         super().__init__(sklearn.ensemble.RandomForestClassifier,
             random_state=random_state, min_samples_leaf=min_samples_leaf,
@@ -26,7 +26,7 @@ def __init__(self, min_samples_leaf=8, random_state=42, useComputedClassWeights=
             **modelArgs)
 
     def getFeatureImportances(self) -> Dict[str, float]:
-        return  dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
 
 class SkLearnMLPVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
diff --git a/src/sensai/sklearn/sklearn_regression.py b/src/sensai/sklearn/sklearn_regression.py
index 9072c2a6..a1ec644f 100644
--- a/src/sensai/sklearn/sklearn_regression.py
+++ b/src/sensai/sklearn/sklearn_regression.py
@@ -8,12 +8,12 @@
 import sklearn.svm
 
 from .sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnMultiDimVectorRegressionModel
-
+from ..feature_importance import FeatureImportanceProvider
 
 log = logging.getLogger(__name__)
 
 
-class SkLearnRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
+class SkLearnRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
     def __init__(self, n_estimators=100, min_samples_leaf=10, random_state=42, **modelArgs):
         super().__init__(sklearn.ensemble.RandomForestRegressor,
             n_estimators=n_estimators, min_samples_leaf=min_samples_leaf, random_state=random_state, **modelArgs)
@@ -22,7 +22,7 @@ def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
         return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
 
-class SkLearnLinearRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel):
+class SkLearnLinearRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
     def __init__(self, **modelArgs):
         super().__init__(sklearn.linear_model.LinearRegression, **modelArgs)
 
diff --git a/src/sensai/util/cache.py b/src/sensai/util/cache.py
index 64cde847..5271c55e 100644
--- a/src/sensai/util/cache.py
+++ b/src/sensai/util/cache.py
@@ -616,7 +616,8 @@ def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str
         :param filenamePrefix: a prefix of the name of the cache file to be created, to which the function name and, where applicable,
             a hash code of the function arguments will be appended and ".cache.pickle" will be appended; if None, use "" (if filename
             has not been provided)
-        :param filename: the full file name of the cache file to be created; this is admissible only if the function has no arguments
+        :param filename: the full file name of the cache file to be created; if the function takes arguments, the filename must
+            contain a placeholder '%s' for the argument hash
         :param backend: the serialisation backend to use (see dumpPickle)
         :param protocol: the pickle protocol version to use
         :param load: whether to load a previously persisted result; if False, do not load an old result but store the newly computed result
@@ -636,16 +637,24 @@ def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str
     def __call__(self, fn: Callable, *_args, **_kwargs):
 
         def wrapped(*args, **kwargs):
+            hashCodeStr = None
             haveArgs = len(args) > 0 or len(kwargs) > 0
+            if haveArgs:
+                hashCodeStr = pickleHash((args, kwargs))
             if self.filename is None:
-                filename = self.filenamePrefix + fn.__qualname__
-                if haveArgs:
-                    filename += "-" + pickleHash((args, kwargs))
+                filename = self.filenamePrefix + fn.__qualname__.replace(".<locals>.", ".")
+                if hashCodeStr is not None:
+                    filename += "-" + hashCodeStr
                 filename += ".cache.pickle"
             else:
-                if haveArgs:
-                    raise Exception("Function called with arguments but full cache filename specified: specify a cache filename prefix only to account for argument values")
-                filename = self.filename
+                if hashCodeStr is not None:
+                    if not "%s" in self.filename:
+                        raise Exception("Function called with arguments but full cache filename contains no placeholder (%s) for argument hash")
+                    filename = self.filename % hashCodeStr
+                else:
+                    if "%s" in self.filename:
+                        raise Exception("Function without arguments but full cache filename with placeholder (%s) was specified")
+                    filename = self.filename
             picklePath = os.path.join(self.cacheBasePath, filename)
             return cached(lambda: fn(*args, **kwargs), picklePath, functionName=fn.__name__, backend=self.backend, load=self.load)
 
diff --git a/src/sensai/util/plot.py b/src/sensai/util/plot.py
index 8f50a4fa..225de905 100644
--- a/src/sensai/util/plot.py
+++ b/src/sensai/util/plot.py
@@ -10,6 +10,9 @@
 log = logging.getLogger(__name__)
 
 
+MATPLOTLIB_DEFAULT_FIGURE_SIZE = (6.4, 4.8)
+
+
 def plotMatrix(matrix, title, xticklabels: Sequence[str], yticklabels: Sequence[str], xlabel: str, ylabel: str, normalize=True, figsize=(9,9),
         titleAdd: str = None) -> matplotlib.figure.Figure:
     """
diff --git a/src/sensai/xgboost.py b/src/sensai/xgboost.py
index 0ebba8ef..e6716af6 100644
--- a/src/sensai/xgboost.py
+++ b/src/sensai/xgboost.py
@@ -25,7 +25,7 @@ def __init__(self, random_state=42, **modelArgs):
         super().__init__(xgboost.XGBRFRegressor, random_state=random_state, **modelArgs)
 
 
-class XGBGradientBoostedVectorClassifictionModel(AbstractSkLearnVectorClassificationModel):
+class XGBGradientBoostedVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     """
     XGBoost's classification model using gradient boosted trees
     """
@@ -36,7 +36,7 @@ def __init__(self, random_state=42, **modelArgs):
         super().__init__(xgboost.XGBClassifier, random_state=random_state, **modelArgs)
 
 
-class XGBRandomForestVectorClassifictionModel(AbstractSkLearnVectorClassificationModel):
+class XGBRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     """
     XGBoost's random forest classification model
     """

From 2306086d852741176246114358dff38d839e324a Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 24 May 2022 14:16:36 +0200
Subject: [PATCH 061/131] Sync dcs

  commit 39b9b38a25d02dfe3242869e3e279add74e67477
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon May 23 19:28:10 2022 +0200

      Import PrecisionRecallDisplay locally, because it is not supported in older versions of sklearn

  dcs/sensai/evaluation/eval_stats/eval_stats_classification.py
---
 src/sensai/evaluation/eval_stats/eval_stats_classification.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index 9497b9f4..4a2d533c 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -7,7 +7,7 @@
 import numpy as np
 import pandas as pd
 import sklearn
-from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, PrecisionRecallDisplay, \
+from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, \
     balanced_accuracy_score, f1_score
 
 from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric, EvalStatsPlot, TEvalStats
@@ -248,6 +248,7 @@ def plotConfusionMatrix(self, normalize=True, titleAdd: str = None):
         return confusionMatrix.plot(normalize=normalize, titleAdd=titleAdd)
 
     def plotPrecisionRecallCurve(self, titleAdd: str = None):
+        from sklearn.metrics import PrecisionRecallDisplay  # only supported by newer versions of sklearn
         if not self._probabilitiesAvailable:
             raise Exception("Precision-recall curve requires probabilities")
         if not self.isBinary:

From edcd94d3518cb3d98a5d2519784490431770776b Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Wed, 25 May 2022 13:48:05 +0200
Subject: [PATCH 062/131] Sync pjm
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

  commit 7be6e5b76c51b287d9903cd0f59bee2618acd862
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed May 25 13:28:53 2022 +0200

      DataFrameSplitter: Added method split, renaming existing static method to splitWithIndices

  sensai/data.py

  commit 76972f0d5a25afd2ccc45b6982cc8d52bde66ac8
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed May 25 13:26:27 2022 +0200

      LightGBMVectorClassificationModel: Fixed prediction of class probabilities for case where only one class exists
      (as LGBMClassifier will return values for a second class with near-0 probabilities regardless)

  sensai/lightgbm.py

  commit 9596c32859333d5dbb1e2627b1abe5014af649ab
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed May 25 13:24:28 2022 +0200

      VectorClassificationModel.predictClassProbabilities: Ensure index of output data frame matches input

  sensai/vector_model.py

  commit b09e09d229a7de62c6f4c781d253605c41776b0b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 24 19:00:12 2022 +0200

      ModelComparisonData: Added methods getBestModel, getBestModelName

  sensai/evaluation/eval_util.py

  commit 407b42586d1bf1a673cdab42a67a9cce0865965a
  Author: Julian Übelacker <julian.uebelacker@jambit.com>
  Date:   Thu May 19 10:36:12 2022 +0200

      Add deprecation decorator in new module util.deprecation

  sensai/util/deprecation.py
---
 src/sensai/data.py                 |  5 ++++-
 src/sensai/evaluation/eval_util.py | 11 +++++++++++
 src/sensai/lightgbm.py             |  9 +++++++++
 src/sensai/util/deprecation.py     | 13 +++++++++++++
 src/sensai/vector_model.py         |  4 +++-
 5 files changed, 40 insertions(+), 2 deletions(-)
 create mode 100644 src/sensai/util/deprecation.py

diff --git a/src/sensai/data.py b/src/sensai/data.py
index 635438e9..263ba8bc 100644
--- a/src/sensai/data.py
+++ b/src/sensai/data.py
@@ -176,12 +176,15 @@ def computeSplitIndices(self, df: pd.DataFrame, fractionalSizeOfFirstSet: float)
         pass
 
     @staticmethod
-    def split(df: pd.DataFrame, indicesPair: Tuple[Sequence[int], Sequence[int]]) -> Tuple[pd.DataFrame, pd.DataFrame]:
+    def splitWithIndices(df: pd.DataFrame, indicesPair: Tuple[Sequence[int], Sequence[int]]) -> Tuple[pd.DataFrame, pd.DataFrame]:
         indicesA, indicesB = indicesPair
         A = df.iloc[indicesA]
         B = df.iloc[indicesB]
         return A, B
 
+    def split(self, df: pd.DataFrame, fractionalSizeOfFirstSet: float) -> Tuple[pd.DataFrame, pd.DataFrame]:
+        return self.splitWithIndices(df, self.computeSplitIndices(df, fractionalSizeOfFirstSet))
+
 
 class DataFrameSplitterFractional(DataFrameSplitter):
     def __init__(self, shuffle=False, randomSeed=42):
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 68e30710..95d93050 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -14,6 +14,7 @@
 
 import matplotlib.figure
 import matplotlib.pyplot as plt
+import numpy as np
 import pandas as pd
 import seaborn as sns
 
@@ -610,6 +611,16 @@ def __init__(self, resultsDF: pd.DataFrame, resultsByModelName: Dict[str, Result
         self.resultsDF = resultsDF
         self.resultByModelName = resultsByModelName
 
+    def getBestModelName(self, metricName: str) -> str:
+        idx = np.argmax(self.resultsDF[metricName])
+        return self.resultsDF.index[idx]
+
+    def getBestModel(self, metricName: str) -> Union[VectorClassificationModel, VectorRegressionModel, VectorModelBase]:
+        result = self.resultByModelName[self.getBestModelName(metricName)]
+        if result.evalData is None:
+            raise ValueError("The best model is not well-defined when using cross-validation")
+        return result.evalData.model
+
 
 class ModelComparisonVisitor(ABC):
     @abstractmethod
diff --git a/src/sensai/lightgbm.py b/src/sensai/lightgbm.py
index c354b931..e9c51421 100644
--- a/src/sensai/lightgbm.py
+++ b/src/sensai/lightgbm.py
@@ -107,3 +107,12 @@ def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
 
     def getFeatureImportances(self) -> Dict[str, Dict[str, int]]:
         return dict(zip(self.model.feature_name_, self.model.feature_importances_))
+
+    def _predictClassProbabilities(self, x: pd.DataFrame):
+        if len(self._labels) == 1:
+            # special handling required because LGBMClassifier will return values for two classes even if there is only one
+            Y = self.model.predict_proba(self._transformInput(x))
+            Y = Y[:, 0]
+            return pd.DataFrame(Y, columns=self._labels)
+        else:
+            return super()._predictClassProbabilities(x)
\ No newline at end of file
diff --git a/src/sensai/util/deprecation.py b/src/sensai/util/deprecation.py
new file mode 100644
index 00000000..9cfe6907
--- /dev/null
+++ b/src/sensai/util/deprecation.py
@@ -0,0 +1,13 @@
+import warnings
+
+
+def deprecated(message):
+    def deprecated_decorator(func):
+        def deprecated_func(*args, **kwargs):
+            warnings.warn("{} is a deprecated function. {}".format(func.__name__, message),
+                category=DeprecationWarning,
+                stacklevel=2)
+            warnings.simplefilter('default', DeprecationWarning)
+            return func(*args, **kwargs)
+        return deprecated_func
+    return deprecated_decorator
diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 878d1917..9dd63c97 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -539,7 +539,8 @@ def convertClassProbabilitiesToPredictions(self, df: pd.DataFrame):
     def predictClassProbabilities(self, x: pd.DataFrame) -> pd.DataFrame:
         """
         :param x: the input data
-        :return: a data frame where the list of columns is the list of class labels and the values are probabilities.
+        :return: a data frame where the list of columns is the list of class labels and the values are probabilities, with the same
+            index as the input data frame.
             Raises an exception if the classifier cannot predict probabilities.
         """
         if not self.isFitted():
@@ -547,6 +548,7 @@ def predictClassProbabilities(self, x: pd.DataFrame) -> pd.DataFrame:
                             f"This might lead to errors down the line, especially if input/output checks are enabled")
         x = self._computeModelInputs(x)
         result = self._predictClassProbabilities(x)
+        result.index = x.index
         self._checkPrediction(result)
         return result
 

From 8c88712ca6c5f73dc1aa21c72025a79adefab321 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:03:12 +0200
Subject: [PATCH 063/131] Fixed spelling error

---
 README-dev.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README-dev.md b/README-dev.md
index 25ceb3bd..4921b646 100644
--- a/README-dev.md
+++ b/README-dev.md
@@ -4,7 +4,7 @@ This section explains the steps required to set up an environment in order to de
 
 ## Clone Large Files
 
-Clone the full repo, including large files using [git large file storage](https://git-lfs.github.com):
+Clone the full repo, including large files using [git LFS](https://git-lfs.github.com):
 
     git lfs pull
 
@@ -18,7 +18,7 @@ Use conda to set up the Python environment:
 
 Solving the environment may take several minutes (but should ultimately work).
 
-NOTE: versions are mostly unpinned in the environment specification, because this facilitates conda dependency resolution. Also, sensAI is intended to be compatible with all (newer) versions of the dependencies. If it isn't, we need to specify  an upper version bound in `setup.py` (where it matters the most) as well as in `environment.yml`. Compatibility with old (pinned) versions and the latest versions is tested in the tox build (see blow).
+NOTE: versions are mostly unpinned in the environment specification, because this facilitates conda dependency resolution. Also, sensAI is intended to be compatible with all (newer) versions of the dependencies. If it isn't, we need to specify  an upper version bound in `setup.py` (where it matters the most) as well as in `environment.yml`. Compatibility with old (pinned) versions and the latest versions is tested in the tox build (see below).
 
 # Build and Test Pipeline
 

From 33f1ad4cec9d9ee8fd2f098a4abec2890c4775df Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:03:50 +0200
Subject: [PATCH 064/131] Use top-level directory (which is now absolute) to
 produce paths

---
 config.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/config.py b/config.py
index 5681406d..3cf4b891 100644
--- a/config.py
+++ b/config.py
@@ -9,7 +9,7 @@
 
 __config_instance = None
 
-topLevelDirectory = os.path.dirname(__file__)
+topLevelDirectory = os.path.abspath(os.path.dirname(__file__))
 
 
 class __Configuration:
@@ -66,7 +66,7 @@ def _get_path(self, key: Union[str, List[str]], create=False) -> str:
         :return: the queried path
         """
         path_string = self._get_non_empty_entry(key)
-        path = os.path.abspath(path_string)
+        path = os.path.abspath(os.path.join(topLevelDirectory, path_string))
         if not os.path.exists(path):
             if isinstance(key, list):
                 key = ".".join(key)  # purely for logging

From 4f441a73e5217feec0074e9bef7ee47be5f65c5b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:04:31 +0200
Subject: [PATCH 065/131] Changed title, fixed typo

---
 notebooks/intro.ipynb | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/notebooks/intro.ipynb b/notebooks/intro.ipynb
index cdc8dd6f..dcba1db8 100644
--- a/notebooks/intro.ipynb
+++ b/notebooks/intro.ipynb
@@ -14,7 +14,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# Introduction to sensAI"
+    "# Introduction to sensAI: Supervised Learning with VectorModels"
    ]
   },
   {
@@ -412,7 +412,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Some of these are only active for binary classification. The one we don't want is \"confusion-matrx-rel\"."
+    "Some of these are only active for binary classification. The one we don't want is \"confusion-matrix-rel\"."
    ]
   },
   {
@@ -548,7 +548,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.9"
+   "version": "3.8.13"
   },
   "orig_nbformat": 4
  },

From 40dc4fefeed4aa186a2a1b5307ce2540c09e1057 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:05:25 +0200
Subject: [PATCH 066/131] Extended package-level imports to improve usability
 without auto-imports

---
 src/sensai/data_transformation/__init__.py | 3 ++-
 src/sensai/torch/__init__.py               | 8 ++++----
 2 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/sensai/data_transformation/__init__.py b/src/sensai/data_transformation/__init__.py
index ab73e9be..fc9bc42f 100644
--- a/src/sensai/data_transformation/__init__.py
+++ b/src/sensai/data_transformation/__init__.py
@@ -1,2 +1,3 @@
 from .dft import *
-from . import sklearn_transformer
\ No newline at end of file
+from .sklearn_transformer import *
+from .value_transformation import *
diff --git a/src/sensai/torch/__init__.py b/src/sensai/torch/__init__.py
index 153c6431..a08a8031 100644
--- a/src/sensai/torch/__init__.py
+++ b/src/sensai/torch/__init__.py
@@ -1,5 +1,5 @@
 from . import torch_modules as modules, torch_models as models
-from .torch_data import TensorScaler, DataUtil, VectorDataUtil
-from .torch_opt import NNLossEvaluatorRegression, NNLossEvaluator, NNOptimiser
-from .torch_base import TorchModel, VectorTorchModel, TorchVectorRegressionModel, \
-    TorchVectorClassificationModel
+from .torch_data import *
+from .torch_opt import *
+from .torch_base import *
+from .torch_enums import *
\ No newline at end of file

From 29392e9e60b0d4f02d7819ebe62ce007229eb15a Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:07:05 +0200
Subject: [PATCH 067/131] Added functions to support inspection of
 misclassifications

---
 .../eval_stats/eval_stats_classification.py         |  3 +++
 src/sensai/evaluation/evaluator.py                  | 13 +++++++++++--
 2 files changed, 14 insertions(+), 2 deletions(-)

diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index 76f5d8f7..937fdfe9 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -293,6 +293,9 @@ def metricsDict(self) -> Dict[str, float]:
                 d[metric.name] = self.computeMetricValue(metric)
         return d
 
+    def getMisclassifiedIndices(self) -> List[int]:
+        return [i for i, (predClass, trueClass) in enumerate(zip(self.y_predicted, self.y_true)) if predClass != trueClass]
+
     def plotConfusionMatrix(self, normalize=True, titleAdd: str = None):
         # based on https://scikit-learn.org/0.20/auto_examples/model_selection/plot_confusion_matrix.html
         confusionMatrix = self.getConfusionMatrix()
diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index a4481bb9..d0e6859f 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -1,7 +1,7 @@
 import functools
 import logging
 from abc import ABC, abstractmethod
-from typing import Tuple, Dict, Any, Generator, Generic, TypeVar, Sequence, Optional, List, Union, Callable
+from typing import Tuple, Dict, Any, Generator, Generic, TypeVar, Sequence, Optional, List, Union, Callable, Iterator
 
 import pandas as pd
 
@@ -314,7 +314,16 @@ def _computeOutputs(self, model: VectorModelBase, inputOutputData: InputOutputDa
 
 
 class VectorClassificationModelEvaluationData(VectorModelEvaluationData[ClassificationEvalStats]):
-    pass
+    def getMisclassifiedInputsDataFrame(self) -> pd.DataFrame:
+        return self.inputData.iloc[self.getEvalStats().getMisclassifiedIndices()]
+
+    def getMisclassifiedTriplesPredTrueInput(self) -> List[Tuple[Any, Any, pd.Series]]:
+        """
+        :return: a list containing a triple (predicted class, true class, input series) for each misclassified data point
+        """
+        evalStats = self.getEvalStats()
+        indices = evalStats.getMisclassifiedIndices()
+        return [(evalStats.y_predicted[i], evalStats.y_true[i], self.inputData.iloc[i]) for i in indices]
 
 
 class VectorClassificationModelEvaluatorParams(VectorModelEvaluatorParams):

From ebee943a9c938dad3bb6373b66fa734d8a4fbfc2 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:07:29 +0200
Subject: [PATCH 068/131] Added
 SkLearnLogisticRegressionVectorClassificationModel

---
 src/sensai/sklearn/sklearn_classification.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/sensai/sklearn/sklearn_classification.py b/src/sensai/sklearn/sklearn_classification.py
index e1349aea..9365446a 100644
--- a/src/sensai/sklearn/sklearn_classification.py
+++ b/src/sensai/sklearn/sklearn_classification.py
@@ -56,3 +56,8 @@ def __init__(self, **modelArgs):
 class SkLearnSVCVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     def __init__(self, random_state=42, **modelArgs):
         super().__init__(sklearn.svm.SVC, random_state=random_state, **modelArgs)
+
+
+class SkLearnLogisticRegressionVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
+    def __init__(self, random_state=42, **modelArgs):
+        super().__init__(sklearn.linear_model.LogisticRegression, random_state=random_state, **modelArgs)
\ No newline at end of file

From 6f66212bf5b778f37d3f68bd6d0eeeaeeaf6dcd9 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:08:11 +0200
Subject: [PATCH 069/131] Improved docstring

---
 src/sensai/torch/torch_base.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index c845a97e..820f8b18 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -358,8 +358,8 @@ def createTorchModuleForDims(self, inputDim: int, outputDim: int) -> torch.nn.Mo
         """
         :param inputDim: the number of input dimensions as reported by the data set provider (number of columns
             in input data frame for default providers)
-        :param outputDim: the number of output dimensions as reported by the data set provider (number of columns
-            in output data frame for default providers)
+        :param outputDim: the number of output dimensions as reported by the data set provider (for default providers,
+            this will be the nnumber of columns in the output data frame or, for classification, the number of classes)
         :return: the torch module
         """
         pass

From 754896061d3564eb12b79939ddf7efc60e8724c5 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:10:10 +0200
Subject: [PATCH 070/131] Extended ignored files

---
 .gitignore | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 83eac1fa..7a7b9f94 100644
--- a/.gitignore
+++ b/.gitignore
@@ -20,4 +20,9 @@ dist
 data
 .coverage
 /*.env
-/docs-build
\ No newline at end of file
+/docs-build
+/code.sh
+/lightning_logs
+*.code-workspace
+/TODO.txt
+notebooks/temp.ipynb
\ No newline at end of file

From 5c858b7b4119865f3ffd053e08aa8ac4e6c39317 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:12:12 +0200
Subject: [PATCH 071/131] Added notebook on neural networks

---
 docs/index.rst                  |   1 +
 notebooks/neural_networks.ipynb | 321 ++++++++++++++++++++++++++++++++
 2 files changed, 322 insertions(+)
 create mode 100644 notebooks/neural_networks.ipynb

diff --git a/docs/index.rst b/docs/index.rst
index 6d03c3a3..a4dcc249 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -6,6 +6,7 @@ sensAI - the Python library for sensible AI
    :glob:
 
    intro.ipynb
+   neural_networks.ipynb
    intro_old.ipynb
    tracking_experiments.ipynb
    tensor_models_pytorch_lightning.ipynb
diff --git a/notebooks/neural_networks.ipynb b/notebooks/neural_networks.ipynb
new file mode 100644
index 00000000..9d6fa278
--- /dev/null
+++ b/notebooks/neural_networks.ipynb
@@ -0,0 +1,321 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys; sys.path.extend([\"../src\", \"..\"])\n",
+    "import sensai\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "from typing import *\n",
+    "import config\n",
+    "\n",
+    "cfg = config.get_config()\n",
+    "sensai.util.logging.configureLogging()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Neural Networks\n",
+    "\n",
+    "Neural networks being a very powerful class of models, especially in cases where the learning of representations from low-level information (such as pixels, audio samples or text) is key, sensAI provides many useful abstractions for dealing with this class of models, facilitating data handling, learning and evaluation.\n",
+    "\n",
+    "sensAI mainly provides abstractions for PyTorch, but there is also rudimentary support for TensorFlow.\n",
+    "\n",
+    "## Image Classification\n",
+    "\n",
+    "As an example use case, let us solve the classification problem of classifying digits in pixel images from the MNIST dataset. Images are greyscale (no colour information) and 28x28 pixels in size."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "mnistDF = pd.read_csv(cfg.datafile_path(\"mnist_train.csv.zip\"))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The data frame contains one column for every pixel, each pixel being represented by a 8-bit integer (0 to 255)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "mnistDF.head(5)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Let's create the I/O data for our experiments."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "mnistIoData = sensai.InputOutputData.fromDataFrame(mnistDF, \"label\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now that we have the image data separated from the labels, let's write a function to restore the 2D image array and take a look at some of the images."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "\n",
+    "def reshape2DImage(series):\n",
+    "    return series.values.reshape(28, 28)\n",
+    "\n",
+    "fig, axs = plt.subplots(nrows=1, ncols=5, figsize=(10, 5))\n",
+    "for i in range(5):\n",
+    "    axs[i].imshow(reshape2DImage(mnistIoData.inputs.iloc[i]), cmap=\"binary\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Applying Predefined Models\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We create an evaluator in order to test the performance of our models, randomly splitting the data."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evaluatorParams = sensai.evaluation.VectorClassificationModelEvaluatorParams(fractionalSplitTestFraction=0.2)\n",
+    "evalUtil = sensai.evaluation.ClassificationEvaluationUtil(mnistIoData, evaluatorParams=evaluatorParams)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "One pre-defined model we could try is a simple multi-layer perceptron. A PyTorch-based implementation is provided via class `sensai.torch.models.MultiLayerPerceptronVectorClassificationModel`. This implementation supports CUDA-accelerated computations (on Nvidia GPUs), but we shall stick to CPU-based computation in the following."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sensai.torch\n",
+    "\n",
+    "nnOptimiserParams = sensai.torch.NNOptimiserParams(earlyStoppingEpochs=10, batchSize=54)\n",
+    "torchMLPModel = sensai.torch.models.MultiLayerPerceptronVectorClassificationModel(hiddenDims=(50, 20), cuda=False,\n",
+    "        normalisationMode=sensai.torch.NormalisationMode.MAX_ALL, nnOptimiserParams=nnOptimiserParams, pDropout=0.0).withName(\"MLP\")\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Neural networks work best on **normalised inputs**, so we have opted to apply basic normalisation by specifying a normalisation mode which will normalise by dividing by the maximum value found across all columns in the training data. For more elaborate normalisation options, we could have used a data frame transformer (DFT), particularly `DFTNormalisation` or `DFTSkLearnTransformer`.\n",
+    "\n",
+    "sensAI's default **neural network training algorithm** is based on early stopping, which involves checking, in regular intervals, the performance of the model on a validation set (which is split from the training set) and ultimately selecting the model that performed best on the validation set. You have full control over the loss evaluation method used to select the best model (by passing a respective `NNLossEvaluator` instance to NNOptimiserParams) as well as the method that is used to split the training set into the actual training set and the validation set (by adding a `DataFrameSplitter` to the model or using a custom `TorchDataSetProvider`).\n",
+    "\n",
+    "Given the vectorised nature of the dataset, we can apply any type of model which can accept the numeric inputs. Let's compare the above neural network against another pre-defined model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "randomForestModel = sensai.sklearn.classification.SkLearnRandomForestVectorClassificationModel(min_samples_leaf=1, n_estimators=10) \\\n",
+    "    .withName(\"RandomForest\")\n",
+    "\n",
+    "evalUtil.compareModels([randomForestModel, torchMLPModel])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Both models perform reasonably well, and the random forest could reach the performance of the MLP by adding more trees."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Creating a Custom CNN Model\n",
+    "\n",
+    "Given that this is an image recognition problem, it can be sensible to apply convolutional neural networks (CNNs), which can analyse smaller patches of the image in order to generate more high-level features from them.\n",
+    "\n",
+    "To define a custom neural network model that uses PyTorch, we need to implement a new model class. For classification and regression, sensAI provides the base classes `TorchVectorClassificationModel` and `TorchVectorRegressionModel` respectively. Ultimately, these classes will wrap an instance of `torch.nn.Module`, the base class for neural networks in PyTorch.\n",
+    "\n",
+    "In the following, we shall define a model which uses multiple convolutions, a max-pooling layer and a multi-layer perceptron at the end in order to produce the classification."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "\n",
+    "class CnnModel(sensai.torch.TorchVectorClassificationModel):\n",
+    "    def __init__(self, cuda: bool, kernelSize: int, numConv: int, poolingKernelSize: int, mlpHiddenDims: Sequence[int], \n",
+    "            nnOptimiserParams: sensai.torch.NNOptimiserParams, pDropout=0.0):\n",
+    "        self.cuda = cuda\n",
+    "        self.outputActivationFn = sensai.torch.ActivationFunction.LOG_SOFTMAX\n",
+    "        self.kernelSize = kernelSize\n",
+    "        self.numConv = numConv\n",
+    "        self.poolingKernelSize = poolingKernelSize\n",
+    "        self.mlpHiddenDims = mlpHiddenDims\n",
+    "        self.pDropout = pDropout\n",
+    "        super().__init__(sensai.torch.ClassificationOutputMode.forActivationFn(self.outputActivationFn),\n",
+    "            modelClass=self.VectorTorchModel, modelArgs=[self], nnOptimiserParams=nnOptimiserParams)\n",
+    "        self.withInputTensoriser(self.InputTensoriser())\n",
+    "\n",
+    "    class InputTensoriser(sensai.torch.RuleBasedTensoriser):\n",
+    "        def _tensorise(self, df: pd.DataFrame) -> Union[torch.Tensor, List[torch.Tensor]]:\n",
+    "            images = [reshape2DImage(row) for _, row in df.iterrows()]\n",
+    "            return torch.tensor(np.stack(images)).float() / 255\n",
+    "\n",
+    "    class VectorTorchModel(sensai.torch.VectorTorchModel):\n",
+    "        def __init__(self, vecModel: \"CnnModel\"):\n",
+    "            super().__init__(vecModel.cuda)\n",
+    "            self._vecModel = vecModel\n",
+    "\n",
+    "        def createTorchModuleForDims(self, inputDim: int, outputDim: int) -> torch.nn.Module:\n",
+    "            return self.Module(int(np.sqrt(inputDim)), outputDim, self._vecModel)\n",
+    "\n",
+    "        class Module(torch.nn.Module):\n",
+    "            def __init__(self, imageDim, outputDim, vecModel: \"CnnModel\"):\n",
+    "                super().__init__()\n",
+    "                k = vecModel.kernelSize\n",
+    "                p = vecModel.poolingKernelSize\n",
+    "                self.cnn = torch.nn.Conv2d(1, vecModel.numConv, (k, k))\n",
+    "                self.pool = torch.nn.MaxPool2d((p, p))\n",
+    "                self.dropout = torch.nn.Dropout(p=vecModel.pDropout)\n",
+    "                reducedDim = (imageDim-k+1)/p\n",
+    "                if int(reducedDim) != reducedDim:\n",
+    "                    raise ValueError(f\"Pooling kernel size {p} is not a divisor of post-convolution dimension {imageDim-k+1}\")\n",
+    "                self.mlp = sensai.torch.models.MultiLayerPerceptron(vecModel.numConv * int(reducedDim)**2, outputDim, vecModel.mlpHiddenDims,\n",
+    "                    outputActivationFn=vecModel.outputActivationFn.getTorchFunction(),\n",
+    "                    hidActivationFn=sensai.torch.ActivationFunction.RELU.getTorchFunction(),\n",
+    "                    pDropout=vecModel.pDropout)\n",
+    "\n",
+    "            def forward(self, x):\n",
+    "                x = self.cnn(x.unsqueeze(1))\n",
+    "                x = self.pool(x)\n",
+    "                x = x.view(x.shape[0], -1)\n",
+    "                x = self.dropout(x)\n",
+    "                return self.mlp(x)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "As you can see, very little code is required in addition to the actual torch module.\n",
+    "The outer class, which provides the sensAI `VectorModel` features, serves mainly to hold the parameters, and the inner class inheriting from `VectorTorchModel` serves a factory for the `torch.nn.Module`, providing us with the input and output dimensions (number of input columns and number of classes respectively). Because we take the dimensions directly from the input, this model could easily process other image sizes than 28x28 and we end up with fewer magic numbers in the code.\n",
+    "\n",
+    "The inner class `InputTensoriser`, which is instantiated and passed as the input tensoriser for the model, serves to convert the input data frame into a tensor. It could perform arbitrary computations in order to produce, from a data frame with N rows, one or more tensors of length N (first dimension equal to N) that will ultimately be fed to the neural network.\n",
+    "\n",
+    "Let's instantiate our model and see how it performs."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "nnOptimiserParams = sensai.torch.NNOptimiserParams(optimiser=sensai.torch.Optimiser.ADAMW, optimiserLR=0.01, batchSize=1024, \n",
+    "    earlyStoppingEpochs=3)\n",
+    "cnnModel = CnnModel(cuda=False, kernelSize=5, numConv=32, poolingKernelSize=2, mlpHiddenDims=(200,20),\n",
+    "    nnOptimiserParams=nnOptimiserParams).withName(\"CNN\")\n",
+    "\n",
+    "evalData = evalUtil.performSimpleEvaluation(cnnModel)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The model does slightly improve upon the MLP model we evaluated earlier.\n",
+    "\n",
+    "Let's take a look at some examples where the model went wrong."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "misclassified = evalData.getMisclassifiedTriplesPredTrueInput()\n",
+    "fig, axs = plt.subplots(nrows=3, ncols=3, figsize=(9,9))\n",
+    "for i, (predClass, trueClass, input) in enumerate(misclassified[:9]):\n",
+    "    axs[i//3][i%3].imshow(reshape2DImage(input), cmap=\"binary\")\n",
+    "    axs[i//3][i%3].set_title(f\"{trueClass} misclassified as {predClass}\")\n",
+    "plt.tight_layout()"
+   ]
+  }
+ ],
+ "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
+  "kernelspec": {
+   "display_name": "Python 3.8.13 ('sensai')",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.13"
+  },
+  "orig_nbformat": 4
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

From 740524fe3e1b6144b9bac6123d77055e96bb87e9 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 18:53:07 +0200
Subject: [PATCH 072/131] Fixed spelling errors, minor improvements

---
 notebooks/neural_networks.ipynb | 44 ++++++++++++++++++++++++---------
 1 file changed, 33 insertions(+), 11 deletions(-)

diff --git a/notebooks/neural_networks.ipynb b/notebooks/neural_networks.ipynb
index 9d6fa278..5f27e802 100644
--- a/notebooks/neural_networks.ipynb
+++ b/notebooks/neural_networks.ipynb
@@ -45,7 +45,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "The data frame contains one column for every pixel, each pixel being represented by a 8-bit integer (0 to 255)."
+    "The data frame contains one column for every pixel, each pixel being represented by an 8-bit integer (0 to 255)."
    ]
   },
   {
@@ -77,7 +77,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Now that we have the image data separated from the labels, let's write a function to restore the 2D image array and take a look at some of the images."
+    "Now that we have the image data separated from the labels, let's write a function to restore the 2D image arrays and take a look at some of the images."
    ]
   },
   {
@@ -125,7 +125,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "One pre-defined model we could try is a simple multi-layer perceptron. A PyTorch-based implementation is provided via class `sensai.torch.models.MultiLayerPerceptronVectorClassificationModel`. This implementation supports CUDA-accelerated computations (on Nvidia GPUs), but we shall stick to CPU-based computation in the following."
+    "One pre-defined model we could try is a simple multi-layer perceptron. A PyTorch-based implementation is provided via class `MultiLayerPerceptronVectorClassificationModel`. This implementation supports CUDA-accelerated computations (on Nvidia GPUs), yet we shall stick to CPU-based computation (cuda=False) in this tutorial."
    ]
   },
   {
@@ -145,11 +145,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Neural networks work best on **normalised inputs**, so we have opted to apply basic normalisation by specifying a normalisation mode which will normalise by dividing by the maximum value found across all columns in the training data. For more elaborate normalisation options, we could have used a data frame transformer (DFT), particularly `DFTNormalisation` or `DFTSkLearnTransformer`.\n",
+    "Neural networks work best on **normalised inputs**, so we have opted to apply basic normalisation by specifying a normalisation mode which will transforms inputs by dividing by the maximum value found across all columns in the training data. For more elaborate normalisation options, we could have used a data frame transformer (DFT), particularly `DFTNormalisation` or `DFTSkLearnTransformer`.\n",
     "\n",
     "sensAI's default **neural network training algorithm** is based on early stopping, which involves checking, in regular intervals, the performance of the model on a validation set (which is split from the training set) and ultimately selecting the model that performed best on the validation set. You have full control over the loss evaluation method used to select the best model (by passing a respective `NNLossEvaluator` instance to NNOptimiserParams) as well as the method that is used to split the training set into the actual training set and the validation set (by adding a `DataFrameSplitter` to the model or using a custom `TorchDataSetProvider`).\n",
     "\n",
-    "Given the vectorised nature of the dataset, we can apply any type of model which can accept the numeric inputs. Let's compare the above neural network against another pre-defined model."
+    "Given the vectorised nature of our MNIST dataset, we can apply any type of model which can accept the numeric inputs. Let's compare the neural network we defined above against another pre-defined model, which is based on a scikit-learn implementation and uses decision trees rather than neural networks."
    ]
   },
   {
@@ -168,7 +168,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Both models perform reasonably well, and the random forest could reach the performance of the MLP by adding more trees."
+    "Both models perform reasonably well."
    ]
   },
   {
@@ -247,8 +247,8 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "As you can see, very little code is required in addition to the actual torch module.\n",
-    "The outer class, which provides the sensAI `VectorModel` features, serves mainly to hold the parameters, and the inner class inheriting from `VectorTorchModel` serves a factory for the `torch.nn.Module`, providing us with the input and output dimensions (number of input columns and number of classes respectively). Because we take the dimensions directly from the input, this model could easily process other image sizes than 28x28 and we end up with fewer magic numbers in the code.\n",
+    "Very little code is required in addition to the actual torch module.\n",
+    "The outer class, which provides the sensAI `VectorModel` features, serves mainly to hold the parameters, and the inner class inheriting from `VectorTorchModel` serves as a factory for the `torch.nn.Module`, providing us with the input and output dimensions (number of input columns and number of classes respectively) based on the data. Because we take the dimensions directly from the input, this model could easily process other image sizes than 28x28 and we furthermore end up with fewer magic numbers in the code.\n",
     "\n",
     "The inner class `InputTensoriser`, which is instantiated and passed as the input tensoriser for the model, serves to convert the input data frame into a tensor. It could perform arbitrary computations in order to produce, from a data frame with N rows, one or more tensors of length N (first dimension equal to N) that will ultimately be fed to the neural network.\n",
     "\n",
@@ -273,9 +273,24 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "The model does slightly improve upon the MLP model we evaluated earlier.\n",
-    "\n",
-    "Let's take a look at some examples where the model went wrong."
+    "The model does slightly improve upon the MLP model we evaluated earlier."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "comparisonData = evalUtil.compareModels([torchMLPModel, cnnModel, randomForestModel], fitModels=False)\n",
+    "comparisonData.resultsDF"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Could the CNN model have produced even better results? Let's take a look at some examples where the CNN model went wrong."
    ]
   },
   {
@@ -291,6 +306,13 @@
     "    axs[i//3][i%3].set_title(f\"{trueClass} misclassified as {predClass}\")\n",
     "plt.tight_layout()"
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "While some of these examples are indeed ambiguous, there still is room for improvement."
+   ]
   }
  ],
  "metadata": {

From 71ba15761d030c0820c5a519bb8ef8b21e8b878a Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 21:51:33 +0200
Subject: [PATCH 073/131] Fixed deprecation warning concerning pandas append
 function

---
 .../geopandas/coordinate_clustering.py             | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/src/sensai/geoanalytics/geopandas/coordinate_clustering.py b/src/sensai/geoanalytics/geopandas/coordinate_clustering.py
index 88f901b4..7a877396 100644
--- a/src/sensai/geoanalytics/geopandas/coordinate_clustering.py
+++ b/src/sensai/geoanalytics/geopandas/coordinate_clustering.py
@@ -1,14 +1,16 @@
-import geopandas as gp
 import logging
+from typing import Callable, Union, Iterable
+
+import geopandas as gp
 import numpy as np
+import pandas as pd
 from shapely.geometry import MultiPoint
-from typing import Callable, Union, Iterable
 
-from ...clustering.clustering_base import EuclideanClusterer
+from .coordinates import validateCoordinates, extractCoordinatesArray, TCoordinates, GeoDataFrameWrapper
 from ...clustering import SkLearnEuclideanClusterer
+from ...clustering.clustering_base import EuclideanClusterer
 from ...clustering.sklearn_clustering import SkLearnClustererProtocol
 from ...util.cache import LoadSaveInterface
-from .coordinates import validateCoordinates, extractCoordinatesArray, TCoordinates, GeoDataFrameWrapper
 from ...util.profiling import timed
 
 log = logging.getLogger(__name__)
@@ -114,9 +116,9 @@ def toGeoDF(self, condition: Callable[[Cluster], bool] = None, crs='epsg:3857',
         geodf.crs = crs
         # TODO or not TODO: parallelize this or improve performance some another way
         for cluster in self.clusters(condition):
-            geodf = geodf.append(cluster.toGeoDF(crs=crs))
+            geodf = pd.concat((geodf, cluster.toGeoDF(crs=crs)))
         if includeNoise:
-            geodf = geodf.append(self.noiseCluster().toGeoDF(crs=crs))
+            geodf = pd.concat((geodf, self.noiseCluster().toGeoDF(crs=crs)))
         return geodf
 
     def plot(self, includeNoise=False, condition=None, **kwargs):

From b54496eae01d9987db68cbcadd257c13fe893101 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 21:53:12 +0200
Subject: [PATCH 074/131] Updated to reflect class name changes, improved text,
 changed preamble to support VSCode

---
 notebooks/coordinate_clustering.ipynb | 172 +++++++++++++-------------
 1 file changed, 87 insertions(+), 85 deletions(-)

diff --git a/notebooks/coordinate_clustering.ipynb b/notebooks/coordinate_clustering.ipynb
index cc9ee369..6cd5843e 100644
--- a/notebooks/coordinate_clustering.ipynb
+++ b/notebooks/coordinate_clustering.ipynb
@@ -1,50 +1,45 @@
 {
  "cells": [
   {
-   "cell_type": "markdown",
-   "metadata": {
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   },
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
-    "# The Coordinate Clustering Module\n",
-    "\n",
-    "On top of support for different clustering algorithms, sensAI provides useful methods specific to\n",
-    "clustering of geospatial data. They include utilities for wrangling geometrical data, spanning trees and for persisting and\n",
-    "visualizing the results. It seamlessly interoperates with geopandas and shapely.\n",
-    "This notebook gives an overview of the coordinate clustering's main functions\n",
-    "\n",
-    "\n",
-    "## Before running the notebook\n",
-    "\n",
-    "Install the library and its dependencies with, if you haven't done so already\n",
-    "```\n",
-    "pip install -e .\n",
-    "```\n",
-    "from the root directory. You can also execute this command directly in the notebook but will need to reload the\n",
-    "kernel afterwards"
+    "%load_ext autoreload\n",
+    "%autoreload 2"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys; sys.path.extend([\"../src\", \"..\"])\n",
+    "import os\n",
+    "import config\n",
+    "import sensai\n",
+    "import logging\n",
+    "\n",
+    "c = config.get_config(reload=True)\n",
+    "sensai.util.logging.configureLogging(level=logging.INFO)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
    },
-   "outputs": [],
    "source": [
-    "# Note - this cell should be executed only once per session\n",
-    "%load_ext autoreload\n",
-    "%autoreload 2\n",
-    "\n",
-    "import sys, os\n",
+    "# Coordinate Clustering\n",
     "\n",
-    "# in order to get the config, it is not part of the library\n",
-    "os.chdir(\"..\")\n",
-    "sys.path.append(os.path.abspath(\".\"))"
+    "On top of support for different clustering algorithms, sensAI provides useful methods specific to\n",
+    "clustering of geospatial data. They include utilities for wrangling geometrical data, spanning trees and for persisting and\n",
+    "visualizing the results. It seamlessly interoperates with geopandas and shapely.\n",
+    "This notebook gives an overview of the coordinate clustering's main functions"
    ]
   },
   {
@@ -57,7 +52,6 @@
    },
    "outputs": [],
    "source": [
-    "import os\n",
     "import geopandas as gp\n",
     "from pprint import pprint\n",
     "import numpy as np\n",
@@ -67,11 +61,7 @@
     "import logging\n",
     "from sensai.geoanalytics.geopandas.graph import CoordinateSpanningTree\n",
     "from sensai.geoanalytics.geopandas.coordinate_clustering import SkLearnCoordinateClustering\n",
-    "from sensai.geoanalytics.geopandas.geometry import alphaShape\n",
-    "from config import get_config\n",
-    "\n",
-    "logging.basicConfig(level=logging.INFO)\n",
-    "c = get_config(reload=True)"
+    "from sensai.geoanalytics.geopandas.geometry import alphaShape"
    ]
   },
   {
@@ -82,7 +72,7 @@
     }
    },
    "source": [
-    "## Loading and Fitting"
+    "## Loading Data and Fitting a Clusterer"
    ]
   },
   {
@@ -93,9 +83,9 @@
     }
    },
    "source": [
-    "The library contains utils for loading coordinates from files and for wrapping arbitrary scikit-learn compatible\n",
-    "clustering algorithms. Custom clustering algorithms can be implemented easily buy inheriting from the baseclass\n",
-    "`ClusteringModel`\n"
+    "The library contains utilities for loading coordinates from files and for wrapping arbitrary scikit-learn-compatible\n",
+    "clustering algorithms. Custom clustering algorithms can be implemented by inheriting from the base class\n",
+    "`EuclideanClusterer`."
    ]
   },
   {
@@ -110,6 +100,15 @@
    "source": [
     "sampleFile = c.datafile_path(\"sample\", stage=c.RAW) # this can point to a directory or a shp/geojson file\n",
     "sampleGeoDF = gp.read_file(sampleFile)\n",
+    "sampleGeoDF"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
     "dbscan = SkLearnCoordinateClustering(DBSCAN(eps=150, min_samples=20))\n",
     "dbscan.fit(sampleGeoDF)"
    ]
@@ -122,8 +121,8 @@
     }
    },
    "source": [
-    "The resulting `CoordinateClusteringAlgorithm` instance has many useful methods.\n",
-    "You can retrieve clusters individually or via a generator. The noise cluster can be accessed individually"
+    "The instance has many useful methods.\n",
+    "You can retrieve clusters individually or via a generator. The noise cluster can be accessed individually."
    ]
   },
   {
@@ -162,8 +161,8 @@
     }
    },
    "source": [
-    "From the dbscan single clusters which are instances of `CoordinateClusteringAlgorithm.Cluster` \n",
-    "can be retrieved and visualized. Most objects, including the dbscan itself, have an inbuilt plot method"
+    "From the instance, individual clusters, which are instances of `EuclidianClusterer.Cluster`,\n",
+    "can be retrieved and visualized. Most objects, including the clusterer itself, have a built-in plot method."
    ]
   },
   {
@@ -187,7 +186,7 @@
     }
    },
    "source": [
-    "We can condition before plotting as well as pass custom arguments"
+    "We can apply a condition to the clusters to be plotted and pass additional arguments affecting the display."
    ]
   },
   {
@@ -211,9 +210,9 @@
     }
    },
    "source": [
-    "### Properties of a single cluster\n",
+    "### Properties of Individual Clusters\n",
     "\n",
-    "Single clusters can be plotted too"
+    "Individual clusters can be plotted, too."
    ]
   },
   {
@@ -258,87 +257,87 @@
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "A single cluster is just a wrapper around its coordinates. They can be\n",
-    "retrieved either as a numpy array, a geodataframe or a MultiPoint object.\n",
-    "The latter is useful for geometric operations, e.g. computing hulls"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "A single cluster is just a wrapper around its coordinates. They can be\n",
+    "retrieved either as a numpy array, a geodataframe or a MultiPoint object.\n",
+    "The latter is useful for geometric operations, e.g. computing hulls"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "clusterMultipoint = sampleCluster.asMultipoint()\n",
-    "clusterMultipoint.convex_hull"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
+   },
+   "outputs": [],
+   "source": [
+    "clusterMultipoint = sampleCluster.asMultipoint()\n",
+    "clusterMultipoint.convex_hull"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "# we also provide a utility for computing alpha shapes for such objects\n",
-    "\n",
-    "alphaShape(clusterMultipoint)"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
+   },
+   "outputs": [],
+   "source": [
+    "# we also provide a utility for computing alpha shapes for such objects\n",
+    "\n",
+    "alphaShape(clusterMultipoint)"
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "sensAI also provides utilities for computing trees, e.g. here for the minimal spanning tree"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "sensAI also provides utilities for computing trees, e.g. here for the minimal spanning tree"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "sampleTree = CoordinateSpanningTree(sampleCluster)\n",
-    "sampleTree.plot()"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
+   },
+   "outputs": [],
+   "source": [
+    "sampleTree = CoordinateSpanningTree(sampleCluster)\n",
+    "sampleTree.plot()"
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "Most objects provide a way for extracting a summary from them, either as a dict or as a data frame"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "Most objects provide a way for extracting a summary from them, either as a dict or as a data frame"
+   ]
   },
   {
    "cell_type": "code",
@@ -469,8 +468,11 @@
   }
  ],
  "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3.8.13 ('sensai')",
    "language": "python",
    "name": "python3"
   },
@@ -484,9 +486,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.2"
+   "version": "3.8.13"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
\ No newline at end of file
+}

From 6d15ba851caffd7901588391cf527124b16cc57c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 22:37:37 +0200
Subject: [PATCH 075/131] Improved text & structure, changed preamble

---
 notebooks/clustering_evaluation.ipynb | 177 ++++++++++++++------------
 1 file changed, 94 insertions(+), 83 deletions(-)

diff --git a/notebooks/clustering_evaluation.ipynb b/notebooks/clustering_evaluation.ipynb
index 2b718151..ca9ec965 100644
--- a/notebooks/clustering_evaluation.ipynb
+++ b/notebooks/clustering_evaluation.ipynb
@@ -1,50 +1,44 @@
 {
  "cells": [
   {
-   "cell_type": "markdown",
-   "metadata": {
-    "collapsed": true,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   },
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
-    "# Evaluating clustering algorithms\n",
-    "\n",
-    "The present library contains utilities for evaluating different clustering algorithms\n",
-    "(with or without ground truth labels). On top of the evaluation utilities there are classes for\n",
-    "performing parameters sweeps and model selection. Here we give an overview of the most important functionality\n",
-    "\n",
-    "\n",
-    "## Before running the notebook\n",
-    "\n",
-    "Install the library and its dependencies with, if you haven't done so already\n",
-    "```\n",
-    "pip install -e .\n",
-    "```\n",
-    "from the root directory. You can also execute this command directly in the notebook but will need to reload the\n",
-    "kernel afterwards"
+    "%load_ext autoreload\n",
+    "%autoreload 2"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys; sys.path.extend([\"../src\", \"..\"])\n",
+    "import sensai\n",
+    "import logging\n",
+    "import config\n",
+    "\n",
+    "cfg = config.get_config(reload=True)\n",
+    "sensai.util.logging.configureLogging(level=logging.INFO)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
+    "collapsed": true,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
    },
-   "outputs": [],
    "source": [
-    "# Note - this cell should be executed only once per session\n",
-    "%load_ext autoreload\n",
-    "%autoreload 2\n",
-    "\n",
-    "import sys, os\n",
+    "# Evaluating Clustering Algorithms\n",
     "\n",
-    "# in order to get the config, it is not part of the library\n",
-    "os.chdir(\"..\")\n",
-    "sys.path.append(os.path.abspath(\".\"))"
+    "The present library contains utilities for evaluating different clustering algorithms\n",
+    "(with or without ground truth labels). On top of the evaluation utilities there are classes for\n",
+    "performing parameters sweeps and model selection. Here we give an overview of the most important functionality"
    ]
   },
   {
@@ -63,6 +57,7 @@
     "from sklearn.cluster import DBSCAN\n",
     "import seaborn as sns\n",
     "import geopandas as gp\n",
+    "import pandas as pd\n",
     "import matplotlib.pyplot as plt\n",
     "import logging\n",
     "\n",
@@ -72,11 +67,7 @@
     "    ClusteringModelUnsupervisedEvaluator\n",
     "from sensai.evaluation.eval_stats import ClusteringUnsupervisedEvalStats, ClusteringSupervisedEvalStats, \\\n",
     "    AdjustedMutualInfoScore\n",
-    "from sensai.geoanalytics.geopandas.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates\n",
-    "\n",
-    "from config import get_config\n",
-    "\n",
-    "logging.basicConfig(level=logging.INFO)"
+    "from sensai.geoanalytics.geopandas.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates"
    ]
   },
   {
@@ -89,9 +80,8 @@
    },
    "outputs": [],
    "source": [
-    "# loading data and config\n",
-    "c  = get_config(reload=True)\n",
-    "sampleFile = c.datafile_path(\"sample\", stage=c.RAW) # this can point to a directory or a shp/geojson file\n",
+    "# loading data \n",
+    "sampleFile = cfg.datafile_path(\"sample\", stage=cfg.RAW) # this can point to a directory or a shp/geojson file\n",
     "coordinatesDF = gp.read_file(sampleFile)"
    ]
   },
@@ -103,7 +93,7 @@
     }
    },
    "source": [
-    "## Evaluating a single model\n",
+    "## Evaluating a Single Model\n",
     "\n",
     "For a single model that was already fitted, evaluation statistics can be extracted with `ClusteringEvalStats`, see the\n",
     "example below (the eval_stats object can also be used to retrieve evaluation results one by one)\n"
@@ -121,8 +111,11 @@
    "source": [
     "dbscan = SkLearnCoordinateClustering(DBSCAN(eps=150, min_samples=20))\n",
     "dbscan.fit(coordinatesDF)\n",
+    "\n",
     "evalStats = ClusteringUnsupervisedEvalStats.fromModel(dbscan)\n",
+    "\n",
     "pprint(evalStats.getAll())\n",
+    "\n",
     "plt.hist(evalStats.clusterSizeDistribution)\n",
     "plt.show()"
    ]
@@ -135,13 +128,13 @@
     }
    },
    "source": [
-    "## Model selection\n",
+    "## Unsupervised Model Selection\n",
     "\n",
     "For model selection we need to compare different (or differently parametrized) models that were\n",
     "trained on the same dataset. The `ClusteringEvaluator` abstraction was designed with this goal in mind.\n",
     "The evaluator can be used to obtain evaluation statistics for different models that are guaranteed\n",
-    "to be comparable with each other (always computed by the same object in the same way). Here an example evaluating\n",
-    "a dbscan performance on metrics that don't necessitate ground truth labels"
+    "to be comparable with each other (always computed by the same object in the same way). Here is an example evaluating\n",
+    "DBSCAN's performance on metrics that don't necessitate ground truth labels."
    ]
   },
   {
@@ -182,8 +175,8 @@
    },
    "source": [
     "One of the main purposes of evaluators is to be used within classes that perform a parameter sweep, e.g.\n",
-    "a `GridSearch`. All such objects return a data frame and (optionally but recommended!) persist all evaluation results\n",
-    "in a csv."
+    "a `GridSearch`. All such objects return a data frame and (optionally) persist all evaluation results\n",
+    "in a CSV file."
    ]
   },
   {
@@ -206,7 +199,7 @@
     "def dbscanFactory(**kwargs):\n",
     "    return SkLearnCoordinateClustering(DBSCAN(**kwargs))\n",
     "\n",
-    "dbscanGridSearch = GridSearch(dbscanFactory, parameterOptions, csvResultsPath=os.path.join(c.temp, \"dbscanGridSearchCsv\"))"
+    "dbscanGridSearch = GridSearch(dbscanFactory, parameterOptions, csvResultsPath=os.path.join(cfg.temp, \"dbscanGridSearchCsv\"))"
    ]
   },
   {
@@ -219,7 +212,7 @@
    },
    "outputs": [],
    "source": [
-    "# the results of the grid-search are saved as csv under the path provided above\n",
+    "# the results of the grid-search are saved as a CSV file under the path provided above\n",
     "resultDf = dbscanGridSearch.run(modelEvaluator, sortColumnName=\"numClusters\", ascending=False)\n",
     "resultDf.head()"
    ]
@@ -292,7 +285,9 @@
     }
    },
    "source": [
-    "## Dealing with ground truth labels\n",
+    "## Supervised Model Selection\n",
+    "\n",
+    "### Obtaining Ground Truth Labels\n",
     "\n",
     "\n",
     "The evaluation classes can take ground truth labels for all coordinates and use them for calculating related metrics.\n",
@@ -313,7 +308,7 @@
    "outputs": [],
    "source": [
     "# The polygons can be read directly from a file, see the documentation for more details\n",
-    "groundTruthClusters = PolygonAnnotatedCoordinates(coordinatesDF, c.datafile_path(\"sample\", stage=c.GROUND_TRUTH))"
+    "groundTruthClusters = PolygonAnnotatedCoordinates(coordinatesDF, cfg.datafile_path(\"sample\", stage=cfg.GROUND_TRUTH))"
    ]
   },
   {
@@ -344,6 +339,13 @@
     "groundTruthClusters.toGeoDF().head()"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Supervised Evaluation Metrics"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {
@@ -352,9 +354,9 @@
     }
    },
    "source": [
-    "We can extract the coordinates and labels for the annotated region and use them in evaluation. In the following\n",
-    "we will train our own adaption of DBSCAN, namely `boundedDBSCAN` on datapoints in the ground truth region and\n",
-    "evaluate the results against the true labels"
+    "We can extract the coordinates and labels for the annotated region and use them in evaluation. In the following,\n",
+    "we will evaluate a slight adaptation of DBSCAN which uses an additional bound, i.e. it will ultimately reject clusters that do not reach a minimum size.\n",
+    "We will train it on datapoints in the ground truth region and evaluate the results against the true labels."
    ]
   },
   {
@@ -368,7 +370,9 @@
    "outputs": [],
    "source": [
     "boundedDbscan = SkLearnCoordinateClustering(DBSCAN(eps=150, min_samples=20), minClusterSize=100)\n",
+    "\n",
     "groundTruthCoordinates, groundTruthLabels = groundTruthClusters.getCoordinatesLabels()\n",
+    "\n",
     "supervisedEvaluator = ClusteringModelSupervisedEvaluator(groundTruthCoordinates, trueLabels=groundTruthLabels)\n",
     "supervisedEvalStats = supervisedEvaluator.evalModel(boundedDbscan)\n",
     "\n",
@@ -376,6 +380,20 @@
     "pprint(supervisedEvalStats.getAll())"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Comparing Unsupervised Evaluation Metrics"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "It can also be instructive to compare unsupervised evaluation metrics."
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -386,11 +404,11 @@
    },
    "outputs": [],
    "source": [
-    "print(\"Unsupervised evaluation metrics of bounded dbscan:\")\n",
-    "pprint(ClusteringUnsupervisedEvalStats(groundTruthCoordinates, groundTruthLabels).getAll())\n",
-    "print(\"\")\n",
-    "print(\"Unsupervised evaluation metrics of annotated data\")\n",
-    "pprint(ClusteringUnsupervisedEvalStats.fromModel(boundedDbscan).getAll())"
+    "groundTruthUnsupervisedMetrics = ClusteringUnsupervisedEvalStats(groundTruthCoordinates, groundTruthLabels).metricsDict()\n",
+    "boundedDbscanUnsupervisedMetrics = ClusteringUnsupervisedEvalStats.fromModel(boundedDbscan).metricsDict()\n",
+    "\n",
+    "pd.DataFrame({\"bounded DBSCAN\": boundedDbscanUnsupervisedMetrics, \"ground truth\": groundTruthUnsupervisedMetrics}, \n",
+    "    index=groundTruthUnsupervisedMetrics.keys())"
    ]
   },
   {
@@ -401,9 +419,9 @@
     }
    },
    "source": [
-    "The bounded dbscan is performing quite OK with the given parameters, although we see that it segregates clusters too\n",
+    "The bounded DBSCAN is already performing quite well with the given parameters, although we see that it segregates clusters too\n",
     "much and has a general tendency towards smaller clusters. These tendencies can be seen visually by comparing the ground\n",
-    "truth and the bounded dbscan cluster plots"
+    "truth and the bounded DBSCAN cluster plots."
    ]
   },
   {
@@ -429,10 +447,10 @@
     }
    },
    "source": [
-    "## Supervised parameter estimation\n",
+    "### Parameter Search\n",
     "\n",
     "We can now bring everything together by running a grid search and evaluating against ground truth. Very little code\n",
-    "is needed for that, so we will write it entirely in the cell below"
+    "is needed for that:"
    ]
   },
   {
@@ -451,22 +469,9 @@
     "}\n",
     "\n",
     "supervisedGridSearch = GridSearch(dbscanFactory, parameterOptions,\n",
-    "                                           csvResultsPath=os.path.join(c.temp, \"bounded_dbscan_grid_search.csv\"))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   },
-   "outputs": [],
-   "source": [
-    "# we will sort the results by mutual information store\n",
+    "    csvResultsPath=os.path.join(cfg.temp, \"bounded_dbscan_grid_search.csv\"))\n",
     "supervisedResultDf = supervisedGridSearch.run(supervisedEvaluator, sortColumnName=AdjustedMutualInfoScore.name,\n",
-    "                                              ascending=False)\n",
+    "    ascending=False)\n",
     "supervisedResultDf"
    ]
   },
@@ -478,15 +483,21 @@
     }
    },
    "source": [
-    "It seems like we were lucky to already have picked the optimal parameters for the dbscan above.\n",
-    "It is also interesting to notice that the supervised scores are in\n",
-    "stark disagreement with the unsupervised ones"
+    "According to the adjusted mutual information score, we have now found a new parameter combination (see rightmost columns of first row) which yields results even closer to the ground truth."
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": []
   }
  ],
  "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3.8.13 ('sensai')",
    "language": "python",
    "name": "python3"
   },
@@ -500,9 +511,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 1
-}
\ No newline at end of file
+}

From a9de9807f6a1679877d088e8f6edda1264ee09f0 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 23:26:39 +0200
Subject: [PATCH 076/131] Improved exception message

---
 src/sensai/evaluation/evaluator.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index d0e6859f..a2f81490 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -241,10 +241,10 @@ def fromDictOrInstance(cls, params: Optional[Union[Dict[str, Any], "VectorRegres
             return VectorRegressionModelEvaluatorParams()
         elif type(params) == dict:
             return cls.fromOldKwArgs(**params)
-        elif isinstance(params, VectorRegressionModelEvaluatorParams):
+        elif isinstance(params, cls):
             return params
         else:
-            raise ValueError(f"Must provide dictionary or instance, got {params}")
+            raise ValueError(f"Must provide dictionary or {cls} instance, got {params}, type {type(params)}")
 
     @classmethod
     def fromOldKwArgs(cls, dataSplitter=None, testFraction=None, randomSeed=42, shuffle=True, additionalMetrics: Sequence[RegressionMetric] = None,

From 384d06a5329d5c3d5af5b78994483f7627cf8371 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 23:27:15 +0200
Subject: [PATCH 077/131] EvaluationUtil: Support tracked experiments

---
 src/sensai/evaluation/eval_util.py | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 95d93050..73292156 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -33,6 +33,7 @@
     VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, VectorModelEvaluatorParams
 from ..data import InputOutputData
 from ..feature_importance import AggregatedFeatureImportances, FeatureImportanceProvider
+from ..tracking import TrackedExperiment
 from ..util.io import ResultWriter
 from ..util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 from ..util.string import prettyStringRepr
@@ -242,11 +243,14 @@ def createCrossValidator(self, model: TModel = None, isRegression: bool = None)
         return createVectorModelCrossValidator(self.inputOutputData, model=model, isRegression=isRegression, params=self.crossValidatorParams)
 
     def performSimpleEvaluation(self, model: TModel, createPlots=True, showPlots=False, logResults=True, resultWriter: ResultWriter = None,
-            additionalEvaluationOnTrainingData=False, fitModel=True, writeEvalStats=False) -> TEvalData:
+            additionalEvaluationOnTrainingData=False, fitModel=True, writeEvalStats=False,
+            trackedExperiment: TrackedExperiment = None) -> TEvalData:
         if showPlots and not createPlots:
             raise ValueError("showPlots=True requires createPlots=True")
         resultWriter = self._resultWriterForModel(resultWriter, model)
         evaluator = self.createEvaluator(model)
+        if trackedExperiment is not None:
+            evaluator.setTrackedExperiment(trackedExperiment)
         log.info(f"Evaluating {model} via {evaluator}")
         if fitModel:
             evaluator.fitModel(model)
@@ -282,7 +286,8 @@ def _resultWriterForModel(resultWriter: Optional[ResultWriter], model: TModel) -
             return None
         return resultWriter.childWithAddedPrefix(model.getName() + "-")
 
-    def performCrossValidation(self, model: TModel, showPlots=False, logResults=True, resultWriter: Optional[ResultWriter] = None) -> TCrossValData:
+    def performCrossValidation(self, model: TModel, showPlots=False, logResults=True, resultWriter: Optional[ResultWriter] = None,
+            trackedExperiment: TrackedExperiment = None) -> TCrossValData:
         """
         Evaluates the given model via cross-validation
 
@@ -291,10 +296,13 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
         :param logResults: whether to log evaluation results
         :param resultWriter: a writer with which to store text files and plots. The evaluated model's name is added to each filename
             automatically
+        :param trackedExperiment: a tracked experiment with which results shall be associated
         :return: cross-validation result data
         """
         resultWriter = self._resultWriterForModel(resultWriter, model)
         crossValidator = self.createCrossValidator(model)
+        if trackedExperiment is not None:
+            crossValidator.setTrackedExperiment(trackedExperiment)
         crossValidationData = crossValidator.evalModel(model)
         aggStatsByVar = {varName: crossValidationData.getEvalStatsCollection(predictedVarName=varName).aggMetricsDict()
                 for varName in crossValidationData.predictedVarNames}

From 40b66fe3c75050fb9623313a5e491e2ac2f28007 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 23:27:45 +0200
Subject: [PATCH 078/131] Changed title and improved heading structure, updated
 evaluation part and removed sections already covered by intro

---
 notebooks/intro_old.ipynb | 450 +++++++++++++-------------------------
 1 file changed, 154 insertions(+), 296 deletions(-)

diff --git a/notebooks/intro_old.ipynb b/notebooks/intro_old.ipynb
index cd72b13a..42ef6d73 100644
--- a/notebooks/intro_old.ipynb
+++ b/notebooks/intro_old.ipynb
@@ -1,5 +1,27 @@
 {
  "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%load_ext autoreload\n",
+    "%autoreload 2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys; sys.path.extend([\"../src\", \"..\"])\n",
+    "from sensai.util import logging\n",
+    "\n",
+    "logging.configureLogging(level=logging.INFO)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {
@@ -9,57 +31,25 @@
     }
    },
    "source": [
-    "# Lightning intro to sensAI\n",
+    "# Custom Models and Feature Generators\n",
     "\n",
     "In this notebook we will demonstrate some of sensAI's main features by training a model together\n",
     "with feature extractors and custom normalization rules. This will also demonstrate how easy it is to wrap one's\n",
     "own model declaration into a sensAI model."
    ]
   },
-  {
-   "cell_type": "markdown",
-   "source": [
-    "### Before running the notebook\n",
-    "\n",
-    "Install the package and its dependencies, if you haven't done so already. E.g. for an editable install call\n",
-    "```\n",
-    "pip install -e .\n",
-    "```\n",
-    "from the root directory. You can also execute this command directly in the notebook but will need to reload the\n",
-    "kernel afterwards"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
-  },
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "# Note - this cell should be executed only once per session\n",
-    "\n",
-    "%load_ext autoreload\n",
-    "%autoreload 2\n",
-    "\n",
-    "import sys, os\n",
-    "\n",
-    "# in order to get the top level modules; they are not part of the package\n",
-    "os.chdir(\"..\")\n",
-    "sys.path.append(os.path.abspath(\".\"))"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
+    "import sensai\n",
     "import pandas as pd\n",
     "import numpy as np\n",
     "import sensai as sn\n",
@@ -72,95 +62,78 @@
     "from sensai.tracking.clearml_tracking import ClearMLExperiment\n",
     "import sensai.featuregen as fgen\n",
     "import matplotlib.pyplot as plt\n",
-    "\n",
-    "\n",
-    "import logging\n",
-    "logging.basicConfig(level=logging.INFO)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "outputs": [],
-   "source": [
     "from config import get_config\n",
     "\n",
-    "c  = get_config(reload=True)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "cfg = get_config(reload=True)"
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "## Loading the dataset"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "First, let us load a dataset."
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
-    "housing_data = c.datafile_path(\"boston_housing.csv\", stage=c.RAW)\n",
+    "housing_data = cfg.datafile_path(\"boston_housing.csv\", stage=cfg.RAW)\n",
     "housing_df = pd.read_csv(housing_data)\n",
     "\n",
     "housing_df.head()"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
     "X = housing_df.copy()\n",
     "y = pd.DataFrame({\"nox\": X.pop(\"nox\")})"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
     "print(\"We will use this as target\")\n",
     "y.head()"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "## Creating a Custom Model\n",
     "\n",
@@ -172,17 +145,17 @@
     "tutorial in TBA.\n",
     "\n",
     "We will use VectorModel to wrap scikit-learn's implementation of a multi layer perceptron."
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "class CustomModel(VectorRegressionModel):\n",
@@ -196,16 +169,16 @@
     "\n",
     "    def _fit(self, X: pd.DataFrame, Y: pd.DataFrame):\n",
     "        self.model.fit(X, Y.values.ravel())"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "## Feature Generation and Normalization\n",
     "\n",
@@ -227,16 +200,16 @@
     "explaining exactly what they do and what the intended use case looks like.\n",
     "\n",
     "Below we will show an example of feature engineering.\n"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "### Defining Feature Generators\n",
     "\n",
@@ -245,17 +218,17 @@
     "is extracted from the dataframe when the feature generator is fit.\n",
     "\n",
     "The second feature generator simply takes the columns \"crim\" and \"age\" as is and marks that they should be normalized."
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "class TaxFraudFeaturegen(fgen.FeatureGenerator):\n",
@@ -287,18 +260,15 @@
     "    columns=[\"crim\", \"age\"],\n",
     "    normalisationRuleTemplate=DFTNormalisation.RuleTemplate(skip=True),\n",
     ")"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {
+    "collapsed": false
+   },
    "source": [
-    "### The Feature Registry\n",
+    "### The Feature Generator Registry\n",
     "\n",
     "We could simply take the feature generators as they are and plug them into our model but instead we demonstrate\n",
     "one more class in sensAI: the feature registry. Creating a registry is convenient for rapid experimentation\n",
@@ -311,14 +281,17 @@
     "The collector is pinned to a registry and allows to call the registered features by name (if desired).\n",
     "This might not make much sense in a notebook but imagine having a central feature registry somewhere in you code. This\n",
     "way you can combine the registered features with some features that you cooked up in a script, all in a few lines of code."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "housing_feature_registry = fgen.FeatureGeneratorRegistry(useSingletons=True)\n",
@@ -326,16 +299,16 @@
     "housing_feature_registry.tax = TaxFraudFeaturegen\n",
     "\n",
     "feature_collector = fgen.FeatureCollector(\"tax\", crime_age_featuregen, registry=housing_feature_registry)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "### Normalization of Input and Target\n",
     "\n",
@@ -347,52 +320,51 @@
     "all normalization rules to the feature generators themselves, just to be sure that nothing is missing.\n",
     "\n",
     "For normalizing the target we have to use an invertible transformer, we will take the MaxAbsScaler here."
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "dft_normalisation = sn.data_transformation.DFTNormalisation(\n",
     "    feature_collector.getNormalizationRules(),\n",
-    "    requireAllHandled=True,\n",
-    ")\n",
+    "    requireAllHandled=True)\n",
     "\n",
     "target_transformer = sn.data_transformation.DFTSkLearnTransformer(MaxAbsScaler())\n"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
-    "### Combining Everything with the Model\n",
+    "## Combining Everything with the Model\n",
     "\n",
     "Now we can plug all these components into our vector model and enjoy a safe and robust that will\n",
     "work during training and inference. The model already has methods for saving and loading and is ready to\n",
     "be deployed."
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "custom_model = CustomModel()\n",
@@ -402,193 +374,79 @@
     "    .withInputTransformers(dft_normalisation) \\\n",
     "    .withTargetTransformer(target_transformer) \\\n",
     "    .withName(\"housing_predictor\")"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "outputs": [],
-   "source": [
-    "custom_model.fit(X, y)\n",
-    "custom_model.predict(X).head()"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
-    "## SensAI Featuregen vs. Sklearn Pipelines\n",
-    "\n",
-    "TBA"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+    "### Evaluating the Model, Tracking Results Online"
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
-    "## Model Evaluation\n",
-    "\n",
-    "sensAI has extensive support for evaluating different types of models with different methods, including\n",
-    "cross validation. The evaluation has native support for experiment tracking frameworks, like clearML or MLflow.\n",
-    "Here we will use clearML, so after running this notebook you will be able to see the result in the\n",
-    "clearML demo-server.\n",
-    "\n",
-    "The evaluation is generally based on the following structure: an `Evaluator` object holds a dataset.\n",
-    "An `Evaluator` can evaluate multiple models by calling `Evaluator.evalModel(model)`,\n",
-    "this ensures that the same kind of evaluation is performed and thus the results can be compared in meaningful way\n",
-    "(the latter is crucial for model selection). This `.evalModel(model)` call returns an EvalData object, h\n",
-    "olding the evaluation data and containing methods for computing metrics and visualization.\n",
-    "\n",
-    "Similarly, a `CrossValidator` holds data and can perform cross validation,\n",
-    "\n",
-    "Below we will show a simple example for that, using the lower-level evaluation interfaces. There is also\n",
-    "a higher level evaluation interfaces in the eval_util module, we will leave that to a separate intro."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+    "We evaluate the model using an evaluation util as usual, but this time we will additionally track the results online using ClearML."
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {},
    "outputs": [],
    "source": [
-    "io_data = InputOutputData(X, y)\n",
-    "\n",
-    "clearml_experiment = ClearMLExperiment(projectName=\"sensai_demo\", taskName=\"custom_model\")\n",
-    "evaluator = createVectorModelEvaluator(io_data, isRegression=custom_model.isRegressionModel(),\n",
-    "                                       testFraction=0.2)\n",
-    "evaluator.setTrackedExperiment(clearml_experiment)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "try: \n",
+    "    clearmlExperiment = ClearMLExperiment(projectName=\"sensai_demo\", taskName=\"custom_model\")\n",
+    "except:\n",
+    "    # allow to run without ClearML credentials being present\n",
+    "    clearmlExperiment = None\n",
+    "\n",
+    "evalUtil = sensai.evaluation.RegressionEvaluationUtil(InputOutputData(X, y))\n",
+    "evalData = evalUtil.performSimpleEvaluation(custom_model, showPlots=True, trackedExperiment=clearmlExperiment)"
+   ]
   },
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "outputs": [],
+   "cell_type": "markdown",
+   "metadata": {},
    "source": [
-    "new_custom_model = CustomModel() \\\n",
-    "    .withFeatureCollector(feature_collector) \\\n",
-    "    .withInputTransformers(dft_normalisation) \\\n",
-    "    .withTargetTransformer(target_transformer) \\\n",
-    "    .withName(\"housing_predictor\")\n",
+    "You will find the URL under which the results are stored online in the log.\n",
     "\n",
-    "evaluator.fitModel(new_custom_model)\n",
-    "eval_stats = evaluator.evalModel(new_custom_model).getEvalStats()"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "outputs": [],
-   "source": [
-    "print(eval_stats.getAll())"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "outputs": [],
-   "source": [
-    "eval_stats.plotScatterGroundTruthPredictions()\n",
-    "eval_stats.plotErrorDistribution()\n",
-    "eval_stats.plotHeatmapGroundTruthPredictions()\n",
-    "plt.show()\n",
-    "print(\"Demonstrating plotting capabilities\")"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "If you missed the evaluation metrics in the log output, here they are:"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {},
    "outputs": [],
    "source": [
-    "eval_stats.plotScatterGroundTruthPredictions()\n",
-    "plt.show()"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
-  },
-  {
-   "cell_type": "markdown",
-   "source": [
-    "## Things we left out in this intro\n",
-    "\n",
-    " - Already implemented models and feature generators\n",
-    " - Caching (this is actually one of the central features)\n",
-    " - Support for ensembling and parallelization\n",
-    " - The local search and hyperopt modules, including grid-search, simulated-annealing and other stuff\n",
-    " - kNN and clustering implementations\n"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+    "evalData.getEvalStats().metricsDict()"
+   ]
   }
  ],
  "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3.8.13 ('sensai')",
    "language": "python",
    "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
-    "version": 2
+    "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython2",
-   "version": "2.7.6"
+   "pygments_lexer": "ipython3",
+   "version": "3.8.13"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
\ No newline at end of file
+}

From 3a9c14308fc10f391cd539bc43f65c5d18f9456c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 26 May 2022 23:29:12 +0200
Subject: [PATCH 079/131] Changed order of notebooks

---
 docs/index.rst | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/index.rst b/docs/index.rst
index a4dcc249..41d07053 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -6,12 +6,12 @@ sensAI - the Python library for sensible AI
    :glob:
 
    intro.ipynb
-   neural_networks.ipynb
    intro_old.ipynb
-   tracking_experiments.ipynb
+   neural_networks.ipynb
    tensor_models_pytorch_lightning.ipynb
    coordinate_clustering.ipynb
    clustering_evaluation.ipynb
+   tracking_experiments.ipynb
 
 ..
   Above, we can include any notebooks from ../notebooks; Within the build process, they will be copied

From f98e29a3d95eef40f05c92aab6452f04b23fa6a3 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 00:25:16 +0200
Subject: [PATCH 080/131] VectorModelEvaluator: Support tracking of metrics
 upon calls to evalModel

---
 src/sensai/evaluation/evaluator.py   | 42 +++++++++++++++++++---------
 src/sensai/tracking/tracking_base.py |  6 ++--
 2 files changed, 33 insertions(+), 15 deletions(-)

diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index a2f81490..927795cf 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -11,7 +11,7 @@
 from .eval_stats.eval_stats_regression import RegressionEvalStats, RegressionEvalStatsCollection, RegressionMetric
 from ..data_transformation import DataFrameTransformer
 from ..data import DataSplitter, DataSplitterFractional, InputOutputData
-from ..tracking import TrackingMixin
+from ..tracking import TrackingMixin, TrackedExperiment
 from ..util.string import ToStringMixin
 from ..util.typing import PandasNamedTuple
 from ..vector_model import VectorClassificationModel, VectorModel, VectorModelBase, VectorModelFittableBase
@@ -47,9 +47,7 @@ def computeMetrics(self, model, **kwargs) -> Optional[Dict[str, float]]:
         """
         valuesDict = self._computeMetrics(model, **kwargs)
         if self.trackedExperiment is not None:
-            trackedDict = valuesDict.copy()
-            trackedDict["str(model)"] = str(model)
-            self.trackedExperiment.trackValues(trackedDict)
+            self.trackedExperiment.trackValues(valuesDict, addValuesDict={"str(model)": str(model)})
         return valuesDict
 
 
@@ -175,16 +173,31 @@ def __init__(self, data: Optional[InputOutputData], testData: InputOutputData =
             self.trainingData = data
             self.testData = testData
 
-    def evalModel(self, model: VectorModelBase, onTrainingData=False) -> TEvalData:
+    def setTrackedExperiment(self, trackedExperiment: TrackedExperiment):
+        """
+        Sets a tracked experiment which will result in metrics being saved whenever computeMetrics is called
+        or evalModel is called with track=True.
+
+        :param trackedExperiment: the experiment in which to track evaluation metrics.
+        """
+        super().setTrackedExperiment(trackedExperiment)
+
+    def evalModel(self, model: VectorModelBase, onTrainingData=False, track=True) -> TEvalData:
         """
         Evaluates the given model
 
         :param model: the model to evaluate
         :param onTrainingData: if True, evaluate on this evaluator's training data rather than the held-out test data
+        :param track: whether to track the evaluation metrics for the case where a tracked experiment was set on this object
         :return: the evaluation result
         """
         data = self.trainingData if onTrainingData else self.testData
-        return self._evalModel(model, data)
+        result: VectorModelEvaluationData = self._evalModel(model, data)
+        if track and self.trackedExperiment is not None:
+            for predVarName in result.predictedVarNames:
+                addValuesDict = {"str(model)": str(model), "predVarName": predVarName}
+                self.trackedExperiment.trackValues(result.getEvalStats(predVarName).metricsDict(), addValuesDict=addValuesDict)
+        return result
 
     @abstractmethod
     def _evalModel(self, model: VectorModelBase, data: InputOutputData) -> TEvalData:
@@ -195,7 +208,8 @@ def _computeMetrics(self, model: VectorModel, onTrainingData=False) -> Dict[str,
 
     def _computeMetricsForVarName(self, model, predictedVarName: Optional[str], onTrainingData=False):
         self.fitModel(model)
-        evalData: VectorModelEvaluationData = self.evalModel(model, onTrainingData=onTrainingData)
+        track = False  # avoid duplicate tracking (as this function is only called by computeMetrics, which already tracks)
+        evalData: VectorModelEvaluationData = self.evalModel(model, onTrainingData=onTrainingData, track=track)
         return evalData.getEvalStats(predictedVarName=predictedVarName).metricsDict()
 
     def createMetricsDictProvider(self, predictedVarName: Optional[str]) -> MetricsDictProvider:
@@ -430,16 +444,17 @@ class RuleBasedVectorClassificationModelEvaluator(VectorClassificationModelEvalu
     def __init__(self, data: InputOutputData):
         super().__init__(data, testData=data)
 
-    def evalModel(self, model: VectorModelBase, onTrainingData=False) -> VectorClassificationModelEvaluationData:
+    def evalModel(self, model: VectorModelBase, onTrainingData=False, track=True) -> VectorClassificationModelEvaluationData:
         """
         Evaluate the rule based model. The training data and test data coincide, thus fitting the model
         will fit the model's preprocessors on the full data set and evaluating it will evaluate the model on the
         same data set.
 
-        :param model:
+        :param model: the model to evaluate
         :param onTrainingData: has to be False here. Setting to True is not supported and will lead to an
             exception
-        :return:
+        :param track: whether to track the evaluation metrics for the case where a tracked experiment was set on this object
+        :return: the evaluation result
         """
         if onTrainingData:
             raise Exception("Evaluating rule based models on training data is not supported. In this evaluator"
@@ -451,16 +466,17 @@ class RuleBasedVectorRegressionModelEvaluator(VectorRegressionModelEvaluator):
     def __init__(self, data: InputOutputData):
         super().__init__(data, testData=data)
 
-    def evalModel(self, model: VectorModelBase, onTrainingData=False) -> VectorRegressionModelEvaluationData:
+    def evalModel(self, model: VectorModelBase, onTrainingData=False, track=True) -> VectorRegressionModelEvaluationData:
         """
         Evaluate the rule based model. The training data and test data coincide, thus fitting the model
         will fit the model's preprocessors on the full data set and evaluating it will evaluate the model on the
         same data set.
 
-        :param model:
+        :param model: the model to evaluate
         :param onTrainingData: has to be False here. Setting to True is not supported and will lead to an
             exception
-        :return:
+        :param track: whether to track the evaluation metrics for the case where a tracked experiment was set on this object
+        :return: the evaluation result
         """
         if onTrainingData:
             raise Exception("Evaluating rule based models on training data is not supported. In this evaluator"
diff --git a/src/sensai/tracking/tracking_base.py b/src/sensai/tracking/tracking_base.py
index 314b5a9a..fcea5f5a 100644
--- a/src/sensai/tracking/tracking_base.py
+++ b/src/sensai/tracking/tracking_base.py
@@ -10,8 +10,10 @@ def __init__(self, additionalLoggingValuesDict=None):
         """
         self.additionalLoggingValuesDict = additionalLoggingValuesDict
 
-    def trackValues(self, valuesDict: Dict[str, Any]):
+    def trackValues(self, valuesDict: Dict[str, Any], addValuesDict: Dict[str, Any] = None):
         valuesDict = dict(valuesDict)
+        if addValuesDict is not None:
+            valuesDict.update(addValuesDict)
         if self.additionalLoggingValuesDict is not None:
             valuesDict.update(self.additionalLoggingValuesDict)
         self._trackValues(valuesDict)
@@ -32,5 +34,5 @@ def unsetTrackedExperiment(self):
         setattr(self, self._trackedExperimentAttributeName, None)
 
     @property
-    def trackedExperiment(self):
+    def trackedExperiment(self) -> TrackedExperiment:
         return getattr(self, self._trackedExperimentAttributeName, None)

From 88a6060c3f5a67a25aec28b776eedd9359e37a30 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 01:03:19 +0200
Subject: [PATCH 081/131] TrackingMixin: Store tracked experiments outside of
 instances in static dictionary

---
 src/sensai/tracking/tracking_base.py | 15 +++++++--------
 1 file changed, 7 insertions(+), 8 deletions(-)

diff --git a/src/sensai/tracking/tracking_base.py b/src/sensai/tracking/tracking_base.py
index fcea5f5a..dcb97a7b 100644
--- a/src/sensai/tracking/tracking_base.py
+++ b/src/sensai/tracking/tracking_base.py
@@ -1,5 +1,5 @@
 from abc import ABC, abstractmethod
-from typing import Dict, Any
+from typing import Dict, Any, Optional
 
 
 class TrackedExperiment(ABC):
@@ -24,15 +24,14 @@ def _trackValues(self, valuesDict):
 
 
 class TrackingMixin(ABC):
-    # hackidy hack
-    _trackedExperimentAttributeName = "_trackedExperiment"
+    _objectId2trackedExperiment = {}
 
-    def setTrackedExperiment(self, trackedExperiment: TrackedExperiment):
-        setattr(self, self._trackedExperimentAttributeName, trackedExperiment)
+    def setTrackedExperiment(self, trackedExperiment: Optional[TrackedExperiment]):
+        self._objectId2trackedExperiment[id(self)] = trackedExperiment
 
     def unsetTrackedExperiment(self):
-        setattr(self, self._trackedExperimentAttributeName, None)
+        self.setTrackedExperiment(None)
 
     @property
-    def trackedExperiment(self) -> TrackedExperiment:
-        return getattr(self, self._trackedExperimentAttributeName, None)
+    def trackedExperiment(self) -> Optional[TrackedExperiment]:
+        return self._objectId2trackedExperiment.get(id(self))

From 29dd4e8001abf36acb5a999c27f04e514b98145b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 05:09:57 +0200
Subject: [PATCH 082/131] Removed duplicate class RelativeFrequencyCounter

---
 src/sensai/local_search.py | 19 ++-----------------
 1 file changed, 2 insertions(+), 17 deletions(-)

diff --git a/src/sensai/local_search.py b/src/sensai/local_search.py
index 622a94c4..eaafc052 100644
--- a/src/sensai/local_search.py
+++ b/src/sensai/local_search.py
@@ -10,6 +10,8 @@
 import pandas as pd
 from matplotlib import pyplot as plt
 
+from sensai.util.aggregation import RelativeFrequencyCounter
+
 log = logging.getLogger(__name__)
 
 
@@ -389,23 +391,6 @@ def chooseParams(self) -> Optional[Tuple[Tuple, Optional[SACostValue]]]:
         pass
 
 
-class RelativeFrequencyCounter:
-    def __init__(self):
-        self.numTotal = 0
-        self.numRelevant = 0
-
-    def count(self, isRelevantEvent):
-        self.numTotal += 1
-        if isRelevantEvent:
-            self.numRelevant += 1
-
-    def __str__(self):
-        info = f"{self.numRelevant}/{self.numTotal}"
-        if self.numTotal > 0:
-            info += f", {100 * self.numRelevant / self.numTotal:.2f}%"
-        return f"RelativeFrequencyCounter[{info}]"
-
-
 class SAChain(Generic[TSAState]):
     """Manages the progression of one state during simulated annealing"""
 

From da9dfca3e694adf4a64d419d065914a4ad44c78b Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 05:10:12 +0200
Subject: [PATCH 083/131] Removed TODO (done)

---
 src/sensai/evaluation/eval_util.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 73292156..7a496cfd 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -3,8 +3,6 @@
 workflow for evaluation is to use these higher-level functionalities instead of instantiating
 the evaluation classes directly.
 """
-# TODO: provide a notebook (and possibly an rst file) that illustrates standard evaluation scenarios and at the same
-#  time serves as an integration test
 import functools
 import logging
 from abc import ABC, abstractmethod

From d31cef903d27c338821cfe62fa9cd33debc336dd Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 05:11:07 +0200
Subject: [PATCH 084/131] Fixed typo in class name:
 XGBGradientBoostedVectorRegressionModel (contained "Bossted")

---
 src/sensai/xgboost.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/sensai/xgboost.py b/src/sensai/xgboost.py
index e6716af6..202199ce 100644
--- a/src/sensai/xgboost.py
+++ b/src/sensai/xgboost.py
@@ -3,7 +3,7 @@
 from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel
 
 
-class XGBGradientBosstedVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
+class XGBGradientBoostedVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
     """
     XGBoost's regression model using gradient boosted trees
     """

From a4f8b1f9be0be59d7db1a933656057f319cd1056 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 21:50:09 +0200
Subject: [PATCH 085/131] ToStringMixin: Prevent infinite recursion caused by
 any ToStringMixin   recursively containing itself via newly introduced
 StringConverter   abstraction

---
 src/sensai/util/string.py | 108 ++++++++++++++++++++++++++++++++------
 1 file changed, 93 insertions(+), 15 deletions(-)

diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index ecebaa93..68d5cf1a 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -1,21 +1,27 @@
-from typing import Union, List, Dict, Any, Sequence, Iterable, Optional, Mapping
 import re
-
+from abc import ABC, abstractmethod
+from typing import Union, List, Dict, Any, Sequence, Iterable, Optional, Mapping
 
 reCommaWhitespacePotentiallyBreaks = re.compile(r",\s+")
 
 
-def dictString(d: Mapping, brackets: Optional[str] = None):
-    s = ', '.join([f'{k}={toString(v)}' for k, v in d.items()])
+class StringConverter(ABC):
+    @abstractmethod
+    def toString(self, x) -> str:
+        pass
+
+
+def dictString(d: Mapping, brackets: Optional[str] = None, converter: StringConverter = None):
+    s = ', '.join([f'{k}={toString(v, converter=converter)}' for k, v in d.items()])
     if brackets is not None:
         return brackets[:1] + s + brackets[-1:]
     else:
         return s
 
 
-def listString(l: Iterable[Any], brackets="[]", quote: Optional[str] = None):
+def listString(l: Iterable[Any], brackets="[]", quote: Optional[str] = None, converter: StringConverter = None):
     def item(x):
-        x = toString(x)
+        x = toString(x, converter=converter)
         if quote is not None:
             return quote + x + quote
         else:
@@ -24,15 +30,29 @@ def item(x):
     return brackets[:1] + ", ".join((item(x) for x in l)) + brackets[-1:]
 
 
-def toString(x):
+def toString(x, converter: StringConverter = None, applyConverterToNonComplexObjects=True):
+    """
+    Converts the given object to a string, with proper handling of lists, tuples and dictionaries, optionally using a converter.
+    The conversion also removes unwanted line breaks (as present, in particular, in sklearn's string representations).
+
+    :param x: the object to convert
+    :param converter: the converter with which to convert objects to strings
+    :param applyConverterToNonComplexObjects: whether to apply/pass on the converter (if any) not only when converting complex objects but also
+        non-complex, primitive objects; use of this flag enables converters to implement their conversion functionality using this function
+        for complex objects without causing an infinite recursion.
+    :return: the string representation
+    """
     if type(x) == list:
-        return listString(x)
+        return listString(x, converter=converter)
     elif type(x) == tuple:
-        return listString(x, brackets="()")
+        return listString(x, brackets="()", converter=converter)
     elif type(x) == dict:
-        return dictString(x, brackets="{}")
+        return dictString(x, brackets="{}", converter=converter)
     else:
-        s = str(x)
+        if converter and applyConverterToNonComplexObjects:
+            s = converter.toString(x)
+        else:
+            s = str(x)
         s = reCommaWhitespacePotentiallyBreaks.sub(", ", s)  # remove any unwanted line breaks and indentation after commas (as generated, for example, by sklearn objects)
         return s
 
@@ -57,7 +77,7 @@ def orRegexGroup(allowedNames: Sequence[str]):
 
 class ToStringMixin:
     """
-    Provides default implementations for __str__ and __repr__ which contain all attribute names and their values. The
+    Provides implementations for __str__ and __repr__ which contain all attribute names and their values. The
     latter also contains the object id.
     """
     _TOSTRING_INCLUDE_ALL = "__all__"
@@ -67,7 +87,7 @@ def _toStringClassName(self):
 
     def _toStringProperties(self, exclude: Optional[Union[str, Iterable[str]]] = None, include: Optional[Union[str, Iterable[str]]] = None,
             excludeExceptions: Optional[List[str]] = None, includeForced: Optional[List[str]] = None,
-            additionalEntries: Dict[str, Any] = None) -> str:
+            additionalEntries: Dict[str, Any] = None, converter: StringConverter = None) -> str:
         """
         Creates a string of the class attributes, with optional exclusions/inclusions/additions.
         Exclusions take precedence over inclusions.
@@ -75,6 +95,7 @@ def _toStringProperties(self, exclude: Optional[Union[str, Iterable[str]]] = Non
         :param exclude: attributes to be excluded
         :param include: attributes to be included; if None/empty, include all that are not excluded
         :param additionalEntries: additional key-value-pairs which are added to the string just like the other attributes
+        :param converter: the string converter to use; if None, use default
         :return: a string containing attribute names and values
         """
         def mklist(x):
@@ -112,7 +133,9 @@ def isExcluded(k):
         if additionalEntries is not None:
             d.update(additionalEntries)
 
-        return dictString(d)
+        if converter is None:
+            converter = self._StringConverterAvoidToStringMixinRecursion(self)
+        return dictString(d, converter=converter)
 
     def _toStringObjectInfo(self) -> str:
         """
@@ -156,6 +179,7 @@ def _toStringIncludes(self) -> List[str]:
         """
         return [self._TOSTRING_INCLUDE_ALL]
 
+    # noinspection PyMethodMayBeStatic
     def _toStringIncludesForced(self) -> List[str]:
         """
         Defines a list of attribute names that are required to be present in the string representation, regardless of the
@@ -194,6 +218,60 @@ def __repr__(self):
             info += ", " + propertyInfo
         return f"{self._toStringClassName()}[{info}]"
 
+    def pprint(self):
+        print(prettyStringRepr(self))
+
+    class _StringConverterAvoidToStringMixinRecursion(StringConverter):
+        """
+        Avoids recursions when converting objects implementing ToStringMixin which may contain themselves to strings.
+        Use of this object prevents infinite recursions caused by a ToStringMixin instance recursively containing itself in
+        either a property of another ToStringMixin, a list or a tuple.
+        It handles all ToStringMixin instances recursively encountered.
+        A previously handled instance is converted to a string of the form "<class name>[<<]"
+        """
+        def __init__(self, *handledObjects: "ToStringMixin"):
+            """
+            :param handledObjects: objects which are initially assumed to have been handled already
+            """
+            self._handledToStringMixinIds = set([id(o) for o in handledObjects])
+
+        def toString(self, x) -> str:
+            if isinstance(x, ToStringMixin):
+                oid = id(x)
+                if oid in self._handledToStringMixinIds:
+                    return f"{x._toStringClassName()}[<<]"
+                self._handledToStringMixinIds.add(oid)
+                return str(self._ToStringMixinProxy(x, self))
+            else:
+                return toString(x, converter=self, applyConverterToNonComplexObjects=False)
+
+        class _ToStringMixinProxy:
+            """
+            A proxy object which wraps a ToStringMixin to ensure that the converter is applied when creating the properties string.
+            The proxy is to achieve that all ToStringMixin methods that aren't explicitly overwritten are bound to this proxy
+            (rather than the original object), such that the transitive call to _toStringProperties will call the new
+            implementation.
+            """
+            def __init__(self, x: "ToStringMixin", converter):
+                self.x = x
+                self.converter = converter
+
+            def _toStringProperties(self, *args, **kwargs):
+                return self.x._toStringProperties(*args, **kwargs, converter=self.converter)
+
+            def _toStringClassName(self):
+                return self.x._toStringClassName()
+
+            def __getattr__(self, attr: str):
+                if attr.startswith("_toString"):  # ToStringMixin method which we bind to use this proxy
+                    method = getattr(ToStringMixin, attr)
+                    return lambda *args, **kwargs: method(self, *args, **kwargs)
+                else:
+                    return getattr(self.x, attr)
+
+            def __str__(self: "ToStringMixin"):
+                return ToStringMixin.__str__(self)
+
 
 def prettyStringRepr(s: Any, initialIndentationLevel=0, indentationString="    "):
     """
@@ -203,7 +281,7 @@ def prettyStringRepr(s: Any, initialIndentationLevel=0, indentationString="    "
     :param s: an object or object string representation
     :param initialIndentationLevel: the initial indentation level
     :param indentationString: the string which corresponds to a single indentation level
-    :return: a reformatted version of the input string with added indentations and line break
+    :return: a reformatted version of the input string with added indentations and line breaks
     """
     if type(s) != str:
         s = str(s)

From 61d9fd80278ed8aea7c9f218d398f686fab68869 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 22:52:36 +0200
Subject: [PATCH 086/131] Use sphinx_rtd_theme>=0.5.1 to fix bullet item
 rendering issue
 https://stackoverflow.com/questions/67542699/readthedocs-sphinx-not-rendering-bullet-list-from-rst-file

---
 environment.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/environment.yml b/environment.yml
index ebb44c8d..bc0220b9 100644
--- a/environment.yml
+++ b/environment.yml
@@ -29,7 +29,7 @@ dependencies:
   - pytest
   # for docs build
   - sphinx 
-  - sphinx_rtd_theme 
+  - sphinx_rtd_theme>=0.5.1
   - nbsphinx
   # for release process
   - bump2version

From 4e046735730aaadc4eec90440564b3088c56c22c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 22:55:18 +0200
Subject: [PATCH 087/131] Clean output folder before build

---
 build-docs.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/build-docs.sh b/build-docs.sh
index 4662b9d0..d9e69328 100644
--- a/build-docs.sh
+++ b/build-docs.sh
@@ -1,3 +1,4 @@
+rm -rf docs/build
 python build_scripts/update_docs.py
 sphinx-build -W -b html docs docs/build
 

From de3110be607664a65ee1d5546d25921513be69be Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 22:55:49 +0200
Subject: [PATCH 088/131] Extended documentation

---
 src/sensai/util/string.py | 143 ++++++++++++++++++++++++++++++--------
 1 file changed, 113 insertions(+), 30 deletions(-)

diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index 68d5cf1a..d4ae219d 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -1,4 +1,5 @@
 import re
+import sys
 from abc import ABC, abstractmethod
 from typing import Union, List, Dict, Any, Sequence, Iterable, Optional, Mapping
 
@@ -6,12 +7,25 @@
 
 
 class StringConverter(ABC):
+    """
+    Abstraction for a string conversion mechanism
+    """
     @abstractmethod
     def toString(self, x) -> str:
         pass
 
 
 def dictString(d: Mapping, brackets: Optional[str] = None, converter: StringConverter = None):
+    """
+    Converts a dictionary to a string of the form "<key>=<value>, <key>=<value>, ...", optionally enclosed
+    by brackets
+
+    :param d: the dictionary
+    :param brackets: a two-character string containing the opening and closing bracket to use, e.g. ``"{}"``;
+        if None, do not use enclosing brackets
+    :param converter: the string converter to use for values
+    :return: the string representation
+    """
     s = ', '.join([f'{k}={toString(v, converter=converter)}' for k, v in d.items()])
     if brackets is not None:
         return brackets[:1] + s + brackets[-1:]
@@ -20,6 +34,17 @@ def dictString(d: Mapping, brackets: Optional[str] = None, converter: StringConv
 
 
 def listString(l: Iterable[Any], brackets="[]", quote: Optional[str] = None, converter: StringConverter = None):
+    """
+    Converts a list or any other iterable to a string of the form "[<value>, <value>, ...]", optionally enclosed
+    by different brackets or with the values quoted.
+
+    :param d: the dictionary
+    :param brackets: a two-character string containing the opening and closing bracket to use, e.g. ``"[]"``;
+        if None, do not use enclosing brackets
+    :param quote: a 1-character string defining the quote to use around each value, e.g. ``"'"``.
+    :param converter: the string converter to use for values
+    :return: the string representation
+    """
     def item(x):
         x = toString(x, converter=converter)
         if quote is not None:
@@ -69,7 +94,7 @@ def orRegexGroup(allowedNames: Sequence[str]):
     """
 
     :param allowedNames: strings to include as literals in the regex
-    :return: raw string of the type (<name1>| ...|<nameN>), where special characters in the names have been escaped
+    :return: a regular expression string of the form (<name1>| ...|<nameN>), which any of the given names
     """
     allowedNames = [re.escape(name) for name in allowedNames]
     return r"(%s)" % "|".join(allowedNames)
@@ -77,12 +102,49 @@ def orRegexGroup(allowedNames: Sequence[str]):
 
 class ToStringMixin:
     """
-    Provides implementations for __str__ and __repr__ which contain all attribute names and their values. The
-    latter also contains the object id.
+    Provides implementations for ``__str__`` and ``__repr__`` which are based on the format ``"<class name>[<object info>]"`` and
+    ``"<class name>[id=<object id>, <object info>]"`` respectively, where ``<object info>`` is usually a list of entries of the
+    form ``"<name>=<value>, ..."``.
+
+    By default, ``<class name>`` will be the qualified name of the class, and ``<object info>`` will include all properties
+    of the class, including private ones starting with an underscore (though the underscore will be dropped in the string
+    representation).
+
+        * To exclude private properties, override :meth:`_toStringExcludePrivate` to return True. If there are exceptions
+          (and some private properties shall be retained), additionally override :meth:`__toStringExcludeExceptions`.
+        * To exclude a particular set of properties, override :meth:`_toStringExcludes`.
+        * To include only select properties (introducing inclusion semantics), override :meth:`_toStringIncludes`.
+        * To add values to the properties list that aren't actually properties of the object (i.e. derived properties),
+          override :meth:`_toStringAdditionalEntries`.
+        * To define a fully custom representation for <object info> which is not based on the above principles, override
+          :meth:`_toStringObjectInfo`.
+
+    For well-defined string conversions within a class hierarchy, it can be good practice to define additional
+    inclusions/exclusions by overriding the respective method once more and basing the return value on an extended
+    version of the value returned by superclass.
+    In some cases, the requirements of a subclass can be at odds with the definitions in the superclass: The superclass
+    may make use of exclusion semantics, but the subclass may want to use inclusion semantics (and include
+    only some of the many properties it adds). If the subclass used :meth:`_toStringInclude` the exclusion semantics
+    of the superclass would be void and none of its properties would be included.
+    In this case, override :meth:`_toStringIncludesForced` to add inclusions regardless of the semantics otherwise used along
+    the class hierarchy.
+
+    .. document private functions
+    .. automethod:: _toStringClassName
+    .. automethod:: _toStringObjectInfo
+    .. automethod:: _toStringExcludes
+    .. automethod:: _toStringExcludeExceptions
+    .. automethod:: _toStringIncludes
+    .. automethod:: _toStringIncludesForced
+    .. automethod:: _toStringAdditionalEntries
+    .. automethod:: _toStringExcludePrivate
     """
     _TOSTRING_INCLUDE_ALL = "__all__"
 
     def _toStringClassName(self):
+        """
+        :return: the string use for <class name> in the string representation ``"<class name>[<object info]"``
+        """
         return type(self).__qualname__
 
     def _toStringProperties(self, exclude: Optional[Union[str, Iterable[str]]] = None, include: Optional[Union[str, Iterable[str]]] = None,
@@ -93,10 +155,12 @@ def _toStringProperties(self, exclude: Optional[Union[str, Iterable[str]]] = Non
         Exclusions take precedence over inclusions.
 
         :param exclude: attributes to be excluded
-        :param include: attributes to be included; if None/empty, include all that are not excluded
-        :param additionalEntries: additional key-value-pairs which are added to the string just like the other attributes
-        :param converter: the string converter to use; if None, use default
-        :return: a string containing attribute names and values
+        :param include: attributes to be included; if non-empty, only the specified attributes will be printed (bar the ones
+            excluded by ``exclude``)
+        :param includeForced: additional attributes to be included
+        :param additionalEntries: additional key-value entries to be added
+        :param converter: the string converter to use; if None, use default (which avoids infinite recursions)
+        :return: a string containing entry/property names and values
         """
         def mklist(x):
             if x is None:
@@ -139,12 +203,13 @@ def isExcluded(k):
 
     def _toStringObjectInfo(self) -> str:
         """
-        Creates a string containing information on the object instance which is to appear between the square brackets in the string
-        representation, i.e. if the class name is Foo, then it is the asterisk in "Foo[*]".
-        By default will make use of all the exclusions/inclusions that are specified by other member functions.
-        This method can be overwritten by sub-classes to provide a custom string.
+        Override this method to use a fully custom definition of the ``<object info>`` part in the full string
+        representation ``"<class name>[<object info>]"`` to be generated.
+        As soon as this method is overridden, any property-based exclusions, inclusions, etc. will have no effect
+        (unless the implementation is specifically designed to make use of them - as is the default
+        implementation).
 
-        :return: a string containing the desired content
+        :return: a string containing the string to use for ``<object info>``
         """
         return self._toStringProperties(exclude=self._toStringExcludes(), include=self._toStringIncludes(),
             excludeExceptions=self._toStringExcludeExceptions(), includeForced=self._toStringIncludesForced(),
@@ -153,9 +218,9 @@ def _toStringObjectInfo(self) -> str:
     def _toStringExcludes(self) -> List[str]:
         """
         Makes the string representation exclude the returned attributes.
-        Returns a list of attribute names to be excluded from __str__ and __repr__. This method can be overwritten by
-        sub-classes which can call super and extend the list returned.
-        This method will only have no effect if _toStringObjectInfo is overridden to not use its result.
+        This method can be conveniently overridden by subclasses which can call super and extend the list returned.
+
+        This method will only have no effect if :meth:`_toStringObjectInfo` is overridden to not use its result.
 
         :return: a list of attribute names
         """
@@ -166,14 +231,14 @@ def _toStringIncludes(self) -> List[str]:
         Makes the string representation include only the returned attributes (i.e. introduces inclusion semantics);
         By default, the list contains only a marker element, which is interpreted as "all attributes included".
 
-        This method can be overridden by sub-classes, which can call super in order to extend the list.
-        If a list containing the aforementioned marker element (which stands for all attributes) is extended, the marker element will be ignored,
-        and only the user-added elements will be considered as included.
+        This method can be conveniently overridden by sub-classes which can call super and extend the list returned.
+        Note that it is not a problem for a list containing the aforementioned marker element (which stands for all attributes)
+        to be extended; the marker element will be ignored and only the user-added elements will be considered as included.
 
         Note: To add an included attribute in a sub-class, regardless of any super-classes using exclusion or inclusion semantics,
         use _toStringIncludesForced instead.
 
-        This method will only have no effect if _toStringObjectInfo is overridden to not use its result.
+        This method will have no effect if :meth:`_toStringObjectInfo` is overridden to not use its result.
 
         :return: a list of attribute names to be included in the string representation
         """
@@ -185,24 +250,29 @@ def _toStringIncludesForced(self) -> List[str]:
         Defines a list of attribute names that are required to be present in the string representation, regardless of the
         instance using include semantics or exclude semantics, thus facilitating added inclusions in sub-classes.
 
+        This method will have no effect if :meth:`_toStringObjectInfo` is overridden to not use its result.
+
         :return: a list of attribute names
         """
         return []
 
     def _toStringAdditionalEntries(self) -> Dict[str, Any]:
+        """
+        :return: a dictionary of entries to be included in the ``<object info>`` part of the string representation
+        """
         return {}
 
     def _toStringExcludePrivate(self) -> bool:
         """
-        :return: whether to exclude properties that are private, i.e. start with an underscore; explicitly included attributes
-            will still be considered
+        :return: whether to exclude properties that are private (start with an underscore); explicitly included attributes
+            will still be considered - as will properties exempt from the rule via :meth:`toStringExcludeException`.
         """
         return False
 
     def _toStringExcludeExceptions(self) -> List[str]:
         """
-        Defines attribute names which should not be excluded even though other rules (e.g. the exclusion of private members
-        via _toStringExcludePrivate) would otherwise exclude them.
+        Defines attribute names which should not be excluded even though other rules (particularly the exclusion of private members
+        via :meth:`_toStringExcludePrivate`) would otherwise exclude them.
 
         :return: a list of attribute names
         """
@@ -218,16 +288,29 @@ def __repr__(self):
             info += ", " + propertyInfo
         return f"{self._toStringClassName()}[{info}]"
 
-    def pprint(self):
-        print(prettyStringRepr(self))
+    def pprint(self, file=sys.stdout):
+        """
+        Prints a prettily formatted string representation of the object (with line breaks and indentations)
+        to ``stdout`` or the given file.
+
+        :param file: the file to print to
+        """
+        print(self.pprints(), file=file)
+
+    def pprints(self) -> str:
+        """
+        :return: a prettily formatted string representation with line breaks and indentations
+        """
+        return prettyStringRepr(self)
 
     class _StringConverterAvoidToStringMixinRecursion(StringConverter):
         """
-        Avoids recursions when converting objects implementing ToStringMixin which may contain themselves to strings.
-        Use of this object prevents infinite recursions caused by a ToStringMixin instance recursively containing itself in
-        either a property of another ToStringMixin, a list or a tuple.
-        It handles all ToStringMixin instances recursively encountered.
-        A previously handled instance is converted to a string of the form "<class name>[<<]"
+        Avoids recursions when converting objects implementing :class:`ToStringMixin` which may contain themselves to strings.
+        Use of this object prevents infinite recursions caused by a :class:`ToStringMixin` instance recursively containing itself in
+        either a property of another :class:`ToStringMixin`, a list or a tuple.
+        It handles all :class:`ToStringMixin` instances recursively encountered.
+
+        A previously handled instance is converted to a string of the form "<class name>[<<]".
         """
         def __init__(self, *handledObjects: "ToStringMixin"):
             """

From 0da3e1806a1bc4a0ec37c027264b5bba7d08d477 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 22:56:20 +0200
Subject: [PATCH 089/131] Ignore docs/build

---
 .gitignore | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 7a7b9f94..5c5766d2 100644
--- a/.gitignore
+++ b/.gitignore
@@ -25,4 +25,5 @@ data
 /lightning_logs
 *.code-workspace
 /TODO.txt
-notebooks/temp.ipynb
\ No newline at end of file
+notebooks/temp.ipynb
+/docs/build
\ No newline at end of file

From b8672c47b1a961736579a7d59a31c6c5367fda92 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 27 May 2022 23:27:26 +0200
Subject: [PATCH 090/131] Added util.string.functionName and applied in
 MultiLayerPerceptron.__str__

---
 src/sensai/torch/torch_models/mlp/mlp_modules.py |  6 +++---
 src/sensai/util/string.py                        | 12 +++++++++++-
 2 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/src/sensai/torch/torch_models/mlp/mlp_modules.py b/src/sensai/torch/torch_models/mlp/mlp_modules.py
index 52c5eaf5..7f46d692 100644
--- a/src/sensai/torch/torch_models/mlp/mlp_modules.py
+++ b/src/sensai/torch/torch_models/mlp/mlp_modules.py
@@ -4,7 +4,7 @@
 from torch import nn
 
 from ...torch_base import MCDropoutCapableNNModule
-from ....util.string import objectRepr
+from ....util.string import objectRepr, functionName
 
 
 class MultiLayerPerceptron(MCDropoutCapableNNModule):
@@ -31,8 +31,8 @@ def __init__(self, inputDim: float, outputDim: float, hiddenDims: Sequence[int],
 
     def __str__(self):
         return objectRepr(self, dict(inputDim=self.inputDim, outputDim=self.outputDim, hiddenDims=self.hiddenDims,
-            hidActivationFn=self.hidActivationFn.__name__ if self.hidActivationFn is not None else None,
-            outputActivationFn=self.outputActivationFn.__name__ if self.outputActivationFn is not None else None,
+            hidActivationFn=functionName(self.hidActivationFn) if self.hidActivationFn is not None else None,
+            outputActivationFn=functionName(self.outputActivationFn) if self.outputActivationFn is not None else None,
             pDropout=self.pDropout))
 
     def forward(self, x):
diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index d4ae219d..47716fe4 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -1,7 +1,8 @@
+import functools
 import re
 import sys
 from abc import ABC, abstractmethod
-from typing import Union, List, Dict, Any, Sequence, Iterable, Optional, Mapping
+from typing import Union, List, Dict, Any, Sequence, Iterable, Optional, Mapping, Callable
 
 reCommaWhitespacePotentiallyBreaks = re.compile(r",\s+")
 
@@ -100,6 +101,15 @@ def orRegexGroup(allowedNames: Sequence[str]):
     return r"(%s)" % "|".join(allowedNames)
 
 
+def functionName(x: Callable) -> str:
+    if isinstance(x, functools.partial):
+        return functionName(x.func)
+    elif hasattr(x, "__name__"):
+        return x.__name__
+    else:
+        return str(x)
+
+
 class ToStringMixin:
     """
     Provides implementations for ``__str__`` and ``__repr__`` which are based on the format ``"<class name>[<object info>]"`` and

From 8ab3013f2d802c8aef78d0696a2f724de7f152eb Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 00:10:55 +0200
Subject: [PATCH 091/131] Improved docstrings

---
 src/sensai/vector_model.py | 107 ++++++++++++++++++++++++-------------
 1 file changed, 69 insertions(+), 38 deletions(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 9dd63c97..9be1f4ee 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -1,7 +1,7 @@
 """
 This module defines base classes for models that use pandas.DataFrames for inputs and outputs, where each data frame row represents
 a single model input or output. Since every row contains a vector of data (one-dimensional array), we refer to them as vector-based
-models. Hence the name of the module and of the central base class VectorModel.
+models. Hence the name of the module and of the central base class :class:`VectorModel`.
 """
 
 import logging
@@ -11,19 +11,17 @@
 import numpy as np
 import pandas as pd
 
+from .data import InputOutputData
 from .data_transformation import DataFrameTransformer, DataFrameTransformerChain, InvertibleDataFrameTransformer
 from .featuregen import FeatureGenerator, FeatureCollector
+from .util import markUsed
 from .util.cache import PickleLoadSaveMixin
 from .util.logging import StopWatch
 from .util.pickle import setstate, getstate
 from .util.sequences import getFirstDuplicate
 from .util.string import ToStringMixin
 
-# imports for backward compatibility (and mark as used)
-from .data import InputOutputData
-
-if InputOutputData:
-    pass
+markUsed(InputOutputData)  # for backward compatibility
 
 log = logging.getLogger(__name__)
 
@@ -103,10 +101,10 @@ class VectorModel(VectorModelFittableBase, PickleLoadSaveMixin, ToStringMixin, A
 
     def __init__(self, checkInputColumns=True):
         """
-        :param checkInputColumns: Whether to check if the input column list (after feature generation)
-            during inference coincides with the input column list during fit.
-            This should be disabled if feature generation is not performed by the model itself,
-            e.g. in ensemble models.
+        :param checkInputColumns: whether to check if the input column list (that is fed to the underlying model, i.e. after feature generation)
+            during inference coincides with the input column list that was observed during training.
+            This should be disabled if feature generation is not performed by the model itself, e.g. in meta-models
+            such as ensemble models.
         """
         super().__init__()
         self._featureGenerator: Optional[FeatureGenerator] = None
@@ -154,9 +152,9 @@ def _toStringAdditionalEntries(self) -> Dict[str, Any]:
 
     def withInputTransformers(self, *inputTransformers: Union[DataFrameTransformer, List[DataFrameTransformer]]) -> __qualname__:
         """
-        Makes the model use the given input transformers. Call with empty input to remove existing input transformers.
+        Makes the model use the given input transformers (removing previously set transformers, if any).
 
-        :param inputTransformers: DataFrameTransformers for the transformation of inputs
+        :param inputTransformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of inputs
         :return: self
         """
         self._inputTransformerChain = DataFrameTransformerChain(*inputTransformers)
@@ -164,9 +162,9 @@ def withInputTransformers(self, *inputTransformers: Union[DataFrameTransformer,
 
     def withFeatureGenerator(self, featureGenerator: Optional[FeatureGenerator]) -> __qualname__:
         """
-        Makes the model use the given feature generator, which shall be used to compute
-        the actual inputs of the model from the data frame that is given.
-        Cannot be used in conjunction with withFeatureCollector
+        Makes the model use the given feature generator in order to obtain the model inputs.
+        If the model shall use more than one feature generator, pass a :class:`MultiFeatureGenerator` which combines them or
+        use the perhaps more convenient :class:`FeatureCollector` in conjunction with :meth:`withFeatureCollector`.
 
         Note: Feature computation takes place before input transformation.
 
@@ -179,8 +177,8 @@ def withFeatureGenerator(self, featureGenerator: Optional[FeatureGenerator]) ->
     def withFeatureCollector(self, featureCollector: FeatureCollector) -> __qualname__:
         """
         Makes the model use the given feature collector's multi-feature generator
-        in order compute the actual inputs of the model from the data frame that is given.
-        Cannot be used in conjunction with withFeatureGenerator.
+        in order compute the underlying model's input from the data frame that is given.
+        Overrides any feature generator previously passed to :meth:`withFeatureGenerator` (if any).
 
         Note: Feature computation takes place before input transformation.
 
@@ -197,6 +195,9 @@ def _preProcessorsAreFitted(self):
         return result
 
     def isFitted(self):
+        """
+        :return: True if the model has been fitted, False otherwise
+        """
         if not self._isUnderlyingModelFitted():
             return False
         if not self._preProcessorsAreFitted():
@@ -212,17 +213,21 @@ def _checkModelInputColumns(self, modelInput: pd.DataFrame):
             raise Exception(f"Inadmissible input data frame: "
                             f"expected columns {self._modelInputVariableNames}, got {list(modelInput.columns)}")
 
-    def computeModelInputs(self, X):
+    def computeModelInputs(self, X: pd.DataFrame):
         """
-        Returns the dataframe that is passed to the model, i.e. the result of applying preprocessors to X.
+        Applies feature generators and input transformers (if any) to generate from an input data frame the input for the
+        underlying model
+
+        :param X: the input data frame, to which input preprocessing is to be applied
+        :return: the input data frame that serves as input for the underlying model
         """
         return self._computeModelInputs(X)
 
     def _computeModelInputs(self, X: pd.DataFrame, Y: pd.DataFrame = None, fit=False) -> pd.DataFrame:
         """
-        :param X:
-        :param Y: Only has to be provided if fit is True and preprocessors require Y for fitting
-        :param fit: if True, preprocessors will be fitted before being applied to X
+        :param X: the input data frame
+        :param Y: the output data frame (when training); only has to be provided if ``fit=True`` and preprocessors require outputs for fitting
+        :param fit: if True, preprocessors will be fitted before being applied to ``X``
         :return:
         """
         if fit:
@@ -240,10 +245,10 @@ def _computeModelOutputs(self, Y: pd.DataFrame) -> pd.DataFrame:
 
     def predict(self, x: pd.DataFrame) -> pd.DataFrame:
         """
-        Performs a prediction for the given input data frame
+        Applies the model to the given input data frame
 
-        :param x: the input data
-        :return: a DataFrame with the same index as the input
+        :param x: the input data frame
+        :return: the model outputs in the form of a data frame whose index corresponds to the index of ``x``
         """
         if not self.isFitted():
             raise Exception(f"Calling predict with unfitted model {self} "
@@ -291,6 +296,12 @@ def _fitPreprocessors(self, X: pd.DataFrame, Y: pd.DataFrame = None):
         self._inputTransformerChain.fit(X)
 
     def fitInputOutputData(self, ioData: InputOutputData, fitPreprocessors=True):
+        """
+        Fits the model using the given data
+
+        :param ioData: the input/output data
+        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall also be fitted
+        """
         self.fit(ioData.inputs, ioData.outputs, fitPreprocessors=fitPreprocessors)
 
     def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True):
@@ -298,11 +309,9 @@ def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True)
         Fits the model using the given data
 
         :param X: a data frame containing input data
-        :param Y: a data frame containing output data. None may be passed if the underlying model does not require
-            fitting, e.g. with rule-based models
-        :param fitPreprocessors: if False, the model's feature generator and input transformers will not be fitted.
-            If a preprocessor requires fitting, was not separately fit before and this option is set to False,
-            an exception will be raised.
+        :param Y: a data frame containing output data; may be None if the underlying model does not actually require
+            fitting, e.g. in the case of a rule-based models, but fitting is still necessary for preprocessors
+        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall also be fitted
         """
         self._trainingContext = TrainingContext(X, Y)
         try:
@@ -337,6 +346,9 @@ def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True)
             self._trainingContext = None
 
     def isBeingFitted(self) -> bool:
+        """
+        :return: True if the model is currently in the process of being fitted, False otherwise
+        """
         return self._trainingContext is not None
 
     @abstractmethod
@@ -344,6 +356,9 @@ def _fit(self, X: pd.DataFrame, Y: pd.DataFrame):
         pass
 
     def getPredictedVariableNames(self):
+        """
+        :return: the list of variable names that are ultimately output by this model (i.e. the columns of the data frame output by :meth:`predict`)
+        """
         return self._predictedVariableNames
 
     def getModelInputVariableNames(self) -> Optional[List[str]]:
@@ -354,18 +369,30 @@ def getModelInputVariableNames(self) -> Optional[List[str]]:
         return self._modelInputVariableNames
 
     def getInputTransformer(self, cls: Type[DataFrameTransformer]):
+        """
+        Gets the (first) input transformer of the given type (if any) within this models input transformer chain
+
+        :param cls: the type of transformer to look for
+        :return: the first matching transformer or None
+        """
         for it in self._inputTransformerChain.dataFrameTransformers:
             if isinstance(it, cls):
                 return it
         return None
 
-    def getInputTransformerChain(self):
+    def getInputTransformerChain(self) -> DataFrameTransformerChain:
+        """
+        :return: the model's input transformer chain (which may be empty and contain no actual transformers)
+        """
         return self._inputTransformerChain
 
     def setFeatureGenerator(self, featureGenerator: Optional[FeatureGenerator]):
         self.withFeatureGenerator(featureGenerator)
 
     def getFeatureGenerator(self) -> Optional[FeatureGenerator]:
+        """
+        :return: the model's feature generator (if any)
+        """
         return self._featureGenerator
 
 
@@ -397,8 +424,7 @@ def withOutputTransformers(self, *outputTransformers: Union[DataFrameTransformer
         The transformers are ignored during the fit phase. Not supported for rule-based models.
 
         **Important**: The output columns names of the last output transformer should be the same
-        as the first one's input column names. If this fails to hold, an exception will be raised when .predict() is called
-        (fit will run through without problems, though).
+        as the first one's input column names. If this fails to hold, an exception will be raised when :meth:`predict` is called.
 
         **Note**: Output transformers perform post-processing after the actual predictions have been made. Contrary
         to invertible target transformers, they are not invoked during the fit phase. Therefore, any losses computed there,
@@ -423,14 +449,19 @@ def withOutputTransformers(self, *outputTransformers: Union[DataFrameTransformer
 
     def withTargetTransformer(self, targetTransformer: Optional[InvertibleDataFrameTransformer]) -> __qualname__:
         """
-        Makes the model use the given target transformers. Not supported for rule-based models.
+        Makes the model use the given target transformers such that the underlying low-level model is trained on the transformed
+        targets, but this high-level model still outputs the original (untransformed) values, i.e. the transformation is applied
+        to targets during training and the inverse transformation is applied to the underlying model's predictions during inference.
+        Hence the requirement of  the transformer being invertible.
+
+        This method is not supported for rule-based models, because they are not trained and therefore the transformation
+        would serve no purpose.
 
-        NOTE: all feature generators and data frame transformers will be fit on the untransformed target.
-        The targetTransformer only affects the fit of the internal model.
+        NOTE: All feature generators and data frame transformers - should they make use of outputs - will be fit on the untransformed target.
+        The targetTransformer only affects the fitting of the underlying model.
 
         :param targetTransformer: a transformer which transforms the targets (training data outputs) prior to learning the model, such
-            that the model learns to predict the transformed outputs. When predicting, the inverse transformer is applied after applying
-            the model, i.e. the transformation is completely transparent when applying the model.
+            that the model learns to predict the transformed outputs
         :return: self
         """
         # Disabled for rule-based models which do not apply fitting and therefore cannot make use of transformed targets

From a69c3c91f5da2d0e903345adb03859609e92b006 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 00:32:54 +0200
Subject: [PATCH 092/131] Flattening feature generators: Allow to control what
 happens to additional columns

---
 src/sensai/featuregen.py | 21 +++++++++++++--------
 1 file changed, 13 insertions(+), 8 deletions(-)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 688f0183..55a006c1 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -243,18 +243,21 @@ def fitGenerate(self, X: pd.DataFrame, Y: pd.DataFrame = None, ctx=None) -> pd.D
 
     def flattened(self, columnsToFlatten: List[str] = None,
             normalisationRules=(),
-            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None) -> "ChainedFeatureGenerator":
+            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None,
+            keepOtherColumns=True) -> "ChainedFeatureGenerator":
         """
         Returns a new feature generator which returns flattened versions of one or more of the vector-valued columns generated
-        by this feature generator
+        by this feature generator.
 
         :param columnsToFlatten: the list of columns to flatten; if None, flatten all columns
         :param normalisationRules: a list of normalisation rules which apply to the flattened columns
         :param normalisationRuleTemplate: a normalisation rule template which applies to all generated flattened columns
+        :param keepOtherColumns: if True, any additional columns that are not to be flattened are to be retained
+            by the returned feature generator; if False, additional columns are to be discarded
         :return: a feature generator which generates the flattened columns
         """
         return flattenedFeatureGenerator(self, columnsToFlatten=columnsToFlatten, normalisationRules=normalisationRules,
-            normalisationRuleTemplate=normalisationRuleTemplate)
+            keepOtherColumns=keepOtherColumns, normalisationRuleTemplate=normalisationRuleTemplate)
 
 
 class RuleBasedFeatureGenerator(FeatureGenerator, ABC):
@@ -907,15 +910,17 @@ def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
         return pd.DataFrame(newCols, index=df.index)
 
 
-def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str] = None,
-                            normalisationRules=(), normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
+def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str] = None, keepOtherColumns=False,
+        normalisationRules: Sequence[DFTNormalisation.Rule] = (),
+        normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
     """
     Return a flattening version of the input feature generator, leaving additional columns (if any) that are not to be flattened
     but are also generated by the input feature generator untouched.
 
     :param fgen: the feature generator which generates columns that are to be flattened
-    :param columnsToFlatten: list of names of output columns to be flattened.
-        If None, all output columns will be flattened.
+    :param columnsToFlatten: list of names of output columns to be flattened; if None, flatten all columns
+    :param keepOtherColumns: whether any additional columns that are not to be flattened are to be retained
+        by the returned feature generator
     :param normalisationRules: additional normalisation rules for the flattened output columns
     :param normalisationRuleTemplate: This parameter can be supplied instead of normalisationRules for the case where
         there shall be a single rule that applies to all flattened output columns
@@ -935,7 +940,7 @@ def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str
     """
     flatteningGenerator = FeatureGeneratorFlattenColumns(columns=columnsToFlatten, normalisationRules=normalisationRules,
         normalisationRuleTemplate=normalisationRuleTemplate)
-    if columnsToFlatten is None:
+    if columnsToFlatten is None or not keepOtherColumns:
         return ChainedFeatureGenerator(fgen, flatteningGenerator)
     else:
         return ChainedFeatureGenerator(fgen,

From a9aea1edc36919442d6b7d32388dbf1ab9276c9c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 00:42:27 +0200
Subject: [PATCH 093/131] FeatureGenerator: Added convenience methods `concat`
 and `chain` for   the construction of MultiFeatureGenerators and
 ChainedFeatureGenerators

---
 src/sensai/featuregen.py | 31 +++++++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 55a006c1..e5c0586a 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -259,6 +259,37 @@ def flattened(self, columnsToFlatten: List[str] = None,
         return flattenedFeatureGenerator(self, columnsToFlatten=columnsToFlatten, normalisationRules=normalisationRules,
             keepOtherColumns=keepOtherColumns, normalisationRuleTemplate=normalisationRuleTemplate)
 
+    def concat(self, *others: "FeatureGenerator") -> "MultiFeatureGenerator":
+        """
+        Concatenates this feature generator with one or more other feature generator in order to produce a feature generator that
+        jointly generates all features
+
+        :param others: other feature generators
+        :return: a :class:`MultiFeatureGenerator`
+        """
+        if isinstance(self, MultiFeatureGenerator):
+            fgens = list(self.featureGenerators)
+        else:
+            fgens = [self]
+        fgens.extend(others)
+        return MultiFeatureGenerator(fgens)
+
+    def chain(self, *others: "FeatureGenerator") -> "ChainedFeatureGenerator":
+        """
+        Chains this feature generator with one or more other feature generators such that each feature generator
+        receives as input the output of the preceding feature generator. The resulting feature generator
+        produces the features of the last element in the chain.
+
+        :param others: other feature generator
+        :return: a :class:`ChainedFeatureGenerator`
+        """
+        if isinstance(self, ChainedFeatureGenerator):
+            fgens = self.featureGenerators
+        else:
+            fgens = [self]
+        fgens.extend(others)
+        return ChainedFeatureGenerator(fgens)
+
 
 class RuleBasedFeatureGenerator(FeatureGenerator, ABC):
     """

From 3218d1bc3b5ed0f364bdcb40104e6b8b61a87eab Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 00:49:34 +0200
Subject: [PATCH 094/131] Improved docstring

---
 src/sensai/featuregen.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index e5c0586a..ae5e9890 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -12,6 +12,7 @@
 from .data_transformation import DFTNormalisation
 from .util import flattenArguments
 from .util.string import orRegexGroup, ToStringMixin, listString
+from .util.typing import PandasNamedTuple
 
 if TYPE_CHECKING:
     from .vector_model import VectorModel
@@ -221,9 +222,10 @@ def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
         :param df: the input data frame for which to generate features
         :param ctx: a context object whose functionality may be required for feature generation;
             this is typically the model instance that this feature generator is to generate inputs for
-        :return: a data frame containing the generated features, which uses the same index as X (and Y).
-            The data frame's columns holding categorical columns are not required to have dtype 'category';
-            this will be ensured by the encapsulating call.
+        :return: a data frame containing the generated features, which uses the same index as ``df``.
+            The data frame's columns holding categorical columns are not required to have dtype ``category``;
+            this will be ensured by the encapsulating call as long as the respective columns' names
+            were appropriately provided at construction.
         """
         pass
 
@@ -382,6 +384,7 @@ def __init__(self, cache: util.cache.PersistentKeyValueCache = None, categorical
     def _generate(self, df: pd.DataFrame, ctx=None):
         dicts = []
         for idx, nt in enumerate(df.itertuples()):
+            nt: PandasNamedTuple
             if idx % 100 == 0:
                 log.debug(f"Generating feature via {self.__class__.__name__} for index {idx}")
             value = None

From 1013d17e562c624564508e420f4f3d70255e3963 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 01:37:39 +0200
Subject: [PATCH 095/131] Added countNotNone

---
 src/sensai/util/helper.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/src/sensai/util/helper.py b/src/sensai/util/helper.py
index e818c3e3..03cf0f78 100644
--- a/src/sensai/util/helper.py
+++ b/src/sensai/util/helper.py
@@ -21,6 +21,16 @@ def countNone(*args: Any) -> int:
     return c
 
 
+def countNotNone(*args: Any) -> int:
+    """
+    Counts the number of arguments that are not None
+
+    :param args: various arguments
+    :return: the number of arguments that are not None
+    """
+    return len(args) - countNone(*args)
+
+
 def anyNone(*args: Any) -> bool:
     """
     :param args: various arguments

From 20dbb503fa450a34dbc42099c4056d3397f17b45 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 01:38:30 +0200
Subject: [PATCH 096/131] DFTNormalisation: Improved docstrings, particularly
 in RuleTemplate, adding input checks

---
 src/sensai/data_transformation/dft.py | 28 +++++++++++++++++++++------
 1 file changed, 22 insertions(+), 6 deletions(-)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 8dfa9d66..3909f408 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -10,7 +10,7 @@
 
 from .sklearn_transformer import SkLearnTransformerProtocol
 from ..columngen import ColumnGenerator
-from ..util import flattenArguments
+from ..util import flattenArguments, countNotNone
 from ..util.pandas import DataFrameColumnChangeTracker
 from ..util.pickle import setstate
 from ..util.string import orRegexGroup, ToStringMixin
@@ -445,6 +445,20 @@ class RuleTemplate:
         def __init__(self, skip=False, unsupported=False, transformer: SkLearnTransformerProtocol = None,
                 transformerFactory: Callable[[], SkLearnTransformerProtocol] = None, independentColumns=False):
             """
+            Creates a rule template which applies to one or more features/columns (depending on context).
+            Use parameters as follows:
+
+                * If the relevant features are already normalised, pass ``skip=True``
+                * If the relevant features cannot be normalised (e.g. because they are categorical), pass ``unsupported=True``
+                * If the relevant features shall be normalised, the other parameters apply.
+                  No parameters, i.e. ``RuleTemplate()``, are an option if ...
+
+                    * a default transformer factory is specified in the :class:`DFTNormalisation` instance and its application
+                      is suitable for the relevant set of features.
+                      Otherwise, specify either ``transformerFactory`` or ``transformer``.
+                    * all relevant features are to be normalised in the same way.
+                      Otherwise, specify ``independentColumns=True``.
+
             :param skip: flag indicating whether no transformation shall be performed on all of the columns
             :param unsupported: flag indicating whether normalisation of all columns is unsupported (shall trigger an exception if attempted)
             :param transformer: a transformer instance (from sklearn.preprocessing, e.g. StandardScaler) to apply to the matching column(s)
@@ -454,12 +468,12 @@ def __init__(self, skip=False, unsupported=False, transformer: SkLearnTransforme
                 feature with associated rule/rule template (disabling `fit` where appropriate). Otherwise, use a factory.
             :param transformerFactory: a factory for the generation of the transformer instance, which will only be applied if `transformer`
                 is not given; if neither `transformer` nor `transformerInstance` are given, the containing instance's default factory will
-                be used. See `SkLearnTransformerFactoryFactory` for convenient construction options.
+                be used. See :class:`SkLearnTransformerFactoryFactory` for convenient construction options.
             :param independentColumns: whether a separate transformation is to be learned for each of the columns for the case where the
                 rule matches multiple columns.
             """
-            if skip and transformer is not None:
-                raise ValueError("skip==True while transformer is not None")
+            if (skip or unsupported) and countNotNone(transformer, transformerFactory) > 0:
+                raise ValueError("Passed transformer or transformerFactory while skip=True or unsupported=True")
             self.skip = skip
             self.unsupported = unsupported
             self.transformer = transformer
@@ -497,7 +511,7 @@ def __init__(self, regex: Optional[str], skip=False, unsupported=False, transfor
                 feature with associated rule/rule template (disabling `fit` where appropriate). Otherwise, use a factory.
             :param transformerFactory: a factory for the generation of the transformer instance, which will only be applied if `transformer`
                 is not given; if neither `transformer` nor `transformerInstance` are given, the containing instance's default factory will
-                be used. See `SkLearnTransformerFactoryFactory` for convenient construction options.
+                be used. See :class:`SkLearnTransformerFactoryFactory` for convenient construction options.
             :param arrayValued: whether the column values are not scalars but arrays (of arbitrary lengths).
                 It is assumed that all entries in such arrays are to be normalised in the same way.
                 If arrayValued is True, only a single matching column is supported, i.e. the regex must match at most one column.
@@ -542,7 +556,9 @@ def matchingColumns(self, columns: Sequence[str]):
 
     def __init__(self, rules: Sequence[Rule], defaultTransformerFactory=None, requireAllHandled=True, inplace=False):
         """
-        :param rules: the set of rules; rules are always fitted and applied in the given order
+        :param rules: the set of rules; rules are always fitted and applied in the given order.
+            A convenient way to obtain a set of rules in the :class:`sensai.vector_model.VectorModel` context is from a
+            :class:`sensai.featuregen.FeatureCollector` or :class:`sensai.featuregen.MultiFeatureGenerator`.
         :param defaultTransformerFactory: a factory for the creation of transformer instances (from sklearn.preprocessing, e.g. StandardScaler)
             that shall be used to create a transformer for all rules that don't specify a particular transformer.
             The default transformer will only be applied to columns matched by such rules, unmatched columns will

From e165db9c0a581c0ce5dba0ab603a6249e425d0f9 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 01:57:03 +0200
Subject: [PATCH 097/131] Updated information on the docs build

---
 README-dev.md | 26 ++++++++++----------------
 1 file changed, 10 insertions(+), 16 deletions(-)

diff --git a/README-dev.md b/README-dev.md
index 4921b646..7a1b89c4 100644
--- a/README-dev.md
+++ b/README-dev.md
@@ -33,33 +33,27 @@ Docs are automatically created during the GitHub build via tox.
 
 All .rst files are auto-generated (by `build_scripts/update_docs.py`), with the exception of the root index file  `index.rst`.
 
-### Dependency Handling
+### Declaring Optional Dependencies
 
-**Attention**: Make sure that any optional sensAI dependencies (which are not included in the `docs` tox environment) are added to `docs/conf.py` under `autodoc_mock_imports`.
+**Attention**: Make sure that any optional sensAI dependencies (which are not included in the `docs` tox environment) are added to `docs/conf.py` under `autodoc_mock_imports`. Otherwise the tox build will fail.
 
 ### Notebooks
 
-Notebooks in the `notebooks/` folder are executed and saved with outputs to the `docs/` folder by a test in `notebooks/test_notebooks.py`.
+`docs/index.rst` includes the names of notebooks which reside in the `notebooks/` folder. They are not initially present in the `docs/` folder, but any notebooks whose names are referenced in `index.rst` will be executed and saved with outputs to the `docs/` folder by a test in `notebooks/test_notebooks.py`.
 
-Notebooks are included in the documentation in `docs/index.rst`.
+Therefore, in order for the docs build to work (without temporarily removing the notebook inclusions), it is necessary to run the aforementioned test at least once via
 
-### Manually Running the Docs Build
-
-The docs build is designed to be run by tox. As soon as a single iPython notebook is included in index.rst, `sensai` must be available as an installed dependency in the environment in which the docs build is run, as the notebook executions take place in a Jupyter environment where we can't simply extend sys.path. 
+    sh run_pytest_notebooks.sh
 
-Under Linux, running tox should work fine. Under Windows, we are yet to succeed.
+For changes in notebooks to be reflected in the docs build, the test needs to be rerun.
 
-To run the docs build without tox (under Windows), first create an environment that has the additional requirements installed.
+### Manually Running the Docs Build
 
-    conda env create -n sensai-docs -f environment.yml
-    conda activate sensai-docs
-    pip install sphinx sphinx_rtd_theme nbsphinx
+The docs build can be run without tox via 
 
-Then, to build the docs, we need to perform the following steps with the new environment `sensai-docs` activated. The first command installs the current source version of  `sensai` itself.
+    sh build-docs.sh
 
-    pip install .
-    rm -rf docs-build; mkdir docs-build
-    sphinx-build -b html docs docs-build
+Results will be stored in `docs/build/`.
 
 # Creating a New Release
 

From 884b713c623f757a04c15cc01283bf4440bd41be Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 02:25:45 +0200
Subject: [PATCH 098/131] flattenedFeatureGenerator: Fixed default of new
 parameter keepOtherColumns

---
 src/sensai/featuregen.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index ae5e9890..3eae6385 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -944,12 +944,11 @@ def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
         return pd.DataFrame(newCols, index=df.index)
 
 
-def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str] = None, keepOtherColumns=False,
+def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str] = None, keepOtherColumns=True,
         normalisationRules: Sequence[DFTNormalisation.Rule] = (),
         normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
     """
-    Return a flattening version of the input feature generator, leaving additional columns (if any) that are not to be flattened
-    but are also generated by the input feature generator untouched.
+    Return a flattening version of the input feature generator.
 
     :param fgen: the feature generator which generates columns that are to be flattened
     :param columnsToFlatten: list of names of output columns to be flattened; if None, flatten all columns

From 2dfc687f5739449bf50ee6fb4d31b9a3bf838af7 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sat, 28 May 2022 02:43:10 +0200
Subject: [PATCH 099/131] Made notebook runnable without ClearML credentials
 and in VSCode context

---
 notebooks/tracking_experiments.ipynb | 276 ++++++++++++++-------------
 1 file changed, 143 insertions(+), 133 deletions(-)

diff --git a/notebooks/tracking_experiments.ipynb b/notebooks/tracking_experiments.ipynb
index 7ee4b0ff..d5855071 100644
--- a/notebooks/tracking_experiments.ipynb
+++ b/notebooks/tracking_experiments.ipynb
@@ -1,5 +1,30 @@
 {
  "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%load_ext autoreload\n",
+    "%autoreload 2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys; sys.path.extend([\"../src\", \"..\"])\n",
+    "import sensai\n",
+    "import logging\n",
+    "import config\n",
+    "\n",
+    "c = config.get_config(reload=True)\n",
+    "sensai.util.logging.configureLogging(level=logging.INFO)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {
@@ -9,7 +34,7 @@
     }
    },
    "source": [
-    "# Tracking sensAI experiments\n",
+    "# Tracking Experiments\n",
     "\n",
     "In this notebook we will demonstrate how to use sensAI's tracking utilities with evaluators\n",
     "and parameter sweeps. Several backends are supported and it is very easy to write a new custom adapter\n",
@@ -21,57 +46,36 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "# Note - this cell should be executed only once per session\n",
-    "%load_ext autoreload\n",
-    "%autoreload 2\n",
-    "\n",
-    "import sys, os\n",
-    "\n",
-    "# in order to get the config, it is not part of the library\n",
-    "os.chdir(\"..\")\n",
-    "sys.path.append(os.path.abspath(\".\"))"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
-    "import geopandas as gp\n",
+    "import os\n",
     "\n",
-    "from sensai.hyperopt import GridSearch\n",
+    "import geopandas as gp\n",
     "from sklearn.cluster import DBSCAN\n",
-    "import logging\n",
     "\n",
+    "from sensai.hyperopt import GridSearch\n",
     "from sensai.geoanalytics.geopandas.coordinate_clustering import SkLearnCoordinateClustering\n",
     "from sensai.evaluation.evaluator_clustering import ClusteringModelSupervisedEvaluator\n",
     "from sensai.geoanalytics.geopandas.coordinate_clustering_ground_truth import PolygonAnnotatedCoordinates\n",
     "from sensai.tracking.clearml_tracking import ClearMLExperiment\n",
     "\n",
-    "import matplotlib.pyplot as plt\n",
-    "\n",
-    "from config import get_config\n",
-    "\n",
-    "logging.basicConfig(level=logging.INFO)\n",
-    "c = get_config(reload=True)"
-   ],
+    "import matplotlib.pyplot as plt"
+   ]
+  },
+  {
+   "cell_type": "markdown",
    "metadata": {
     "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
+     "name": "#%% md\n"
     }
-   }
-  },
-  {
-   "cell_type": "markdown",
+   },
    "source": [
     "### Evaluators\n",
     "\n",
@@ -80,108 +84,114 @@
     "[intro to evaluation](clustering_evaluation.ipynb) for more details.\n",
     "\n",
     "[comment]: <> (TODO - use some VectorModel with an sklearn dataset instead, move the notebook to sensAI repo)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%% md\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "# loading the data and ground truth labels\n",
     "sampleFile = c.datafile_path(\"sample\", stage=c.RAW) # this can point to a directory or a shp/geojson file\n",
     "sampleGeoDF = gp.read_file(sampleFile)\n",
     "groundTruthClusters = PolygonAnnotatedCoordinates(sampleGeoDF, c.datafile_path(\"sample\", stage=c.GROUND_TRUTH))"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
     "# creating the evaluator\n",
     "groundTruthCoordinates, groundTruthLabels = groundTruthClusters.getCoordinatesLabels()\n",
     "supervisedEvaluator = ClusteringModelSupervisedEvaluator(groundTruthCoordinates, trueLabels=groundTruthLabels)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "### Setup tracking\n",
-    "\n",
-    "Now comes the new part - we create a tracking experiment and set it in the evaluator"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "### Setup tracking\n",
+    "\n",
+    "Now comes the new part - we create a tracking experiment and set it in the evaluator"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "experiment = ClearMLExperiment(projectName=\"Demos\", taskName=\"notebook_experiment\")\n",
-    "supervisedEvaluator.setTrackedExperiment(experiment)"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
+   },
+   "outputs": [],
+   "source": [
+    "def createExperiment(projectName, taskName):\n",
+    "    try:\n",
+    "        return ClearMLExperiment(projectName=projectName, taskName=taskName)\n",
+    "    except:  # allow to run in contexts without ClearML credentials\n",
+    "        return None\n",
+    "\n",
+    "experiment = createExperiment(projectName=\"Demos\", taskName=\"notebook_experiment\")\n",
+    "supervisedEvaluator.setTrackedExperiment(experiment)"
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "As simple as that! Whenever we perform an evaluation, the results will be tracked. Depending on\n",
-    "the backend and the particular implementation of the experiment, the code and other information\n",
-    "like images will get tracked as well. We will demonstrated the tracking of the evaluation of a dbscan."
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "As simple as that! Whenever we perform an evaluation, the results will be tracked. Depending on\n",
+    "the backend and the particular implementation of the experiment, the code and other information\n",
+    "like images will get tracked as well. We will demonstrated the tracking of the evaluation of a dbscan."
+   ]
   },
   {
    "cell_type": "code",
-   "source": [
-    "boundedDbscan = SkLearnCoordinateClustering(DBSCAN(eps=150, min_samples=20), minClusterSize=100)\n",
-    "supervisedEvaluator.computeMetrics(boundedDbscan)"
-   ],
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
    },
-   "execution_count": null,
-   "outputs": []
+   "outputs": [],
+   "source": [
+    "boundedDbscan = SkLearnCoordinateClustering(DBSCAN(eps=150, min_samples=20), minClusterSize=100)\n",
+    "supervisedEvaluator.computeMetrics(boundedDbscan)"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "# plots are tracked automatically on creation.\n",
@@ -191,67 +201,68 @@
     "ax.set_title(\"Sample Ground Truth clusters\")\n",
     "groundTruthClusters.plot(includeNoise=False, markersize=0.2, cmap=\"plasma\", ax=ax)\n",
     "fig.show()"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
     "fig, ax = plt.subplots(figsize=[6, 8])\n",
     "ax.set_title(\"Predicted clusters\")\n",
     "boundedDbscan.plot(includeNoise=False, markersize=0.2, cmap=\"plasma\", ax=ax, figsize=10)\n",
     "fig.show()\n"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
     "# We can also add the summaries df to the experiment through explicit tracking\n",
     "\n",
-    "logger  = supervisedEvaluator.trackedExperiment.logger\n",
+    "if supervisedEvaluator.trackedExperiment:\n",
+    "    logger  = supervisedEvaluator.trackedExperiment.logger\n",
     "\n",
-    "logger.report_table(title=\"Clusters Summaries\", series=\"pandas DataFrame\", iteration=0,\n",
-    "                    table_plot=boundedDbscan.summaryDF().sort_values(\"numMembers\"))"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "    logger.report_table(title=\"Clusters Summaries\", series=\"pandas DataFrame\", iteration=0,\n",
+    "                        table_plot=boundedDbscan.summaryDF().sort_values(\"numMembers\"))"
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "The same mechanism works in the hyperopts module. The experiment can be set for GridSearch\n",
-    "or simulated annealing. One can also set the experiment in the evaluator that is passed to\n",
-    "the hyperopt objects and use that one for tracking instead. Here an example\n"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "The same mechanism works in the hyperopts module. The experiment can be set for GridSearch\n",
+    "or simulated annealing. One can also set the experiment in the evaluator that is passed to\n",
+    "the hyperopt objects and use that one for tracking instead. Here an example\n"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "# because of how trains works and because we are using it in jupyter, we need to manually close the existing task\n",
@@ -259,8 +270,9 @@
     "# this step is unnecessary if one has one experiment per script execution\n",
     "# we also unset the tracked experiment in the evaluator and prepare a new one for the grid search\n",
     "\n",
-    "supervisedEvaluator.trackedExperiment.task.close()\n",
-    "supervisedEvaluator.unsetTrackedExperiment()\n",
+    "if supervisedEvaluator.trackedExperiment:\n",
+    "    supervisedEvaluator.trackedExperiment.task.close()\n",
+    "    supervisedEvaluator.unsetTrackedExperiment()\n",
     "\n",
     "\n",
     "def dbscanFactory(**kwargs):\n",
@@ -271,70 +283,68 @@
     "    \"eps\": [50, 150]\n",
     "}\n",
     "\n",
+    "gridExperiment = createExperiment(projectName=\"Demos\", taskName=\"notebook_grid_search\")\n",
     "dbscanGridSearch = GridSearch(dbscanFactory, parameterOptions,\n",
     "                              csvResultsPath=os.path.join(c.temp, \"dbscanGridSearchCsv\"))\n",
-    "gridExperiment = ClearMLExperiment(projectName=\"Demos\", taskName=\"notebook_grid_search\")\n",
     "dbscanGridSearch.setTrackedExperiment(gridExperiment)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
+   },
+   "outputs": [],
+   "source": [
+    "searchResults = dbscanGridSearch.run(supervisedEvaluator, sortColumnName=\"numClusters\")"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "searchResults = dbscanGridSearch.run(supervisedEvaluator, sortColumnName=\"numClusters\")"
-   ],
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   },
    "outputs": [],
    "source": [
     "# unfortunately, the trains experiment interface is at conflict with the grid search\n",
     "# the most pragmatic solution is to simply attach the dataframe to the experiment and to use it for further evaluation\n",
     "\n",
-    "dbscanGridSearch.trackedExperiment.logger.report_table(title=\"Results\", series=\"pandas DataFrame\", iteration=0,\n",
-    "                    table_plot=searchResults)\n"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "if dbscanGridSearch.trackedExperiment:\n",
+    "    dbscanGridSearch.trackedExperiment.logger.report_table(title=\"Results\", series=\"pandas DataFrame\", iteration=0,\n",
+    "        table_plot=searchResults)\n"
+   ]
   }
  ],
  "metadata": {
+  "interpreter": {
+   "hash": "9b3442ae4bdb9561e722e28424c33a03c16d40b3aa50369b79d367cad7b1adea"
+  },
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3.8.13 ('sensai')",
    "language": "python",
    "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
-    "version": 2
+    "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython2",
-   "version": "2.7.6"
+   "pygments_lexer": "ipython3",
+   "version": "3.8.13"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
\ No newline at end of file
+}

From 604c42fd7a79143423dd2223115ba7cf59e4d2ba Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Sat, 28 May 2022 16:02:55 +0200
Subject: [PATCH 100/131] Sync pjm

  commit e240e5f7e8f8305c967ece100d44966a5941202f
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sat May 28 13:50:22 2022 +0200

      MultiDataEvaluationUtil: Fixed missing None check for visitors

  sensai/evaluation/eval_util.py

  commit b010379b3f7a7e72998e10af4374d39711301fc5
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sat May 28 13:19:38 2022 +0200

      GreedyAgglomerativeGeoCoordClusterer: Fixed superclass not being specified

  sensai/geoanalytics/geo_clustering.py

  commit 75f713a7bca40c433c889c46673709bbd6ee5d3f
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Sat May 28 13:18:40 2022 +0200

      Added HistogramPlot

  sensai/util/plot.py

  commit b21eebc411e719529100c50c978bef7103bfc0dd
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed May 25 20:47:34 2022 +0200

      Moved feature importance plotting functionality from visitor to module feature_importance

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py

  commit 36c688d45d27df120c599a854b2ca108e79af68b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed May 25 20:37:15 2022 +0200

      AggregatedFeatureImportances: Support aggregation of features via regex

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py
---
 src/sensai/evaluation/eval_util.py        | 25 +++++------
 src/sensai/feature_importance.py          | 55 +++++++++++++++++++----
 src/sensai/geoanalytics/geo_clustering.py |  2 +-
 src/sensai/util/plot.py                   | 13 +++++-
 4 files changed, 70 insertions(+), 25 deletions(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 95d93050..77b91903 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -32,7 +32,7 @@
     VectorRegressionModelEvaluationData, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, \
     VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, VectorModelEvaluatorParams
 from ..data import InputOutputData
-from ..feature_importance import AggregatedFeatureImportances, FeatureImportanceProvider
+from ..feature_importance import AggregatedFeatureImportances, FeatureImportanceProvider, plotFeatureImportance
 from ..util.io import ResultWriter
 from ..util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 from ..util.string import prettyStringRepr
@@ -592,8 +592,9 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
 
         # create plots from visitors (if any)
         resultCollector = EvaluationResultCollector(showPlots=False, resultWriter=resultWriter)
-        for visitor in visitors:
-            visitor.collectPlots(resultCollector)
+        if visitors is not None:
+            for visitor in visitors:
+                visitor.collectPlots(resultCollector)
 
         if isRegression:
             return RegressionMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
@@ -641,12 +642,16 @@ class ModelComparisonVisitorAggregatedFeatureImportances(ModelComparisonVisitor)
     """
     During a model comparison, computes aggregated feature importance values for the model with the given name
     """
-    def __init__(self, modelName: str):
+    def __init__(self, modelName: str, featureAggRegEx: Sequence[str] = ()):
         """
         :param modelName: the name of the model for which to compute the aggregated feature importance values
+        :param featureAggRegEx: a sequence of regular expressions describing which feature names to sum as one. Each regex must
+            contain exactly one group. If a regex matches a feature name, the feature importance will be summed under the key
+            of the matched group instead of the full feature name. For example, the regex r"(\w+)_\d+$" will cause "foo_1" and "foo_2"
+            to be summed under "foo" and similarly "bar_1" and "bar_2" to be summed under "bar".
         """
         self.modelName = modelName
-        self.aggFeatureImportance = AggregatedFeatureImportances()
+        self.aggFeatureImportance = AggregatedFeatureImportances(featureAggRegEx=featureAggRegEx)
 
     def visit(self, modelName: str, result: ModelComparisonData.Result):
         if modelName == self.modelName:
@@ -666,15 +671,7 @@ def _collect(self, model: Union[FeatureImportanceProvider, VectorModelBase]):
         self.aggFeatureImportance.add(model.getFeatureImportances())
 
     def plotFeatureImportance(self) -> plt.Figure:
-        featureImportanceDict = self.aggFeatureImportance.aggDict
-        numFeatures = len(featureImportanceDict)
-        defaultWidth, defaultHeight = MATPLOTLIB_DEFAULT_FIGURE_SIZE
-        height = max(defaultHeight, defaultHeight * numFeatures / 20)
-        fig, ax = plt.subplots(figsize=(defaultWidth, height))
-        sns.barplot(list(featureImportanceDict.values()), list(featureImportanceDict.keys()), ax=ax)
-        plt.title(f"Feature Importance\n{self.modelName}")
-        plt.tight_layout()
-        return fig
+        return plotFeatureImportance(self.aggFeatureImportance.getFeatureImportanceSum(), subtitle=self.modelName)
 
     def collectPlots(self, resultCollector: EvaluationResultCollector):
         resultCollector.addFigure(f"{self.modelName}_feature-importance", self.plotFeatureImportance())
diff --git a/src/sensai/feature_importance.py b/src/sensai/feature_importance.py
index f752c139..7da122e1 100644
--- a/src/sensai/feature_importance.py
+++ b/src/sensai/feature_importance.py
@@ -1,6 +1,12 @@
 import collections
+import re
 from abc import ABC, abstractmethod
-from typing import Dict, Union
+from typing import Dict, Union, Sequence
+
+import seaborn as sns
+from matplotlib import pyplot as plt
+
+from .util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 
 
 class FeatureImportanceProvider(ABC):
@@ -18,15 +24,39 @@ def getFeatureImportances(self) -> Union[Dict[str, float], Dict[str, Dict[str, f
         pass
 
 
+def plotFeatureImportance(featureImportanceDict: Dict[str, float], subtitle: str = None) -> plt.Figure:
+    numFeatures = len(featureImportanceDict)
+    defaultWidth, defaultHeight = MATPLOTLIB_DEFAULT_FIGURE_SIZE
+    height = max(defaultHeight, defaultHeight * numFeatures / 20)
+    fig, ax = plt.subplots(figsize=(defaultWidth, height))
+    sns.barplot(x=list(featureImportanceDict.values()), y=list(featureImportanceDict.keys()), ax=ax)
+    title = "Feature Importance"
+    if subtitle is not None:
+        title += "\n" + subtitle
+    plt.title(title)
+    plt.tight_layout()
+    return fig
+
+
 class AggregatedFeatureImportances:
     """
-    Aggregates feature importance values from models that suppurt method getFeatureImportances
-    (e.g. sklearn's RandomForest models and compatible models from lightgbm, etc.)
+    Aggregates feature importance values (e.g. from models implementing FeatureImportanceProvider, such as sklearn's RandomForest
+    models and compatible models from lightgbm, etc.)
     """
-    def __init__(self, *featureImportances: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]]):
+    def __init__(self, *featureImportances: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]],
+            featureAggRegEx: Sequence[str] = ()):
+        r"""
+        :param featureImportances: (optional) initial list of feature importance providers or dictionaries to aggregate; further
+            values can be added via method add
+        :param featureAggRegEx: a sequence of regular expressions describing which feature names to sum as one. Each regex must
+            contain exactly one group. If a regex matches a feature name, the feature importance will be summed under the key
+            of the matched group instead of the full feature name. For example, the regex r"(\w+)_\d+$" will cause "foo_1" and "foo_2"
+            to be summed under "foo" and similarly "bar_1" and "bar_2" to be summed under "bar".
+        """
         self.aggDict = None
         self._isNested = None
         self._numDictsAdded = 0
+        self._featureAggRegEx = [re.compile(p) for p in featureAggRegEx]
         for d in featureImportances:
             self.add(d)
 
@@ -47,16 +77,23 @@ def add(self, featureImportance: Union[FeatureImportanceProvider, Dict[str, floa
         if self._isNested:
             if self.aggDict is None:
                 self.aggDict = collections.defaultdict(lambda: collections.defaultdict(lambda: 0))
-                for targetName, d in featureImportance.items():
-                    d: dict
-                    for featureName, value in d.items():
-                        self.aggDict[targetName][featureName] += value
+            for targetName, d in featureImportance.items():
+                d: dict
+                for featureName, value in d.items():
+                    self.aggDict[targetName][self._aggFeatureName(featureName)] += value
         else:
             if self.aggDict is None:
                 self.aggDict = collections.defaultdict(lambda: 0)
             for featureName, value in featureImportance.items():
-                self.aggDict[featureName] += value
+                self.aggDict[self._aggFeatureName(featureName)] += value
         self._numDictsAdded += 1
 
+    def _aggFeatureName(self, featureName: str):
+        for regex in self._featureAggRegEx:
+            m = regex.match(featureName)
+            if m is not None:
+                return m.group(1)
+        return featureName
+
     def getFeatureImportanceSum(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
         return self.aggDict
diff --git a/src/sensai/geoanalytics/geo_clustering.py b/src/sensai/geoanalytics/geo_clustering.py
index 2f351cef..1094a315 100644
--- a/src/sensai/geoanalytics/geo_clustering.py
+++ b/src/sensai/geoanalytics/geo_clustering.py
@@ -30,7 +30,7 @@ def clustersIndices(self) -> Tuple[List[List[int]], List[int]]:
         pass
 
 
-class GreedyAgglomerativeGeoCoordClusterer:
+class GreedyAgglomerativeGeoCoordClusterer(GeoCoordClusterer):
     def __init__(self, maxMinDistanceForMergeM: float, maxDistanceM: float, minClusterSize: int, lcs: LocalCoordinateSystem = None):
         """
         :param maxMinDistanceForMergeM: the maximum distance, in metres, for the minimum distance between two existing clusters for a merge
diff --git a/src/sensai/util/plot.py b/src/sensai/util/plot.py
index 225de905..6adcde78 100644
--- a/src/sensai/util/plot.py
+++ b/src/sensai/util/plot.py
@@ -5,11 +5,11 @@
 import matplotlib.figure
 from matplotlib import pyplot as plt
 import numpy as np
+import seaborn as sns
 
 
 log = logging.getLogger(__name__)
 
-
 MATPLOTLIB_DEFAULT_FIGURE_SIZE = (6.4, 4.8)
 
 
@@ -143,4 +143,15 @@ def draw():
                 plt.ylabel(yLabel)
             return plt.imshow(heatmap.T, extent=extent, origin='lower', interpolation="none", cmap=cmap, zorder=1, aspect="auto", **kwargs)
 
+        super().__init__(draw)
+
+
+class HistogramPlot(Plot):
+    def __init__(self, values, bins="auto", kde=False, binwidth=None, stat="percent", xlabel=None, **kwargs):
+        def draw():
+            ax = sns.histplot(values, bins=bins, kde=kde, binwidth=binwidth, stat=stat, **kwargs)
+            if xlabel is not None:
+                plt.xlabel(xlabel)
+            return ax
+
         super().__init__(draw)
\ No newline at end of file

From 4fcc088c0e3aac6e120b3d3b7bd98abff8543f48 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Sun, 29 May 2022 15:27:36 +0200
Subject: [PATCH 101/131] Added possibility to construct DFT from
 FeatureGenerator

---
 src/sensai/data_transformation/dft.py | 24 +++++++++++++++++++++++-
 src/sensai/featuregen.py              |  5 ++++-
 src/sensai/util/pandas.py             |  1 +
 src/sensai/util/string.py             |  1 +
 4 files changed, 29 insertions(+), 2 deletions(-)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 3909f408..72e2c4e7 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -15,6 +15,11 @@
 from ..util.pickle import setstate
 from ..util.string import orRegexGroup, ToStringMixin
 
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from ..featuregen import FeatureGenerator
+
 log = logging.getLogger(__name__)
 
 
@@ -48,9 +53,13 @@ def getName(self) -> str:
         """
         return self._name
 
-    def setName(self, name):
+    def setName(self, name: str):
         self._name = name
 
+    def withName(self, name: str):
+        self.setName(name)
+        return self
+
     @abstractmethod
     def _fit(self, df: pd.DataFrame):
         pass
@@ -87,6 +96,19 @@ def fitApply(self, df: pd.DataFrame) -> pd.DataFrame:
         return self.apply(df)
 
 
+class DFTFromFeatureGenerator(DataFrameTransformer):
+    def _fit(self, df: pd.DataFrame):
+        self.fgen.fit(df, ctx=None)
+
+    def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
+        return self.fgen.generate(df)
+
+    def __init__(self, fgen: FeatureGenerator):
+        super().__init__()
+        self.fgen = fgen
+        self.setName(f"{self.__class__.__name__}[{self.fgen.getName()}]")
+
+
 class InvertibleDataFrameTransformer(DataFrameTransformer, ABC):
     @abstractmethod
     def applyInverse(self, df: pd.DataFrame) -> pd.DataFrame:
diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 3eae6385..c2e7b354 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -9,7 +9,7 @@
 
 from . import util, data_transformation
 from .columngen import ColumnGenerator
-from .data_transformation import DFTNormalisation
+from .data_transformation import DFTNormalisation, DFTFromFeatureGenerator
 from .util import flattenArguments
 from .util.string import orRegexGroup, ToStringMixin, listString
 from .util.typing import PandasNamedTuple
@@ -138,6 +138,9 @@ def getGeneratedColumnNames(self) -> Optional[List[str]]:
         """
         return self._generatedColumnNames
 
+    def toDFT(self):
+        return DFTFromFeatureGenerator(self)
+
     @abstractmethod
     def _fit(self, X: pd.DataFrame, Y: pd.DataFrame = None, ctx=None):
         """
diff --git a/src/sensai/util/pandas.py b/src/sensai/util/pandas.py
index d05a7dae..06b42751 100644
--- a/src/sensai/util/pandas.py
+++ b/src/sensai/util/pandas.py
@@ -116,6 +116,7 @@ def extractArray(df: pd.DataFrame, dtype=None):
             arr = np.stack(arr[:, 0])
         # For the case where there is only one row, the old implementation above removed the first dimension,
         # so we do the same, even though it seems odd to do so (potential problem for batch size 1)
+        # TODO: remove this behavior
         if arr.shape[0] == 1:
             arr = arr[0]
     except ValueError:
diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index 47716fe4..684f0627 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -110,6 +110,7 @@ def functionName(x: Callable) -> str:
         return str(x)
 
 
+# TODO: allow returning json string for easier parsing/printing
 class ToStringMixin:
     """
     Provides implementations for ``__str__`` and ``__repr__`` which are based on the format ``"<class name>[<object info>]"`` and

From ab7a7875bbdc5b50989e1b3e8b9ed3fc86b385a9 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 15:22:23 +0200
Subject: [PATCH 102/131] Added FeatureGeneratorFromDataFrameTransformer; added
 comment on FeatureGenerator.__init__

---
 src/sensai/featuregen.py | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index c2e7b354..ace07141 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -16,6 +16,7 @@
 
 if TYPE_CHECKING:
     from .vector_model import VectorModel
+    from .data_transformation import DataFrameTransformer
 
 log = logging.getLogger(__name__)
 
@@ -47,6 +48,11 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
             If True, normalisation rules for categorical features (which are unsupported by normalisation) and their corresponding one-hot
             encoded features (with "_<index>" appended) will be added.
         """
+        # NOTE: While it would be more elegant to not have all of the above constructor arguments and instead provide
+        # them later using "with*" methods, this would have the significant drawback that it would enable
+        # all such attributes to be provided in all subclasses, even in ones where we know settings exactly
+        # and can provide them directly in the subclass constructor implementation. Thus it would enable
+        # non-sensical settings which should be avoided.
         if len(normalisationRules) > 0 and normalisationRuleTemplate is not None:
             raise ValueError(f"normalisationRules should be empty when a normalisationRuleTemplate is provided")
 
@@ -981,3 +987,19 @@ def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str
     else:
         return ChainedFeatureGenerator(fgen,
             MultiFeatureGenerator(flatteningGenerator, FeatureGeneratorTakeColumns(exceptColumns=columnsToFlatten)))
+
+
+class FeatureGeneratorFromDataFrameTransformer(FeatureGenerator):
+    def __init__(self, dft: DataFrameTransformer, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None,
+            normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
+            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None,
+            addCategoricalDefaultRules=True):
+        super().__init__(categoricalFeatureNames=categoricalFeatureNames, normalisationRules=normalisationRules,
+            normalisationRuleTemplate=normalisationRuleTemplate, addCategoricalDefaultRules=addCategoricalDefaultRules)
+        self.dft = dft
+
+    def _fit(self, X: pd.DataFrame, Y: pd.DataFrame = None, ctx=None):
+        self.dft.fit(X)
+
+    def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
+        return self.dft.apply(df)

From e67ff6232e6ee2401f1beb4e182a0fff92999673 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 15:37:12 +0200
Subject: [PATCH 103/131] VectorModel:   * Added withRawInputTransformers   *
 Renamed withInputTransformers to withFeatureTransformers, retaining     the
 old method (but marked as deprecated)

---
 src/sensai/vector_model.py | 69 ++++++++++++++++++++++++++------------
 1 file changed, 47 insertions(+), 22 deletions(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 9be1f4ee..09849075 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -11,6 +11,7 @@
 import numpy as np
 import pandas as pd
 
+from sensai.util.deprecation import deprecated
 from .data import InputOutputData
 from .data_transformation import DataFrameTransformer, DataFrameTransformerChain, InvertibleDataFrameTransformer
 from .featuregen import FeatureGenerator, FeatureCollector
@@ -97,7 +98,10 @@ class VectorModel(VectorModelFittableBase, PickleLoadSaveMixin, ToStringMixin, A
     """
     TOSTRING_INCLUDE_PREPROCESSORS = False
     _TRANSIENT_MEMBERS = ["_trainingContext"]
-    _RENAMED_MEMBERS = {"checkInputColumns": "_checkInputColumns"}
+    _RENAMED_MEMBERS = {
+        "checkInputColumns": "_checkInputColumns",
+        "_inputTransformerChain": "_featureTransformerChain"
+    }
 
     def __init__(self, checkInputColumns=True):
         """
@@ -108,7 +112,8 @@ def __init__(self, checkInputColumns=True):
         """
         super().__init__()
         self._featureGenerator: Optional[FeatureGenerator] = None
-        self._inputTransformerChain = DataFrameTransformerChain()
+        self._rawInputTransformerChain = DataFrameTransformerChain()
+        self._featureTransformerChain = DataFrameTransformerChain()
         self._isFitted = False  # Note: this keeps track only of the actual model being fitted, not the pre/postprocessors
         self._predictedVariableNames: Optional[list] = None
         self._modelInputVariableNames: Optional[list] = None
@@ -118,20 +123,12 @@ def __init__(self, checkInputColumns=True):
         self._trainingContext: Optional[TrainingContext] = None
 
     def __getstate__(self):
-        state = getstate(VectorModel, self)
-        for m in VectorModel._TRANSIENT_MEMBERS:
-            if m in state:
-                del state[m]
-        return state
+        return getstate(VectorModel, self, transientProperties=self._TRANSIENT_MEMBERS)
 
     def __setstate__(self, state):
         for m in VectorModel._TRANSIENT_MEMBERS:
             state[m] = None
-        for mOld, mNew in VectorModel._RENAMED_MEMBERS.items():
-            if mOld in state:
-                state[mNew] = state[mOld]
-                del state[mOld]
-        setstate(VectorModel, self, state)
+        setstate(VectorModel, self, state, renamedProperties=self._RENAMED_MEMBERS)
 
     def _toStringExcludePrivate(self) -> bool:
         return True
@@ -150,16 +147,42 @@ def _toStringAdditionalEntries(self) -> Dict[str, Any]:
             d["name"] = self._name
         return d
 
-    def withInputTransformers(self, *inputTransformers: Union[DataFrameTransformer, List[DataFrameTransformer]]) -> __qualname__:
+    def withRawInputTransformers(self, *transformers: Union[DataFrameTransformer, List[DataFrameTransformer]]):
         """
-        Makes the model use the given input transformers (removing previously set transformers, if any).
+        Makes the model use the given transformers (removing previously set transformers, if any), which
+        are to be applied to the raw input data frame (prior to feature generation).
 
         :param inputTransformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of inputs
         :return: self
         """
-        self._inputTransformerChain = DataFrameTransformerChain(*inputTransformers)
+        self._rawInputTransformerChain = DataFrameTransformerChain(*transformers)
+        return self
+
+    def withFeatureTransformers(self, *inputTransformers: Union[DataFrameTransformer, List[DataFrameTransformer]]) -> __qualname__:
+        """
+        Makes the model use the given transformers (removing previously set transformers, if any),
+        which are to be applied to the data frames generated by feature generators.
+        (If the model does not use feature generators, the transformers will be applied to
+        whatever is produced by the raw input transformers or, if there are none, the original raw
+        input data frame).
+
+        :param inputTransformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of features
+        :return: self
+        """
+        self._featureTransformerChain = DataFrameTransformerChain(*inputTransformers)
         return self
 
+    @deprecated("Use withFeatureTransformers instead; this method will be removed in a future sensAI release.")
+    def withInputTransformers(self, *inputTransformers: Union[DataFrameTransformer, List[DataFrameTransformer]]) -> __qualname__:
+        """
+        Makes the model use the given feature transformers (removing previously set transformers, if any),
+        i.e. it transforms the data frame that is generated by the feature generators (if any).
+
+        :param inputTransformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of inputs
+        :return: self
+        """
+        return self.withFeatureTransformers(*inputTransformers)
+
     def withFeatureGenerator(self, featureGenerator: Optional[FeatureGenerator]) -> __qualname__:
         """
         Makes the model use the given feature generator in order to obtain the model inputs.
@@ -189,7 +212,7 @@ def withFeatureCollector(self, featureCollector: FeatureCollector) -> __qualname
         return self
 
     def _preProcessorsAreFitted(self):
-        result = self._inputTransformerChain.isFitted()
+        result = self._featureTransformerChain.isFitted()
         if self.getFeatureGenerator() is not None:
             result = result and self.getFeatureGenerator().isFitted()
         return result
@@ -231,13 +254,15 @@ def _computeModelInputs(self, X: pd.DataFrame, Y: pd.DataFrame = None, fit=False
         :return:
         """
         if fit:
+            X = self._rawInputTransformerChain.fitApply(X)
             if self._featureGenerator is not None:
                 X = self._featureGenerator.fitGenerate(X, Y, self)
-            X = self._inputTransformerChain.fitApply(X)
+            X = self._featureTransformerChain.fitApply(X)
         else:
+            X = self._rawInputTransformerChain.apply(X)
             if self._featureGenerator is not None:
                 X = self._featureGenerator.generate(X, self)
-            X = self._inputTransformerChain.apply(X)
+            X = self._featureTransformerChain.apply(X)
         return X
 
     def _computeModelOutputs(self, Y: pd.DataFrame) -> pd.DataFrame:
@@ -289,11 +314,11 @@ def _underlyingModelRequiresFitting(self) -> bool:
     def _fitPreprocessors(self, X: pd.DataFrame, Y: pd.DataFrame = None):
         # no need for fitGenerate if chain is empty
         if self._featureGenerator is not None:
-            if len(self._inputTransformerChain) == 0:
+            if len(self._featureTransformerChain) == 0:
                 self._featureGenerator.fit(X, Y)
             else:
                 X = self._featureGenerator.fitGenerate(X, Y, self)
-        self._inputTransformerChain.fit(X)
+        self._featureTransformerChain.fit(X)
 
     def fitInputOutputData(self, ioData: InputOutputData, fitPreprocessors=True):
         """
@@ -375,7 +400,7 @@ def getInputTransformer(self, cls: Type[DataFrameTransformer]):
         :param cls: the type of transformer to look for
         :return: the first matching transformer or None
         """
-        for it in self._inputTransformerChain.dataFrameTransformers:
+        for it in self._featureTransformerChain.dataFrameTransformers:
             if isinstance(it, cls):
                 return it
         return None
@@ -384,7 +409,7 @@ def getInputTransformerChain(self) -> DataFrameTransformerChain:
         """
         :return: the model's input transformer chain (which may be empty and contain no actual transformers)
         """
-        return self._inputTransformerChain
+        return self._featureTransformerChain
 
     def setFeatureGenerator(self, featureGenerator: Optional[FeatureGenerator]):
         self.withFeatureGenerator(featureGenerator)

From 1a18405b8347d190c2b8b9a131d30b07dcc07ec5 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Sun, 29 May 2022 16:05:51 +0200
Subject: [PATCH 104/131] FgenTakeColumns: allowed to not raise errors on
 missing columns

---
 src/sensai/featuregen.py | 19 ++++++++++++++-----
 1 file changed, 14 insertions(+), 5 deletions(-)

diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index ace07141..3a59354c 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -421,7 +421,8 @@ class FeatureGeneratorTakeColumns(RuleBasedFeatureGenerator):
     def __init__(self, columns: Union[str, List[str]] = None, exceptColumns: Sequence[str] = (),
             categoricalFeatureNames: Optional[Union[Sequence[str], str]] = (),
             normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
-            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None):
+            normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None,
+            verifyColumnNames=True):
         """
         :param columns: name of the column or list of names of columns to be taken. If None, all columns will be taken.
         :param exceptColumns: list of names of columns to not take if present in the input df
@@ -435,21 +436,29 @@ def __init__(self, columns: Union[str, List[str]] = None, exceptColumns: Sequenc
             within a data processing pipeline. They do not affect feature generation.
         :param normalisationRuleTemplate: This parameter can be supplied instead of normalisationRules for the case where
             there shall be a single rule that applies to all columns generated by this feature generator that were not labeled as categorical.
+        :param verifyColumnNames: if True and columns to take were specified, will raise an error in case said columns
+            are missing during feature generation. If False, will log on info level instead
         """
         super().__init__(categoricalFeatureNames=categoricalFeatureNames, normalisationRules=normalisationRules, normalisationRuleTemplate=normalisationRuleTemplate)
         if isinstance(columns, str):
             columns = [columns]
         self.columns = columns
         self.exceptColumns = exceptColumns
+        self.verifyColumnNames = verifyColumnNames
 
     def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
         columnsToTake = self.columns if self.columns is not None else df.columns
         columnsToTake = [col for col in columnsToTake if col not in self.exceptColumns]
 
-        missingCols = set(columnsToTake).difference(df.columns)
-        if len(missingCols) > 0:
-            raise Exception(f"Columns {missingCols} not present in data frame; available columns: {list(df.columns)}")
-
+        if self.columns is not None:
+            missingCols = set(columnsToTake).difference(df.columns)
+            if len(missingCols) > 0:
+                missing_cols_notification = f"Columns {missingCols} were specified but are not present in data frame. " \
+                               f"verifyColumnNames was set to {self.verifyColumnNames}; " \
+                               f"available columns: {list(df.columns)}"
+                if self.verifyColumnNames:
+                    raise RuntimeError(missing_cols_notification)
+                log.info(missing_cols_notification)
         return df[columnsToTake]
 
     def info(self):

From 281a76fefb5aa41492a049e820d6f50e3400751c Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Sun, 29 May 2022 16:11:00 +0200
Subject: [PATCH 105/131] Minor improvement in docstrings

---
 src/sensai/vector_model.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 09849075..8ed3652e 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -149,27 +149,27 @@ def _toStringAdditionalEntries(self) -> Dict[str, Any]:
 
     def withRawInputTransformers(self, *transformers: Union[DataFrameTransformer, List[DataFrameTransformer]]):
         """
-        Makes the model use the given transformers (removing previously set transformers, if any), which
+        Makes the model use the given transformers (removing previously set raw input transformers, if any), which
         are to be applied to the raw input data frame (prior to feature generation).
 
-        :param inputTransformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of inputs
+        :param transformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of inputs
         :return: self
         """
         self._rawInputTransformerChain = DataFrameTransformerChain(*transformers)
         return self
 
-    def withFeatureTransformers(self, *inputTransformers: Union[DataFrameTransformer, List[DataFrameTransformer]]) -> __qualname__:
+    def withFeatureTransformers(self, *transformers: Union[DataFrameTransformer, List[DataFrameTransformer]]) -> __qualname__:
         """
-        Makes the model use the given transformers (removing previously set transformers, if any),
+        Makes the model use the given transformers (removing previously set feature transformers, if any),
         which are to be applied to the data frames generated by feature generators.
         (If the model does not use feature generators, the transformers will be applied to
         whatever is produced by the raw input transformers or, if there are none, the original raw
         input data frame).
 
-        :param inputTransformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of features
+        :param transformers: :class:`DataFrameTransformer` instances to use (in sequence) for the transformation of features
         :return: self
         """
-        self._featureTransformerChain = DataFrameTransformerChain(*inputTransformers)
+        self._featureTransformerChain = DataFrameTransformerChain(*transformers)
         return self
 
     @deprecated("Use withFeatureTransformers instead; this method will be removed in a future sensAI release.")

From be272746b9261adb67ec028963dca437fb1d8e17 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Sun, 29 May 2022 16:22:17 +0200
Subject: [PATCH 106/131] VectorModel: adjusted getters to new transformer
 structure

Also deprecated old getters
---
 src/sensai/vector_model.py | 48 +++++++++++++++++++++++++++++++++++---
 1 file changed, 45 insertions(+), 3 deletions(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 8ed3652e..4731039d 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -393,21 +393,63 @@ def getModelInputVariableNames(self) -> Optional[List[str]]:
         """
         return self._modelInputVariableNames
 
+    @deprecated("Use getFeatureTransformer instead, this method will be removed in a future release")
     def getInputTransformer(self, cls: Type[DataFrameTransformer]):
         """
-        Gets the (first) input transformer of the given type (if any) within this models input transformer chain
+        Gets the (first) feature transformer of the given type (if any) within this models feature transformer chain
 
         :param cls: the type of transformer to look for
-        :return: the first matching transformer or None
+        :return: the first matching feature transformer or None
         """
         for it in self._featureTransformerChain.dataFrameTransformers:
             if isinstance(it, cls):
                 return it
         return None
 
+    def getFeatureTransformer(self, cls: Type[DataFrameTransformer]):
+        """
+        Gets the (first) feature transformer of the given type (if any) within this models feature transformer chain
+
+        :param cls: the type of transformer to look for
+        :return: the first matching feature transformer or None
+        """
+        for it in self._featureTransformerChain.dataFrameTransformers:
+            if isinstance(it, cls):
+                return it
+        return None
+
+    def getRawInputTransformer(self, cls: Type[DataFrameTransformer]):
+        """
+        Gets the (first) raw input transformer of the given type (if any) within this models raw input transformer chain
+
+        :param cls: the type of transformer to look for
+        :return: the first matching raw input transformer or None
+        """
+        for it in self._rawInputTransformerChain.dataFrameTransformers:
+            if isinstance(it, cls):
+                return it
+        return None
+
+    @deprecated("Use getFeatureTransformerChain instead, this method will be removed in a future release")
     def getInputTransformerChain(self) -> DataFrameTransformerChain:
         """
-        :return: the model's input transformer chain (which may be empty and contain no actual transformers)
+        :return: the model's feature transformer chain (which may be empty and contain no actual transformers),
+            i.e. the transformers that are applied after feature generation
+        """
+        return self._featureTransformerChain
+
+
+    def getRawInputTransformerChain(self) -> DataFrameTransformerChain:
+        """
+        :return: the model's raw input transformer chain (which may be empty and contain no actual transformers),
+            i.e. the transformers that are applied before feature generation
+        """
+        return self._rawInputTransformerChain
+
+    def getFeatureTransformerChain(self) -> DataFrameTransformerChain:
+        """
+        :return: the model's feature transformer chain (which may be empty and contain no actual transformers),
+            i.e. the transformers that are applied after feature generation
         """
         return self._featureTransformerChain
 

From b8d550a21f367f92240510e8c451487fe43a358d Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 20:29:30 +0200
Subject: [PATCH 107/131] listString: Support brackets=None

Improved docstrings
---
 src/sensai/util/string.py | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index 47716fe4..81428f28 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -52,8 +52,11 @@ def item(x):
             return quote + x + quote
         else:
             return x
-
-    return brackets[:1] + ", ".join((item(x) for x in l)) + brackets[-1:]
+    s = ", ".join((item(x) for x in l))
+    if brackets is not None:
+        return brackets[:1] + s + brackets[-1:]
+    else:
+        return s
 
 
 def toString(x, converter: StringConverter = None, applyConverterToNonComplexObjects=True):
@@ -121,22 +124,22 @@ class ToStringMixin:
     representation).
 
         * To exclude private properties, override :meth:`_toStringExcludePrivate` to return True. If there are exceptions
-          (and some private properties shall be retained), additionally override :meth:`__toStringExcludeExceptions`.
+          (and some private properties shall be retained), additionally override :meth:`_toStringExcludeExceptions`.
         * To exclude a particular set of properties, override :meth:`_toStringExcludes`.
         * To include only select properties (introducing inclusion semantics), override :meth:`_toStringIncludes`.
         * To add values to the properties list that aren't actually properties of the object (i.e. derived properties),
           override :meth:`_toStringAdditionalEntries`.
-        * To define a fully custom representation for <object info> which is not based on the above principles, override
+        * To define a fully custom representation for ``<object info>`` which is not based on the above principles, override
           :meth:`_toStringObjectInfo`.
 
-    For well-defined string conversions within a class hierarchy, it can be good practice to define additional
+    For well-defined string conversions within a class hierarchy, it can be a good practice to define additional
     inclusions/exclusions by overriding the respective method once more and basing the return value on an extended
     version of the value returned by superclass.
     In some cases, the requirements of a subclass can be at odds with the definitions in the superclass: The superclass
     may make use of exclusion semantics, but the subclass may want to use inclusion semantics (and include
-    only some of the many properties it adds). If the subclass used :meth:`_toStringInclude` the exclusion semantics
-    of the superclass would be void and none of its properties would be included.
-    In this case, override :meth:`_toStringIncludesForced` to add inclusions regardless of the semantics otherwise used along
+    only some of the many properties it adds). In this case, if the subclass used :meth:`_toStringInclude`, the exclusion semantics
+    of the superclass would be void and none of its properties would actually be included.
+    In such cases, override :meth:`_toStringIncludesForced` to add inclusions regardless of the semantics otherwise used along
     the class hierarchy.
 
     .. document private functions

From 8db72617f78776ebb6fc6048e28a5cbe390468ef Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 20:31:20 +0200
Subject: [PATCH 108/131] Added class TorchModelFromModule

Added factory methods:
  * TorchVectorRegressionModel.fromModule
  * TorchVectorClassificationModel.fromModule
---
 src/sensai/torch/torch_base.py | 28 +++++++++++++++++++++++++---
 1 file changed, 25 insertions(+), 3 deletions(-)

diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index 820f8b18..ef136b6f 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -335,6 +335,15 @@ def createTorchModule(self) -> torch.nn.Module:
         return self.moduleFactory(*self.args, **self.kwargs)
 
 
+class TorchModelFromModule(TorchModel):
+    def __init__(self, module: torch.nn.Module, cuda: bool = True):
+        super().__init__(cuda=cuda)
+        self.module = module
+
+    def createTorchModule(self) -> torch.nn.Module:
+        return self.module
+
+
 class VectorTorchModel(TorchModel, ABC):
     """
     Base class for TorchModels that can be used within VectorModels, where the input and output dimensions
@@ -375,9 +384,9 @@ def __init__(self, modelClass: Callable[..., TorchModel], modelArgs: Sequence =
             normalisationMode: NormalisationMode = NormalisationMode.NONE,
             nnOptimiserParams: Union[dict, NNOptimiserParams, None] = None) -> None:
         """
-        :param modelClass: the constructor with which to create the wrapped torch vector model
-        :param modelArgs: the constructor argument list to pass to modelClass
-        :param modelKwArgs: the dictionary of constructor keyword arguments to pass to modelClass
+        :param modelClass: the constructor/factory function with which to create the contained TorchModel instance
+        :param modelArgs: the constructor argument list to pass to ``modelClass``
+        :param modelKwArgs: the dictionary of constructor keyword arguments to pass to ``modelClass``
         :param normalisationMode: the normalisation mode to apply to input data frames
         :param nnOptimiserParams: the parameters to apply in NNOptimiser during training
         """
@@ -410,6 +419,12 @@ def __setstate__(self, state) -> None:
             "outputTensorToArrayConverter"]
         setstate(TorchVectorRegressionModel, self, state, newOptionalProperties=newOptionalMembers)
 
+    @classmethod
+    def fromModule(cls, module: torch.nn.Module, cuda=True, normalisationMode: NormalisationMode = NormalisationMode.NONE,
+            nnOptimiserParams: Optional[NNOptimiserParams] = None) -> "TorchVectorRegressionModel":
+        return cls(TorchModelFromModule, modelKwArgs=dict(module=module, cuda=cuda), normalisationMode=normalisationMode,
+            nnOptimiserParams=nnOptimiserParams)
+
     def withInputTensoriser(self, tensoriser: Tensoriser) -> __qualname__:
         """
         :param tensoriser: tensoriser to use in order to convert input data frames to (one or more) tensors.
@@ -557,6 +572,13 @@ def __setstate__(self, state) -> None:
         setstate(TorchVectorClassificationModel, self, state, newOptionalProperties=newOptionalMembers,
             newDefaultProperties=newDefaultProperties)
 
+    @classmethod
+    def fromModule(cls, outputMode: ClassificationOutputMode, module: torch.nn.Module, cuda=True,
+            normalisationMode: NormalisationMode = NormalisationMode.NONE,
+            nnOptimiserParams: Optional[NNOptimiserParams] = None) -> "TorchVectorRegressionModel":
+        return cls(outputMode, TorchModelFromModule, modelKwArgs=dict(module=module, cuda=cuda),
+            normalisationMode=normalisationMode, nnOptimiserParams=nnOptimiserParams)
+
     def withInputTensoriser(self, tensoriser: Tensoriser) -> __qualname__:
         """
         :param tensoriser: tensoriser to use in order to convert input data frames to (one or more) tensors.

From 98ef634b9d548ea63a8ea9bf1173a2bbbb15a8e2 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 20:36:00 +0200
Subject: [PATCH 109/131] Added second CNN example (from module), motivating
 the input/output adaptiveness of the original model

---
 notebooks/neural_networks.ipynb | 210 ++++++++++++++++++++++++++------
 1 file changed, 173 insertions(+), 37 deletions(-)

diff --git a/notebooks/neural_networks.ipynb b/notebooks/neural_networks.ipynb
index 5f27e802..7b3def36 100644
--- a/notebooks/neural_networks.ipynb
+++ b/notebooks/neural_networks.ipynb
@@ -1,5 +1,15 @@
 {
  "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%load_ext autoreload\n",
+    "%autoreload 2"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -136,9 +146,11 @@
    "source": [
     "import sensai.torch\n",
     "\n",
-    "nnOptimiserParams = sensai.torch.NNOptimiserParams(earlyStoppingEpochs=10, batchSize=54)\n",
-    "torchMLPModel = sensai.torch.models.MultiLayerPerceptronVectorClassificationModel(hiddenDims=(50, 20), cuda=False,\n",
-    "        normalisationMode=sensai.torch.NormalisationMode.MAX_ALL, nnOptimiserParams=nnOptimiserParams, pDropout=0.0).withName(\"MLP\")\n"
+    "nnOptimiserParams = sensai.torch.NNOptimiserParams(earlyStoppingEpochs=2, batchSize=54)\n",
+    "torchMLPModel = sensai.torch.models.MultiLayerPerceptronVectorClassificationModel(hiddenDims=(50, 20), \n",
+    "        cuda=False, normalisationMode=sensai.torch.NormalisationMode.MAX_ALL, \n",
+    "        nnOptimiserParams=nnOptimiserParams, pDropout=0.0) \\\n",
+    "    .withName(\"MLP\")"
    ]
   },
   {
@@ -159,8 +171,22 @@
    "outputs": [],
    "source": [
     "randomForestModel = sensai.sklearn.classification.SkLearnRandomForestVectorClassificationModel(min_samples_leaf=1, n_estimators=10) \\\n",
-    "    .withName(\"RandomForest\")\n",
-    "\n",
+    "    .withName(\"RandomForest\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Let's compare the two models using our evaluation utility."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
     "evalUtil.compareModels([randomForestModel, torchMLPModel])"
    ]
   },
@@ -177,11 +203,127 @@
    "source": [
     "### Creating a Custom CNN Model\n",
     "\n",
-    "Given that this is an image recognition problem, it can be sensible to apply convolutional neural networks (CNNs), which can analyse smaller patches of the image in order to generate more high-level features from them.\n",
+    "Given that this is an image recognition problem, it can be sensible to apply convolutional neural networks (CNNs), which can analyse patches of the image in order to generate more high-level features from them.\n",
+    "Specifically, we shall apply a neural network model which uses multiple convolutions, a max-pooling layer and a multi-layer perceptron at the end in order to produce the classification.\n",
+    "\n",
+    "For classification and regression, sensAI provides the fundamental classes `TorchVectorClassificationModel` and `TorchVectorRegressionModel` respectively. Ultimately, these classes will wrap an instance of `torch.nn.Module`, the base class for neural networks in PyTorch.\n",
+    "\n",
+    "#### Wrapping a Custom torch.nn.Module Instance\n",
     "\n",
-    "To define a custom neural network model that uses PyTorch, we need to implement a new model class. For classification and regression, sensAI provides the base classes `TorchVectorClassificationModel` and `TorchVectorRegressionModel` respectively. Ultimately, these classes will wrap an instance of `torch.nn.Module`, the base class for neural networks in PyTorch.\n",
+    "If we already had an implementation of a ``torch.nn.Module`, it can be straightforwardly adapted to a sensAI model.\n",
     "\n",
-    "In the following, we shall define a model which uses multiple convolutions, a max-pooling layer and a multi-layer perceptron at the end in order to produce the classification."
+    "Let's say we had the following implementation of a torch module, which performs the steps described above.\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "\n",
+    "class MnistCnnModule(torch.nn.Module):\n",
+    "    def __init__(self, imageDim: int, outputDim: int, numConv: int, kernelSize: int, poolingKernelSize: int, \n",
+    "            mlpHiddenDims: Sequence[int], outputActivationFn: sensai.torch.ActivationFunction, pDropout=0.0):\n",
+    "        super().__init__()\n",
+    "        k = kernelSize\n",
+    "        p = poolingKernelSize\n",
+    "        self.cnn = torch.nn.Conv2d(1, numConv, (k, k))\n",
+    "        self.pool = torch.nn.MaxPool2d((p, p))\n",
+    "        self.dropout = torch.nn.Dropout(p=pDropout)\n",
+    "        reducedDim = (imageDim-k+1)/p\n",
+    "        if int(reducedDim) != reducedDim:\n",
+    "            raise ValueError(f\"Pooling kernel size {p} is not a divisor of post-convolution dimension {imageDim-k+1}\")\n",
+    "        self.mlp = sensai.torch.models.MultiLayerPerceptron(numConv * int(reducedDim)**2, outputDim, mlpHiddenDims,\n",
+    "            outputActivationFn=outputActivationFn.getTorchFunction(),\n",
+    "            hidActivationFn=sensai.torch.ActivationFunction.RELU.getTorchFunction(),\n",
+    "            pDropout=pDropout)\n",
+    "\n",
+    "    def forward(self, x):\n",
+    "        x = self.cnn(x.unsqueeze(1))\n",
+    "        x = self.pool(x)\n",
+    "        x = x.view(x.shape[0], -1)\n",
+    "        x = self.dropout(x)\n",
+    "        return self.mlp(x)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Since this module requires 2D images as input, we will need a component that transforms the vector input that is given in our data frame into a tensor that will serve as input to the module.\n",
+    "In sensAI, the abstraction for this purpose is a ``sensai.torch.Tensoriser``. A **Tensoriser** can, in principle, perform arbitrary computations in order to produce, from a data frame with N rows, one or more tensors of length N (first dimension equal to N) that will ultimately be fed to the neural network.\n",
+    "\n",
+    "Luckily, for the case at hand, we already have the function ``reshape2DImage`` from above to assist in the implementation of the tensoriser."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class ImageReshapingInputTensoriser(sensai.torch.RuleBasedTensoriser):\n",
+    "    def _tensorise(self, df: pd.DataFrame) -> Union[torch.Tensor, List[torch.Tensor]]:\n",
+    "        images = [reshape2DImage(row) for _, row in df.iterrows()]\n",
+    "        return torch.tensor(np.stack(images)).float() / 255"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In this case, we derived the class from ``RuleBasedTensorised`` rather than ``Tensoriser``, because it does not require fitting. We additionally took care of the normalisation within the tensoriser.\n",
+    "\n",
+    "Now we have all we need to create a sensAI ``TorchVectorClassificationModel`` that will work on the input/output data we loaded earlier."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "cnnModule = MnistCnnModule(28, 10, 32, 5, 2, (200, 20), sensai.torch.ActivationFunction.LOG_SOFTMAX)\n",
+    "nnOptimiserParams = sensai.torch.NNOptimiserParams(optimiser=sensai.torch.Optimiser.ADAMW, optimiserLR=0.01, batchSize=1024, \n",
+    "    earlyStoppingEpochs=3)\n",
+    "cnnModelFromModule = sensai.torch.TorchVectorClassificationModel.fromModule(\n",
+    "        sensai.torch.ClassificationOutputMode.LOG_PROBABILITIES, \n",
+    "        cnnModule, cuda=False, nnOptimiserParams=nnOptimiserParams) \\\n",
+    "    .withInputTensoriser(ImageReshapingInputTensoriser()) \\\n",
+    "    .withName(\"CNN\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We have now fully defined all the necessary parameters, including parameters controlling the training of the model.\n",
+    "\n",
+    "We are now ready to evaluate the model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evalUtil.performSimpleEvaluation(cnnModelFromModule);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "#### Creating an Input-/Output-Adaptive Custom Model\n",
+    "\n",
+    "While the above approach allows us to straightforwardly encapsulate a ``torch.nn.Module``, it really doesn't follow sensAI's principle of adapting model hyperparameters based on the inputs and outputs we receive during training - whenever possible. Notice that in the above example, we had to hard-code the image dimension (``28``) as well as the number of classes (``10``), even though these parameters could have been easily determined from the data. Especially in other domains where feature engineering is possible, we might want to experiment with different combinations of features, and therefore automatically adapting to inputs is key if we want to avoid editing the model hyperparameters time and time again; similarly, we might change the set of target labels in our classification problem and the model should simply adapt to a changed output dimension.\n",
+    "\n",
+    "To design a model that can fully adapt to the inputs and outputs, we can simply subclass ``TorchVectorClassificationModel``, where the late instantiation of the underlying model is catered for. Naturally, delayed construction of the underlying model necessitates the use of factories and thus results in some indirections. \n",
+    "\n",
+    "If we had designed the above model to be within the sensAI ``VectorModel`` realm from the beginning, here's what we might have written:"
    ]
   },
   {
@@ -204,36 +346,30 @@
     "        self.pDropout = pDropout\n",
     "        super().__init__(sensai.torch.ClassificationOutputMode.forActivationFn(self.outputActivationFn),\n",
     "            modelClass=self.VectorTorchModel, modelArgs=[self], nnOptimiserParams=nnOptimiserParams)\n",
-    "        self.withInputTensoriser(self.InputTensoriser())\n",
-    "\n",
-    "    class InputTensoriser(sensai.torch.RuleBasedTensoriser):\n",
-    "        def _tensorise(self, df: pd.DataFrame) -> Union[torch.Tensor, List[torch.Tensor]]:\n",
-    "            images = [reshape2DImage(row) for _, row in df.iterrows()]\n",
-    "            return torch.tensor(np.stack(images)).float() / 255\n",
     "\n",
     "    class VectorTorchModel(sensai.torch.VectorTorchModel):\n",
-    "        def __init__(self, vecModel: \"CnnModel\"):\n",
-    "            super().__init__(vecModel.cuda)\n",
-    "            self._vecModel = vecModel\n",
+    "        def __init__(self, parent: \"CnnModel\"):\n",
+    "            super().__init__(parent.cuda)\n",
+    "            self._parent = parent\n",
     "\n",
     "        def createTorchModuleForDims(self, inputDim: int, outputDim: int) -> torch.nn.Module:\n",
-    "            return self.Module(int(np.sqrt(inputDim)), outputDim, self._vecModel)\n",
+    "            return self.Module(int(np.sqrt(inputDim)), outputDim, self._parent)\n",
     "\n",
     "        class Module(torch.nn.Module):\n",
-    "            def __init__(self, imageDim, outputDim, vecModel: \"CnnModel\"):\n",
+    "            def __init__(self, imageDim, outputDim, parent: \"CnnModel\"):\n",
     "                super().__init__()\n",
-    "                k = vecModel.kernelSize\n",
-    "                p = vecModel.poolingKernelSize\n",
-    "                self.cnn = torch.nn.Conv2d(1, vecModel.numConv, (k, k))\n",
+    "                k = parent.kernelSize\n",
+    "                p = parent.poolingKernelSize\n",
+    "                self.cnn = torch.nn.Conv2d(1, parent.numConv, (k, k))\n",
     "                self.pool = torch.nn.MaxPool2d((p, p))\n",
-    "                self.dropout = torch.nn.Dropout(p=vecModel.pDropout)\n",
+    "                self.dropout = torch.nn.Dropout(p=parent.pDropout)\n",
     "                reducedDim = (imageDim-k+1)/p\n",
     "                if int(reducedDim) != reducedDim:\n",
     "                    raise ValueError(f\"Pooling kernel size {p} is not a divisor of post-convolution dimension {imageDim-k+1}\")\n",
-    "                self.mlp = sensai.torch.models.MultiLayerPerceptron(vecModel.numConv * int(reducedDim)**2, outputDim, vecModel.mlpHiddenDims,\n",
-    "                    outputActivationFn=vecModel.outputActivationFn.getTorchFunction(),\n",
+    "                self.mlp = sensai.torch.models.MultiLayerPerceptron(parent.numConv * int(reducedDim)**2, outputDim, parent.mlpHiddenDims,\n",
+    "                    outputActivationFn=parent.outputActivationFn.getTorchFunction(),\n",
     "                    hidActivationFn=sensai.torch.ActivationFunction.RELU.getTorchFunction(),\n",
-    "                    pDropout=vecModel.pDropout)\n",
+    "                    pDropout=parent.pDropout)\n",
     "\n",
     "            def forward(self, x):\n",
     "                x = self.cnn(x.unsqueeze(1))\n",
@@ -247,12 +383,10 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Very little code is required in addition to the actual torch module.\n",
-    "The outer class, which provides the sensAI `VectorModel` features, serves mainly to hold the parameters, and the inner class inheriting from `VectorTorchModel` serves as a factory for the `torch.nn.Module`, providing us with the input and output dimensions (number of input columns and number of classes respectively) based on the data. Because we take the dimensions directly from the input, this model could easily process other image sizes than 28x28 and we furthermore end up with fewer magic numbers in the code.\n",
-    "\n",
-    "The inner class `InputTensoriser`, which is instantiated and passed as the input tensoriser for the model, serves to convert the input data frame into a tensor. It could perform arbitrary computations in order to produce, from a data frame with N rows, one or more tensors of length N (first dimension equal to N) that will ultimately be fed to the neural network.\n",
+    "It is only insignificantly more code than in the previous implementation.\n",
+    "The outer class, which provides the sensAI `VectorModel` features, serves mainly to hold the parameters, and the inner class inheriting from `VectorTorchModel` serves as a factory for the `torch.nn.Module`, providing us with the input and output dimensions (number of input columns and number of classes respectively) based on the data, thus enabling the model to adapt. If we had required even more adaptiveness, we could have learnt more about the data from within the fitting process of a custom input tensoriser (i.e. we could have added an inner ``Tensoriser`` class, which could have derived further hyperparameters from the data in its implementation of the fitting method.)\n",
     "\n",
-    "Let's instantiate our model and see how it performs."
+    "Let's instantiate our model and evaluate it."
    ]
   },
   {
@@ -261,10 +395,10 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "nnOptimiserParams = sensai.torch.NNOptimiserParams(optimiser=sensai.torch.Optimiser.ADAMW, optimiserLR=0.01, batchSize=1024, \n",
-    "    earlyStoppingEpochs=3)\n",
     "cnnModel = CnnModel(cuda=False, kernelSize=5, numConv=32, poolingKernelSize=2, mlpHiddenDims=(200,20),\n",
-    "    nnOptimiserParams=nnOptimiserParams).withName(\"CNN\")\n",
+    "        nnOptimiserParams=nnOptimiserParams) \\\n",
+    "    .withName(\"CNN'\") \\\n",
+    "    .withInputTensoriser(ImageReshapingInputTensoriser())\n",
     "\n",
     "evalData = evalUtil.performSimpleEvaluation(cnnModel)"
    ]
@@ -273,7 +407,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "The model does slightly improve upon the MLP model we evaluated earlier."
+    "Our CNN models does slightly improve upon the MLP model we evaluated earlier. Let's do another comparison, so we get all the metrics in one place."
    ]
   },
   {
@@ -282,7 +416,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "comparisonData = evalUtil.compareModels([torchMLPModel, cnnModel, randomForestModel], fitModels=False)\n",
+    "comparisonData = evalUtil.compareModels([torchMLPModel, cnnModelFromModule, cnnModel, randomForestModel], fitModels=False)\n",
     "comparisonData.resultsDF"
    ]
   },
@@ -290,7 +424,9 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Could the CNN model have produced even better results? Let's take a look at some examples where the CNN model went wrong."
+    "Note that any differences between the two CNN models are due only to randomness in the parameter initialisation; they are functionally identical.\n",
+    "\n",
+    "Could the CNN model have produced even better results? Let's take a look at some examples where the CNN model went wrong by inspecting the evaluation data that was returned earlier."
    ]
   },
   {

From d41788c1eb90253d2f42155a32612a7e29cccbf3 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 21:21:24 +0200
Subject: [PATCH 110/131] Disable warnings

---
 notebooks/neural_networks.ipynb | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/notebooks/neural_networks.ipynb b/notebooks/neural_networks.ipynb
index 7b3def36..eccfc796 100644
--- a/notebooks/neural_networks.ipynb
+++ b/notebooks/neural_networks.ipynb
@@ -22,8 +22,10 @@
     "import numpy as np\n",
     "from typing import *\n",
     "import config\n",
+    "import warnings\n",
     "\n",
     "cfg = config.get_config()\n",
+    "warnings.filterwarnings(\"ignore\")\n",
     "sensai.util.logging.configureLogging()"
    ]
   },

From dc37c655823c904c7f9c51ee31253b2129519274 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 21:27:47 +0200
Subject: [PATCH 111/131] TorchVectorClassificationModel.fromModule: Changed
 parameter order

---
 notebooks/neural_networks.ipynb | 6 +++---
 src/sensai/torch/torch_base.py  | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/notebooks/neural_networks.ipynb b/notebooks/neural_networks.ipynb
index eccfc796..2cfa23ad 100644
--- a/notebooks/neural_networks.ipynb
+++ b/notebooks/neural_networks.ipynb
@@ -276,7 +276,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "In this case, we derived the class from ``RuleBasedTensorised`` rather than ``Tensoriser``, because it does not require fitting. We additionally took care of the normalisation within the tensoriser.\n",
+    "In this case, we derived the class from ``RuleBasedTensorised`` rather than ``Tensoriser``, because our tensoriser does not require fitting. We additionally took care of the normalisation.\n",
     "\n",
     "Now we have all we need to create a sensAI ``TorchVectorClassificationModel`` that will work on the input/output data we loaded earlier."
    ]
@@ -291,8 +291,8 @@
     "nnOptimiserParams = sensai.torch.NNOptimiserParams(optimiser=sensai.torch.Optimiser.ADAMW, optimiserLR=0.01, batchSize=1024, \n",
     "    earlyStoppingEpochs=3)\n",
     "cnnModelFromModule = sensai.torch.TorchVectorClassificationModel.fromModule(\n",
-    "        sensai.torch.ClassificationOutputMode.LOG_PROBABILITIES, \n",
-    "        cnnModule, cuda=False, nnOptimiserParams=nnOptimiserParams) \\\n",
+    "        cnnModule, sensai.torch.ClassificationOutputMode.LOG_PROBABILITIES, \n",
+    "        cuda=False, nnOptimiserParams=nnOptimiserParams) \\\n",
     "    .withInputTensoriser(ImageReshapingInputTensoriser()) \\\n",
     "    .withName(\"CNN\")"
    ]
diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index ef136b6f..0f96ec9d 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -573,7 +573,7 @@ def __setstate__(self, state) -> None:
             newDefaultProperties=newDefaultProperties)
 
     @classmethod
-    def fromModule(cls, outputMode: ClassificationOutputMode, module: torch.nn.Module, cuda=True,
+    def fromModule(cls, module: torch.nn.Module, outputMode: ClassificationOutputMode, cuda=True,
             normalisationMode: NormalisationMode = NormalisationMode.NONE,
             nnOptimiserParams: Optional[NNOptimiserParams] = None) -> "TorchVectorRegressionModel":
         return cls(outputMode, TorchModelFromModule, modelKwArgs=dict(module=module, cuda=cuda),

From fdc998ae342ebb9b00301892c7c640c031a9af90 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Sun, 29 May 2022 21:33:59 +0200
Subject: [PATCH 112/131] Fixed typos, minor improvements

---
 notebooks/neural_networks.ipynb | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/notebooks/neural_networks.ipynb b/notebooks/neural_networks.ipynb
index 2cfa23ad..6461bba1 100644
--- a/notebooks/neural_networks.ipynb
+++ b/notebooks/neural_networks.ipynb
@@ -212,7 +212,7 @@
     "\n",
     "#### Wrapping a Custom torch.nn.Module Instance\n",
     "\n",
-    "If we already had an implementation of a ``torch.nn.Module`, it can be straightforwardly adapted to a sensAI model.\n",
+    "If we already had an implementation of a `torch.nn.Module`, it can be straightforwardly adapted to become a sensAI ``VectorModel``.\n",
     "\n",
     "Let's say we had the following implementation of a torch module, which performs the steps described above.\n"
    ]
@@ -409,7 +409,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Our CNN models does slightly improve upon the MLP model we evaluated earlier. Let's do another comparison, so we get all the metrics in one place."
+    "Our CNN models do improve upon the MLP model we evaluated earlier. Let's do a comparison of all the models we trained thus far:"
    ]
   },
   {

From 9a0efcdf5f996e6ae81286870c4c4a495c077f02 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 30 May 2022 00:18:00 +0200
Subject: [PATCH 113/131] Fixed type annotation

---
 src/sensai/torch/torch_base.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index 0f96ec9d..7aa37c99 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -575,7 +575,7 @@ def __setstate__(self, state) -> None:
     @classmethod
     def fromModule(cls, module: torch.nn.Module, outputMode: ClassificationOutputMode, cuda=True,
             normalisationMode: NormalisationMode = NormalisationMode.NONE,
-            nnOptimiserParams: Optional[NNOptimiserParams] = None) -> "TorchVectorRegressionModel":
+            nnOptimiserParams: Optional[NNOptimiserParams] = None) -> "TorchVectorClassificationModel":
         return cls(outputMode, TorchModelFromModule, modelKwArgs=dict(module=module, cuda=cuda),
             normalisationMode=normalisationMode, nnOptimiserParams=nnOptimiserParams)
 

From 297bb5eed5f45851f4b2c6395636fb28ca0b08ae Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Mon, 30 May 2022 01:26:41 +0200
Subject: [PATCH 114/131] Fixed choice of loss function & activation (was
 mismatch), added proper evaluation and adapted preamble

---
 .../tensor_models_pytorch_lightning.ipynb     | 120 ++++++++++--------
 1 file changed, 64 insertions(+), 56 deletions(-)

diff --git a/notebooks/tensor_models_pytorch_lightning.ipynb b/notebooks/tensor_models_pytorch_lightning.ipynb
index daf1260b..8b5fb9dc 100644
--- a/notebooks/tensor_models_pytorch_lightning.ipynb
+++ b/notebooks/tensor_models_pytorch_lightning.ipynb
@@ -1,5 +1,30 @@
 {
  "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%load_ext autoreload\n",
+    "%autoreload 2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys; sys.path.extend([\"../src\", \"..\"])\n",
+    "import sensai\n",
+    "import logging\n",
+    "import config\n",
+    "\n",
+    "c = config.get_config(reload=True)\n",
+    "sensai.util.logging.configureLogging(level=logging.INFO)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {
@@ -15,45 +40,6 @@
     "and trainers for even faster development and experimentation."
    ]
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "collapsed": false
-   },
-   "source": [
-    "### Before running the notebook\n",
-    "\n",
-    "Install the package and its dependencies, if you haven't done so already. E.g. for an editable install call\n",
-    "```\n",
-    "pip install -e .\n",
-    "```\n",
-    "from the root directory. You can also execute this command directly in the notebook but will need to reload the\n",
-    "kernel afterwards\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Note - this cell should be executed only once per session\n",
-    "\n",
-    "%load_ext autoreload\n",
-    "%autoreload 2\n",
-    "\n",
-    "import sys, os\n",
-    "\n",
-    "# in order to get the top level modules; they are not part of the package\n",
-    "os.chdir(\"..\")\n",
-    "sys.path.append(os.path.abspath(\".\"))\n",
-    "try:\n",
-    "    import sensai\n",
-    "except:\n",
-    "    sys.path.append(os.path.abspath(\"src\"))\n",
-    "    import sensai"
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -128,7 +114,7 @@
     }
    },
    "source": [
-    "## Using Data Loaders in pure PyTorch Lightning\n",
+    "## Using Data Loaders in Pure PyTorch Lightning\n",
     "\n",
     "First, let us see how training would proceed in pure pytorch-lightning.\n",
     "\n",
@@ -147,14 +133,16 @@
    },
    "outputs": [],
    "source": [
+    "TEST_FRACTION = 0.2\n",
     "VALIDATION_FRACTION = 0.1\n",
     "\n",
     "full_ds = InputOutputArrays(extractArray(X), extractArray(labels))\n",
-    "splitter = DataSplitterFractional(1-VALIDATION_FRACTION)\n",
     "\n",
-    "train_ds, val_ds = splitter.split(full_ds)\n",
+    "full_train_ds, test_ds = DataSplitterFractional(1-VALIDATION_FRACTION).split(full_ds)\n",
+    "train_ds, val_ds = DataSplitterFractional(1-VALIDATION_FRACTION).split(full_train_ds)\n",
     "train_dataloader = train_ds.toTorchDataLoader()\n",
-    "val_dataloader = val_ds.toTorchDataLoader()"
+    "val_dataloader = val_ds.toTorchDataLoader()\n",
+    "test_dataloader = test_ds.toTorchDataLoader()"
    ]
   },
   {
@@ -190,16 +178,16 @@
     "    def forward(self, x: torch.Tensor):\n",
     "        x = x.float()\n",
     "        x = torch.relu(self.l1(x.view(x.size(0), -1)))\n",
-    "        return F.softmax(x, dim=1)\n",
+    "        return F.log_softmax(x, dim=1)\n",
     "\n",
     "    def training_step(self, batch, *args):\n",
     "        x, y = batch\n",
-    "        loss = F.cross_entropy(self(x), y)\n",
+    "        loss = F.nll_loss(self(x), y)\n",
     "        return loss\n",
     "\n",
     "    def validation_step(self, batch, *args):\n",
     "        x, y = batch\n",
-    "        loss = F.cross_entropy(self(x), y)\n",
+    "        loss = F.nll_loss(self(x), y)\n",
     "        return loss\n",
     "\n",
     "    def configure_optimizers(self):\n",
@@ -219,7 +207,7 @@
    "source": [
     "mnist_model = MNISTModel()\n",
     "\n",
-    "trainer = pl.Trainer(max_epochs=3, progress_bar_refresh_rate=20)\n",
+    "trainer = pl.Trainer(max_epochs=5, progress_bar_refresh_rate=20)\n",
     "trainer.fit(mnist_model, train_dataloader, val_dataloader)"
    ]
   },
@@ -246,13 +234,24 @@
    },
    "outputs": [],
    "source": [
-    "mini_test_set = val_dataloader.dataset[10:20]\n",
+    "mini_test_set = test_dataloader.dataset[10:20]\n",
     "test_images, test_labels = mini_test_set\n",
     "\n",
     "display(mnist_model(test_images).argmax(axis=1))\n",
     "display(test_labels)"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sklearn\n",
+    "\n",
+    "sklearn.metrics.accuracy_score(test_ds.outputs, mnist_model(test_dataloader.dataset[:][0]).argmax(axis=1))"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {
@@ -336,7 +335,10 @@
    },
    "outputs": [],
    "source": [
-    "sensaiMnistModel.fit(X, labels)"
+    "ioData = sensai.InputOutputData(X, labels)\n",
+    "trainData, testData = DataSplitterFractional(0.8).split(ioData)\n",
+    "\n",
+    "sensaiMnistModel.fitInputOutputData(trainData)"
    ]
   },
   {
@@ -364,9 +366,9 @@
    "outputs": [],
    "source": [
     "display(\"Predicted data frame\")\n",
-    "display(sensaiMnistModel.predict(X.iloc[:10]))\n",
+    "display(sensaiMnistModel.predict(testData.inputs.iloc[:10]))\n",
     "display(\"True labels data frame\")\n",
-    "display(labels.iloc[:10])"
+    "display(testData.outputs.iloc[:10])"
    ]
   },
   {
@@ -378,11 +380,17 @@
     }
    },
    "source": [
-    "## Evaluating Tensor Models\n",
-    "\n",
-    "TODO - the evaluation part is unfinished yet (although we could already the above classifier with the standard\n",
-    "vector model evaluators).\n",
-    "We should also include TensorToTensor models here and show how to evaluate them\n"
+    "## Evaluating the Model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evaluator = sensai.evaluation.VectorClassificationModelEvaluator(trainData, testData)\n",
+    "evaluator.evalModel(sensaiMnistModel).getEvalStats().metricsDict()"
    ]
   }
  ],

From 09aa519493ee72dd992a36c568d6d42cf6f7cd28 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Thu, 2 Jun 2022 19:18:48 +0200
Subject: [PATCH 115/131] Sync pjm

  commit 8e57a6dc02463c84a8be0c35cf224299cf0a1cb2
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 2 19:07:40 2022 +0200

      Fixed plot titles: 'y vs. x' instead of 'x vs. y'

  sensai/evaluation/eval_stats/eval_stats_regression.py

  commit ed32bff53491e518f1a886e0e4112811a0ccf613
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 2 19:06:50 2022 +0200

      MultiDataEvaluationUtil: Moved distribution & x-y plot generation to MultiDataModelComparisonData

  sensai/evaluation/eval_util.py

  commit 21735748b1e428fc24a91d861ef4a2ca2ca64b8a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 2 19:05:12 2022 +0200

      EvalStatsCollection: Improved metric plots:
        * Set axis bounds with room to spare for x-y metric plots
        * Support complementary cdf for metric distribution plots and improved axis ticks

  sensai/evaluation/eval_stats/eval_stats_base.py

  commit dbd47dd8288554c6cba44fc9434c7828292d2d8d
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 2 18:57:37 2022 +0200

      Added ClassificationMetricAccuracyWithoutLabels

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit f9e1490f763fe4ea3d11c4f7c3cd4d580d0d0bac
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 2 18:48:45 2022 +0200

      ScatterPlot: Adjusted transparency function

      HistogramPlot: Support complementary cdf, configure y-axis ticks depending on stat

  sensai/util/plot.py

  commit f2226e86c15f86e6fca53f5f9624e2178b965881
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 2 18:27:08 2022 +0200

      PickleCached, cached: Added versioning of cached results

  sensai/util/cache.py

  commit f9b6b10a14e385c33d4cdb413d749e70af48476f
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Jun 1 17:43:01 2022 +0200

      MultiDataEvaluationUtil: Enable cdf by default in distribution plots

  sensai/evaluation/eval_util.py

  commit 162120f82f630cbd040ef2c57207a3dd6a59a54a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Jun 1 17:42:26 2022 +0200

      ClassificationMetricAccuracyMaxProbabilityBeyondThreshold: Added paired metric

  sensai/evaluation/eval_stats/eval_stats_classification.py

  commit b2d58ad4741df2b3500fd4f0333afb24672b668d
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Wed Jun 1 17:42:03 2022 +0200

      EvalStatsCollection.plotDistribution: Disable kde by default, added option to add cdf

  sensai/evaluation/eval_stats/eval_stats_base.py

  commit 02f9f17d42cf35821216e26d42945e7e2b131669
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 22:26:23 2022 +0200

      MultiDataEvaluationUtil: Added model string representations to comparison results text file

  sensai/evaluation/eval_util.py

  commit 7171f23f583e772caee804477807177c368b0787
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 22:24:38 2022 +0200

      HistogramPlot: Added option to add cdf

  sensai/util/plot.py

  commit b7047166a9d14a5a291bab5fa0b421f22b8627e9
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 21:05:39 2022 +0200

      ScatterPlot: Determine point transparency based on number of data points

  sensai/util/plot.py

  commit 90060f2c65d8f8f3a48192f1ace4cc034e7541a5
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 21:03:37 2022 +0200

      * Added concept of paired metrics (e.g. precision and recall)
      * EvalStatsCollection, MultiDataEvaluationUtil: Added scatter plots of paired metrics

  sensai/evaluation/eval_stats/eval_stats_base.py
  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/eval_util.py

  commit 909e8c8c2c383c3c5b222362657bd84ba497849b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 20:52:28 2022 +0200

      Plot: Fixed ax not always being an Axes object; allow chaining of attribute setters

  sensai/util/plot.py

  commit b43edafe3e80a90d6f6c8c1d0d51342794ec07d0
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 20:00:03 2022 +0200

      MultiDataEvaluationUtil: Added option to plot metric distributions

  sensai/evaluation/eval_util.py

  commit 17866e261b9b35882314259139d7d2437dc40085
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue May 31 19:23:01 2022 +0200

      Metrics:
        * Metric: Added bounds member
        * EvalStatsCollection:
            - Allow to retrieve Metric objects, adding second type parameter
            - Use Metric.bounds in plotDistribution
        * Added new classification metrics:
            - BinaryClassificationMetricPrecisionThreshold
            - BinaryClassificationMetricRecallThreshold
        * BinaryClassificationMetricRecallForPrecision: Added zeroValue fallback to

  sensai/evaluation/eval_stats/eval_stats_base.py
  sensai/evaluation/eval_stats/eval_stats_classification.py
  sensai/evaluation/eval_stats/eval_stats_regression.py
---
 .../evaluation/eval_stats/eval_stats_base.py  | 112 +++++++++++---
 .../eval_stats/eval_stats_classification.py   | 140 ++++++++++++++++--
 .../eval_stats/eval_stats_regression.py       |   6 +-
 src/sensai/evaluation/eval_util.py            |  48 +++++-
 src/sensai/util/cache.py                      |  27 +++-
 src/sensai/util/plot.py                       | 105 ++++++++++---
 6 files changed, 375 insertions(+), 63 deletions(-)

diff --git a/src/sensai/evaluation/eval_stats/eval_stats_base.py b/src/sensai/evaluation/eval_stats/eval_stats_base.py
index e085273b..07f542f0 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_base.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_base.py
@@ -3,8 +3,9 @@
 import seaborn as sns
 from abc import ABC, abstractmethod
 from matplotlib import pyplot as plt
-from typing import Generic, TypeVar, List, Union, Dict, Sequence, Optional
+from typing import Generic, TypeVar, List, Union, Dict, Sequence, Optional, Tuple, Callable
 
+from ...util.plot import ScatterPlot, HistogramPlot, Plot, HeatMapPlot
 from ...util.string import ToStringMixin, dictString
 from ...vector_model import VectorModel
 
@@ -65,19 +66,33 @@ def _toStringObjectInfo(self) -> str:
 class Metric(Generic[TEvalStats], ABC):
     name: str
 
-    def __init__(self, name: str = None):
+    def __init__(self, name: str = None, bounds: Optional[Tuple[float, float]] = None):
         """
         :param name: the name of the metric; if None use the class' name attribute
+        :param bounds: the minimum and maximum values the metric can take on (or None if the bounds are not specified)
         """
         # this raises an attribute error if a subclass does not specify a name as a static attribute nor as parameter
         self.name = name if name is not None else self.__class__.name
+        self.bounds = bounds
 
     @abstractmethod
     def computeValueForEvalStats(self, evalStats: TEvalStats) -> float:
         pass
 
+    def getPairedMetrics(self) -> List[TMetric]:
+        """
+        Gets a list of metrics that should be considered together with this metric (e.g. for paired visualisations/plots).
+        The direction of the pairing should be such that if this metric is "x", the other is "y" for x-y type visualisations.
+
+        :return: a list of metrics
+        """
+        return []
+
+    def hasFiniteBounds(self) -> bool:
+        return self.bounds is not None and not any((np.isinf(x) for x in self.bounds))
+
 
-class EvalStatsCollection(Generic[TEvalStats], ABC):
+class EvalStatsCollection(Generic[TEvalStats, TMetric], ABC):
     def __init__(self, evalStatsList: List[TEvalStats]):
         self.statsList = evalStatsList
         metricNamesSet = None
@@ -92,53 +107,108 @@ def __init__(self, evalStatsList: List[TEvalStats]):
                     raise Exception(f"Inconsistent set of metrics in evaluation stats collection: Got {metricNamesSet} for one instance, {currentMetricNamesSet} for another")
             metricsList.append(metrics)
         metricNames = sorted(metricsList[0].keys())
-        self.metrics = {metric: [d[metric] for d in metricsList] for metric in metricNames}
+        self._valuesByMetricName = {metric: [d[metric] for d in metricsList] for metric in metricNames}
+        self._metrics: List[TMetric] = evalStatsList[0].metrics
 
-    def getValues(self, metric):
-        return self.metrics[metric]
+    def getValues(self, metricName: str):
+        return self._valuesByMetricName[metricName]
 
     def getMetricNames(self) -> List[str]:
-        return list(self.metrics.keys())
+        return list(self._valuesByMetricName.keys())
+
+    def getMetrics(self) -> List[TMetric]:
+        return self._metrics
+
+    def getMetricByName(self, name: str) -> Optional[TMetric]:
+        for m in self._metrics:
+            if m.name == name:
+                return m
+        return None
+
+    def hasMetric(self, metric: Union[Metric, str]) -> bool:
+        if type(metric) != str:
+            metric = metric.name
+        return metric in self._valuesByMetricName
 
     def aggMetricsDict(self, aggFns=(np.mean, np.std)) -> Dict[str, float]:
         agg = {}
-        for metric, values in self.metrics.items():
+        for metric, values in self._valuesByMetricName.items():
             for aggFn in aggFns:
                 agg[f"{aggFn.__name__}[{metric}]"] = float(aggFn(values))
         return agg
 
     def meanMetricsDict(self) -> Dict[str, float]:
-        metrics = {metric: np.mean(values) for (metric, values) in self.metrics.items()}
+        metrics = {metric: np.mean(values) for (metric, values) in self._valuesByMetricName.items()}
         return metrics
 
-    def plotDistribution(self, metricName: str, subtitle: Optional[str] = None, bins=None, kde=True, stat="percent",
-            **kwargs) -> plt.Figure:
+    def plotDistribution(self, metricName: str, subtitle: Optional[str] = None, bins=None, kde=False, cdf=False,
+            cdfComplementary=False, stat="proportion", **kwargs) -> plt.Figure:
         """
         Plots the distribution of a metric as a histogram
 
-        :param metricName: the name of the metric for which to plot the distribution (histogram) across evaluations
+        :param metricName: name of the metric for which to plot the distribution (histogram) across evaluations
         :param subtitle: the subtitle to add, if any
-        :param bins: the histogram bins (number of bins or boundaries); if None, auto
+        :param bins: the histogram bins (number of bins or boundaries); metrics bounds will be used to define the x limits.
+            If None, use 'auto' bins
         :param kde: whether to add a kernel density estimator plot
-        :param stat: the statistic to compute for each bin ('percent', 'probability', 'count', 'frequency' or 'density'), y-axis value
+        :param cdf: whether to add the cumulative distribution function (cdf)
+        :param cdfComplementary: whether to plot, if ``cdf`` is True, the complementary cdf instead of the regular cdf
+        :param stat: the statistic to compute for each bin ('percent', 'probability'='proportion', 'count', 'frequency' or 'density'), y-axis value
         :param kwargs: additional parameters to pass to seaborn.histplot (see https://seaborn.pydata.org/generated/seaborn.histplot.html)
         :return:
         """
-        values = self.metrics[metricName]
-        fig = plt.figure()
+        # define bins based on metric bounds where available
+        xTick = None
+        if bins is None or type(bins) == int:
+            metric = self.getMetricByName(metricName)
+            if metric.bounds == (0, 1):
+                xTick = 0.1
+                if bins is None:
+                    numBins = 10 if cdf else 20
+                else:
+                    numBins = bins
+                bins = np.linspace(0, 1, numBins+1)
+
+        values = self._valuesByMetricName[metricName]
         title = metricName
         if subtitle is not None:
             title += "\n" + subtitle
-        plt.title(title)
-        sns.histplot(values, kde=kde, bins=bins, stat=stat, **kwargs)
-        return fig
+        plot = HistogramPlot(values, bins=bins, stat=stat, kde=kde, cdf=cdf, cdfComplementary=cdfComplementary, **kwargs).title(title)
+        if xTick is not None:
+            plot.xtickMajor(xTick)
+        return plot.fig
+
+    def _plotXY(self, metricNameX, metricNameY, plotFactory: Callable[[Sequence, Sequence], Plot], adjustBounds: bool) -> plt.Figure:
+        def axlim(bounds):
+            minValue, maxValue = bounds
+            diff = maxValue - minValue
+            return (minValue - 0.05 * diff, maxValue + 0.05 * diff)
+
+        x = self._valuesByMetricName[metricNameX]
+        y = self._valuesByMetricName[metricNameY]
+        plot = plotFactory(x, y)
+        plot.xlabel(metricNameX)
+        plot.ylabel(metricNameY)
+        mx = self.getMetricByName(metricNameX)
+        if adjustBounds and mx.hasFiniteBounds():
+            plot.xlim(*axlim(mx.bounds))
+        my = self.getMetricByName(metricNameY)
+        if adjustBounds and my.hasFiniteBounds():
+            plot.ylim(*axlim(my.bounds))
+        return plot.fig
+
+    def plotScatter(self, metricNameX: str, metricNameY: str) -> plt.Figure:
+        return self._plotXY(metricNameX, metricNameY, ScatterPlot, adjustBounds=True)
+
+    def plotHeatMap(self, metricNameX: str, metricNameY: str) -> plt.Figure:
+        return self._plotXY(metricNameX, metricNameY, HeatMapPlot, adjustBounds=False)
 
     def toDataFrame(self) -> pd.DataFrame:
         """
         :return: a DataFrame with the evaluation metrics from all contained EvalStats objects;
             the EvalStats' name field being used as the index if it is set
         """
-        data = dict(self.metrics)
+        data = dict(self._valuesByMetricName)
         index = [stats.name for stats in self.statsList]
         if len([n for n in index if n is not None]) == 0:
             index = None
@@ -153,7 +223,7 @@ def getGlobalStats(self) -> TEvalStats:
 
     def __str__(self):
         return f"{self.__class__.__name__}[" + \
-               ", ".join([f"{key}={self.aggMetricsDict()[key]:.4f}" for key in self.metrics]) + "]"
+               ", ".join([f"{key}={self.aggMetricsDict()[key]:.4f}" for key in self._valuesByMetricName]) + "]"
 
 
 class PredictionEvalStats(EvalStats[TMetric], ABC):
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_classification.py b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
index 937fdfe9..988981f1 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_classification.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_classification.py
@@ -1,7 +1,8 @@
 import logging
 from abc import ABC, abstractmethod
-from typing import List, Sequence, Optional, Dict
+from typing import List, Sequence, Optional, Dict, Any, Tuple
 
+import matplotlib.ticker as plticker
 import numpy as np
 import pandas as pd
 import sklearn
@@ -9,7 +10,7 @@
 from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, precision_recall_curve, \
     balanced_accuracy_score, f1_score
 
-from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric, EvalStatsPlot
+from .eval_stats_base import PredictionArray, PredictionEvalStats, EvalStatsCollection, Metric, EvalStatsPlot, TMetric
 from ...util.aggregation import RelativeFrequencyCounter
 from ...util.pickle import getstate
 from ...util.plot import plotMatrix
@@ -24,6 +25,14 @@
 class ClassificationMetric(Metric["ClassificationEvalStats"], ABC):
     requiresProbabilities = False
 
+    def __init__(self, name=None, bounds: Tuple[float, float] = (0, 1), requiresProbabilities=None):
+        """
+        :param name: the name of the metric; if None use the class' name attribute
+        :param bounds: the minimum and maximum values the metric can take on
+        """
+        super().__init__(name=name, bounds=bounds)
+        self.requiresProbabilities = requiresProbabilities if requiresProbabilities is not None else self.__class__.requiresProbabilities
+
     def computeValueForEvalStats(self, evalStats: "ClassificationEvalStats"):
         return self.computeValue(evalStats.y_true, evalStats.y_predicted, evalStats.y_predictedClassProbabilities)
 
@@ -51,6 +60,45 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return balanced_accuracy_score(y_true=y_true, y_pred=y_predicted)
 
 
+class ClassificationMetricAccuracyWithoutLabels(ClassificationMetric):
+    """
+    Accuracy score with set of data points limited to the ones where the ground truth label is not one of the given labels
+    """
+    def __init__(self, *labels: Any, probabilityThreshold=None):
+        """
+        :param labels: one or more labels which are not to be considered (all data points where the ground truth is
+            one of these labels will be ignored)
+        :param probabilityThreshold: a probability threshold: the probability of the most likely class must be at least this value for a data point
+            to be considered in the metric computation (analogous to :class:`ClassificationMetricAccuracyMaxProbabilityBeyondThreshold`)
+        """
+        if probabilityThreshold is not None:
+            nameAdd = f", p_max >= {probabilityThreshold}"
+        else:
+            nameAdd = ""
+        name = f"{ClassificationMetricAccuracy.name}Without[{','.join(map(str, labels))}{nameAdd}]"
+        super().__init__(name, requiresProbabilities=probabilityThreshold is not None)
+        self.labels = set(labels)
+        self.probabilityThreshold = probabilityThreshold
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        y_true = np.array(y_true)
+        y_predicted = np.array(y_predicted)
+        indices = []
+        for i, (trueLabel, predictedLabel) in enumerate(zip(y_true, y_predicted)):
+            if trueLabel not in self.labels:
+                if self.probabilityThreshold is not None:
+                    if y_predictedClassProbabilities[predictedLabel].iloc[i] < self.probabilityThreshold:
+                        continue
+                indices.append(i)
+        return accuracy_score(y_true=y_true[indices], y_pred=y_predicted[indices])
+
+    def getPairedMetrics(self) -> List[TMetric]:
+        if self.probabilityThreshold is not None:
+            return [ClassificationMetricRelFreqMaxProbabilityBeyondThreshold(self.probabilityThreshold)]
+        else:
+            return []
+
+
 class ClassificationMetricGeometricMeanOfTrueClassProbability(ClassificationMetric):
     name = "geoMeanTrueClassProb"
     requiresProbabilities = True
@@ -115,6 +163,9 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         else:
             return relFreq.getRelativeFrequency()
 
+    def getPairedMetrics(self) -> List[TMetric]:
+        return [ClassificationMetricRelFreqMaxProbabilityBeyondThreshold(self.threshold)]
+
 
 class ClassificationMetricRelFreqMaxProbabilityBeyondThreshold(ClassificationMetric):
     """
@@ -155,6 +206,9 @@ def __init__(self, positiveClassLabel):
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         return precision_score(y_true, y_predicted, pos_label=self.positiveClassLabel, zero_division=0)
 
+    def getPairedMetrics(self) -> List[BinaryClassificationMetric]:
+        return [BinaryClassificationMetricRecall(self.positiveClassLabel)]
+
 
 class BinaryClassificationMetricRecall(BinaryClassificationMetric):
     name = "recall"
@@ -178,28 +232,92 @@ def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
 
 class BinaryClassificationMetricRecallForPrecision(BinaryClassificationMetric):
     """
-    Computes the maximum recall that can be achieved in cases where at least the given precision is reached.
-    The given precision may not be achievable at all, in which case the metric value is NaN.
+    Computes the maximum recall that can be achieved (by varying the decision threshold) in cases where at least the given precision
+    is reached. The given precision may not be achievable at all, in which case the metric value is ``zeroValue``.
     """
-    def __init__(self, precision: float, positiveClassLabel):
+    def __init__(self, precision: float, positiveClassLabel, zeroValue=0.0):
+        """
+        :param precision: the minimum precision value that must be reached
+        :param positiveClassLabel: the positive class label
+        :param zeroValue: the value to return for the case where the minimum precision is never reached
+        """
         self.minPrecision = precision
+        self.zeroValue = zeroValue
         super().__init__(positiveClassLabel, name=f"recallForPrecision[{precision}]")
 
     def computeValueForEvalStats(self, evalStats: "ClassificationEvalStats"):
         varData = evalStats.getBinaryClassificationProbabilityThresholdVariationData()
-        result = np.nan
+        bestRecall = None
         for c in varData.counts:
             precision = c.getPrecision()
             if precision >= self.minPrecision:
                 recall = c.getRecall()
-                if np.isnan(result) or result < recall:
-                    result = recall
-        return result
+                if bestRecall is None or recall > bestRecall:
+                    bestRecall = recall
+        return self.zeroValue if bestRecall is None else bestRecall
 
     def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
         raise NotImplementedError(f"{self.__class__.__qualname__} only supports computeValueForEvalStats")
 
 
+class BinaryClassificationMetricPrecisionThreshold(BinaryClassificationMetric):
+    """
+    Precision for the case where predictions are considered "positive" if predicted probability of the positive class is beyond the
+    given threshold
+    """
+    requiresProbabilities = True
+
+    def __init__(self, threshold: float, positiveClassLabel: Any, zeroValue=0.0):
+        """
+        :param threshold: the minimum predicted probability of the positive class for the prediction to be considered "positive"
+        :param zeroValue: the value of the metric for the case where a positive class probability beyond the threshold is never predicted
+            (denominator = 0)
+        """
+        self.threshold = threshold
+        self.zeroValue = zeroValue
+        super().__init__(positiveClassLabel, name=f"precision[{threshold}]")
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        relFreqCorrect = RelativeFrequencyCounter()
+        classIdx_positive = list(y_predictedClassProbabilities.columns).index(self.positiveClassLabel)
+        for i, (probabilities, classLabel_true) in enumerate(zip(y_predictedClassProbabilities.values.tolist(), y_true)):
+            prob_predicted = probabilities[classIdx_positive]
+            if prob_predicted >= self.threshold:
+                relFreqCorrect.count(classLabel_true == self.positiveClassLabel)
+        f = relFreqCorrect.getRelativeFrequency()
+        return f if f is not None else self.zeroValue
+
+    def getPairedMetrics(self) -> List[BinaryClassificationMetric]:
+        return [BinaryClassificationMetricRecallThreshold(self.threshold, self.positiveClassLabel)]
+
+
+class BinaryClassificationMetricRecallThreshold(BinaryClassificationMetric):
+    """
+    Recall for the case where predictions are considered "positive" if predicted probability of the positive class is beyond the
+    given threshold
+    """
+    requiresProbabilities = True
+
+    def __init__(self, threshold: float, positiveClassLabel: Any, zeroValue=0.0):
+        """
+        :param threshold: the minimum predicted probability of the positive class for the prediction to be considered "positive"
+        :param zeroValue: the value of the metric for the case where there are no positive instances in the data set (denominator = 0)
+        """
+        self.threshold = threshold
+        self.zeroValue = zeroValue
+        super().__init__(positiveClassLabel, name=f"recall[{threshold}]")
+
+    def _computeValue(self, y_true, y_predicted, y_predictedClassProbabilities):
+        relFreqRecalled = RelativeFrequencyCounter()
+        classIdx_positive = list(y_predictedClassProbabilities.columns).index(self.positiveClassLabel)
+        for i, (probabilities, classLabel_true) in enumerate(zip(y_predictedClassProbabilities.values.tolist(), y_true)):
+            if self.positiveClassLabel == classLabel_true:
+                prob_predicted = probabilities[classIdx_positive]
+                relFreqRecalled.count(prob_predicted >= self.threshold)
+        f = relFreqRecalled.getRelativeFrequency()
+        return f if f is not None else self.zeroValue
+
+
 class ClassificationEvalStats(PredictionEvalStats["ClassificationMetric"]):
     def __init__(self, y_predicted: PredictionArray = None,
             y_true: PredictionArray = None,
@@ -319,10 +437,12 @@ def plotPrecisionRecallCurve(self, titleAdd: str = None):
         if titleAdd is not None:
             title += "\n" + titleAdd
         ax.set_title(title)
+        ax.xaxis.set_major_locator(plticker.MultipleLocator(base=0.1))
+        ax.yaxis.set_major_locator(plticker.MultipleLocator(base=0.1))
         return disp.figure_
 
 
-class ClassificationEvalStatsCollection(EvalStatsCollection[ClassificationEvalStats]):
+class ClassificationEvalStatsCollection(EvalStatsCollection[ClassificationEvalStats, ClassificationMetric]):
     def __init__(self, evalStatsList: List[ClassificationEvalStats]):
         super().__init__(evalStatsList)
         self.globalStats = None
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_regression.py b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
index 16e557e1..89f5b0ae 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_regression.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
@@ -198,7 +198,7 @@ def plotScatterGroundTruthPredictions(self, figure=True, titleAdd=None, **kwargs
         :return:  the resulting figure object or None
         """
         fig = None
-        title = "Scatter Plot of Ground Truth vs. Predicted Values"
+        title = "Scatter Plot of Predicted Values vs. Ground Truth"
         if titleAdd is not None:
             title += "\n" + titleAdd
         if figure:
@@ -228,7 +228,7 @@ def plotHeatmapGroundTruthPredictions(self, figure=True, cmap=None, bins=60, tit
         :return:  the resulting figure object or None
         """
         fig = None
-        title = "Heat Map of Ground Truth vs. Predicted Values"
+        title = "Heat Map of Predicted Values vs. Ground Truth"
         if titleAdd:
             title += "\n" + titleAdd
         if figure:
@@ -260,7 +260,7 @@ def plotHeatmapGroundTruthPredictions(self, figure=True, cmap=None, bins=60, tit
         return fig
 
 
-class RegressionEvalStatsCollection(EvalStatsCollection):
+class RegressionEvalStatsCollection(EvalStatsCollection[RegressionEvalStats, RegressionMetric]):
     def __init__(self, evalStatsList: List[RegressionEvalStats]):
         super().__init__(evalStatsList)
         self.globalStats = None
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index d5e93db3..69394eb9 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -480,7 +480,10 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
             crossValidatorParams: Optional[Union[VectorModelCrossValidatorParams, Dict[str, Any]]] = None,
             columnNameForModelRanking: str = None,
             rankMax=True,
+            createMetricDistributionPlots=True,
             createCombinedEvalStatsPlots=False,
+            distributionPlots_cdf = True,
+            distributionPlots_cdfComplementary = False,
             visitors: Optional[Iterable["ModelComparisonVisitor"]] = None) -> Union["RegressionMultiDataModelComparisonData", "ClassificationMultiDataModelComparisonData"]:
         """
         :param modelFactories: a sequence of factory functions for the creation of models to evaluate; every factory must result
@@ -493,6 +496,7 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
         :param crossValidatorParams: parameters to use for the instantiation of cross-validators (relevant if useCrossValidation==True)
         :param columnNameForModelRanking: column name to use for ranking models
         :param rankMax: if true, use max for ranking, else min
+        :param createMetricDistributionPlots: whether to create, for each model, plots of the distribution of each metric across the datasets
         :param createCombinedEvalStatsPlots: whether to combine, for each type of model, the EvalStats objects from the individual experiments
             into a single objects that holds all results and use it to create plots reflecting the overall result.
             Note that for classification, this is only possible if all individual experiments use the same set of class labels.
@@ -506,6 +510,7 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
         isRegression = None
         plotCollector: Optional[EvalStatsPlotCollector] = None
         modelNames = None
+        modelName2StringRepr = None
 
         for i, (key, inputOutputData) in enumerate(self.inputOutputDataDict.items(), start=1):
             log.info(f"Evaluating models for data set #{i}/{len(self.inputOutputDataDict)}: {self.keyName}={key}")
@@ -552,6 +557,9 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
 
             allResultsDF = pd.concat((allResultsDF, df))
 
+            if modelName2StringRepr is None:
+                modelName2StringRepr = {model.getName(): model.pprints() for model in models}
+
         if self.metaDF is not None:
             allResultsDF = allResultsDF.join(self.metaDF, on=self.keyName, how="left")
 
@@ -583,7 +591,10 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
         log.info(strFurtherAggs)
 
         if resultWriter is not None:
-            resultWriter.writeTextFile("model-comparison-results", strMeanResults + "\n\n" + strFurtherAggs + "\n\n" + strAllResults)
+            comparisonContent = strMeanResults + "\n\n" + strFurtherAggs + "\n\n" + strAllResults
+            comparisonContent += "\n\nModels [example instance]:\n\n"
+            comparisonContent += "\n\n".join(f"{name} = {s}" for name, s in modelName2StringRepr.items())
+            resultWriter.writeTextFile("model-comparison-results", comparisonContent)
 
         # create plots from combined data for each model
         if createCombinedEvalStatsPlots:
@@ -602,10 +613,17 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
             for visitor in visitors:
                 visitor.collectPlots(resultCollector)
 
+        # create result
         if isRegression:
-            return RegressionMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
+            mdmcData = RegressionMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
         else:
-            return ClassificationMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
+            mdmcData = ClassificationMultiDataModelComparisonData(allResultsDF, meanResultsDF, furtherAggsDF, evalStatsByModelName)
+
+        # plot distributions
+        if createMetricDistributionPlots and resultWriter is not None:
+            mdmcData.createDistributionPlots(resultWriter, cdf=distributionPlots_cdf, cdfComplementary=distributionPlots_cdfComplementary)
+
+        return mdmcData
 
 
 class ModelComparisonData:
@@ -701,6 +719,30 @@ def getEvalStatsList(self, modelName: str) -> List[TEvalStats]:
     def getEvalStatsCollection(self, modelName: str) -> TEvalStatsCollection:
         pass
 
+    def createDistributionPlots(self, resultWriter: ResultWriter, cdf=True, cdfComplementary=False):
+        """
+        Creates plots of distributions of metrics across datasets for each model as a histogram, and additionally
+        any x-y plots (scatter plots & heat maps) for metrics that have associated paired metrics that were also computed
+
+        :param resultWriter: the result writer
+        :param cdf: whether to additionally plot, for each distribution, the cumulative distribution function
+        :param cdfComplementary: whether to plot the complementary cdf, provided that ``cdf`` is True
+        """
+        for modelName in self.getModelNames():
+            evalStatsCollection = self.getEvalStatsCollection(modelName)
+            for metricName in evalStatsCollection.getMetricNames():
+                # plot distribution
+                fig = evalStatsCollection.plotDistribution(metricName, cdf=cdf, cdfComplementary=cdfComplementary)
+                resultWriter.writeFigure(f"{modelName}_dist-{metricName}", fig)
+                # scatter plot with paired metrics
+                metric = evalStatsCollection.getMetricByName(metricName)
+                for pairedMetric in metric.getPairedMetrics():
+                    if evalStatsCollection.hasMetric(pairedMetric):
+                        fig = evalStatsCollection.plotScatter(metric.name, pairedMetric.name)
+                        resultWriter.writeFigure(f"{modelName}_scatter-{metric.name}-{pairedMetric.name}", fig)
+                        fig = evalStatsCollection.plotHeatMap(metric.name, pairedMetric.name)
+                        resultWriter.writeFigure(f"{modelName}_heatmap-{metric.name}-{pairedMetric.name}", fig)
+
 
 class ClassificationMultiDataModelComparisonData(MultiDataModelComparisonData[ClassificationEvalStats, ClassificationEvalStatsCollection]):
     def getEvalStatsCollection(self, modelName: str):
diff --git a/src/sensai/util/cache.py b/src/sensai/util/cache.py
index 5271c55e..c0542e11 100644
--- a/src/sensai/util/cache.py
+++ b/src/sensai/util/cache.py
@@ -565,18 +565,19 @@ def _computeValue(self, key, data):
 
 
 def cached(fn: Callable[[], T], picklePath, functionName=None, validityCheckFn: Optional[Callable[[T], bool]] = None,
-        backend="pickle", protocol=pickle.HIGHEST_PROTOCOL, load=True) -> T:
+        backend="pickle", protocol=pickle.HIGHEST_PROTOCOL, load=True, version=None) -> T:
     """
     :param fn: the function whose result is to be cached
     :param picklePath: the path in which to store the cached result
     :param functionName: the name of the function fn (for the case where its __name__ attribute is not
         informative)
     :param validityCheckFn: an optional function to call in order to check whether a cached result is still valid;
-        the function shall return True if the res is still valid and false otherwise. If a cached result is invalid,
+        the function shall return True if the result is still valid and false otherwise. If a cached result is invalid,
         the function fn is called to compute the result and the cached result is updated.
     :param backend: pickle or joblib
     :param protocol: the pickle protocol version
     :param load: whether to load a previously persisted result; if False, do not load an old result but store the newly computed result
+    :param version: if not None, previously persisted data will only be returned if it was stored with the same version
     :return: the result (either obtained from the cache or the function)
     """
     if functionName is None:
@@ -585,7 +586,11 @@ def cached(fn: Callable[[], T], picklePath, functionName=None, validityCheckFn:
     def callFnAndCacheResult():
         res = fn()
         log.info(f"Saving cached result in {picklePath}")
-        dumpPickle(res, picklePath, backend=backend, protocol=protocol)
+        if version is not None:
+            persistedRes = {"__cacheVersion": version, "obj": res}
+        else:
+            persistedRes = res
+        dumpPickle(persistedRes, picklePath, backend=backend, protocol=protocol)
         return res
 
     if os.path.exists(picklePath):
@@ -596,6 +601,15 @@ def callFnAndCacheResult():
                 if not validityCheckFn(result):
                     log.info(f"Cached result is no longer valid, recomputing ...")
                     result = callFnAndCacheResult()
+            if version is not None:
+                cachedVersion = None
+                if type(result) == dict:
+                    cachedVersion = result.get("__cacheVersion")
+                if cachedVersion != version:
+                    log.info(f"Cached result has incorrect version ({cachedVersion}, expected {version}), recomputing ...")
+                    result = callFnAndCacheResult()
+                else:
+                    result = result["obj"]
             return result
         else:
             log.info(f"Ignoring previously stored result in {picklePath}, calling function '{functionName}' ...")
@@ -610,7 +624,7 @@ class PickleCached(object):
     Function decorator for caching function results via pickle
     """
     def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str = None, backend="pickle",
-            protocol=pickle.HIGHEST_PROTOCOL, load=True):
+            protocol=pickle.HIGHEST_PROTOCOL, load=True, version=None):
         """
         :param cacheBasePath: the directory where the pickle cache file will be stored
         :param filenamePrefix: a prefix of the name of the cache file to be created, to which the function name and, where applicable,
@@ -621,6 +635,7 @@ def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str
         :param backend: the serialisation backend to use (see dumpPickle)
         :param protocol: the pickle protocol version to use
         :param load: whether to load a previously persisted result; if False, do not load an old result but store the newly computed result
+        :param version: if not None, previously persisted data will only be returned if it was stored with the same version
         """
         self.filename = filename
         self.cacheBasePath = cacheBasePath
@@ -628,6 +643,7 @@ def __init__(self, cacheBasePath: str, filenamePrefix: str = None, filename: str
         self.backend = backend
         self.protocol = protocol
         self.load = load
+        self.version = version
 
         if self.filenamePrefix is None:
             self.filenamePrefix = ""
@@ -656,7 +672,8 @@ def wrapped(*args, **kwargs):
                         raise Exception("Function without arguments but full cache filename with placeholder (%s) was specified")
                     filename = self.filename
             picklePath = os.path.join(self.cacheBasePath, filename)
-            return cached(lambda: fn(*args, **kwargs), picklePath, functionName=fn.__name__, backend=self.backend, load=self.load)
+            return cached(lambda: fn(*args, **kwargs), picklePath, functionName=fn.__name__, backend=self.backend, load=self.load,
+                version=self.version)
 
         return wrapped
 
diff --git a/src/sensai/util/plot.py b/src/sensai/util/plot.py
index 6adcde78..ceb18ff6 100644
--- a/src/sensai/util/plot.py
+++ b/src/sensai/util/plot.py
@@ -1,7 +1,8 @@
 import logging
 from matplotlib.colors import LinearSegmentedColormap
-from typing import Sequence, Callable
+from typing import Sequence, Callable, TypeVar, Type, Tuple
 
+import matplotlib.ticker as plticker
 import matplotlib.figure
 from matplotlib import pyplot as plt
 import numpy as np
@@ -62,41 +63,85 @@ def plotMatrix(matrix, title, xticklabels: Sequence[str], yticklabels: Sequence[
     return fig
 
 
+TPlot = TypeVar("TPlot", bound="Plot")
+
+
 class Plot:
-    def __init__(self, draw: Callable[[], plt.Axes] = None, name=None):
+    def __init__(self, draw: Callable[[], None] = None, name=None):
         """
         :param draw: function which returns a matplotlib.Axes object to show
         :param name: name/number of the figure, which determines the window caption; it should be unique, as any plot
             with the same name will have its contents rendered in the same window. By default, figures are number
             sequentially.
         """
-        self.fig: matplotlib.figure.Figure = plt.figure(name)
-        self.ax = draw()
+        fig, ax = plt.subplots(num=name)
+        self.fig: plt.Figure = fig
+        self.ax: plt.Axes = ax
+        draw()
 
-    def xlabel(self, label):
-        plt.xlabel(label)
+    def xlabel(self: Type[TPlot], label):
+        self.ax.set_xlabel(label)
         return self
 
-    def ylabel(self, label):
-        plt.ylabel(label)
+    def ylabel(self: Type[TPlot], label) -> TPlot:
+        self.ax.set_ylabel(label)
         return self
 
-    def title(self, title: str):
-        plt.title(title)
+    def title(self: Type[TPlot], title: str) -> TPlot:
+        self.ax.set_title(title)
+        return self
 
-    def xlim(self, minValue, maxValue):
-        plt.xlim(minValue, maxValue)
+    def xlim(self: Type[TPlot], minValue, maxValue) -> TPlot:
+        self.ax.set_xlim(minValue, maxValue)
+        return self
 
-    def ylim(self, minValue, maxValue):
-        plt.ylim(minValue, maxValue)
+    def ylim(self: Type[TPlot], minValue, maxValue) -> TPlot:
+        self.ax.set_ylim(minValue, maxValue)
+        return self
 
     def save(self, path):
         log.info(f"Saving figure in {path}")
         self.fig.savefig(path)
 
+    def xtickMajor(self, base):
+        self.ax.xaxis.set_major_locator(plticker.MultipleLocator(base=base))
+
+    def ytickMajor(self, base):
+        self.ax.yaxis.set_major_locator(plticker.MultipleLocator(base=base))
+
+
 
 class ScatterPlot(Plot):
-    def __init__(self, x, y, c=((0, 0, 1, 0.05),), x_label=None, y_label=None, **kwargs):
+    N_MAX_TRANSPARENCY = 1000
+    N_MIN_TRANSPARENCY = 100
+    MAX_OPACITY = 0.5
+    MIN_OPACITY = 0.05
+
+    def __init__(self, x, y, c=None, c_base: Tuple[float, float, float]=(0, 0, 1), c_opacity=None, x_label=None, y_label=None, **kwargs):
+        """
+        :param x: the x values; if has name (e.g. pd.Series), will be used as axis label
+        :param y: the y values; if has name (e.g. pd.Series), will be used as axis label
+        :param c: the colour specification; if None, compose from ``c_base`` and ``c_opacity``
+        :param c_base: the base colour as (R, G, B) floats
+        :param c_opacity: the opacity; if None, automatically determine from number of data points
+        :param x_label:
+        :param y_label:
+        :param kwargs:
+        """
+        if c is None:
+            if c_base is None:
+                c_base = (0, 0, 1)
+            if c_opacity is None:
+                n = len(x)
+                if n > self.N_MAX_TRANSPARENCY:
+                    transparency = 1
+                elif n < self.N_MIN_TRANSPARENCY:
+                    transparency = 0
+                else:
+                    transparency = (n - self.N_MIN_TRANSPARENCY) / (self.N_MAX_TRANSPARENCY - self.N_MIN_TRANSPARENCY)
+                c_opacity = self.MIN_OPACITY + (self.MAX_OPACITY - self.MIN_OPACITY) * (1-transparency)
+            c = ((*c_base, c_opacity),)
+
         assert len(x) == len(y)
         if x_label is None and hasattr(x, "name"):
             x_label = x.name
@@ -108,7 +153,7 @@ def draw():
                 plt.xlabel(x_label)
             if x_label is not None:
                 plt.ylabel(y_label)
-            return plt.scatter(x, y, c=c, **kwargs)
+            plt.scatter(x, y, c=c, **kwargs)
 
         super().__init__(draw)
 
@@ -141,17 +186,35 @@ def draw():
                 plt.xlabel(xLabel)
             if yLabel is not None:
                 plt.ylabel(yLabel)
-            return plt.imshow(heatmap.T, extent=extent, origin='lower', interpolation="none", cmap=cmap, zorder=1, aspect="auto", **kwargs)
+            plt.imshow(heatmap.T, extent=extent, origin='lower', interpolation="none", cmap=cmap, zorder=1, aspect="auto", **kwargs)
 
         super().__init__(draw)
 
 
 class HistogramPlot(Plot):
-    def __init__(self, values, bins="auto", kde=False, binwidth=None, stat="percent", xlabel=None, **kwargs):
+    def __init__(self, values, bins="auto", kde=False, cdf=False, cdfComplementary=False, binwidth=None, stat="probability", xlabel=None,
+            **kwargs):
+        stat="proportion"
+        if stat == "probability":
+            stat = "proportion"  # same semantics but "probability" not understood by ecdfplot
+
         def draw():
-            ax = sns.histplot(values, bins=bins, kde=kde, binwidth=binwidth, stat=stat, **kwargs)
+            sns.histplot(values, bins=bins, kde=kde, binwidth=binwidth, stat=stat, **kwargs)
+            if cdf:
+                if cdfComplementary or stat not in ("count", "proportion"):
+                    sns.ecdfplot(values, stat=stat, complementary=cdfComplementary, color="orange")
+                else:
+                    sns.histplot(values, bins=100, stat=stat, element="poly", fill=False, cumulative=True, color="orange")
             if xlabel is not None:
                 plt.xlabel(xlabel)
-            return ax
 
-        super().__init__(draw)
\ No newline at end of file
+        super().__init__(draw)
+
+        if stat in ("proportion", "probability"):
+            yTick = 0.1
+        elif stat == "percent":
+            yTick = 10
+        else:
+            yTick = None
+        if yTick is not None:
+            self.ytickMajor((yTick))

From 66734af9044c401a90ad2263da3c76d5808e76d8 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Fri, 3 Jun 2022 14:36:34 +0200
Subject: [PATCH 116/131] Sync avancis

  commit 2651412e8ad006d9ccc86f000e4946b2325b089a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Jun 3 14:23:08 2022 +0200

      Added SkLearnDummyVectorRegressionModel

  sensai/sklearn/sklearn_regression.py

  commit fe9c2c982c059faf369b55d4e8ea161c7495523b
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Jun 3 14:22:54 2022 +0200

      Fixed typo in docstring

  sensai/data_transformation/dft.py

  commit 115c4d6112500944d1b3167ce9e0ad843ba14b31
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Jun 3 13:13:40 2022 +0200

      Improved logging

  sensai/evaluation/eval_util.py

  commit e5e0c4b9148b11869ab228af7d143e22b5ebb985
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Jun 3 13:13:21 2022 +0200

      EvalStatsRegression.plotErrorDistribution: Use HistogramPlot

  sensai/evaluation/eval_stats/eval_stats_regression.py
---
 src/sensai/data_transformation/dft.py           |  2 +-
 .../eval_stats/eval_stats_regression.py         | 17 +++++++----------
 src/sensai/evaluation/eval_util.py              |  3 ++-
 src/sensai/sklearn/sklearn_regression.py        |  6 ++++++
 4 files changed, 16 insertions(+), 12 deletions(-)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 3909f408..cf873ad8 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -842,7 +842,7 @@ def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
 
 class DFTDropNA(RuleBasedDataFrameTransformer):
     """
-    Drops rows or columns containin NA/NaN values
+    Drops rows or columns containing NA/NaN values
     """
     def __init__(self, axis=0, inplace=False):
         """
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_regression.py b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
index 16e557e1..50208f80 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_regression.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
@@ -7,6 +7,7 @@
 from typing import List, Sequence, Optional
 
 from .eval_stats_base import PredictionEvalStats, Metric, EvalStatsCollection, PredictionArray, EvalStatsPlot
+from ...util.plot import HistogramPlot
 
 log = logging.getLogger(__name__)
 
@@ -168,26 +169,22 @@ def getEvalStatsCollection(self) -> "RegressionEvalStatsCollection":
             statsList.append(stats)
         return RegressionEvalStatsCollection(statsList)
 
-    def plotErrorDistribution(self, bins=None, figure=True, titleAdd=None) -> Optional[plt.Figure]:
+    def plotErrorDistribution(self, bins="auto", titleAdd=None) -> Optional[plt.Figure]:
         """
-        :param bins: if None, seaborns default binning will be used
+        :param bins: bin specification (see :class:`HistogramPlot`)
         :param figure: whether to plot in a separate figure and return that figure
         :param titleAdd: a string to add to the title (on a second line)
 
         :return: the resulting figure object or None
         """
         errors = np.array(self.y_predicted) - np.array(self.y_true)
-        fig = None
         title = "Prediction Error Distribution"
         if titleAdd is not None:
             title += "\n" + titleAdd
-        if figure:
-            fig = plt.figure(title.replace("\n", " "))
-        sns.distplot(errors, bins=bins)
-        plt.title(title)
-        plt.xlabel("error (prediction - ground truth)")
-        plt.ylabel("probability density")
-        return fig
+        plot = HistogramPlot(errors, bins=bins, kde=True).title(title)
+        plot.xlabel("error (prediction - ground truth)")
+        plot.ylabel("probability density")
+        return plot.fig
 
     def plotScatterGroundTruthPredictions(self, figure=True, titleAdd=None, **kwargs) -> Optional[plt.Figure]:
         """
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index d5e93db3..8dec7683 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -333,8 +333,9 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
         """
         statsList = []
         resultByModelName = {}
-        for model in models:
+        for i, model in enumerate(models, start=1):
             modelName = model.getName()
+            log.info(f"Evaluating model {i}/{len(models)} named '{modelName}' ...")
             if useCrossValidation:
                 if not fitModels:
                     raise ValueError("Cross-validation necessitates that models be retrained; got fitModels=False")
diff --git a/src/sensai/sklearn/sklearn_regression.py b/src/sensai/sklearn/sklearn_regression.py
index a1ec644f..31e617c7 100644
--- a/src/sensai/sklearn/sklearn_regression.py
+++ b/src/sensai/sklearn/sklearn_regression.py
@@ -75,3 +75,9 @@ class SkLearnExtraTreesVectorRegressionModel(AbstractSkLearnMultipleOneDimVector
     def __init__(self, n_estimators=100, min_samples_leaf=10, random_state=42, **modelArgs):
         super().__init__(sklearn.ensemble.ExtraTreesRegressor,
             n_estimators=n_estimators, min_samples_leaf=min_samples_leaf, random_state=random_state, **modelArgs)
+
+
+class SkLearnDummyVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
+    def __init__(self, strategy='mean', constant=None, quantile=None):
+        super().__init__(sklearn.dummy.DummyRegressor,
+            strategy=strategy, constant=constant, quantile=quantile)

From 0c876cede9b615f2f7df98f2e2acf1c3e1c34924 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Fri, 3 Jun 2022 19:52:29 +0200
Subject: [PATCH 117/131] Improved docstrings

---
 src/sensai/torch/torch_opt.py | 23 +++++------------------
 1 file changed, 5 insertions(+), 18 deletions(-)

diff --git a/src/sensai/torch/torch_opt.py b/src/sensai/torch/torch_opt.py
index f1b6118e..168d41ce 100644
--- a/src/sensai/torch/torch_opt.py
+++ b/src/sensai/torch/torch_opt.py
@@ -123,7 +123,7 @@ def startEpoch(self) -> None:
         def computeTrainBatchLoss(self, modelOutput, groundTruth, X, Y) -> torch.Tensor:
             """
             Computes the loss for the given model outputs and ground truth values for a batch
-            and aggregates the computed loss values such that getEpochLoss can return an appropriate
+            and aggregates the computed loss values such that :meth:``getEpochTrainLoss`` can return an appropriate
             result for the entire epoch.
             The original batch tensors X and Y are provided as meta-information only.
 
@@ -542,7 +542,7 @@ def __init__(self, lossEvaluator: NNLossEvaluator = None, gpu=None, optimiser: U
         """
         :param lossEvaluator: the loss evaluator to use
         :param gpu: the index of the GPU to be used (if CUDA is enabled for the model to be trained); if None, default to first GPU
-        :param optimiser: the name of the optimizer to be used; defaults to "adam"
+        :param optimiser: the optimiser to use
         :param optimiserLR: the optimiser's learning rate
         :param earlyStoppingEpochs: the number of epochs without validation score improvement after which to abort training and
             use the best epoch's model (early stopping); if None, never abort training before all epochs are completed
@@ -552,8 +552,8 @@ def __init__(self, lossEvaluator: NNLossEvaluator = None, gpu=None, optimiser: U
             If no validation is to be performed, pass 1.0.
         :param scaledOutputs: whether to scale all outputs, resulting in computations of the loss function based on scaled values rather than normalised values.
             Enabling scaling may not be appropriate in cases where there are multiple outputs on different scales/with completely different units.
-        :param useShrinkage: whether to apply shrinkage to gradients whose norm exceeds optimiserClip
-        :param shrinkageClip: the maximum gradient norm beyond which to apply shrinkage (if useShrinkage is True)
+        :param useShrinkage: whether to apply shrinkage to gradients whose norm exceeds ``shrinkageClip``, scaling the gradient down to ``shrinkageClip``
+        :param shrinkageClip: the maximum gradient norm beyond which to apply shrinkage (if ``useShrinkage`` is True)
         :param shuffle: whether to shuffle the training data
         :param optimiserArgs: keyword arguments to be passed on to the actual torch optimiser
         """
@@ -618,20 +618,7 @@ class NNOptimiser:
 
     def __init__(self, params: NNOptimiserParams):
         """
-        :param cuda: whether to use CUDA
-        :param lossEvaluator: the loss evaluator to use
-        :param gpu: index of the gpu to be used (if CUDA is enabled in the model to be trained)
-        :param optimiser: the optimizer to be used; defaults to "adam"
-        :param optimiserClip: the maximum gradient norm beyond which to apply shrinkage (if useShrinkage is True)
-        :param optimiserLR: the optimiser's learning rate
-        :param batchSize: the batch size to use; for algorithms L-BFGS (optimiser='lbfgs'), which do not use batches, leave this at None.
-            If the algorithm uses batches and None is specified, batch size 64 will be used by default.
-        :param trainFraction: the fraction of the data used for training (with the remainder being used for validation).
-            If no validation is to be performed, pass 1.0.
-        :param scaledOutputs: whether to scale all outputs, resulting in computations of the loss function based on scaled values rather than normalised values.
-            Enabling scaling may not be appropriate in cases where there are multiple outputs on different scales/with completely different units.
-        :param useShrinkage: whether to apply shrinkage to gradients whose norm exceeds optimiserClip
-        :param optimiserArgs: keyword arguments to be passed on to the actual torch optimiser
+        :param params: parameters
         """
         if params.lossEvaluator is None:
             raise ValueError("Must provide a loss evaluator")

From 4b04f3485a030aec3c8ac9be079be60053331f76 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Tue, 7 Jun 2022 16:46:10 +0200
Subject: [PATCH 118/131] DFT and Featuregen: added toFeatureGenerator method

Also minor renaming and improvement in imports
---
 src/sensai/data_transformation/dft.py | 13 ++++++++++++-
 src/sensai/featuregen.py              |  5 ++---
 2 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index 72e2c4e7..03a2c348 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -95,6 +95,17 @@ def fitApply(self, df: pd.DataFrame) -> pd.DataFrame:
         self.fit(df)
         return self.apply(df)
 
+    def toFeatureGenerator(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None,
+            normalisationRules: Sequence['DFTNormalisation.Rule'] = (),
+            normalisationRuleTemplate: 'DFTNormalisation.RuleTemplate' = None,
+            addCategoricalDefaultRules=True):
+        # need to import here to prevent circular imports
+        from ..featuregen import FeatureGeneratorFromDFT
+        return FeatureGeneratorFromDFT(
+            self, categoricalFeatureNames=categoricalFeatureNames, normalisationRules=normalisationRules,
+            normalisationRuleTemplate=normalisationRuleTemplate, addCategoricalDefaultRules=addCategoricalDefaultRules
+        )
+
 
 class DFTFromFeatureGenerator(DataFrameTransformer):
     def _fit(self, df: pd.DataFrame):
@@ -103,7 +114,7 @@ def _fit(self, df: pd.DataFrame):
     def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
         return self.fgen.generate(df)
 
-    def __init__(self, fgen: FeatureGenerator):
+    def __init__(self, fgen: "FeatureGenerator"):
         super().__init__()
         self.fgen = fgen
         self.setName(f"{self.__class__.__name__}[{self.fgen.getName()}]")
diff --git a/src/sensai/featuregen.py b/src/sensai/featuregen.py
index 3a59354c..48df2618 100644
--- a/src/sensai/featuregen.py
+++ b/src/sensai/featuregen.py
@@ -9,14 +9,13 @@
 
 from . import util, data_transformation
 from .columngen import ColumnGenerator
-from .data_transformation import DFTNormalisation, DFTFromFeatureGenerator
+from .data_transformation import DFTNormalisation, DFTFromFeatureGenerator, DataFrameTransformer
 from .util import flattenArguments
 from .util.string import orRegexGroup, ToStringMixin, listString
 from .util.typing import PandasNamedTuple
 
 if TYPE_CHECKING:
     from .vector_model import VectorModel
-    from .data_transformation import DataFrameTransformer
 
 log = logging.getLogger(__name__)
 
@@ -998,7 +997,7 @@ def flattenedFeatureGenerator(fgen: FeatureGenerator, columnsToFlatten: List[str
             MultiFeatureGenerator(flatteningGenerator, FeatureGeneratorTakeColumns(exceptColumns=columnsToFlatten)))
 
 
-class FeatureGeneratorFromDataFrameTransformer(FeatureGenerator):
+class FeatureGeneratorFromDFT(FeatureGenerator):
     def __init__(self, dft: DataFrameTransformer, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None,
             normalisationRules: Sequence[data_transformation.DFTNormalisation.Rule] = (),
             normalisationRuleTemplate: data_transformation.DFTNormalisation.RuleTemplate = None,

From 21bdd341b837a1a8af704690429dd0ea7020334c Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Tue, 7 Jun 2022 16:46:52 +0200
Subject: [PATCH 119/131] VectorModel: fixes in fitting of rawInputTransformers

---
 src/sensai/vector_model.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 4731039d..05d0633e 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -212,7 +212,7 @@ def withFeatureCollector(self, featureCollector: FeatureCollector) -> __qualname
         return self
 
     def _preProcessorsAreFitted(self):
-        result = self._featureTransformerChain.isFitted()
+        result = self._rawInputTransformerChain.isFitted() and self._featureTransformerChain.isFitted()
         if self.getFeatureGenerator() is not None:
             result = result and self.getFeatureGenerator().isFitted()
         return result
@@ -312,6 +312,7 @@ def _underlyingModelRequiresFitting(self) -> bool:
         return True
 
     def _fitPreprocessors(self, X: pd.DataFrame, Y: pd.DataFrame = None):
+        self._rawInputTransformerChain.fit(X)
         # no need for fitGenerate if chain is empty
         if self._featureGenerator is not None:
             if len(self._featureTransformerChain) == 0:

From 1404a2e72dbd6d66caf1c77c88e431ccefe855f7 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Tue, 7 Jun 2022 16:47:52 +0200
Subject: [PATCH 120/131] Tests: adjusted to new structure and minor
 enhancement of test cases

I found out that pytest simply ignores test classes that have an init
without even showing an error...
---
 tests/base/test_data_transformation.py | 14 +++++++++++---
 tests/base/test_featuregen.py          | 20 +++++++++++++-------
 tests/base/test_vector_model.py        |  8 ++++----
 3 files changed, 28 insertions(+), 14 deletions(-)

diff --git a/tests/base/test_data_transformation.py b/tests/base/test_data_transformation.py
index 33ea6c62..794855c1 100644
--- a/tests/base/test_data_transformation.py
+++ b/tests/base/test_data_transformation.py
@@ -2,9 +2,11 @@
 
 import numpy as np
 import pandas as pd
+import pytest
 import sklearn.preprocessing
 
 from sensai.data_transformation import DataFrameTransformer, RuleBasedDataFrameTransformer, DataFrameTransformerChain, DFTNormalisation
+from sensai.featuregen import FeatureGenerator
 
 log = logging.getLogger(__name__)
 
@@ -21,11 +23,17 @@ class RuleBasedTestDFT(RuleBasedDataFrameTransformer):
         def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
             return df
 
-    testdf = pd.DataFrame({"foo": [1, 2], "bar": [1, 2]})
+    class TestFgen(FeatureGenerator):
+        def _fit(self, X: pd.DataFrame, Y: pd.DataFrame = None, ctx=None):
+            pass
 
-    def test_basicProperties(self):
-        testdft = self.TestDFT()
+        def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
+            return pd.DataFrame({"foo": [1, 2], "baz": [1, 2]})
+
+    testdf = pd.DataFrame({"foo": [1, 2], "bar": [1, 2]})
 
+    @pytest.mark.parametrize("testdft", [TestDFT(), TestFgen().toDFT()])
+    def test_basicProperties(self, testdft):
         assert not testdft.isFitted()
         assert testdft.info()["changeInColumnNames"] is None
         testdft.fit(self.testdf)
diff --git a/tests/base/test_featuregen.py b/tests/base/test_featuregen.py
index f8766d11..adc55c4c 100644
--- a/tests/base/test_featuregen.py
+++ b/tests/base/test_featuregen.py
@@ -6,7 +6,7 @@
 import pytest
 
 from sensai import InputOutputData
-from sensai.data_transformation import DFTNormalisation, DFTFillNA
+from sensai.data_transformation import DFTNormalisation, DFTFillNA, DataFrameTransformer
 from sensai.data_transformation.sklearn_transformer import SkLearnTransformerFactoryFactory
 from sensai.evaluation import VectorClassificationModelEvaluator
 from sensai.featuregen import FeatureGeneratorFlattenColumns, FeatureGeneratorTakeColumns, flattenedFeatureGenerator, \
@@ -57,18 +57,24 @@ def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
         return df
 
 
+class TestDFT(DataFrameTransformer):
+    def _fit(self, df: pd.DataFrame):
+        pass
+
+    def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
+        return df
+
+
 class RuleBasedTestFgen(RuleBasedFeatureGenerator):
     def _generate(self, df: pd.DataFrame, ctx=None) -> pd.DataFrame:
         return df
 
 
 class TestFgenBasics:
-    def __init__(self):
-        self.testdf = pd.DataFrame({"foo": [1, 2], "bar": [1, 2]})
-
-    def test_basicProperties(self):
-        testfgen = TestFgen()
+    testdf = pd.DataFrame({"foo": [1, 2], "bar": [1, 2]})
 
+    @pytest.mark.parametrize("testfgen", [TestFgen(), TestDFT().toFeatureGenerator()])
+    def test_basicProperties(self, testfgen):
         assert not testfgen.isFitted()
         assert testfgen.getGeneratedColumnNames() is None
         testfgen.fit(self.testdf)
@@ -76,7 +82,7 @@ def test_basicProperties(self):
         testfgen.generate(self.testdf)
         assert set(testfgen.getGeneratedColumnNames()) == {"foo", "bar"}
     
-    @pytest.mark.parametrize("fgen", [TestFgen(), RuleBasedTestFgen(), MultiFeatureGenerator(TestFgen()),
+    @pytest.mark.parametrize("fgen", [TestFgen(), TestDFT().toFeatureGenerator(), RuleBasedTestFgen(), MultiFeatureGenerator(TestFgen()),
         ChainedFeatureGenerator(TestFgen())])
     def test_Naming(self, fgen):
         assert isinstance(fgen.getName(), str)
diff --git a/tests/base/test_vector_model.py b/tests/base/test_vector_model.py
index 2a196e0b..9de23912 100644
--- a/tests/base/test_vector_model.py
+++ b/tests/base/test_vector_model.py
@@ -108,7 +108,7 @@ def test_isFittedWhenPreprocessorsRuleBased(self, model, ruleBasedDFT, ruleBased
     @pytest.mark.parametrize("modelConstructor", [SampleRuleBasedVectorModel, fittedVectorModel])
     def test_isFittedWithFittableProcessors(self, modelConstructor, fittableDFT, fittableFgen):
         # is fitted after fit with model
-        model = modelConstructor().withInputTransformers(fittableDFT)
+        model = modelConstructor().withRawInputTransformers(fittableDFT)
         assert not model.isFitted()
         model.fit(testX, testY)
         assert model.isFitted()
@@ -116,7 +116,7 @@ def test_isFittedWithFittableProcessors(self, modelConstructor, fittableDFT, fit
         # is fitted if DFT is fitted
         fittedDFT = copy(fittableDFT)
         fittedDFT.fit(testX)
-        model = modelConstructor().withInputTransformers(fittedDFT)
+        model = modelConstructor().withRawInputTransformers(fittedDFT)
         assert model.isFitted()
 
         # same for fgen
@@ -151,7 +151,7 @@ def test_isFittedWithTargetTransformer(self, vectorModel, fittableDFT):
 
 def test_InputRowsRemovedByTransformer(irisClassificationTestCase):
     """
-    Tests handling of case where the input generation process removes rows from the data
+    Tests handling of case where the input generation process removes rows from the raw data
     """
     iodata = irisClassificationTestCase.data
 
@@ -174,5 +174,5 @@ def _fitClassifier(self, X: pd.DataFrame, y: pd.DataFrame):
         def _predictClassProbabilities(self, X: pd.DataFrame) -> pd.DataFrame:
             pass
 
-    model = MyModel().withInputTransformers(DFTDropNA())
+    model = MyModel().withRawInputTransformers(DFTDropNA())
     model.fit(iodata.inputs, iodata.outputs)

From 5308b6c6e95c0385fe9f165469cdee4aea3aa4cf Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 21 Jun 2022 11:14:24 +0200
Subject: [PATCH 121/131] Sync avancis

  commit 5d24078ced7d96bf3ca70f781b5442fd64e7769d
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 21 11:06:08 2022 +0200

      Added DFTCastCategoricalColumns

  sensai/data_transformation/dft.py

  commit 1a36188107daf7f7620ca7dfa225f54701608e60
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 21 10:58:41 2022 +0200

      Added module feature_selection.rfe with class RecursiveFeatureEliminationCV

  sensai/feature_selection/rfe.py

  commit 1a15aeb932ecb6acc0f97be985e4dab7fcbd206c
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 21 10:55:43 2022 +0200

      VectorModels: Added parameter fitModel to fit methods; added method removeInputPreprocessors

  sensai/tensor_model.py
  sensai/vector_model.py

  commit 84859e9b7ac56d4064a2b98fc43fe90c754dcf5d
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 21 10:55:25 2022 +0200

      Implement FeatureImportanceProvider in xgboost models

  sensai/xgboost.py

  commit 86dd2119157ef3fe079043d4175e4eed43f9c89a
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 21 10:42:57 2022 +0200

      Added class FeatureImportance as a proper representation for feature importance

      FeatureImportanceProvider: Added method getFeatureImportance returning FeatureImportance instance

      AggregatedFeatureImportances: Renamed method getFeatureImportanceSum -> getAggregatedFeatureImportanceDict;
        added method getAggregatedFeatureImportance returning FeatureImportance instance

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py

  commit 7895a0eec1daa2ce8b039f2dbaac3246b1708cfe
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Jun 20 14:45:55 2022 +0200

      LogTime: Added log message when starting

  sensai/util/logging.py

  commit c75ef3a43e8206a70add4f39d2c2968e60103722
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Jun 20 14:17:38 2022 +0200

      VectorModel._computeModelOutputs: Store _modelOutputVariableNames only if model is being fitted

  sensai/vector_model.py

  commit b8ce50b0b952feef6d2f2e966fa5b41b41da9993
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Jun 20 11:32:58 2022 +0200

      RegressionEvalStats.plotErrorDistribution: Address seaborn issue with low number of data points and bins='auto'

  sensai/evaluation/eval_stats/eval_stats_regression.py

  commit 24b678e5091b02ac4c87e1957f4c8b0a68926308
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Fri Jun 3 15:52:45 2022 +0200

      Added sklearn linear model variants: ridge & lasso regression

  sensai/sklearn/sklearn_regression.py
---
 src/sensai/data_transformation/dft.py         |  27 +++-
 .../eval_stats/eval_stats_regression.py       |  11 +-
 src/sensai/evaluation/eval_util.py            |   2 +-
 src/sensai/feature_importance.py              |  39 ++++-
 src/sensai/feature_selection/rfe.py           | 137 ++++++++++++++++++
 src/sensai/sklearn/sklearn_regression.py      |  44 +++++-
 src/sensai/tensor_model.py                    |   8 +-
 src/sensai/util/logging.py                    |   2 +
 src/sensai/vector_model.py                    |  35 +++--
 src/sensai/xgboost.py                         |  23 ++-
 10 files changed, 299 insertions(+), 29 deletions(-)
 create mode 100644 src/sensai/feature_selection/rfe.py

diff --git a/src/sensai/data_transformation/dft.py b/src/sensai/data_transformation/dft.py
index cf873ad8..f7698bb6 100644
--- a/src/sensai/data_transformation/dft.py
+++ b/src/sensai/data_transformation/dft.py
@@ -840,6 +840,31 @@ def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
             return df.fillna(value=self.fillValue)
 
 
+class DFTCastCategoricalColumns(RuleBasedDataFrameTransformer):
+    """
+    Casts columns with dtype category to the given type.
+    This can be useful in cases where categorical columns are not accepted by the model but the column values are actually numeric,
+    in which case the cast to a numeric value yields an acceptable label encoding.
+    """
+    def __init__(self, columns: Optional[List[str]] = None, dtype=float):
+        """
+        :param columns: the columns to convert; if None, convert all that have dtype category
+        :param dtype: the data type to which categorical columns are to be converted
+        """
+        super().__init__()
+        self.columns = columns
+        self.dtype = dtype
+
+    def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
+        df = df.copy()
+        columns = self.columns if self.columns is not None else df.columns
+        for col in columns:
+            s = df[col]
+            if s.dtype.name == "category":
+                df[col] = s.astype(self.dtype)
+        return df
+    
+
 class DFTDropNA(RuleBasedDataFrameTransformer):
     """
     Drops rows or columns containing NA/NaN values
@@ -858,4 +883,4 @@ def _apply(self, df: pd.DataFrame) -> pd.DataFrame:
             df.dropna(axis=self.axis, inplace=True)
             return df
         else:
-            return df.dropna(axis=self.axis)
\ No newline at end of file
+            return df.dropna(axis=self.axis)
diff --git a/src/sensai/evaluation/eval_stats/eval_stats_regression.py b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
index c9844767..f121d4eb 100644
--- a/src/sensai/evaluation/eval_stats/eval_stats_regression.py
+++ b/src/sensai/evaluation/eval_stats/eval_stats_regression.py
@@ -1,10 +1,10 @@
 import logging
-import numpy as np
-import seaborn as sns
 from abc import abstractmethod, ABC
+from typing import List, Sequence, Optional
+
+import numpy as np
 from matplotlib import pyplot as plt
 from matplotlib.colors import LinearSegmentedColormap
-from typing import List, Sequence, Optional
 
 from .eval_stats_base import PredictionEvalStats, Metric, EvalStatsCollection, PredictionArray, EvalStatsPlot
 from ...util.plot import HistogramPlot
@@ -181,7 +181,10 @@ def plotErrorDistribution(self, bins="auto", titleAdd=None) -> Optional[plt.Figu
         title = "Prediction Error Distribution"
         if titleAdd is not None:
             title += "\n" + titleAdd
-        plot = HistogramPlot(errors, bins=bins, kde=True).title(title)
+        if bins == "auto" and len(errors) < 100:
+            bins = 10  # seaborn can crash with low number of data points and bins="auto" (tries to allocate vast amounts of memory)
+        plot = HistogramPlot(errors, bins=bins, kde=True)
+        plot.title(title)
         plot.xlabel("error (prediction - ground truth)")
         plot.ylabel("probability density")
         return plot.fig
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 8a02d316..0d533e93 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -696,7 +696,7 @@ def _collect(self, model: Union[FeatureImportanceProvider, VectorModelBase]):
         self.aggFeatureImportance.add(model.getFeatureImportances())
 
     def plotFeatureImportance(self) -> plt.Figure:
-        return plotFeatureImportance(self.aggFeatureImportance.getFeatureImportanceSum(), subtitle=self.modelName)
+        return plotFeatureImportance(self.aggFeatureImportance.getAggregatedFeatureImportanceDict(), subtitle=self.modelName)
 
     def collectPlots(self, resultCollector: EvaluationResultCollector):
         resultCollector.addFigure(f"{self.modelName}_feature-importance", self.plotFeatureImportance())
diff --git a/src/sensai/feature_importance.py b/src/sensai/feature_importance.py
index 7da122e1..f8fafada 100644
--- a/src/sensai/feature_importance.py
+++ b/src/sensai/feature_importance.py
@@ -1,7 +1,7 @@
 import collections
 import re
 from abc import ABC, abstractmethod
-from typing import Dict, Union, Sequence
+from typing import Dict, Union, Sequence, List, Tuple
 
 import seaborn as sns
 from matplotlib import pyplot as plt
@@ -9,6 +9,35 @@
 from .util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 
 
+class FeatureImportance:
+    def __init__(self, featureImportances: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
+        self.featureImportances = featureImportances
+        self._isMultiVar = self._isDict(next(iter(featureImportances.values())))
+
+    @staticmethod
+    def _isDict(x):
+        return hasattr(x, "get")
+
+    def getFeatureImportanceDict(self, predictedVarName=None) -> Dict[str, float]:
+        if self._isMultiVar:
+            self.featureImportances: Dict[str, Dict[str, float]]
+            if predictedVarName is not None:
+                return self.featureImportances[predictedVarName]
+            else:
+                if len(self.featureImportances) > 1:
+                    raise ValueError("Must provide predicted variable name (multiple output variables)")
+                else:
+                    return next(iter(self.featureImportances.values()))
+        else:
+            return self.featureImportances
+
+    def getSortedTuples(self, predictedVarName=None) -> List[Tuple[str, float]]:
+        # noinspection PyTypeChecker
+        tuples: List[Tuple[str, float]] = list(self.getFeatureImportanceDict(predictedVarName).items())
+        tuples.sort(key=lambda t: t[1])
+        return tuples
+
+
 class FeatureImportanceProvider(ABC):
     """
     Interface for models that can provide feature importance values
@@ -23,6 +52,9 @@ def getFeatureImportances(self) -> Union[Dict[str, float], Dict[str, Dict[str, f
         """
         pass
 
+    def getFeatureImportance(self) -> FeatureImportance:
+        return FeatureImportance(self.getFeatureImportances())
+
 
 def plotFeatureImportance(featureImportanceDict: Dict[str, float], subtitle: str = None) -> plt.Figure:
     numFeatures = len(featureImportanceDict)
@@ -95,5 +127,8 @@ def _aggFeatureName(self, featureName: str):
                 return m.group(1)
         return featureName
 
-    def getFeatureImportanceSum(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
+    def getAggregatedFeatureImportanceDict(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
         return self.aggDict
+
+    def getAggregatedFeatureImportance(self) -> FeatureImportance:
+        return FeatureImportance(self.aggDict)
diff --git a/src/sensai/feature_selection/rfe.py b/src/sensai/feature_selection/rfe.py
new file mode 100644
index 00000000..c404c4c0
--- /dev/null
+++ b/src/sensai/feature_selection/rfe.py
@@ -0,0 +1,137 @@
+import logging
+from copy import copy
+from dataclasses import dataclass
+from typing import Union, List
+
+import matplotlib.pyplot as plt
+import numpy as np
+
+from sensai import VectorModel, InputOutputData
+from sensai.evaluation import VectorModelCrossValidatorParams, createVectorModelCrossValidator
+from sensai.feature_importance import FeatureImportanceProvider, AggregatedFeatureImportances
+from sensai.util.plot import ScatterPlot
+
+log = logging.getLogger(__name__)
+
+
+class RecursiveFeatureEliminationCV:
+    """
+    Recursive feature elimination, using cross-validation to select the best set of features:
+    In each step, the model is first evaluated using cross-validation.
+    Then the feature importance values are aggregated across the models that were trained during cross-validation,
+    and the least important feature is discarded. For the case where the lowest feature importance is 0, all
+    features with 0 importance are discarded.
+    This process is repeated until a point is reached where only `minFeatures` (or less) remain.
+    The selected set of features is the one from the step where cross-validation yielded the best evaluation metric value.
+
+    Feature importance is computed at the level of model input features, i.e. after feature generation and transformation.
+
+    NOTE: This implementation differs markedly from sklearn's RFECV, which performs an independent RFE for each fold.
+    RFECV determines the number of features to use by determining the elimination step in each fold that yielded the best
+    metric value on average. Because the eliminations are independent, the actual features that were being used in those step
+    could have been completely different. Using the selected number of features n, RFECV then performs another RFE, eliminating features
+    until n features remain and returns these features as the result.
+    """
+    def __init__(self, crossValidatorParams: VectorModelCrossValidatorParams, minFeatures=1):
+        """
+        :param crossValidatorParams: the parameters for cross-validation
+        :param minFeatures: the minimum number of features to evaluate
+        """
+        self.crossValidatorParams = crossValidatorParams
+        self.minFeatures = minFeatures
+
+    @dataclass
+    class Step:
+        metricValue: float
+        features: List[str]
+
+    class Result:
+        def __init__(self, steps: List["RecursiveFeatureEliminationCV.Step"], metricName: str, minimise: bool):
+            self.steps = steps
+            self.metricName = metricName
+            self.minimise = minimise
+
+        def getSortedSteps(self) -> List["RecursiveFeatureEliminationCV.Step"]:
+            """
+            :return: the elimination step results, sorted from best to worst
+            """
+            return sorted(self.steps, key=lambda s: s.metricValue, reverse=not self.minimise)
+
+        def getSelectedFeatures(self) -> List[str]:
+            return self.getSortedSteps()[0].features
+
+        def getNumFeaturesArray(self) -> np.ndarray:
+            """
+            :return: array containing the number of features that was considered in each step
+            """
+            return np.array([len(s.features) for s in self.steps])
+
+        def getMetricValuesArray(self) -> np.ndarray:
+            """
+            :return: array containing the metric value that resulted in each step
+            """
+            return np.array([s.metricValue for s in self.steps])
+
+        def plotMetricValues(self) -> plt.Figure:
+            """
+            Plots the metric values vs. the number of features for each step of the elimination
+
+            :return: the figure
+            """
+            return ScatterPlot(self.getNumFeaturesArray(), self.getMetricValuesArray(), c_opacity=1, x_label="number of features",
+                y_label=f"cross-validation mean metric value ({self.metricName})").fig
+
+    def run(self, model: Union[VectorModel, FeatureImportanceProvider], ioData: InputOutputData, metricName: str, minimise: bool) -> Result:
+        """
+        Runs the optimisation for the given model and data.
+
+        :param model: the model
+        :param ioData: the data
+        :param metricName: the metric to optimise
+        :param minimise: whether the metric shall be minimsed; if False, maximise.
+        :return: a result object, which provides access to the selected features and data on all elimination steps
+        """
+        metricKey = f"mean[{metricName}]"
+
+        model = copy(model)
+        model.fitInputOutputData(ioData, fitPreprocessors=True, fitModel=False)
+        inputs = model.computeModelInputs(ioData.inputs)
+        model.removeInputPreprocessors()
+        ioData = InputOutputData(inputs, ioData.outputs)
+
+        features = list(inputs.columns)
+        steps = []
+        while True:
+            # evaluate model
+            crossValidator = createVectorModelCrossValidator(ioData, model=model, params=self.crossValidatorParams)
+            crossValData = crossValidator.evalModel(model)
+            aggMetricsDict = crossValData.getEvalStatsCollection().aggMetricsDict()
+            metricValue = aggMetricsDict[metricKey]
+
+            steps.append(self.Step(metricValue=metricValue, features=features))
+
+            # eliminate feature(s)
+            log.info(f"Model performance with {len(features)} features: {metricKey}={metricValue}")
+            aggImportance = AggregatedFeatureImportances(*crossValData.trainedModels)
+            fi = aggImportance.getAggregatedFeatureImportance()
+            tuples = fi.getSortedTuples()
+            minImportance = tuples[0][1]
+            if minImportance == 0:
+                eliminatedFeatures = []
+                for i, (fname, importance) in enumerate(tuples):
+                    if importance > 0:
+                        break
+                    eliminatedFeatures.append(fname)
+                log.info(f"Eliminating {len(eliminatedFeatures)} features with 0 importance: {eliminatedFeatures}")
+            else:
+                eliminatedFeatures = [tuples[0][0]]
+                log.info(f"Eliminating feature {eliminatedFeatures[0]}")
+            features = [f for f in features if f not in eliminatedFeatures]
+            ioData.inputs = ioData.inputs[features]
+            log.info(f"{len(features)} features remain")
+
+            if len(features) < self.minFeatures:
+                log.info("Minimum number of features reached/exceeded")
+                break
+
+        return self.Result(steps, metricName, minimise)
\ No newline at end of file
diff --git a/src/sensai/sklearn/sklearn_regression.py b/src/sensai/sklearn/sklearn_regression.py
index 31e617c7..49bdd1cd 100644
--- a/src/sensai/sklearn/sklearn_regression.py
+++ b/src/sensai/sklearn/sklearn_regression.py
@@ -23,8 +23,48 @@ def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
 
 
 class SkLearnLinearRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
-    def __init__(self, **modelArgs):
-        super().__init__(sklearn.linear_model.LinearRegression, **modelArgs)
+    def __init__(self, fit_intercept=True, **modelArgs):
+        """
+        :param fit_intercept: whether to determine the intercept, i.e. the constant term which is not scaled with an input feature value;
+            set to False if the data is already centred
+        :param modelArgs: see https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LinearRegression.html
+        """
+        super().__init__(sklearn.linear_model.LinearRegression, fit_intercept=fit_intercept, **modelArgs)
+
+    def getFeatureImportances(self) -> Dict[str, float]:
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+
+
+class SkLearnLinearRidgeRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
+    """
+    Linear least squares with L2 regularisation
+    """
+    def __init__(self, alpha=1.0, fit_intercept=True, solver="auto", max_iter=None, tol=1e-3, **modelArgs):
+        """
+        :param alpha: multiplies the L2 term, controlling regularisation strength
+        :param fit_intercept: whether to determine the intercept, i.e. the constant term which is not scaled with an input feature value;
+            set to False if the data is already centred
+        :param modelArgs: see https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.Ridge.html#sklearn.linear_model.Ridge
+        """
+        super().__init__(sklearn.linear_model.Ridge, alpha=alpha, fit_intercept=fit_intercept, max_iter=max_iter, tol=tol,
+            solver=solver, **modelArgs)
+
+    def getFeatureImportances(self) -> Dict[str, float]:
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+
+
+class SkLearnLinearLassoRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
+    """
+    Linear least squares with L1 regularisation, a.k.a. the lasso
+    """
+    def __init__(self, alpha=1.0, fit_intercept=True, max_iter=1000, tol=0.0001, **modelArgs):
+        """
+        :param alpha: multiplies the L1 term, controlling regularisation strength
+        :param fit_intercept: whether to determine the intercept, i.e. the constant term which is not scaled with an input feature value;
+            set to False if the data is already centred
+        :param modelArgs: see https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.Lasso.html#sklearn.linear_model.Lasso
+        """
+        super().__init__(sklearn.linear_model.Lasso, alpha=alpha, fit_intercept=fit_intercept, max_iter=max_iter, tol=tol, **modelArgs)
 
     def getFeatureImportances(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
diff --git a/src/sensai/tensor_model.py b/src/sensai/tensor_model.py
index c853ec8f..77f858f2 100644
--- a/src/sensai/tensor_model.py
+++ b/src/sensai/tensor_model.py
@@ -262,15 +262,15 @@ def isRegressionModel(self) -> bool:
     def getNumPredictedClasses(self):
         return self._numPredictedClasses
 
-    def fit(self, X: pd.DataFrame, Y: pd.DataFrame, fitPreprocessors=True):
+    def fit(self, X: pd.DataFrame, Y: pd.DataFrame, fitPreprocessors=True, fitModel=True):
         """
 
         :param X: data frame containing input tensors on which to train
         :param Y: ground truth has to be an array containing only zeroes and ones (one-hot-encoded labels) of the shape
             `(*predictionShape, numLabels)`
 
-        :param fitPreprocessors:
-        :return:
+        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall be fitted
+        :param fitModel: whether the model itself shall be fitted
         """
         if len(Y.columns) != 1:
             raise ValueError(f"{self.__class__.__name__} requires exactly one output "
@@ -290,7 +290,7 @@ def fit(self, X: pd.DataFrame, Y: pd.DataFrame, fitPreprocessors=True):
                                     f"predictionShape. If the predictions are scalars, a TensorToScalarClassificationModel "
                                     f"should be used instead of {self.__class__.__name__}")
         self._numPredictedClasses = dfYToCheck.shape[-1]
-        super().fit(X, Y, fitPreprocessors=fitPreprocessors)
+        super().fit(X, Y, fitPreprocessors=fitPreprocessors, fitModel=True)
 
     def getModelOutputShape(self):
         # The ground truth contains one-hot-encoded labels in the last dimension
diff --git a/src/sensai/util/logging.py b/src/sensai/util/logging.py
index 324392b1..adad5ce6 100644
--- a/src/sensai/util/logging.py
+++ b/src/sensai/util/logging.py
@@ -136,6 +136,8 @@ def start(self):
         Starts the stopwatch
         """
         self.stopwatch = StopWatch()
+        if self.enabled:
+            self.logger.info(f"{self.name} starting ...")
 
     def stop(self):
         """
diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 9be1f4ee..d35b1aff 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -243,6 +243,9 @@ def _computeModelInputs(self, X: pd.DataFrame, Y: pd.DataFrame = None, fit=False
     def _computeModelOutputs(self, Y: pd.DataFrame) -> pd.DataFrame:
         return Y
 
+    def computeModelOutputs(self, Y: pd.DataFrame) -> pd.DataFrame:
+        return self._computeModelOutputs(Y)
+
     def predict(self, x: pd.DataFrame) -> pd.DataFrame:
         """
         Applies the model to the given input data frame
@@ -295,23 +298,25 @@ def _fitPreprocessors(self, X: pd.DataFrame, Y: pd.DataFrame = None):
                 X = self._featureGenerator.fitGenerate(X, Y, self)
         self._inputTransformerChain.fit(X)
 
-    def fitInputOutputData(self, ioData: InputOutputData, fitPreprocessors=True):
+    def fitInputOutputData(self, ioData: InputOutputData, fitPreprocessors=True, fitModel=True):
         """
         Fits the model using the given data
 
         :param ioData: the input/output data
-        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall also be fitted
+        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall be fitted
+        :param fitModel: whether the model itself shall be fitted
         """
-        self.fit(ioData.inputs, ioData.outputs, fitPreprocessors=fitPreprocessors)
+        self.fit(ioData.inputs, ioData.outputs, fitPreprocessors=fitPreprocessors, fitModel=fitModel)
 
-    def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True):
+    def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True, fitModel=True):
         """
         Fits the model using the given data
 
         :param X: a data frame containing input data
         :param Y: a data frame containing output data; may be None if the underlying model does not actually require
             fitting, e.g. in the case of a rule-based models, but fitting is still necessary for preprocessors
-        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall also be fitted
+        :param fitPreprocessors: whether the model's preprocessors (feature generators and data frame transformers) shall be fitted
+        :param fitModel: whether the model itself shall be fitted
         """
         self._trainingContext = TrainingContext(X, Y)
         try:
@@ -336,11 +341,14 @@ def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True)
                         raise ValueError("Could not recover matching outputs for changed inputs. Only input filtering is admissible, "
                             "indices of input & ouput data frames must match.")
                 self._modelInputVariableNames = list(X.columns)
-                inputsWithTypes = ', '.join([n + '/' + X[n].dtype.name for n in self._modelInputVariableNames])
-                log.info(f"Fitting with outputs[{len(Y.columns)}]={list(Y.columns)}, "
-                    f"inputs[{len(self._modelInputVariableNames)}]=[{inputsWithTypes}]; N={len(X)} data points")
-                self._fit(X, Y)
-                self._isFitted = True
+                if fitModel:
+                    inputsWithTypes = ', '.join([n + '/' + X[n].dtype.name for n in self._modelInputVariableNames])
+                    log.info(f"Fitting with outputs[{len(Y.columns)}]={list(Y.columns)}, "
+                             f"inputs[{len(self._modelInputVariableNames)}]=[{inputsWithTypes}]; N={len(X)} data points")
+                    self._fit(X, Y)
+                    self._isFitted = True
+                else:
+                    log.info("Fitting of underlying model skipped")
             log.info(f"Fitting completed in {sw.getElapsedTimeSecs():.2f} seconds: {self}")
         finally:
             self._trainingContext = None
@@ -395,6 +403,10 @@ def getFeatureGenerator(self) -> Optional[FeatureGenerator]:
         """
         return self._featureGenerator
 
+    def removeInputPreprocessors(self):
+        self.withFeatureGenerator(None)
+        self.withInputTransformers()
+
 
 class VectorRegressionModel(VectorModel, ABC):
     def __init__(self, checkInputColumns=True):
@@ -496,7 +508,8 @@ def _applyPostProcessing(self, y: pd.DataFrame):
     def _computeModelOutputs(self, Y: pd.DataFrame) -> pd.DataFrame:
         if self._targetTransformer is not None:
             Y = self._targetTransformer.fitApply(Y)
-        self._modelOutputVariableNames = list(Y.columns)
+        if self.isBeingFitted():
+            self._modelOutputVariableNames = list(Y.columns)
         return Y
 
     def predict(self, x: pd.DataFrame) -> pd.DataFrame:
diff --git a/src/sensai/xgboost.py b/src/sensai/xgboost.py
index 202199ce..0485abe3 100644
--- a/src/sensai/xgboost.py
+++ b/src/sensai/xgboost.py
@@ -1,9 +1,12 @@
+from typing import Dict
+
 import xgboost
 
+from .feature_importance import FeatureImportanceProvider
 from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel
 
 
-class XGBGradientBoostedVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
+class XGBGradientBoostedVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
     """
     XGBoost's regression model using gradient boosted trees
     """
@@ -13,8 +16,11 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRegressor, random_state=random_state, **modelArgs)
 
+    def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
+        return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
+
 
-class XGBRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel):
+class XGBRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
     """
     XGBoost's random forest regression model
     """
@@ -24,8 +30,11 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRFRegressor, random_state=random_state, **modelArgs)
 
+    def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
+        return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
+
 
-class XGBGradientBoostedVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
+class XGBGradientBoostedVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
     """
     XGBoost's classification model using gradient boosted trees
     """
@@ -35,8 +44,11 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBClassifier, random_state=random_state, **modelArgs)
 
+    def getFeatureImportances(self) -> Dict[str, float]:
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
-class XGBRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
+
+class XGBRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
     """
     XGBoost's random forest classification model
     """
@@ -45,3 +57,6 @@ def __init__(self, random_state=42, **modelArgs):
         :param modelArgs: See https://xgboost.readthedocs.io/en/latest/python/python_api.html#xgboost.XGBRFClassifier
         """
         super().__init__(xgboost.XGBRFClassifier, random_state=random_state, **modelArgs)
+
+    def getFeatureImportances(self) -> Dict[str, float]:
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))

From fd6b9f7a51168487ee87f40579280a1780da695e Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 21 Jun 2022 11:28:14 +0200
Subject: [PATCH 122/131] Sync pjm
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

  commit 23c7400aa548bc15b45d21a13714bf83ed34d0bf
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 21 11:27:08 2022 +0200

      Renaming:
        * FeatureImportanceProvider.getFeatureImportances -> getFeatureImportanceDict
        * AggregatedFeatureImportances -> AggregatedFeatureImportance
        * ModelComparisonVisitorAggregatedFeatureImportances -> ModelComparisonVisitorAggregatedFeatureImportance

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py
  sensai/feature_selection/rfe.py
  sensai/lightgbm.py
  sensai/sklearn/sklearn_classification.py
  sensai/sklearn/sklearn_regression.py
  sensai/xgboost.py

  commit 9b05cfe88f21f9c65a98c70affb9f3be2e05fb92
  Author: Julian Übelacker <julian.uebelacker@jambit.com>
  Date:   Tue Jun 14 11:57:26 2022 +0200

      Added util.math.sigmoid

  sensai/util/math.py
---
 src/sensai/evaluation/eval_util.py           |  8 ++---
 src/sensai/feature_importance.py             | 32 ++++++++++----------
 src/sensai/feature_selection/rfe.py          |  4 +--
 src/sensai/lightgbm.py                       |  4 +--
 src/sensai/sklearn/sklearn_classification.py |  2 +-
 src/sensai/sklearn/sklearn_regression.py     |  8 ++---
 src/sensai/util/math.py                      |  5 +++
 src/sensai/xgboost.py                        |  8 ++---
 8 files changed, 38 insertions(+), 33 deletions(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 0d533e93..4f18975d 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -30,7 +30,7 @@
     VectorRegressionModelEvaluationData, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, \
     VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, VectorModelEvaluatorParams
 from ..data import InputOutputData
-from ..feature_importance import AggregatedFeatureImportances, FeatureImportanceProvider, plotFeatureImportance
+from ..feature_importance import AggregatedFeatureImportance, FeatureImportanceProvider, plotFeatureImportance
 from ..tracking import TrackedExperiment
 from ..util.io import ResultWriter
 from ..util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
@@ -663,7 +663,7 @@ def collectPlots(self, resultCollector: EvaluationResultCollector) -> None:
         pass
 
 
-class ModelComparisonVisitorAggregatedFeatureImportances(ModelComparisonVisitor):
+class ModelComparisonVisitorAggregatedFeatureImportance(ModelComparisonVisitor):
     """
     During a model comparison, computes aggregated feature importance values for the model with the given name
     """
@@ -676,7 +676,7 @@ def __init__(self, modelName: str, featureAggRegEx: Sequence[str] = ()):
             to be summed under "foo" and similarly "bar_1" and "bar_2" to be summed under "bar".
         """
         self.modelName = modelName
-        self.aggFeatureImportance = AggregatedFeatureImportances(featureAggRegEx=featureAggRegEx)
+        self.aggFeatureImportance = AggregatedFeatureImportance(featureAggRegEx=featureAggRegEx)
 
     def visit(self, modelName: str, result: ModelComparisonData.Result):
         if modelName == self.modelName:
@@ -693,7 +693,7 @@ def visit(self, modelName: str, result: ModelComparisonData.Result):
     def _collect(self, model: Union[FeatureImportanceProvider, VectorModelBase]):
         if not isinstance(model, FeatureImportanceProvider):
             raise ValueError(f"Got model which does inherit from {FeatureImportanceProvider.__qualname__}: {model}")
-        self.aggFeatureImportance.add(model.getFeatureImportances())
+        self.aggFeatureImportance.add(model.getFeatureImportanceDict())
 
     def plotFeatureImportance(self) -> plt.Figure:
         return plotFeatureImportance(self.aggFeatureImportance.getAggregatedFeatureImportanceDict(), subtitle=self.modelName)
diff --git a/src/sensai/feature_importance.py b/src/sensai/feature_importance.py
index f8fafada..2eae8ca9 100644
--- a/src/sensai/feature_importance.py
+++ b/src/sensai/feature_importance.py
@@ -10,9 +10,9 @@
 
 
 class FeatureImportance:
-    def __init__(self, featureImportances: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
-        self.featureImportances = featureImportances
-        self._isMultiVar = self._isDict(next(iter(featureImportances.values())))
+    def __init__(self, featureImportanceDict: Union[Dict[str, float], Dict[str, Dict[str, float]]]):
+        self.featureImportanceDict = featureImportanceDict
+        self._isMultiVar = self._isDict(next(iter(featureImportanceDict.values())))
 
     @staticmethod
     def _isDict(x):
@@ -20,16 +20,16 @@ def _isDict(x):
 
     def getFeatureImportanceDict(self, predictedVarName=None) -> Dict[str, float]:
         if self._isMultiVar:
-            self.featureImportances: Dict[str, Dict[str, float]]
+            self.featureImportanceDict: Dict[str, Dict[str, float]]
             if predictedVarName is not None:
-                return self.featureImportances[predictedVarName]
+                return self.featureImportanceDict[predictedVarName]
             else:
-                if len(self.featureImportances) > 1:
+                if len(self.featureImportanceDict) > 1:
                     raise ValueError("Must provide predicted variable name (multiple output variables)")
                 else:
-                    return next(iter(self.featureImportances.values()))
+                    return next(iter(self.featureImportanceDict.values()))
         else:
-            return self.featureImportances
+            return self.featureImportanceDict
 
     def getSortedTuples(self, predictedVarName=None) -> List[Tuple[str, float]]:
         # noinspection PyTypeChecker
@@ -43,7 +43,7 @@ class FeatureImportanceProvider(ABC):
     Interface for models that can provide feature importance values
     """
     @abstractmethod
-    def getFeatureImportances(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
+    def getFeatureImportanceDict(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
         """
         Gets the feature importance values
 
@@ -53,7 +53,7 @@ def getFeatureImportances(self) -> Union[Dict[str, float], Dict[str, Dict[str, f
         pass
 
     def getFeatureImportance(self) -> FeatureImportance:
-        return FeatureImportance(self.getFeatureImportances())
+        return FeatureImportance(self.getFeatureImportanceDict())
 
 
 def plotFeatureImportance(featureImportanceDict: Dict[str, float], subtitle: str = None) -> plt.Figure:
@@ -70,15 +70,15 @@ def plotFeatureImportance(featureImportanceDict: Dict[str, float], subtitle: str
     return fig
 
 
-class AggregatedFeatureImportances:
+class AggregatedFeatureImportance:
     """
     Aggregates feature importance values (e.g. from models implementing FeatureImportanceProvider, such as sklearn's RandomForest
     models and compatible models from lightgbm, etc.)
     """
-    def __init__(self, *featureImportances: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]],
+    def __init__(self, *items: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]],
             featureAggRegEx: Sequence[str] = ()):
         r"""
-        :param featureImportances: (optional) initial list of feature importance providers or dictionaries to aggregate; further
+        :param items: (optional) initial list of feature importance providers or dictionaries to aggregate; further
             values can be added via method add
         :param featureAggRegEx: a sequence of regular expressions describing which feature names to sum as one. Each regex must
             contain exactly one group. If a regex matches a feature name, the feature importance will be summed under the key
@@ -89,8 +89,8 @@ def __init__(self, *featureImportances: Union[FeatureImportanceProvider, Dict[st
         self._isNested = None
         self._numDictsAdded = 0
         self._featureAggRegEx = [re.compile(p) for p in featureAggRegEx]
-        for d in featureImportances:
-            self.add(d)
+        for item in items:
+            self.add(item)
 
     @staticmethod
     def _isDict(x):
@@ -103,7 +103,7 @@ def add(self, featureImportance: Union[FeatureImportanceProvider, Dict[str, floa
         :param featureImportance: the dictionary obtained via a model's getFeatureImportances method
         """
         if isinstance(featureImportance, FeatureImportanceProvider):
-            featureImportance = featureImportance.getFeatureImportances()
+            featureImportance = featureImportance.getFeatureImportanceDict()
         if self._isNested is None:
             self._isNested = self._isDict(next(iter(featureImportance.values())))
         if self._isNested:
diff --git a/src/sensai/feature_selection/rfe.py b/src/sensai/feature_selection/rfe.py
index c404c4c0..9d1fcd20 100644
--- a/src/sensai/feature_selection/rfe.py
+++ b/src/sensai/feature_selection/rfe.py
@@ -8,7 +8,7 @@
 
 from sensai import VectorModel, InputOutputData
 from sensai.evaluation import VectorModelCrossValidatorParams, createVectorModelCrossValidator
-from sensai.feature_importance import FeatureImportanceProvider, AggregatedFeatureImportances
+from sensai.feature_importance import FeatureImportanceProvider, AggregatedFeatureImportance
 from sensai.util.plot import ScatterPlot
 
 log = logging.getLogger(__name__)
@@ -112,7 +112,7 @@ def run(self, model: Union[VectorModel, FeatureImportanceProvider], ioData: Inpu
 
             # eliminate feature(s)
             log.info(f"Model performance with {len(features)} features: {metricKey}={metricValue}")
-            aggImportance = AggregatedFeatureImportances(*crossValData.trainedModels)
+            aggImportance = AggregatedFeatureImportance(*crossValData.trainedModels)
             fi = aggImportance.getAggregatedFeatureImportance()
             tuples = fi.getSortedTuples()
             minImportance = tuples[0][1]
diff --git a/src/sensai/lightgbm.py b/src/sensai/lightgbm.py
index e9c51421..258fd1cc 100644
--- a/src/sensai/lightgbm.py
+++ b/src/sensai/lightgbm.py
@@ -61,7 +61,7 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
     def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         _updateFitArgs(self.fitArgs, inputs, outputs, self._categoricalFeatureNameRegex)
 
-    def getFeatureImportances(self) -> Dict[str, Dict[str, int]]:
+    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, int]]:
         return {targetFeature: dict(zip(model.feature_name_, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
 
@@ -105,7 +105,7 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
     def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         _updateFitArgs(self.fitArgs, inputs, outputs, self._categoricalFeatureNameRegex)
 
-    def getFeatureImportances(self) -> Dict[str, Dict[str, int]]:
+    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, int]]:
         return dict(zip(self.model.feature_name_, self.model.feature_importances_))
 
     def _predictClassProbabilities(self, x: pd.DataFrame):
diff --git a/src/sensai/sklearn/sklearn_classification.py b/src/sensai/sklearn/sklearn_classification.py
index 9365446a..e59d10f1 100644
--- a/src/sensai/sklearn/sklearn_classification.py
+++ b/src/sensai/sklearn/sklearn_classification.py
@@ -25,7 +25,7 @@ def __init__(self, min_samples_leaf=8, random_state=42, useComputedClassWeights=
             useComputedClassWeights=useComputedClassWeights,
             **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, float]:
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
 
diff --git a/src/sensai/sklearn/sklearn_regression.py b/src/sensai/sklearn/sklearn_regression.py
index 49bdd1cd..d0e575d0 100644
--- a/src/sensai/sklearn/sklearn_regression.py
+++ b/src/sensai/sklearn/sklearn_regression.py
@@ -18,7 +18,7 @@ def __init__(self, n_estimators=100, min_samples_leaf=10, random_state=42, **mod
         super().__init__(sklearn.ensemble.RandomForestRegressor,
             n_estimators=n_estimators, min_samples_leaf=min_samples_leaf, random_state=random_state, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
+    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, float]]:
         return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
 
@@ -31,7 +31,7 @@ def __init__(self, fit_intercept=True, **modelArgs):
         """
         super().__init__(sklearn.linear_model.LinearRegression, fit_intercept=fit_intercept, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, float]:
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
 
@@ -49,7 +49,7 @@ def __init__(self, alpha=1.0, fit_intercept=True, solver="auto", max_iter=None,
         super().__init__(sklearn.linear_model.Ridge, alpha=alpha, fit_intercept=fit_intercept, max_iter=max_iter, tol=tol,
             solver=solver, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, float]:
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
 
@@ -66,7 +66,7 @@ def __init__(self, alpha=1.0, fit_intercept=True, max_iter=1000, tol=0.0001, **m
         """
         super().__init__(sklearn.linear_model.Lasso, alpha=alpha, fit_intercept=fit_intercept, max_iter=max_iter, tol=tol, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, float]:
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
 
diff --git a/src/sensai/util/math.py b/src/sensai/util/math.py
index f9e2efae..bcbc8ced 100644
--- a/src/sensai/util/math.py
+++ b/src/sensai/util/math.py
@@ -1,3 +1,4 @@
+import math
 import scipy.stats
 
 from .string import objectRepr
@@ -25,5 +26,9 @@ def __str__(self):
         return objectRepr(self, ["mean", "std", "unitMax"])
 
 
+def sigmoid(x: float):
+    return math.exp(x) / (1 + math.exp(x))
+
+
 def reduceFloatPrecisionDecimals(f: float, decimals: int) -> float:
     return float(format(f, '.%df' % decimals))
\ No newline at end of file
diff --git a/src/sensai/xgboost.py b/src/sensai/xgboost.py
index 0485abe3..85141c36 100644
--- a/src/sensai/xgboost.py
+++ b/src/sensai/xgboost.py
@@ -16,7 +16,7 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRegressor, random_state=random_state, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
+    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, float]]:
         return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
 
@@ -30,7 +30,7 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRFRegressor, random_state=random_state, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, Dict[str, float]]:
+    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, float]]:
         return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
 
@@ -44,7 +44,7 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBClassifier, random_state=random_state, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, float]:
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
 
@@ -58,5 +58,5 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRFClassifier, random_state=random_state, **modelArgs)
 
-    def getFeatureImportances(self) -> Dict[str, float]:
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
         return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))

From 5c049494a92affe2d09058454e220cf9f627c585 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 21 Jun 2022 11:32:09 +0200
Subject: [PATCH 123/131] Added FeatureImportanceProvider.getFeatureImportances
 (deprecated) for backward compatibility

---
 src/sensai/feature_importance.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/sensai/feature_importance.py b/src/sensai/feature_importance.py
index 2eae8ca9..bc12c289 100644
--- a/src/sensai/feature_importance.py
+++ b/src/sensai/feature_importance.py
@@ -6,6 +6,7 @@
 import seaborn as sns
 from matplotlib import pyplot as plt
 
+from .util.deprecation import deprecated
 from .util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 
 
@@ -55,6 +56,10 @@ def getFeatureImportanceDict(self) -> Union[Dict[str, float], Dict[str, Dict[str
     def getFeatureImportance(self) -> FeatureImportance:
         return FeatureImportance(self.getFeatureImportanceDict())
 
+    @deprecated("Use getFeatureImportanceDict or the high-level interface getFeatureImportance instead.")
+    def getFeatureImportances(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
+        return self.getFeatureImportanceDict()
+
 
 def plotFeatureImportance(featureImportanceDict: Dict[str, float], subtitle: str = None) -> plt.Figure:
     numFeatures = len(featureImportanceDict)

From a2bbbabc68b53fb9f8f4de385611967e591d1ba3 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 22 Jun 2022 00:02:56 +0200
Subject: [PATCH 124/131] Extended VectorModel.removeInputPreprocessors to also
 remove the newly introduced raw input transformers

---
 src/sensai/vector_model.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 534ba865..29e08125 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -447,7 +447,6 @@ def getInputTransformerChain(self) -> DataFrameTransformerChain:
         """
         return self._featureTransformerChain
 
-
     def getRawInputTransformerChain(self) -> DataFrameTransformerChain:
         """
         :return: the model's raw input transformer chain (which may be empty and contain no actual transformers),
@@ -472,8 +471,12 @@ def getFeatureGenerator(self) -> Optional[FeatureGenerator]:
         return self._featureGenerator
 
     def removeInputPreprocessors(self):
+        """
+        Removes all input preprocessors (i.e. raw input transformers, feature generators and feature transformers) from the model
+        """
+        self.withRawInputTransformers()
         self.withFeatureGenerator(None)
-        self.withInputTransformers()
+        self.withFeatureTransformers()
 
 
 class VectorRegressionModel(VectorModel, ABC):

From 50212b92f1142f2ec625e4bf5169be7dd33d8c2c Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Wed, 22 Jun 2022 00:12:03 +0200
Subject: [PATCH 125/131] Fixed backward compatibility: default value for new
 attribute _rawInputTransformerChain was not set

---
 src/sensai/vector_model.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index 29e08125..c8bc2d67 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -128,7 +128,8 @@ def __getstate__(self):
     def __setstate__(self, state):
         for m in VectorModel._TRANSIENT_MEMBERS:
             state[m] = None
-        setstate(VectorModel, self, state, renamedProperties=self._RENAMED_MEMBERS)
+        setstate(VectorModel, self, state, renamedProperties=self._RENAMED_MEMBERS,
+            newDefaultProperties={"_rawInputTransformerChain": DataFrameTransformerChain()})
 
     def _toStringExcludePrivate(self) -> bool:
         return True

From e7f5df81314ce1310c8dc9573e499923d4743785 Mon Sep 17 00:00:00 2001
From: Dominik Jain <djain@gmx.net>
Date: Thu, 23 Jun 2022 21:41:04 +0200
Subject: [PATCH 126/131] Added feature importance mixins for sklearn-type
 models, eliminating duplicate implementations

---
 src/sensai/lightgbm.py                       | 19 ++++++--------
 src/sensai/sklearn/sklearn_base.py           | 21 +++++++++++++++-
 src/sensai/sklearn/sklearn_classification.py | 12 +++------
 src/sensai/sklearn/sklearn_regression.py     | 26 ++++++--------------
 src/sensai/xgboost.py                        | 26 +++++---------------
 5 files changed, 44 insertions(+), 60 deletions(-)

diff --git a/src/sensai/lightgbm.py b/src/sensai/lightgbm.py
index 258fd1cc..4f09a47e 100644
--- a/src/sensai/lightgbm.py
+++ b/src/sensai/lightgbm.py
@@ -1,12 +1,13 @@
-from typing import Sequence, Union, Optional, Dict
 import logging
+import re
+from typing import Sequence, Union, Optional
+
 import lightgbm
 import pandas as pd
-import re
 
-from .feature_importance import FeatureImportanceProvider
+from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel, \
+    FeatureImportanceProviderSkLearnRegressionMultipleOneDim, FeatureImportanceProviderSkLearnClassification
 from .util.string import orRegexGroup
-from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel
 
 log = logging.getLogger(__name__)
 
@@ -24,7 +25,7 @@ def _updateFitArgs(fitArgs: dict, inputs: pd.DataFrame, outputs: pd.DataFrame, c
         fitArgs.pop("categorical_feature", None)
 
 
-class LightGBMVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
+class LightGBMVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultipleOneDim):
     log = log.getChild(__qualname__)
 
     def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None, random_state=42, num_leaves=31,
@@ -61,11 +62,8 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
     def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         _updateFitArgs(self.fitArgs, inputs, outputs, self._categoricalFeatureNameRegex)
 
-    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, int]]:
-        return {targetFeature: dict(zip(model.feature_name_, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
-
-class LightGBMVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
+class LightGBMVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProviderSkLearnClassification):
     log = log.getChild(__qualname__)
 
     def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]] = None, random_state=42, num_leaves=31,
@@ -105,9 +103,6 @@ def __init__(self, categoricalFeatureNames: Optional[Union[Sequence[str], str]]
     def _updateFitArgs(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         _updateFitArgs(self.fitArgs, inputs, outputs, self._categoricalFeatureNameRegex)
 
-    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, int]]:
-        return dict(zip(self.model.feature_name_, self.model.feature_importances_))
-
     def _predictClassProbabilities(self, x: pd.DataFrame):
         if len(self._labels) == 1:
             # special handling required because LGBMClassifier will return values for two classes even if there is only one
diff --git a/src/sensai/sklearn/sklearn_base.py b/src/sensai/sklearn/sklearn_base.py
index 38f7859a..c719fff0 100644
--- a/src/sensai/sklearn/sklearn_base.py
+++ b/src/sensai/sklearn/sklearn_base.py
@@ -8,6 +8,7 @@
 import pandas as pd
 from sklearn import compose
 
+from ..feature_importance import FeatureImportanceProvider
 from ..util.pickle import setstate
 from ..vector_model import VectorRegressionModel, VectorClassificationModel
 
@@ -303,4 +304,22 @@ def _computeClassWeights(self, outputs: pd.DataFrame):
         counts = classes.value_counts()
         rfreqs = counts / counts.sum()
         weights: pd.Series = 1.0 / rfreqs
-        return weights.to_dict()
\ No newline at end of file
+        return weights.to_dict()
+
+
+class FeatureImportanceProviderSkLearnRegressionMultipleOneDim(FeatureImportanceProvider):
+    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, int]]:
+        self: AbstractSkLearnMultipleOneDimVectorRegressionModel
+        return {targetFeature: dict(zip(model.feature_name_, model.feature_importances_)) for targetFeature, model in self.models.items()}
+
+
+class FeatureImportanceProviderSkLearnRegressionMultiDim(FeatureImportanceProvider):
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
+        self: AbstractSkLearnMultiDimVectorRegressionModel
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+
+
+class FeatureImportanceProviderSkLearnClassification(FeatureImportanceProvider):
+    def getFeatureImportanceDict(self) -> Dict[str, float]:
+        self: AbstractSkLearnVectorClassificationModel
+        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
diff --git a/src/sensai/sklearn/sklearn_classification.py b/src/sensai/sklearn/sklearn_classification.py
index e59d10f1..51a060fd 100644
--- a/src/sensai/sklearn/sklearn_classification.py
+++ b/src/sensai/sklearn/sklearn_classification.py
@@ -1,13 +1,12 @@
 import logging
-from typing import Union, Optional, Dict
+from typing import Union, Optional
 
 import sklearn.ensemble
 import sklearn.naive_bayes
 import sklearn.neural_network
 import sklearn.tree
 
-from .sklearn_base import AbstractSkLearnVectorClassificationModel
-from ..feature_importance import FeatureImportanceProvider
+from .sklearn_base import AbstractSkLearnVectorClassificationModel, FeatureImportanceProviderSkLearnClassification
 
 log = logging.getLogger(__name__)
 
@@ -18,16 +17,13 @@ def __init__(self, min_samples_leaf=8, random_state=42, **modelArgs):
             min_samples_leaf=min_samples_leaf, random_state=random_state, **modelArgs)
 
 
-class SkLearnRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
+class SkLearnRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProviderSkLearnClassification):
     def __init__(self, min_samples_leaf=8, random_state=42, useComputedClassWeights=False, **modelArgs):
         super().__init__(sklearn.ensemble.RandomForestClassifier,
             random_state=random_state, min_samples_leaf=min_samples_leaf,
             useComputedClassWeights=useComputedClassWeights,
             **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, float]:
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
-
 
 class SkLearnMLPVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     def __init__(self, hidden_layer_sizes=(100,), activation: str = "relu",
@@ -60,4 +56,4 @@ def __init__(self, random_state=42, **modelArgs):
 
 class SkLearnLogisticRegressionVectorClassificationModel(AbstractSkLearnVectorClassificationModel):
     def __init__(self, random_state=42, **modelArgs):
-        super().__init__(sklearn.linear_model.LogisticRegression, random_state=random_state, **modelArgs)
\ No newline at end of file
+        super().__init__(sklearn.linear_model.LogisticRegression, random_state=random_state, **modelArgs)
diff --git a/src/sensai/sklearn/sklearn_regression.py b/src/sensai/sklearn/sklearn_regression.py
index d0e575d0..23c4b5e4 100644
--- a/src/sensai/sklearn/sklearn_regression.py
+++ b/src/sensai/sklearn/sklearn_regression.py
@@ -1,5 +1,5 @@
 import logging
-from typing import Union, Optional, Dict
+from typing import Union, Optional
 
 import sklearn.ensemble
 import sklearn.linear_model
@@ -7,22 +7,19 @@
 import sklearn.neural_network
 import sklearn.svm
 
-from .sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnMultiDimVectorRegressionModel
-from ..feature_importance import FeatureImportanceProvider
+from .sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnMultiDimVectorRegressionModel, \
+    FeatureImportanceProviderSkLearnRegressionMultipleOneDim, FeatureImportanceProviderSkLearnRegressionMultiDim
 
 log = logging.getLogger(__name__)
 
 
-class SkLearnRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
+class SkLearnRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultipleOneDim):
     def __init__(self, n_estimators=100, min_samples_leaf=10, random_state=42, **modelArgs):
         super().__init__(sklearn.ensemble.RandomForestRegressor,
             n_estimators=n_estimators, min_samples_leaf=min_samples_leaf, random_state=random_state, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, float]]:
-        return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
 
-
-class SkLearnLinearRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
+class SkLearnLinearRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultiDim):
     def __init__(self, fit_intercept=True, **modelArgs):
         """
         :param fit_intercept: whether to determine the intercept, i.e. the constant term which is not scaled with an input feature value;
@@ -31,11 +28,8 @@ def __init__(self, fit_intercept=True, **modelArgs):
         """
         super().__init__(sklearn.linear_model.LinearRegression, fit_intercept=fit_intercept, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, float]:
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
-
 
-class SkLearnLinearRidgeRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
+class SkLearnLinearRidgeRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultiDim):
     """
     Linear least squares with L2 regularisation
     """
@@ -49,11 +43,8 @@ def __init__(self, alpha=1.0, fit_intercept=True, solver="auto", max_iter=None,
         super().__init__(sklearn.linear_model.Ridge, alpha=alpha, fit_intercept=fit_intercept, max_iter=max_iter, tol=tol,
             solver=solver, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, float]:
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
-
-class SkLearnLinearLassoRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProvider):
+class SkLearnLinearLassoRegressionVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultiDim):
     """
     Linear least squares with L1 regularisation, a.k.a. the lasso
     """
@@ -66,9 +57,6 @@ def __init__(self, alpha=1.0, fit_intercept=True, max_iter=1000, tol=0.0001, **m
         """
         super().__init__(sklearn.linear_model.Lasso, alpha=alpha, fit_intercept=fit_intercept, max_iter=max_iter, tol=tol, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, float]:
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
-
 
 class SkLearnMultiLayerPerceptronVectorRegressionModel(AbstractSkLearnMultiDimVectorRegressionModel):
     def __init__(self,
diff --git a/src/sensai/xgboost.py b/src/sensai/xgboost.py
index 85141c36..8775f9d9 100644
--- a/src/sensai/xgboost.py
+++ b/src/sensai/xgboost.py
@@ -1,12 +1,10 @@
-from typing import Dict
-
 import xgboost
 
-from .feature_importance import FeatureImportanceProvider
-from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel
+from .sklearn.sklearn_base import AbstractSkLearnMultipleOneDimVectorRegressionModel, AbstractSkLearnVectorClassificationModel, \
+    FeatureImportanceProviderSkLearnRegressionMultipleOneDim, FeatureImportanceProviderSkLearnClassification
 
 
-class XGBGradientBoostedVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
+class XGBGradientBoostedVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultipleOneDim):
     """
     XGBoost's regression model using gradient boosted trees
     """
@@ -16,11 +14,8 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRegressor, random_state=random_state, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, float]]:
-        return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
-
 
-class XGBRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProvider):
+class XGBRandomForestVectorRegressionModel(AbstractSkLearnMultipleOneDimVectorRegressionModel, FeatureImportanceProviderSkLearnRegressionMultipleOneDim):
     """
     XGBoost's random forest regression model
     """
@@ -30,11 +25,8 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBRFRegressor, random_state=random_state, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, Dict[str, float]]:
-        return {targetFeature: dict(zip(self._modelInputVariableNames, model.feature_importances_)) for targetFeature, model in self.models.items()}
-
 
-class XGBGradientBoostedVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
+class XGBGradientBoostedVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProviderSkLearnClassification):
     """
     XGBoost's classification model using gradient boosted trees
     """
@@ -44,11 +36,8 @@ def __init__(self, random_state=42, **modelArgs):
         """
         super().__init__(xgboost.XGBClassifier, random_state=random_state, **modelArgs)
 
-    def getFeatureImportanceDict(self) -> Dict[str, float]:
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
 
-
-class XGBRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProvider):
+class XGBRandomForestVectorClassificationModel(AbstractSkLearnVectorClassificationModel, FeatureImportanceProviderSkLearnClassification):
     """
     XGBoost's random forest classification model
     """
@@ -57,6 +46,3 @@ def __init__(self, random_state=42, **modelArgs):
         :param modelArgs: See https://xgboost.readthedocs.io/en/latest/python/python_api.html#xgboost.XGBRFClassifier
         """
         super().__init__(xgboost.XGBRFClassifier, random_state=random_state, **modelArgs)
-
-    def getFeatureImportanceDict(self) -> Dict[str, float]:
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))

From c94c96529a3678582d7daae111d8681b30194d3a Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Tue, 28 Jun 2022 20:44:54 +0200
Subject: [PATCH 127/131] Sync avancis

  commit b3750b99a7f49a8e6d476d26a5b24d2f63a033d6
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 20:43:27 2022 +0200

      Support visitor result collection in EvaluationUtil.compareModels; added CSV result to feature importance visitor

  sensai/evaluation/eval_util.py

  commit fdea09fa138b6dc7f9760c5a7dbf5d7179f08207
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 20:42:31 2022 +0200

      Improved string reprentations for TorchVector*Models without instantiated submodel

  sensai/torch/torch_base.py

  commit 2d2228aa95ca80516586ebde0d2345b5b41b9217
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 19:20:19 2022 +0200

      Changed log level of message listing i/o columns to DEBUG (as it may be excessively long)

  sensai/vector_model.py

  commit 390a1e1457d2cb72dbe0e4d68fd9c22d6ed2c965
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Mon Jun 27 19:25:16 2022 +0200

      VectorRegressionModelEvaluatorParams: Allow to control full set of metrics (not only additionalMetrics)

  sensai/evaluation/evaluator.py
---
 src/sensai/evaluation/eval_util.py | 38 ++++++++++++++++++++++--------
 src/sensai/evaluation/evaluator.py |  9 ++++---
 src/sensai/torch/torch_base.py     | 12 ++++++++--
 src/sensai/vector_model.py         |  2 +-
 4 files changed, 45 insertions(+), 16 deletions(-)

diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index 4f18975d..ddcf2edc 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -139,10 +139,14 @@ def __init__(self, showPlots: bool = True, resultWriter: Optional[ResultWriter]
         self.showPlots = showPlots
         self.resultWriter = resultWriter
 
-    def addFigure(self, name, fig: matplotlib.figure.Figure):
+    def addFigure(self, name: str, fig: matplotlib.figure.Figure):
         if self.resultWriter is not None:
             self.resultWriter.writeFigure(name, fig, closeFigure=not self.showPlots)
 
+    def addDataFrameCsvFile(self, name: str, df: pd.DataFrame):
+        if self.resultWriter is not None:
+            self.resultWriter.writeDataFrameCsvFile(name, df)
+
     def child(self, addedFilenamePrefix):
         resultWriter = self.resultWriter
         if resultWriter:
@@ -315,7 +319,8 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
 
     def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None, useCrossValidation=False,
             fitModels=True, writeIndividualResults=True, sortColumn: Optional[str] = None, sortAscending: bool = True,
-            visitors: Optional[Iterable["ModelComparisonVisitor"]] = None) -> "ModelComparisonData":
+            visitors: Optional[Iterable["ModelComparisonVisitor"]] = None,
+            writeVisitorResults=False) -> "ModelComparisonData":
         """
         Compares several models via simple evaluation or cross-validation
 
@@ -329,6 +334,7 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
         :param sortColumn: column/metric name by which to sort
         :param sortAscending: whether to sort in ascending order
         :param visitors: visitors which may process individual results
+        :param writeVisitorResults: whether to collect results from visitors (if any) after the comparison
         :return: the comparison results
         """
         statsList = []
@@ -368,6 +374,10 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
             suffix = "crossval" if useCrossValidation else "simple-eval"
             strResults += "\n\n" + "\n\n".join([f"{model.getName()} = {str(model)}" for model in models])
             resultWriter.writeTextFile(f"model-comparison-results-{suffix}", strResults)
+        if visitors is not None and writeVisitorResults:
+            resultCollector = EvaluationResultCollector(showPlots=False, resultWriter=resultWriter)
+            for visitor in visitors:
+                visitor.collectResults(resultCollector)
         return ModelComparisonData(resultsDF, resultByModelName)
 
     def compareModelsCrossValidation(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None) -> "ModelComparisonData":
@@ -540,7 +550,8 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
 
             # compute data frame with results for current data set
             childResultWriter = resultWriter.childForSubdirectory(key) if (writePerDatasetResults and resultWriter is not None) else None
-            comparisonData = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter, visitors=visitors)
+            comparisonData = ev.compareModels(models, useCrossValidation=useCrossValidation, resultWriter=childResultWriter,
+                visitors=visitors, writeVisitorResults=False)
             df = comparisonData.resultsDF
 
             # augment data frame
@@ -608,11 +619,11 @@ def compareModels(self, modelFactories: Sequence[Callable[[], Union[VectorRegres
                     evalStats = ClassificationEvalStatsCollection(evalStatsList).getGlobalStats()
                 plotCollector.createPlots(evalStats, subtitle=modelName, resultCollector=resultCollector)
 
-        # create plots from visitors (if any)
+        # collect results from visitors (if any)
         resultCollector = EvaluationResultCollector(showPlots=False, resultWriter=resultWriter)
         if visitors is not None:
             for visitor in visitors:
-                visitor.collectPlots(resultCollector)
+                visitor.collectResults(resultCollector)
 
         # create result
         if isRegression:
@@ -654,9 +665,9 @@ def visit(self, modelName: str, result: ModelComparisonData.Result):
         pass
 
     @abstractmethod
-    def collectPlots(self, resultCollector: EvaluationResultCollector) -> None:
+    def collectResults(self, resultCollector: EvaluationResultCollector) -> None:
         """
-        Collects figures at the end of the model comparison, based on the results collected
+        Collects results (such as figures) at the end of the model comparison, based on the results collected
 
         :param resultCollector: the collector to which figures are to be added
         """
@@ -667,7 +678,7 @@ class ModelComparisonVisitorAggregatedFeatureImportance(ModelComparisonVisitor):
     """
     During a model comparison, computes aggregated feature importance values for the model with the given name
     """
-    def __init__(self, modelName: str, featureAggRegEx: Sequence[str] = ()):
+    def __init__(self, modelName: str, featureAggRegEx: Sequence[str] = (), writeFigure=True, writeDataFrameCSV=False):
         """
         :param modelName: the name of the model for which to compute the aggregated feature importance values
         :param featureAggRegEx: a sequence of regular expressions describing which feature names to sum as one. Each regex must
@@ -677,6 +688,8 @@ def __init__(self, modelName: str, featureAggRegEx: Sequence[str] = ()):
         """
         self.modelName = modelName
         self.aggFeatureImportance = AggregatedFeatureImportance(featureAggRegEx=featureAggRegEx)
+        self.writeFigure = writeFigure
+        self.writeDataFrameCSV = writeDataFrameCSV
 
     def visit(self, modelName: str, result: ModelComparisonData.Result):
         if modelName == self.modelName:
@@ -698,8 +711,13 @@ def _collect(self, model: Union[FeatureImportanceProvider, VectorModelBase]):
     def plotFeatureImportance(self) -> plt.Figure:
         return plotFeatureImportance(self.aggFeatureImportance.getAggregatedFeatureImportanceDict(), subtitle=self.modelName)
 
-    def collectPlots(self, resultCollector: EvaluationResultCollector):
-        resultCollector.addFigure(f"{self.modelName}_feature-importance", self.plotFeatureImportance())
+    def collectResults(self, resultCollector: EvaluationResultCollector):
+        if self.writeFigure:
+            resultCollector.addFigure(f"{self.modelName}_feature-importance", self.plotFeatureImportance())
+        if self.writeDataFrameCSV:
+            namesAndImportance = self.aggFeatureImportance.getAggregatedFeatureImportance().getSortedTuples()
+            df = pd.DataFrame(namesAndImportance, columns=["feature", "importance"])
+            resultCollector.addDataFrameCsvFile(f"{self.modelName}_feature-importance", df)
 
 
 class MultiDataModelComparisonData(Generic[TEvalStats, TEvalStatsCollection], ABC):
diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index 927795cf..6db0639f 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -1,7 +1,7 @@
 import functools
 import logging
 from abc import ABC, abstractmethod
-from typing import Tuple, Dict, Any, Generator, Generic, TypeVar, Sequence, Optional, List, Union, Callable, Iterator
+from typing import Tuple, Dict, Any, Generator, Generic, TypeVar, Sequence, Optional, List, Union, Callable
 
 import pandas as pd
 
@@ -9,8 +9,8 @@
 from .eval_stats.eval_stats_base import EvalStats, EvalStatsCollection
 from .eval_stats.eval_stats_classification import ClassificationEvalStats, ClassificationMetric
 from .eval_stats.eval_stats_regression import RegressionEvalStats, RegressionEvalStatsCollection, RegressionMetric
-from ..data_transformation import DataFrameTransformer
 from ..data import DataSplitter, DataSplitterFractional, InputOutputData
+from ..data_transformation import DataFrameTransformer
 from ..tracking import TrackingMixin, TrackedExperiment
 from ..util.string import ToStringMixin
 from ..util.typing import PandasNamedTuple
@@ -231,7 +231,7 @@ def fitModel(self, model: VectorModelFittableBase):
 
 class VectorRegressionModelEvaluatorParams(VectorModelEvaluatorParams):
     def __init__(self, dataSplitter: DataSplitter = None, fractionalSplitTestFraction: float = None, fractionalSplitRandomSeed=42,
-            fractionalSplitShuffle=True, additionalMetrics: Sequence[RegressionMetric] = None,
+            fractionalSplitShuffle=True, metrics: Sequence[RegressionMetric] = None, additionalMetrics: Sequence[RegressionMetric] = None,
             outputDataFrameTransformer: DataFrameTransformer = None):
         """
         :param dataSplitter: [if test data must be obtained via split] a splitter to use in order to obtain; if None, must specify
@@ -240,12 +240,14 @@ def __init__(self, dataSplitter: DataSplitter = None, fractionalSplitTestFractio
         :param fractionalSplitRandomSeed: [if dataSplitter is none, test data must be obtained via split] the random seed to use for the fractional split of the data
         :param fractionalSplitShuffle: [if dataSplitter is None, test data must be obtained via split] whether to randomly (based on randomSeed) shuffle the dataset before
             splitting it
+
         :param additionalMetrics: additional regression metrics to apply
         :param outputDataFrameTransformer: a data frame transformer to apply to all output data frames (both model outputs and ground truth),
             such that evaluation metrics are computed on the transformed data frame
         """
         super().__init__(dataSplitter, fractionalSplitTestFraction=fractionalSplitTestFraction, fractionalSplitRandomSeed=fractionalSplitRandomSeed,
             fractionalSplitShuffle=fractionalSplitShuffle)
+        self.metrics = metrics
         self.additionalMetrics = additionalMetrics
         self.outputDataFrameTransformer = outputDataFrameTransformer
 
@@ -298,6 +300,7 @@ def _evalModel(self, model: VectorModelBase, data: InputOutputData) -> VectorReg
         predictions, groundTruth = self._computeOutputs(model, data)
         for predictedVarName in predictions.columns:
             evalStats = RegressionEvalStats(y_predicted=predictions[predictedVarName], y_true=groundTruth[predictedVarName],
+                metrics=self.params.metrics,
                 additionalMetrics=self.params.additionalMetrics)
             evalStatsByVarName[predictedVarName] = evalStats
         return VectorRegressionModelEvaluationData(evalStatsByVarName, data.inputs, model)
diff --git a/src/sensai/torch/torch_base.py b/src/sensai/torch/torch_base.py
index 7aa37c99..b11d551f 100644
--- a/src/sensai/torch/torch_base.py
+++ b/src/sensai/torch/torch_base.py
@@ -521,7 +521,11 @@ def _predict(self, inputs: pd.DataFrame) -> pd.DataFrame:
         return pd.DataFrame(yArray, columns=self.getModelOutputVariableNames())
 
     def _toStringExcludes(self) -> List[str]:
-        return super()._toStringExcludes() + ["modelClass", "modelArgs", "modelKwArgs", "inputTensoriser"]
+        excludes = super()._toStringExcludes()
+        if self.model is not None:
+            return excludes + ["modelClass", "modelArgs", "modelKwArgs"]
+        else:
+            return excludes
 
 
 class TorchVectorClassificationModel(VectorClassificationModel):
@@ -671,7 +675,11 @@ def _predictClassProbabilities(self, inputs: pd.DataFrame) -> pd.DataFrame:
         return pd.DataFrame(y.numpy(), columns=self._labels)
 
     def _toStringExcludes(self) -> List[str]:
-        return super()._toStringExcludes() + ["modelClass", "modelArgs", "modelKwArgs", "inputTensoriser"]
+        excludes = super()._toStringExcludes()
+        if self.model is not None:
+            return excludes + ["modelClass", "modelArgs", "modelKwArgs"]
+        else:
+            return excludes
 
 
 class TorchDataSetProviderFactory(ABC):
diff --git a/src/sensai/vector_model.py b/src/sensai/vector_model.py
index d35b1aff..f26bd60e 100644
--- a/src/sensai/vector_model.py
+++ b/src/sensai/vector_model.py
@@ -343,7 +343,7 @@ def fit(self, X: pd.DataFrame, Y: Optional[pd.DataFrame], fitPreprocessors=True,
                 self._modelInputVariableNames = list(X.columns)
                 if fitModel:
                     inputsWithTypes = ', '.join([n + '/' + X[n].dtype.name for n in self._modelInputVariableNames])
-                    log.info(f"Fitting with outputs[{len(Y.columns)}]={list(Y.columns)}, "
+                    log.debug(f"Fitting with outputs[{len(Y.columns)}]={list(Y.columns)}, "
                              f"inputs[{len(self._modelInputVariableNames)}]=[{inputsWithTypes}]; N={len(X)} data points")
                     self._fit(X, Y)
                     self._isFitted = True

From 8143dbf153a2c835481894b9e718796797ab03f6 Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Thu, 30 Jun 2022 19:22:52 +0200
Subject: [PATCH 128/131] ToStringMixin._ToStringMixinProxy: Fixed issue where
 the transitive conversion of a ToStringMixin would ignore method overrides in
 subclasses

---
 src/sensai/util/string.py      |  2 +-
 tests/base/test_util_string.py | 24 ++++++++++++++++++++++++
 2 files changed, 25 insertions(+), 1 deletion(-)
 create mode 100644 tests/base/test_util_string.py

diff --git a/src/sensai/util/string.py b/src/sensai/util/string.py
index 99748b43..cc433f38 100644
--- a/src/sensai/util/string.py
+++ b/src/sensai/util/string.py
@@ -361,7 +361,7 @@ def _toStringClassName(self):
 
             def __getattr__(self, attr: str):
                 if attr.startswith("_toString"):  # ToStringMixin method which we bind to use this proxy
-                    method = getattr(ToStringMixin, attr)
+                    method = getattr(self.x.__class__, attr)
                     return lambda *args, **kwargs: method(self, *args, **kwargs)
                 else:
                     return getattr(self.x, attr)
diff --git a/tests/base/test_util_string.py b/tests/base/test_util_string.py
new file mode 100644
index 00000000..56e22f50
--- /dev/null
+++ b/tests/base/test_util_string.py
@@ -0,0 +1,24 @@
+from sensai.util.string import ToStringMixin
+
+
+class A(ToStringMixin):
+    def __init__(self, p1):
+        self.p1 = p1
+        self.p2 = 2
+        self.p3 = self
+        self.p5 = ["foo", self]
+
+    def _toStringExcludes(self):
+        return ["p2"]
+
+
+class B(ToStringMixin):
+    def __init__(self, a):
+        self.a = a
+
+
+def test_ToStringMixin_recursion():
+    s = str(A("foo"))
+    assert s == "A[p1=foo, p3=A[<<], p5=[foo, A[<<]]]"
+    s = str(B(A("foo")))
+    assert s == "B[a=A[p1=foo, p3=A[<<], p5=[foo, A[<<]]]]"

From c30920c365ab8fc149969789b5a361dc15f3738e Mon Sep 17 00:00:00 2001
From: Dominik Jain <dominik.jain@jambit.com>
Date: Thu, 30 Jun 2022 19:30:15 +0200
Subject: [PATCH 129/131] Sync avancis

  commit 63ad5d3d65b613f71841dc83bdbcfbe5ea83dd71
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 30 17:40:21 2022 +0200

      Improved consistency of output file naming across EvalUtil and MultiDataEvalUtil

  sensai/evaluation/eval_util.py

  commit ce7e1de62b3db18f6dd05ba13477c91e43c10284
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 30 14:55:02 2022 +0200

      FeatureImportance: Moved functionality from the visitor to this class to improve reusability

  sensai/evaluation/eval_util.py
  sensai/feature_importance.py

  commit 5af8fd21d3999f643d797b18e3779ae0279a11ab
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 30 14:24:01 2022 +0200

      Added permutation feature importance computation, included aggregations thereof via AggregatedPermutationFeatureImportance

  sensai/feature_importance.py

  commit 5a5410fa49f521abd3b55ad40fdb066cbda3df7e
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 30 14:14:05 2022 +0200

      VectorModelEvaluationData: Store full InputOutputData instead of just input data frame

  sensai/evaluation/evaluator.py

  commit 0e0a12bc4d6520975cc1825b7fbed4eeb0ac5fda
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 30 12:28:51 2022 +0200

      InputOutputData: added string repr

  sensai/data.py

  commit 4adc7448f48d290ef18517796d883aa1786f1321
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Thu Jun 30 11:34:25 2022 +0200

      EvaluationUtil.compareModels: Consider agg. columns when using sortColumn, allow to also include unsorted results

  sensai/evaluation/eval_util.py

  commit b4e83fc58b9b1409d1d1e938df3fe857d24a31d9
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 22:25:49 2022 +0200

      EvaluationUtil.compareModels: Use formatted model string repr. in results text file

  sensai/evaluation/eval_util.py

  commit 6d2f63afcf6fd642da674ed8d9b057f7c9b7b6fd
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 22:24:30 2022 +0200

      Improved string repr. of objects with uninstantiated underlying model(s)

  sensai/sklearn/sklearn_base.py

  commit 6f68bedf44425bab3e3ac5562d5281b5d3078b86
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 21:42:32 2022 +0200

      ModelComparisonVisitorAggregatedFeatureImportance: Fixed plotting for nested feature importance dict

  sensai/evaluation/eval_util.py

  commit 3d47010a7d9728a7e007f8c71ab562f04444357f
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 21:41:34 2022 +0200

      FeatureImportance.getSortedTuples: Added docstring, allow to reverse order

  sensai/feature_importance.py

  commit aaa447d1c1ef7ea035c728ebdc2799e11ef22266
  Author: Dominik Jain <dominik.jain@jambit.com>
  Date:   Tue Jun 28 21:39:14 2022 +0200

      Fixed feature importance retrieval for some models:
        * Fixed feature name retrieval for multiple one-dim. regression models
        * Fixed importance retrieval for linear models (using abs. coefficients)

  sensai/sklearn/sklearn_base.py
---
 src/sensai/data.py                 |   7 +-
 src/sensai/evaluation/eval_util.py |  39 +++++++---
 src/sensai/evaluation/evaluator.py |  14 ++--
 src/sensai/feature_importance.py   | 113 ++++++++++++++++++++++++++---
 src/sensai/sklearn/sklearn_base.py |  24 ++++--
 5 files changed, 161 insertions(+), 36 deletions(-)

diff --git a/src/sensai/data.py b/src/sensai/data.py
index 263ba8bc..7f2d5091 100644
--- a/src/sensai/data.py
+++ b/src/sensai/data.py
@@ -7,6 +7,8 @@
 import scipy.stats
 from sklearn.model_selection import StratifiedShuffleSplit
 
+from sensai.util.string import ToStringMixin
+
 log = logging.getLogger(__name__)
 
 T = TypeVar("T")
@@ -50,13 +52,16 @@ def toTorchDataLoader(self, batchSize=64, shuffle=True):
         return DataLoader(dataSet, batch_size=batchSize, shuffle=shuffle)
 
 
-class InputOutputData(BaseInputOutputData[pd.DataFrame]):
+class InputOutputData(BaseInputOutputData[pd.DataFrame], ToStringMixin):
     """
     Holds input and output data for learning problems
     """
     def __init__(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
         super().__init__(inputs, outputs)
 
+    def _toStringObjectInfo(self) -> str:
+        return f"N={len(self.inputs)}, numInputColumns={len(self.inputs.columns)}, numOutputColumns={len(self.outputs.columns)}"
+
     @classmethod
     def fromDataFrame(cls, df: pd.DataFrame, *outputColumns: str) -> "InputOutputData":
         """
diff --git a/src/sensai/evaluation/eval_util.py b/src/sensai/evaluation/eval_util.py
index ddcf2edc..e1c8f76e 100644
--- a/src/sensai/evaluation/eval_util.py
+++ b/src/sensai/evaluation/eval_util.py
@@ -30,10 +30,10 @@
     VectorRegressionModelEvaluationData, VectorClassificationModelEvaluator, VectorClassificationModelEvaluationData, \
     VectorRegressionModelEvaluatorParams, VectorClassificationModelEvaluatorParams, VectorModelEvaluatorParams
 from ..data import InputOutputData
-from ..feature_importance import AggregatedFeatureImportance, FeatureImportanceProvider, plotFeatureImportance
+from ..feature_importance import AggregatedFeatureImportance, FeatureImportanceProvider, plotFeatureImportance, FeatureImportance
 from ..tracking import TrackedExperiment
+from ..util.deprecation import deprecated
 from ..util.io import ResultWriter
-from ..util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
 from ..util.string import prettyStringRepr
 from ..vector_model import VectorClassificationModel, VectorRegressionModel, VectorModel, VectorModelBase
 
@@ -286,7 +286,7 @@ def gatherResults(evalResultData: VectorModelEvaluationData, resultWriter, subti
     def _resultWriterForModel(resultWriter: Optional[ResultWriter], model: TModel) -> Optional[ResultWriter]:
         if resultWriter is None:
             return None
-        return resultWriter.childWithAddedPrefix(model.getName() + "-")
+        return resultWriter.childWithAddedPrefix(model.getName() + "_")
 
     def performCrossValidation(self, model: TModel, showPlots=False, logResults=True, resultWriter: Optional[ResultWriter] = None,
             trackedExperiment: TrackedExperiment = None) -> TCrossValData:
@@ -319,6 +319,7 @@ def performCrossValidation(self, model: TModel, showPlots=False, logResults=True
 
     def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultWriter] = None, useCrossValidation=False,
             fitModels=True, writeIndividualResults=True, sortColumn: Optional[str] = None, sortAscending: bool = True,
+            alsoIncludeUnsortedResults: bool = False,
             visitors: Optional[Iterable["ModelComparisonVisitor"]] = None,
             writeVisitorResults=False) -> "ModelComparisonData":
         """
@@ -333,6 +334,8 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
             summary)
         :param sortColumn: column/metric name by which to sort
         :param sortAscending: whether to sort in ascending order
+        :param alsoIncludeUnsortedResults: whether to also include, for the case where the results are sorted, the unsorted table of
+            results in the results text
         :param visitors: visitors which may process individual results
         :param writeVisitorResults: whether to collect results from visitors (if any) after the comparison
         :return: the comparison results
@@ -363,16 +366,24 @@ def compareModels(self, models: Sequence[TModel], resultWriter: Optional[ResultW
                 for visitor in visitors:
                     visitor.visit(modelName, modelResult)
         resultsDF = pd.DataFrame(statsList).set_index("modelName")
+        unsortedResultsDF = resultsDF
         if sortColumn is not None:
             if sortColumn not in resultsDF.columns:
-                log.warning(f"Requested sort column '{sortColumn}' not in list of columns {list(resultsDF.columns)}")
-            else:
-                resultsDF.sort_values(sortColumn, ascending=sortAscending, inplace=True)
+                altSortColumn = f"mean[{sortColumn}]"
+                if altSortColumn in resultsDF.columns:
+                    sortColumn = altSortColumn
+                else:
+                    sortColumn = None
+                    log.warning(f"Requested sort column '{sortColumn}' (or '{altSortColumn}') not in list of columns {list(resultsDF.columns)}")
+            if sortColumn is not None:
+                resultsDF = resultsDF.sort_values(sortColumn, ascending=sortAscending, inplace=False)
         strResults = f"Model comparison results:\n{resultsDF.to_string()}"
+        if alsoIncludeUnsortedResults and sortColumn is not None:
+            strResults += f"\n\nModel comparison results (unsorted):\n{unsortedResultsDF.to_string()}"
         log.info(strResults)
         if resultWriter is not None:
             suffix = "crossval" if useCrossValidation else "simple-eval"
-            strResults += "\n\n" + "\n\n".join([f"{model.getName()} = {str(model)}" for model in models])
+            strResults += "\n\n" + "\n\n".join([f"{model.getName()} = {model.pprints()}" for model in models])
             resultWriter.writeTextFile(f"model-comparison-results-{suffix}", strResults)
         if visitors is not None and writeVisitorResults:
             resultCollector = EvaluationResultCollector(showPlots=False, resultWriter=resultWriter)
@@ -708,16 +719,20 @@ def _collect(self, model: Union[FeatureImportanceProvider, VectorModelBase]):
             raise ValueError(f"Got model which does inherit from {FeatureImportanceProvider.__qualname__}: {model}")
         self.aggFeatureImportance.add(model.getFeatureImportanceDict())
 
+    @deprecated("Use getFeatureImportance and create the plot using the returned object")
     def plotFeatureImportance(self) -> plt.Figure:
-        return plotFeatureImportance(self.aggFeatureImportance.getAggregatedFeatureImportanceDict(), subtitle=self.modelName)
+        featureImportanceDict = self.aggFeatureImportance.getAggregatedFeatureImportance().getFeatureImportanceDict()
+        return plotFeatureImportance(featureImportanceDict, subtitle=self.modelName)
+
+    def getFeatureImportance(self) -> FeatureImportance:
+        return self.aggFeatureImportance.getAggregatedFeatureImportance()
 
     def collectResults(self, resultCollector: EvaluationResultCollector):
+        featureImportance = self.getFeatureImportance()
         if self.writeFigure:
-            resultCollector.addFigure(f"{self.modelName}_feature-importance", self.plotFeatureImportance())
+            resultCollector.addFigure(f"{self.modelName}_feature-importance", featureImportance.plot())
         if self.writeDataFrameCSV:
-            namesAndImportance = self.aggFeatureImportance.getAggregatedFeatureImportance().getSortedTuples()
-            df = pd.DataFrame(namesAndImportance, columns=["feature", "importance"])
-            resultCollector.addDataFrameCsvFile(f"{self.modelName}_feature-importance", df)
+            resultCollector.addDataFrameCsvFile(f"{self.modelName}_feature-importance", featureImportance.getDataFrame())
 
 
 class MultiDataModelComparisonData(Generic[TEvalStats, TEvalStatsCollection], ABC):
diff --git a/src/sensai/evaluation/evaluator.py b/src/sensai/evaluation/evaluator.py
index 6db0639f..2760c87e 100644
--- a/src/sensai/evaluation/evaluator.py
+++ b/src/sensai/evaluation/evaluator.py
@@ -60,13 +60,13 @@ def _computeMetrics(self, model, **kwargs) -> Dict[str, float]:
 
 
 class VectorModelEvaluationData(ABC, Generic[TEvalStats]):
-    def __init__(self, statsDict: Dict[str, TEvalStats], inputData: pd.DataFrame, model: VectorModelBase):
+    def __init__(self, statsDict: Dict[str, TEvalStats], ioData: InputOutputData, model: VectorModelBase):
         """
         :param statsDict: a dictionary mapping from output variable name to the evaluation statistics object
-        :param inputData: the input data that was used to produce the results
+        :param ioData: the input/output data that was used to produce the results
         :param model: the model that was used to produce predictions
         """
-        self.inputData = inputData
+        self.ioData = ioData
         self.evalStatsByVarName = statsDict
         self.predictedVarNames = list(self.evalStatsByVarName.keys())
         self.model = model
@@ -75,6 +75,10 @@ def __init__(self, statsDict: Dict[str, TEvalStats], inputData: pd.DataFrame, mo
     def modelName(self):
         return self.model.getName()
 
+    @property
+    def inputData(self):  # for backward compatibility
+        return self.ioData.inputs
+
     def getEvalStats(self, predictedVarName=None) -> TEvalStats:
         if predictedVarName is None:
             if len(self.evalStatsByVarName) != 1:
@@ -303,7 +307,7 @@ def _evalModel(self, model: VectorModelBase, data: InputOutputData) -> VectorReg
                 metrics=self.params.metrics,
                 additionalMetrics=self.params.additionalMetrics)
             evalStatsByVarName[predictedVarName] = evalStats
-        return VectorRegressionModelEvaluationData(evalStatsByVarName, data.inputs, model)
+        return VectorRegressionModelEvaluationData(evalStatsByVarName, data, model)
 
     def computeTestDataOutputs(self, model: VectorModelBase) -> Tuple[pd.DataFrame, pd.DataFrame]:
         """
@@ -414,7 +418,7 @@ def _evalModel(self, model: VectorClassificationModel, data: InputOutputData) ->
         evalStats = ClassificationEvalStats(y_predictedClassProbabilities=predictions_proba, y_predicted=predictions, y_true=groundTruth,
             labels=model.getClassLabels(), additionalMetrics=self.params.additionalMetrics, binaryPositiveLabel=self.params.binaryPositiveLabel)
         predictedVarName = model.getPredictedVariableNames()[0]
-        return VectorClassificationModelEvaluationData({predictedVarName: evalStats}, data.inputs, model)
+        return VectorClassificationModelEvaluationData({predictedVarName: evalStats}, data, model)
 
     def computeTestDataOutputs(self, model) -> Tuple[pd.DataFrame, pd.DataFrame, pd.DataFrame]:
         """
diff --git a/src/sensai/feature_importance.py b/src/sensai/feature_importance.py
index bc12c289..4f277de6 100644
--- a/src/sensai/feature_importance.py
+++ b/src/sensai/feature_importance.py
@@ -1,13 +1,24 @@
 import collections
+import copy
+import logging
 import re
 from abc import ABC, abstractmethod
 from typing import Dict, Union, Sequence, List, Tuple
 
+import numpy as np
+import pandas as pd
 import seaborn as sns
 from matplotlib import pyplot as plt
+from sklearn.inspection import permutation_importance
 
+from .data import InputOutputData
+from .evaluation.crossval import VectorModelCrossValidationData
 from .util.deprecation import deprecated
 from .util.plot import MATPLOTLIB_DEFAULT_FIGURE_SIZE
+from .util.string import ToStringMixin
+from .vector_model import VectorModel
+
+log = logging.getLogger(__name__)
 
 
 class FeatureImportance:
@@ -32,12 +43,29 @@ def getFeatureImportanceDict(self, predictedVarName=None) -> Dict[str, float]:
         else:
             return self.featureImportanceDict
 
-    def getSortedTuples(self, predictedVarName=None) -> List[Tuple[str, float]]:
+    def getSortedTuples(self, predictedVarName=None, reverse=False) -> List[Tuple[str, float]]:
+        """
+        :param predictedVarName: the predicted variable name for which to retrieve the sorted feature importance values
+        :param reverse: whether to reverse the order (i.e. descending order of importance values, where the most important feature comes first,
+            rather than ascending order)
+        :return: a sorted list of tuples (feature name, feature importance)
+        """
         # noinspection PyTypeChecker
         tuples: List[Tuple[str, float]] = list(self.getFeatureImportanceDict(predictedVarName).items())
-        tuples.sort(key=lambda t: t[1])
+        tuples.sort(key=lambda t: t[1], reverse=reverse)
         return tuples
 
+    def plot(self, predictedVarName=None) -> plt.Figure:
+        return plotFeatureImportance(self.getFeatureImportanceDict(predictedVarName=predictedVarName))
+
+    def getDataFrame(self, predictedVarName=None) -> pd.DataFrame:
+        """
+        :param predictedVarName: the predicted variable name
+        :return: a data frame with two columns, "feature" and "importance"
+        """
+        namesAndImportance = self.getSortedTuples(predictedVarName=predictedVarName, reverse=True)
+        return pd.DataFrame(namesAndImportance, columns=["feature", "importance"])
+
 
 class FeatureImportanceProvider(ABC):
     """
@@ -81,7 +109,7 @@ class AggregatedFeatureImportance:
     models and compatible models from lightgbm, etc.)
     """
     def __init__(self, *items: Union[FeatureImportanceProvider, Dict[str, float], Dict[str, Dict[str, float]]],
-            featureAggRegEx: Sequence[str] = ()):
+            featureAggRegEx: Sequence[str] = (), aggFn=np.mean):
         r"""
         :param items: (optional) initial list of feature importance providers or dictionaries to aggregate; further
             values can be added via method add
@@ -90,10 +118,11 @@ def __init__(self, *items: Union[FeatureImportanceProvider, Dict[str, float], Di
             of the matched group instead of the full feature name. For example, the regex r"(\w+)_\d+$" will cause "foo_1" and "foo_2"
             to be summed under "foo" and similarly "bar_1" and "bar_2" to be summed under "bar".
         """
-        self.aggDict = None
+        self._aggDict = None
         self._isNested = None
         self._numDictsAdded = 0
         self._featureAggRegEx = [re.compile(p) for p in featureAggRegEx]
+        self._aggFn = aggFn
         for item in items:
             self.add(item)
 
@@ -112,17 +141,17 @@ def add(self, featureImportance: Union[FeatureImportanceProvider, Dict[str, floa
         if self._isNested is None:
             self._isNested = self._isDict(next(iter(featureImportance.values())))
         if self._isNested:
-            if self.aggDict is None:
-                self.aggDict = collections.defaultdict(lambda: collections.defaultdict(lambda: 0))
+            if self._aggDict is None:
+                self._aggDict = collections.defaultdict(lambda: collections.defaultdict(list))
             for targetName, d in featureImportance.items():
                 d: dict
                 for featureName, value in d.items():
-                    self.aggDict[targetName][self._aggFeatureName(featureName)] += value
+                    self._aggDict[targetName][self._aggFeatureName(featureName)].append(value)
         else:
-            if self.aggDict is None:
-                self.aggDict = collections.defaultdict(lambda: 0)
+            if self._aggDict is None:
+                self._aggDict = collections.defaultdict(list)
             for featureName, value in featureImportance.items():
-                self.aggDict[self._aggFeatureName(featureName)] += value
+                self._aggDict[self._aggFeatureName(featureName)].append(value)
         self._numDictsAdded += 1
 
     def _aggFeatureName(self, featureName: str):
@@ -133,7 +162,67 @@ def _aggFeatureName(self, featureName: str):
         return featureName
 
     def getAggregatedFeatureImportanceDict(self) -> Union[Dict[str, float], Dict[str, Dict[str, float]]]:
-        return self.aggDict
+        def aggregate(d: dict):
+            return {k: self._aggFn(l) for k, l in d.items()}
+
+        if self._isNested:
+            return {k: aggregate(d) for k, d in self._aggDict}
+        else:
+            return aggregate(self._aggDict)
 
     def getAggregatedFeatureImportance(self) -> FeatureImportance:
-        return FeatureImportance(self.aggDict)
+        return FeatureImportance(self.getAggregatedFeatureImportanceDict())
+
+
+def computePermutationFeatureImportanceDict(model, ioData: InputOutputData, scoring, numRepeats: int, randomState,
+        excludeInputPreprocessors=False):
+    if excludeInputPreprocessors:
+        inputs = model.computeModelInputs(ioData.inputs)
+        model = copy.copy(model)
+        model.removeInputPreprocessors()
+    else:
+        inputs = ioData.inputs
+    featureNames = inputs.columns
+    pi = permutation_importance(model, inputs, ioData.outputs, n_repeats=numRepeats, random_state=randomState, scoring=scoring)
+    importanceValues = pi.importances_mean
+    assert len(importanceValues) == len(featureNames)
+    featureImportanceDict = dict(zip(featureNames, importanceValues))
+    return featureImportanceDict
+
+
+class AggregatedPermutationFeatureImportance(ToStringMixin):
+    def __init__(self, aggregatedFeatureImportance: AggregatedFeatureImportance, scoring, numRepeats=5, randomSeed=42,
+            excludeModelInputPreprocessors=False):
+        """
+        :param aggregatedFeatureImportance: the object in which to aggregate the feature importance (to which no feature importance
+            values should have yet been added)
+        :param scoring: the scoring method; see https://scikit-learn.org/stable/modules/model_evaluation.html; e.g. "r2" for regression or
+            "accuracy" for classification
+        :param numRepeats: the number of data permutations to apply for each model
+        :param randomSeed: the random seed for shuffling the data
+        :param excludeModelInputPreprocessors: whether to exclude model input preprocessors, such that the
+            feature importance will be reported on the transformed inputs that are actually fed to the model rather than the original
+            inputs.
+            Enabling this can, for example, help save time in cases where the input preprocessors discard many of the raw input
+            columns, but it may not be a good idea of the preprocessors generate multiple columns from the original input columns.
+        """
+        self._agg = aggregatedFeatureImportance
+        self.scoring = scoring
+        self.numRepeats = numRepeats
+        self.randomSeed = randomSeed
+        self.excludeModelInputPreprocessors = excludeModelInputPreprocessors
+
+    def add(self, model: VectorModel, ioData: InputOutputData):
+        featureImportanceDict = computePermutationFeatureImportanceDict(model, ioData, self.scoring, numRepeats=self.numRepeats,
+            randomState=self.randomSeed, excludeInputPreprocessors=self.excludeModelInputPreprocessors)
+        self._agg.add(featureImportanceDict)
+
+    def addCrossValidationData(self, crossValData: VectorModelCrossValidationData):
+        if crossValData.trainedModels is None:
+            raise ValueError("No models in cross-validation data; enable model collection during cross-validation")
+        for i, (model, evalData) in enumerate(zip(crossValData.trainedModels, crossValData.evalDataList), start=1):
+            log.info(f"Computing permutation feature importance for model #{i}/{len(crossValData.trainedModels)}")
+            self.add(model, evalData.ioData)
+
+    def getFeatureImportance(self) -> FeatureImportance:
+        return self._agg.getAggregatedFeatureImportance()
diff --git a/src/sensai/sklearn/sklearn_base.py b/src/sensai/sklearn/sklearn_base.py
index c719fff0..d6c2e21c 100644
--- a/src/sensai/sklearn/sklearn_base.py
+++ b/src/sensai/sklearn/sklearn_base.py
@@ -10,6 +10,7 @@
 
 from ..feature_importance import FeatureImportanceProvider
 from ..util.pickle import setstate
+from ..util.string import dictString
 from ..vector_model import VectorRegressionModel, VectorClassificationModel
 
 log = logging.getLogger(__name__)
@@ -142,7 +143,7 @@ def _toStringAdditionalEntries(self) -> Dict[str, Any]:
         if len(self.models) > 0:
             d["model[0]"] = strSkLearnModel(next(iter(self.models.values())))
         else:
-            d["modelConstructor"] = f"{self.modelConstructor.__name__}{self.modelArgs}"
+            d["modelConstructor"] = f"{self.modelConstructor.__name__}({dictString(self.modelArgs)})"
         return d
 
     def _fitSkLearn(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
@@ -177,7 +178,7 @@ def _toStringAdditionalEntries(self) -> Dict[str, Any]:
         if self.model is not None:
             d["model"] = strSkLearnModel(self.model)
         else:
-            d["modelConstructor"] = f"{self.modelConstructor.__name__}{self.modelArgs}"
+            d["modelConstructor"] = f"{self.modelConstructor.__name__}({dictString(self.modelArgs)})"
         return d
 
     def _fitSkLearn(self, inputs: pd.DataFrame, outputs: pd.DataFrame):
@@ -221,7 +222,7 @@ def _toStringExcludes(self) -> List[str]:
     def _toStringAdditionalEntries(self) -> Dict[str, Any]:
         d = super()._toStringAdditionalEntries()
         if self.model is None:
-            d["modelConstructor"] = f"{self.modelConstructor.__name__}{self.modelArgs}"
+            d["modelConstructor"] = f"{self.modelConstructor.__name__}({dictString(self.modelArgs)})"
         else:
             d["model"] = strSkLearnModel(self.model)
         return d
@@ -307,19 +308,30 @@ def _computeClassWeights(self, outputs: pd.DataFrame):
         return weights.to_dict()
 
 
+def _getModelFeatureImportanceVector(model):
+    candAttributes = ("feature_importances_", "coef_")
+    for attr in candAttributes:
+        if hasattr(model, attr):
+            importanceValues = getattr(model, attr)
+            if attr == "coef_":
+                importanceValues = np.abs(importanceValues)  # for coefficients in linear models, use the absolute values
+            return importanceValues
+    raise ValueError(f"Model {model} has none of the attributes {candAttributes}")
+
+
 class FeatureImportanceProviderSkLearnRegressionMultipleOneDim(FeatureImportanceProvider):
     def getFeatureImportanceDict(self) -> Dict[str, Dict[str, int]]:
         self: AbstractSkLearnMultipleOneDimVectorRegressionModel
-        return {targetFeature: dict(zip(model.feature_name_, model.feature_importances_)) for targetFeature, model in self.models.items()}
+        return {targetFeature: dict(zip(self._modelInputVariableNames, _getModelFeatureImportanceVector(model))) for targetFeature, model in self.models.items()}
 
 
 class FeatureImportanceProviderSkLearnRegressionMultiDim(FeatureImportanceProvider):
     def getFeatureImportanceDict(self) -> Dict[str, float]:
         self: AbstractSkLearnMultiDimVectorRegressionModel
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+        return dict(zip(self._modelInputVariableNames, _getModelFeatureImportanceVector(self.model)))
 
 
 class FeatureImportanceProviderSkLearnClassification(FeatureImportanceProvider):
     def getFeatureImportanceDict(self) -> Dict[str, float]:
         self: AbstractSkLearnVectorClassificationModel
-        return dict(zip(self._modelInputVariableNames, self.model.feature_importances_))
+        return dict(zip(self._modelInputVariableNames, _getModelFeatureImportanceVector(self.model)))

From a957286fcc06b5cf51f72feef12d2526cf9d0af6 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Fri, 1 Jul 2022 16:34:10 +0200
Subject: [PATCH 130/131] Fixed version strings

---
 .bumpversion.cfg       | 2 +-
 setup.py               | 2 +-
 src/sensai/__init__.py | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.bumpversion.cfg b/.bumpversion.cfg
index 52f7e3ee..d3455a05 100644
--- a/.bumpversion.cfg
+++ b/.bumpversion.cfg
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.1.6
+current_version = 0.1.8.dev1
 commit = False
 tag = False
 allow_dirty = False
diff --git a/setup.py b/setup.py
index e6caad2e..2ab95349 100644
--- a/setup.py
+++ b/setup.py
@@ -73,7 +73,7 @@ def relaxed_requirements_from_file(path):
     url="https://github.com/jambit/sensAI",
     packages=find_namespace_packages(where="src"),
     include_package_data=True,
-    version='0.1.6',
+    version='0.1.8.dev1',
     description='Library for sensible AI',
     install_requires=relaxed_requirements_from_file("requirements.txt"),
     dependency_links=["https://download.pytorch.org/whl/torch_stable.html"],
diff --git a/src/sensai/__init__.py b/src/sensai/__init__.py
index 5f13e3b5..d9ded9ac 100644
--- a/src/sensai/__init__.py
+++ b/src/sensai/__init__.py
@@ -16,7 +16,7 @@
     TensorToTensorClassificationModel, TensorToScalarClassificationModel
 from .vector_model import VectorModelBase, VectorModel, VectorRegressionModel, VectorClassificationModel
 
-__version__ = "0.1.6"
+__version__ = "0.1.8.dev1"
 
 # The following submodules are not imported by default to avoid necessarily requiring their dependencies:
 # tensorflow

From c50a86bdbfa772571055a2d29a42acecc3d5e995 Mon Sep 17 00:00:00 2001
From: Mischa Panchenko <michael.panchenko@unternehmertum.de>
Date: Fri, 1 Jul 2022 16:34:25 +0200
Subject: [PATCH 131/131] =?UTF-8?q?Bump=20version:=200.1.8.dev1=20?=
 =?UTF-8?q?=E2=86=92=200.1.8?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .bumpversion.cfg       | 2 +-
 setup.py               | 2 +-
 src/sensai/__init__.py | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.bumpversion.cfg b/.bumpversion.cfg
index d3455a05..35b29ab6 100644
--- a/.bumpversion.cfg
+++ b/.bumpversion.cfg
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.1.8.dev1
+current_version = 0.1.8
 commit = False
 tag = False
 allow_dirty = False
diff --git a/setup.py b/setup.py
index 2ab95349..095c112a 100644
--- a/setup.py
+++ b/setup.py
@@ -73,7 +73,7 @@ def relaxed_requirements_from_file(path):
     url="https://github.com/jambit/sensAI",
     packages=find_namespace_packages(where="src"),
     include_package_data=True,
-    version='0.1.8.dev1',
+    version='0.1.8',
     description='Library for sensible AI',
     install_requires=relaxed_requirements_from_file("requirements.txt"),
     dependency_links=["https://download.pytorch.org/whl/torch_stable.html"],
diff --git a/src/sensai/__init__.py b/src/sensai/__init__.py
index d9ded9ac..3820c298 100644
--- a/src/sensai/__init__.py
+++ b/src/sensai/__init__.py
@@ -16,7 +16,7 @@
     TensorToTensorClassificationModel, TensorToScalarClassificationModel
 from .vector_model import VectorModelBase, VectorModel, VectorRegressionModel, VectorClassificationModel
 
-__version__ = "0.1.8.dev1"
+__version__ = "0.1.8"
 
 # The following submodules are not imported by default to avoid necessarily requiring their dependencies:
 # tensorflow