predict-idlab · jvdd · May 24, 2023 · May 24, 2023 · May 25, 2023 · May 25, 2023
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -45,6 +45,10 @@ pycatch22 = "^0.4.2"
 # antropy = "^0.1.5"
 antropy = { git = "https://github.com/raphaelvallat/antropy.git", branch = "master" }  # replace with pip when > 0.1.5 release available
 nolds = "^0.5.2"
+pyentrp = [
+    { version = "^0.7.1", python = "<3.8" },
+    { version = "^0.8.2", python = ">=3.8" }
+]
 # Linting
 ruff = "^0.0.264"
 black = "^22.12.0"

diff --git a/tests/test_features_feature_collection.py b/tests/test_features_feature_collection.py
@@ -1730,7 +1730,7 @@ def sum_mean(x, axis):
     s = "EDA__"
     p = "__w=1000"
     assert np.all(res[s + "sum" + p].values == res[s + "sum_vect" + p].values)
-    assert np.all(res[s + "mean" + p].values == res[s + "mean_vect" + p].values)
+    assert np.allclose(res[s + "mean" + p].values, res[s + "mean_vect" + p].values)
 
 
 def test_multiple_inputs_vectorized_features(dummy_data):
@@ -1759,6 +1759,137 @@ def windowed_diff(x1, x2):
     assert np.all(res["EDA|TMP__windowed_diff" + p].values == manual_diff)
 
 
+### Test parallel features
+
+
+def test_basic_parallel_features_different_fc(dummy_data):
+    fs = 4  # The sample frequency in Hz
+    fc1 = FeatureCollection(
+        feature_descriptors=[
+            FeatureDescriptor(np.max, "EDA", 250 * fs, 75 * fs),
+        ]
+    )
+    fc2 = FeatureCollection(
+        feature_descriptors=[
+            FeatureDescriptor(
+                FuncWrapper(np.max, output_names="max_", parallel=True),
+                "EDA",
+                250 * fs,
+                75 * fs,
+            ),
+        ]
+    )
+    res1 = fc1.calculate(dummy_data)
+    res2 = fc2.calculate(dummy_data)
+
+    assert len(res1) == 1
+    assert len(res2) == 1
+    res1 = res1[0]
+    res2 = res2[0]
+    assert (len(res1) > 1) and (len(res2) > 1)
+    assert np.all(res1.index == res2.index)
+    assert np.all(res1.values == res2.values)
+
+
+def test_basic_parallel_features_same_fc(dummy_data):
+    fs = 4  # The sample frequency in Hz
+    fc = FeatureCollection(
+        feature_descriptors=[
+            FeatureDescriptor(np.max, "EDA", 250 * fs, 75 * fs),
+            FeatureDescriptor(
+                FuncWrapper(np.max, output_names="max_", parallel=True),
+                "EDA",
+                250 * fs,
+                75 * fs,
+            ),
+        ]
+    )
+    res = fc.calculate(dummy_data)
+
+    assert len(res) == 2
+    assert (len(res[0]) > 1) and (len(res[1]) > 1)
+    assert np.all(res[0].index == res[1].index)
+    assert np.all(res[0].values == res[1].values)
+
+
+def test_time_based_parallel_features(dummy_data):
+    fc = FeatureCollection(
+        feature_descriptors=[
+            FeatureDescriptor(np.max, "EDA", "5min", "3min"),
+            FeatureDescriptor(
+                FuncWrapper(np.max, output_names="max_", parallel=True),
+                "EDA",
+                "5min",
+                "3min",
+            ),
+        ]
+    )
+    res = fc.calculate(dummy_data)
+
+    assert len(res) == 2
+    assert (len(res[0]) > 1) and (len(res[1]) > 1)
+    assert np.all(res[0].index == res[1].index)
+    assert np.all(res[0].values == res[1].values)
+
+
+def test_multiple_outputs_parallel_features(dummy_data):
+    def sum_mean(x):
+        s = np.sum(x)
+        return s, s / x.shape[0]
+
+    fs = 4  # The sample frequency in Hz
+    fc = FeatureCollection(
+        feature_descriptors=[
+            FeatureDescriptor(np.sum, "EDA", 250 * fs, 75 * fs),
+            FeatureDescriptor(np.mean, "EDA", 250 * fs, 75 * fs),
+            FeatureDescriptor(
+                FuncWrapper(
+                    sum_mean,
+                    output_names=["sum_par", "mean_par"],
+                    parallel=True,
+                ),
+                "EDA",
+                250 * fs,
+                75 * fs,
+            ),
+        ]
+    )
+
+    res = fc.calculate(dummy_data, return_df=True)
+
+    assert res.shape[1] == 4
+    s = "EDA__"
+    p = "__w=1000"
+    assert np.all(res[s + "sum" + p].values == res[s + "sum_par" + p].values)
+    assert np.allclose(res[s + "mean" + p].values, res[s + "mean_par" + p].values)
+
+
+def test_multiple_inputs_parallel_features(dummy_data):
+    def windowed_diff(x1, x2):
+        return np.sum(x1) - np.sum(x2)
+
+    fc = FeatureCollection(
+        feature_descriptors=[
+            FeatureDescriptor(np.sum, "EDA", "5min", "2.5min"),
+            FeatureDescriptor(np.sum, "TMP", "5min", "2.5min"),
+            FeatureDescriptor(
+                FuncWrapper(windowed_diff, parallel=True),
+                ("EDA", "TMP"),
+                "5min",
+                "2.5min",
+            ),
+        ]
+    )
+
+    res = fc.calculate(dummy_data, return_df=True)
+
+    assert res.shape[1] == 3
+    assert res.shape[0] > 1
+    p = "__w=5m"
+    manual_diff = res["EDA__sum" + p].values - res["TMP__sum" + p].values
+    assert np.all(res["EDA|TMP__windowed_diff" + p].values == manual_diff)
+
+
 ### Test feature extraction length
 
 

diff --git a/tsflex/features/feature_collection.py b/tsflex/features/feature_collection.py
@@ -104,6 +104,31 @@ def get_required_series(self) -> List[str]:
             set(flatten([fr_key[0] for fr_key in self._feature_desc_dict.keys()]))
         )
 
+    def _get_feature_desc_dict(
+        self, parallel: bool
+    ) -> Dict[
+        Tuple[Tuple[str, ...], Union[float, pd.Timedelta]], List[FeatureDescriptor]
+    ]:
+        """Return the feature descriptor dictionary.
+
+        Parameters
+        ----------
+        parallel : bool
+            Whether to return the feature descriptors for the parallel functions or not.
+
+        Returns
+        -------
+        Dict[Tuple[Tuple[str, ...], Union[float, pd.Timedelta]], List[FeatureDescriptor]]
+            The feature descriptor dictionary.
+
+        """
+        res = {}
+        for k, fd_list in self._feature_desc_dict.items():
+            fd_list = [fd for fd in fd_list if fd.function.parallel == parallel]
+            if fd_list:
+                res[k] = fd_list
+        return res
+
     def get_nb_output_features(self) -> int:
         """Return the number of output features in this feature collection.
 
@@ -260,11 +285,23 @@ def add(
         self._check_feature_descriptors(skip_none=True)
 
     @staticmethod
-    def _executor(idx: int):
-        # global get_stroll_func
-        stroll, function = get_stroll_func(idx)
+    def _non_parallel_func_executor(idx: int):
+        """Execute functions that are not parallelized (over the strided window).
+
+        This executor can be called in a multiprocessing context.
+        """
+        stroll, function = get_stroll_non_parallel_func(idx)
         return stroll.apply_func(function)
 
+    @staticmethod
+    def _parallel_func_executor(idx: int, n_jobs: int):
+        """Execute functions that are parallelized (over the strided window).
+
+        This executor canNOT be called in a multiprocessing context.
+        """
+        stroll, function = get_stroll_parallel_func(idx)
+        return stroll.apply_func(function, n_jobs)
+
     # def _get_stroll(self, kwargs):
     #     return StridedRollingFactory.get_segmenter(**kwargs)
 
@@ -279,20 +316,21 @@ def _stroll_feat_generator(
         window_idx: str,
         include_final_window: bool,
         approve_sparsity: bool,
+        parallel: bool,
     ) -> Callable[[int], Tuple[StridedRolling, FuncWrapper]]:
         # --- Future work ---
         # We could also make the StridedRolling creation multithreaded
         # Very low priority because the STROLL __init__ is rather efficient!
-        keys_wins_strides = list(self._feature_desc_dict.keys())
-        lengths = np.cumsum(
-            [len(self._feature_desc_dict[k]) for k in keys_wins_strides]
-        )
+        feature_desc_dict = self._get_feature_desc_dict(parallel)
+
+        keys_wins_strides = list(feature_desc_dict)
+        lengths = np.cumsum([len(feature_desc_dict[k]) for k in keys_wins_strides])
 
         def get_stroll_function(idx) -> Tuple[StridedRolling, FuncWrapper]:
             key_idx = np.searchsorted(lengths, idx, "right")  # right bc idx starts at 0
             key, win = keys_wins_strides[key_idx]
 
-            feature = self._feature_desc_dict[keys_wins_strides[key_idx]][
+            feature = feature_desc_dict[keys_wins_strides[key_idx]][
                 idx - lengths[key_idx]
             ]
             stride = feature.stride if calc_stride is None else calc_stride
@@ -316,10 +354,9 @@ def get_stroll_function(idx) -> Tuple[StridedRolling, FuncWrapper]:
 
         return get_stroll_function
 
-    def _get_stroll_feat_length(self) -> int:
-        return sum(
-            len(self._feature_desc_dict[k]) for k in self._feature_desc_dict.keys()
-        )
+    def _get_stroll_feat_length(self, parallel: bool) -> int:
+        feat_desc_dict = self._get_feature_desc_dict(parallel)
+        return sum(len(feat_desc_dict[k]) for k in feat_desc_dict.keys())
 
     def _check_no_multiple_windows(self):
         assert (
@@ -599,11 +636,18 @@ def calculate(
             for n, s, in series_dict.items()
         }
 
+        if (
+            os.name == "nt"
+        ):  # On Windows no multiprocessing is supported, see https://github.com/predict-idlab/tsflex/issues/51
+            n_jobs = 1
+        elif n_jobs is None:
+            n_jobs = os.cpu_count()
+
         # Note: this variable has a global scope so this is shared in multiprocessing
         # TODO: try to make this more efficient (but is not really the bottleneck)
-        global get_stroll_func
-        get_stroll_func = self._stroll_feat_generator(
-            series_dict,
+        global get_stroll_non_parallel_func  # is not applied in parallel on the stroll
+        global get_stroll_parallel_func  # is applied in parallel on the stroll
+        kwargs = dict(
             calc_stride=stride,
             segment_start_idxs=segment_start_idxs,
             segment_end_idxs=segment_end_idxs,
@@ -613,30 +657,42 @@ def calculate(
             include_final_window=include_final_window,
             approve_sparsity=approve_sparsity,
         )
-        nb_stroll_funcs = self._get_stroll_feat_length()
-
-        if (
-            os.name == "nt"
-        ):  # On Windows no multiprocessing is supported, see https://github.com/predict-idlab/tsflex/issues/51
-            n_jobs = 1
-        elif n_jobs is None:
-            n_jobs = os.cpu_count()
-        n_jobs = min(n_jobs, nb_stroll_funcs)
+        get_stroll_non_parallel_func = self._stroll_feat_generator(
+            series_dict,
+            **kwargs,
+            parallel=False,
+        )
+        nb_stroll_non_parallel_func = self._get_stroll_feat_length(parallel=False)
+        n_jobs_non_parallel_func = min(n_jobs, nb_stroll_non_parallel_func)
+        get_stroll_parallel_func = self._stroll_feat_generator(
+            series_dict,
+            **kwargs,
+            parallel=True,
+        )
+        nb_stroll_parallel_func = self._get_stroll_feat_length(parallel=True)
 
         calculated_feature_list = None
-        if n_jobs in [0, 1]:
-            idxs = range(nb_stroll_funcs)
+
+        # 1. Calculate the features for the non-parallel functions
+        # -> these functions are calculated (possibly in parallel) over the functions
+        if n_jobs_non_parallel_func in [0, 1]:
+            idxs = range(nb_stroll_non_parallel_func)
             if show_progress:
                 idxs = tqdm(idxs)
             try:
-                calculated_feature_list = [self._executor(idx) for idx in idxs]
+                # 1. Calculate the features for the non-parallel functions
+                calculated_feature_list = [
+                    self._non_parallel_func_executor(i) for i in idxs
+                ]
             except Exception:
                 traceback.print_exc()
         else:
-            with Pool(processes=n_jobs) as pool:
-                results = pool.imap_unordered(self._executor, range(nb_stroll_funcs))
+            with Pool(processes=n_jobs_non_parallel_func) as pool:
+                results = pool.imap_unordered(
+                    self._non_parallel_func_executor, range(nb_stroll_non_parallel_func)
+                )
                 if show_progress:
-                    results = tqdm(results, total=nb_stroll_funcs)
+                    results = tqdm(results, total=nb_stroll_non_parallel_func)
                 try:
                     calculated_feature_list = [f for f in results]
                 except Exception:
@@ -647,6 +703,21 @@ def calculate(
                     pool.close()
                     pool.join()
 
+        # 2. Calculate the features for the parallel functions
+        # -> these functions are calculated (possibly in parallel) within the functions
+        idxs = range(nb_stroll_parallel_func)
+        if show_progress:
+            idxs = tqdm(idxs)
+        try:
+            # We collect one by one the results of the parallel functions
+            # (because the parallelization is done within the function , i.e. over the
+            # strided windows)
+            calculated_feature_list += [
+                self._parallel_func_executor(i, n_jobs) for i in idxs
+            ]
+        except Exception:
+            traceback.print_exc()
+
         # Close the file handler (this avoids PermissionError: [WinError 32])
         if logging_file_path:
             f_handler.close()

diff --git a/tsflex/features/function_wrapper.py b/tsflex/features/function_wrapper.py
@@ -66,6 +66,7 @@ def __init__(
         output_names: Optional[Union[List[str], str]] = None,
         input_type: Optional[Union[np.array, pd.Series]] = np.array,
         vectorized: bool = False,
+        parallel: bool = False,
         **kwargs,
     ):
         """Create FuncWrapper instance."""
@@ -83,10 +84,14 @@ def __init__(
 
         assert input_type in SUPPORTED_STROLL_TYPES, "Invalid input_type!"
         assert not (
-            vectorized & (input_type is not np.array)
+            vectorized and (input_type is not np.array)
         ), "The input_type must be np.array if vectorized is True!"
+        assert not (
+            vectorized and parallel
+        ), "vectorized and parallel cannot be both True!"
         self.input_type = input_type
         self.vectorized = vectorized
+        self.parallel = parallel
 
         self._freeze()