From 2207e6c4b89a1ff68b7e24f0ed7b297680c042ca Mon Sep 17 00:00:00 2001
From: Pierre Marchand <pierre.jimthefrench@gmail.com>
Date: Wed, 7 Aug 2024 19:52:36 +0200
Subject: [PATCH] update htool 0.9.0

---
 CMakeLists.txt                                |   2 +-
 example/ddm_solver.py                         |  97 --------
 example/define_custom_generators.py           |  61 +----
 example/define_custom_local_operator.py       |  12 +-
 example/define_custom_low_rank_generator.py   |  13 +-
 ...lt_build.py => use_block_jacobi_solver.py} |  15 +-
 ...ock_jacobi_solver_with_no_default_build.py | 134 ----------
 example/use_cluster.py                        |   2 -
 example/use_cluster_with_given_partition.py   |   2 -
 example/use_custom_dense_block_generator.py   |   4 +-
 example/use_custom_local_operator.py          |  20 +-
 example/use_custom_low_rank_approximation.py  |  35 +--
 ...lt_build.py => use_hmatrix_compression.py} |   9 +-
 ...ld.py => use_local_hmatrix_compression.py} |  28 +--
 example/use_no_default_build.py               | 128 ----------
 lib/hpddm                                     |   2 +-
 lib/htool                                     |   2 +-
 pyproject.toml                                |   2 +-
 src/htool/clustering/cluster_node.hpp         |  15 --
 .../distributed_operator.hpp                  |  39 ++-
 .../implementation/partition_from_cluster.hpp |  16 --
 .../interface/partition.hpp                   |  32 ---
 src/htool/distributed_operator/utility.hpp    |  32 ++-
 src/htool/hmatrix/hmatrix.hpp                 | 122 ++-------
 src/htool/hmatrix/hmatrix_builder.hpp         |   6 +-
 .../hmatrix/interfaces/virtual_generator.hpp  |  61 +----
 .../interfaces/virtual_low_rank_generator.hpp |  45 ++--
 src/htool/local_operator/local_operator.hpp   |   8 +-
 src/htool/main.cpp                            |  21 +-
 src/htool/misc/utility.hpp                    |   2 +-
 .../solver/geneo/coarse_space_builder.hpp     |  35 ++-
 .../geneo/coarse_space_dense_builder.hpp      | 133 ++++++++++
 src/htool/solver/solver.hpp                   |  19 +-
 src/htool/solver/utility.hpp                  |  51 +---
 tests/conftest.py                             |  59 ++---
 tests/test_cluster.py                         |   9 +-
 tests/test_ddm_solver.py                      | 232 ++++++++----------
 37 files changed, 455 insertions(+), 1050 deletions(-)
 delete mode 100644 example/ddm_solver.py
 rename example/{use_block_jacobi_solver_with_default_build.py => use_block_jacobi_solver.py} (89%)
 delete mode 100644 example/use_block_jacobi_solver_with_no_default_build.py
 rename example/{use_default_build.py => use_hmatrix_compression.py} (94%)
 rename example/{use_local_build.py => use_local_hmatrix_compression.py} (91%)
 delete mode 100644 example/use_no_default_build.py
 delete mode 100644 src/htool/distributed_operator/implementation/partition_from_cluster.hpp
 delete mode 100644 src/htool/distributed_operator/interface/partition.hpp
 create mode 100644 src/htool/solver/geneo/coarse_space_dense_builder.hpp

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e41773d..e8419d0 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -87,7 +87,7 @@ if("${BLA_VENDOR}" STREQUAL "Intel10_32"
     target_compile_definitions(htool PRIVATE "-DHPDDM_MKL -DHTOOL_MKL")
 endif()
 
-target_compile_definitions(Htool PRIVATE "-DPYTHON_INTERFACE" "-DWITH_HPDDM")
+target_compile_definitions(Htool PRIVATE "-DHTOOL_WITH_PYTHON_INTERFACE" "-DHTOOL_WITH_HPDDM")
 
 if(CODE_COVERAGE AND (CMAKE_C_COMPILER_ID MATCHES "GNU" OR CMAKE_CXX_COMPILER_ID MATCHES "GNU"))
     target_compile_options(Htool PRIVATE -fprofile-arcs -ftest-coverage)
diff --git a/example/ddm_solver.py b/example/ddm_solver.py
deleted file mode 100644
index 8dd208d..0000000
--- a/example/ddm_solver.py
+++ /dev/null
@@ -1,97 +0,0 @@
-import Htool
-import matplotlib.pyplot as plt
-import mpi4py
-import numpy as np
-from create_geometry import create_random_geometries
-from define_custom_generators import CustomGeneratorWithPermutation
-
-# Random geometry
-size = 500
-dimension = 3
-
-[points, _] = create_random_geometries(dimension, size, size)
-
-
-# Htool parameters
-eta = 10
-epsilon = 1e-3
-minclustersize = 10
-number_of_children = 2
-
-# Build clusters
-cluster_builder = Htool.ClusterBuilder()
-cluster_builder.set_minclustersize(minclustersize)
-cluster: Htool.Cluster = cluster_builder.create_cluster_tree(
-    points, number_of_children, mpi4py.MPI.COMM_WORLD.size
-)
-
-# Build generator
-generator = CustomGeneratorWithPermutation(
-    cluster.get_permutation(), points, cluster.get_permutation(), points
-)
-
-# Build distributed operator
-default_approximation = Htool.DefaultApproximationBuilder(
-    generator,
-    cluster,
-    cluster,
-    epsilon,
-    eta,
-    "S",
-    "L",
-    mpi4py.MPI.COMM_WORLD,
-)
-
-# Solver with block Jacobi preconditionner
-default_solver_builder = Htool.DefaultSolverBuilder(
-    default_approximation.distributed_operator,
-    default_approximation.block_diagonal_hmatrix,
-)
-solver = default_solver_builder.solver
-
-
-# Solver with block Jacobi
-x_ref = np.random.random(size)
-b = default_approximation.distributed_operator * x_ref
-x = np.zeros(size)
-
-hpddm_args = "-hpddm_compute_residual l2 "
-if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
-    hpddm_args += "-hpddm_verbosity 10"
-solver.set_hpddm_args(hpddm_args)
-solver.facto_one_level()
-solver.solve(x, b)
-
-
-# Several ways to display information
-if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
-    print(np.linalg.norm(x - x_ref) / np.linalg.norm(x_ref))
-    hmatrix = default_approximation.hmatrix
-    local_block_hmatrix = default_approximation.block_diagonal_hmatrix
-    print(hmatrix.get_tree_parameters())
-    print(hmatrix.get_information())
-
-    fig = plt.figure()
-    ax1 = None
-    ax2 = None
-    ax3 = None
-    ax4 = None
-    if dimension == 2:
-        ax1 = fig.add_subplot(2, 2, 1)
-        ax2 = fig.add_subplot(2, 2, 2)
-        ax3 = fig.add_subplot(2, 2, 3)
-        ax4 = fig.add_subplot(2, 2, 4)
-    elif dimension == 3:
-        ax1 = fig.add_subplot(2, 2, 1, projection="3d")
-        ax2 = fig.add_subplot(2, 2, 2, projection="3d")
-        ax3 = fig.add_subplot(2, 2, 3)
-        ax4 = fig.add_subplot(2, 2, 4)
-
-    ax1.set_title("cluster at depth 1")
-    ax2.set_title("cluster at depth 2")
-    ax4.set_title("Hmatrix on rank 0")
-    Htool.plot(ax1, cluster, points, 1)
-    Htool.plot(ax2, cluster, points, 2)
-    Htool.plot(ax3, hmatrix)
-    Htool.plot(ax4, local_block_hmatrix)
-    plt.show()
diff --git a/example/define_custom_generators.py b/example/define_custom_generators.py
index 334e7a6..2519eab 100644
--- a/example/define_custom_generators.py
+++ b/example/define_custom_generators.py
@@ -2,66 +2,13 @@
 import numpy as np
 
 
-class CustomGenerator(Htool.VirtualGenerator):
-    def __init__(self, target_cluster, target_points, source_cluster, source_points):
+class CustomGenerator(Htool.VirtualGeneratorInUserNumbering):
+    def __init__(self, target_points, source_points):
         super().__init__()
         self.target_points = target_points
-        self.target_permutation = target_cluster.get_permutation()
         self.source_points = source_points
-        self.source_permutation = source_cluster.get_permutation()
-        self.nb_rows = len(self.target_permutation)
-        self.nb_cols = len(self.source_permutation)
-
-    def get_coef(self, i, j):
-        return 1.0 / (
-            1e-1
-            + np.linalg.norm(
-                self.target_points[:, self.target_permutation[i]]
-                - self.source_points[:, self.source_permutation[j]]
-            )
-        )
-
-    def build_submatrix(self, row_offset, col_offset, mat):
-        for j in range(0, mat.shape[0]):
-            for k in range(0, mat.shape[1]):
-                mat[j, k] = 1.0 / (
-                    1.0e-1
-                    + np.linalg.norm(
-                        self.target_points[:, self.target_permutation[j + row_offset]]
-                        - self.source_points[:, self.source_permutation[k + col_offset]]
-                    )
-                )
-
-    def mat_vec(self, x):
-        y = np.zeros(self.nb_rows)
-        for i in range(0, self.nb_rows):
-            for j in range(0, self.nb_cols):
-                y[self.target_permutation[i]] += (
-                    self.get_coef(i, j) * x[self.source_permutation[j]]
-                )
-        return y
-
-    def mat_mat(self, X):
-        Y = np.zeros((self.nb_rows, X.shape[1]))
-
-        for i in range(0, self.nb_rows):
-            for j in range(0, X.shape[1]):
-                for k in range(0, self.nb_cols):
-                    Y[self.target_permutation[i], j] += (
-                        self.get_coef(i, k) * X[self.source_permutation[k], j]
-                    )
-        return Y
-
-
-class CustomGeneratorWithPermutation(Htool.VirtualGeneratorWithPermutation):
-    def __init__(
-        self, target_permutation, target_points, source_permutation, source_points
-    ):
-        super().__init__(target_permutation, source_permutation)
-        self.target_points = target_points
-        self.source_points = source_points
-        self.nb_rows = len(target_permutation)
-        self.nb_cols = len(source_permutation)
+        self.nb_rows = target_points.shape[1]
+        self.nb_cols = source_points.shape[1]
 
     def get_coef(self, i, j):
         return 1.0 / (
diff --git a/example/define_custom_local_operator.py b/example/define_custom_local_operator.py
index c28c4ce..526a38b 100644
--- a/example/define_custom_local_operator.py
+++ b/example/define_custom_local_operator.py
@@ -5,7 +5,7 @@
 class CustomLocalOperator(Htool.LocalOperator):
     def __init__(
         self,
-        generator: Htool.VirtualGenerator,
+        generator: Htool.VirtualGeneratorInUserNumbering,
         target_cluster: Htool.Cluster,
         source_cluster: Htool.Cluster,
         symmetry: str = "N",
@@ -23,7 +23,15 @@ def __init__(
         )
         self.data = np.zeros((target_cluster.get_size(), source_cluster.get_size()))
         generator.build_submatrix(
-            target_cluster.get_offset(), source_cluster.get_offset(), self.data
+            target_cluster.get_permutation()[
+                target_cluster.get_offset() : target_cluster.get_offset()
+                + target_cluster.get_size()
+            ],
+            source_cluster.get_permutation()[
+                source_cluster.get_offset() : source_cluster.get_offset()
+                + source_cluster.get_size()
+            ],
+            self.data,
         )
 
     def add_vector_product(
diff --git a/example/define_custom_low_rank_generator.py b/example/define_custom_low_rank_generator.py
index 6b02f5b..dab4378 100644
--- a/example/define_custom_low_rank_generator.py
+++ b/example/define_custom_low_rank_generator.py
@@ -5,11 +5,12 @@
 
 
 class CustomSVD(Htool.VirtualLowRankGenerator):
-    def build_low_rank_approximation(
-        self, generator, target_size, source_size, target_offset, source_offset, epsilon
-    ):
-        submat = np.zeros((target_size, source_size), order="F")
-        generator.build_submatrix(target_offset, source_offset, submat)
+    def __init__(self, generator: Htool.VirtualGeneratorInUserNumbering):
+        super().__init__(generator)
+
+    def build_low_rank_approximation(self, rows, cols, epsilon):
+        submat = np.zeros((len(rows), len(cols)), order="F")
+        self.build_submatrix(rows, cols, submat)
         u, s, vh = np.linalg.svd(submat, full_matrices=False)
 
         norm = np.linalg.norm(submat)
@@ -18,7 +19,7 @@ def build_low_rank_approximation(
         while count > 0 and math.sqrt(svd_norm) / norm < epsilon:
             svd_norm += s[count] ** 2
             count -= 1
-        count = min(count + 1, min(target_size, source_size))
+        count = min(count + 1, min(len(rows), len(cols)))
         self.set_U(u[:, 0:count] * s[0:count])
         self.set_V(vh[0:count, :])
         self.set_rank(count)
diff --git a/example/use_block_jacobi_solver_with_default_build.py b/example/use_block_jacobi_solver.py
similarity index 89%
rename from example/use_block_jacobi_solver_with_default_build.py
rename to example/use_block_jacobi_solver.py
index d7352ed..d3301a9 100644
--- a/example/use_block_jacobi_solver_with_default_build.py
+++ b/example/use_block_jacobi_solver.py
@@ -1,3 +1,5 @@
+import copy
+
 import Htool
 import matplotlib.pyplot as plt
 import mpi4py
@@ -26,7 +28,7 @@
 )
 
 # Build generator
-generator = CustomGenerator(cluster, points, cluster, points)
+generator = CustomGenerator(points, points)
 
 # Build distributed operator
 default_approximation = Htool.DefaultApproximationBuilder(
@@ -41,9 +43,10 @@
 )
 
 # Solver with block Jacobi preconditionner
-default_solver_builder = Htool.DefaultSolverBuilder(
-    default_approximation.distributed_operator,
-    default_approximation.block_diagonal_hmatrix,
+block_diagonal_hmatrix = copy.deepcopy(default_approximation.block_diagonal_hmatrix)
+test = default_approximation.block_diagonal_hmatrix
+default_solver_builder = Htool.DDMSolverBuilder(
+    default_approximation.distributed_operator, block_diagonal_hmatrix
 )
 solver = default_solver_builder.solver
 
@@ -79,10 +82,6 @@
     print(solver_information)
 
     fig = plt.figure()
-    ax1 = None
-    ax2 = None
-    ax3 = None
-    ax4 = None
     if dimension == 2:
         ax1 = fig.add_subplot(2, 2, 1)
         ax2 = fig.add_subplot(2, 2, 2)
diff --git a/example/use_block_jacobi_solver_with_no_default_build.py b/example/use_block_jacobi_solver_with_no_default_build.py
deleted file mode 100644
index e5ccc11..0000000
--- a/example/use_block_jacobi_solver_with_no_default_build.py
+++ /dev/null
@@ -1,134 +0,0 @@
-import Htool
-import matplotlib.pyplot as plt
-import mpi4py
-import numpy as np
-from create_geometry import create_partitionned_geometries
-from define_custom_generators import CustomGenerator
-
-# Random geometry
-size = 500
-dimension = 3
-[points, _, partition] = create_partitionned_geometries(
-    dimension, size, size, mpi4py.MPI.COMM_WORLD.size
-)
-
-
-# Htool parameters
-eta = 10
-epsilon = 1e-3
-minclustersize = 10
-number_of_children = 2
-
-# Build clusters
-cluster_builder = Htool.ClusterBuilder()
-cluster_builder.set_minclustersize(minclustersize)
-cluster: Htool.Cluster = cluster_builder.create_cluster_tree(
-    points, number_of_children, mpi4py.MPI.COMM_WORLD.size, partition
-)
-
-
-# Build generator
-generator = CustomGenerator(cluster, points, cluster, points)
-
-# Build HMatrix
-hmatrix_builder = Htool.HMatrixBuilder(
-    cluster,
-    cluster,
-    epsilon,
-    eta,
-    "S",
-    "L",
-    -1,
-    mpi4py.MPI.COMM_WORLD.rank,
-)
-
-hmatrix: Htool.HMatrix = hmatrix_builder.build(generator)
-
-
-# Build local operator
-local_operator = Htool.LocalHMatrix(
-    hmatrix,
-    cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank),
-    cluster,
-    "N",
-    "N",
-    False,
-    False,
-)
-
-# Build distributed operator
-partition_from_cluster = Htool.PartitionFromCluster(cluster)
-distributed_operator = Htool.DistributedOperator(
-    partition_from_cluster,
-    partition_from_cluster,
-    "S",
-    "L",
-    mpi4py.MPI.COMM_WORLD,
-)
-
-distributed_operator.add_local_operator(local_operator)
-
-
-# Solver with block Jacobi preconditionner
-block_diagonal_hmatrix = hmatrix.get_sub_hmatrix(
-    cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank),
-    cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank),
-)
-default_solver_builder = Htool.DefaultSolverBuilder(
-    distributed_operator,
-    block_diagonal_hmatrix,
-)
-solver = default_solver_builder.solver
-
-# Solver with block Jacobi
-x_ref = np.random.random(size)
-b = distributed_operator * x_ref
-x = np.zeros(size)
-
-hpddm_args = "-hpddm_compute_residual l2 "
-if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
-    hpddm_args += "-hpddm_verbosity 10"
-solver.set_hpddm_args(hpddm_args)
-solver.facto_one_level()
-solver.solve(x, b)
-
-
-# Outputs
-hmatrix_distributed_information = hmatrix.get_distributed_information(
-    mpi4py.MPI.COMM_WORLD
-)
-hmatrix_tree_parameter = hmatrix.get_tree_parameters()
-hmatrix_local_information = hmatrix.get_local_information()
-solver_information = solver.get_information()
-if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
-    print(np.linalg.norm(x - x_ref) / np.linalg.norm(x_ref))
-    print(hmatrix_distributed_information)
-    print(hmatrix_local_information)
-    print(hmatrix_tree_parameter)
-    print(solver_information)
-
-    fig = plt.figure()
-    ax1 = None
-    ax2 = None
-    ax3 = None
-    ax4 = None
-    if dimension == 2:
-        ax1 = fig.add_subplot(2, 2, 1)
-        ax2 = fig.add_subplot(2, 2, 2)
-        ax3 = fig.add_subplot(2, 2, 3)
-        ax4 = fig.add_subplot(2, 2, 4)
-    elif dimension == 3:
-        ax1 = fig.add_subplot(2, 2, 1, projection="3d")
-        ax2 = fig.add_subplot(2, 2, 2, projection="3d")
-        ax3 = fig.add_subplot(2, 2, 3)
-        ax4 = fig.add_subplot(2, 2, 4)
-
-    ax1.set_title("cluster at depth 1")
-    ax2.set_title("cluster at depth 2")
-    ax3.set_title("Hmatrix on rank 0")
-    ax4.set_title("Block diagonal Hmatrix on rank 0")
-    Htool.plot(ax1, cluster, points, 1)
-    Htool.plot(ax2, cluster, points, 2)
-    Htool.plot(ax3, hmatrix)
-    Htool.plot(ax4, block_diagonal_hmatrix)
-    plt.show()
diff --git a/example/use_cluster.py b/example/use_cluster.py
index e975e89..1f3589a 100644
--- a/example/use_cluster.py
+++ b/example/use_cluster.py
@@ -41,8 +41,6 @@
 
 if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
     fig = plt.figure()
-    ax1 = None
-    ax2 = None
 
     if dimension == 2:
         ax1 = fig.add_subplot(1, 2, 1)
diff --git a/example/use_cluster_with_given_partition.py b/example/use_cluster_with_given_partition.py
index 2306eae..8499605 100644
--- a/example/use_cluster_with_given_partition.py
+++ b/example/use_cluster_with_given_partition.py
@@ -31,8 +31,6 @@
 
 if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
     fig = plt.figure()
-    ax1 = None
-    ax2 = None
 
     if dimension == 2:
         ax1 = fig.add_subplot(1, 2, 1)
diff --git a/example/use_custom_dense_block_generator.py b/example/use_custom_dense_block_generator.py
index 5514172..05639ba 100644
--- a/example/use_custom_dense_block_generator.py
+++ b/example/use_custom_dense_block_generator.py
@@ -32,9 +32,7 @@
 
 
 # Build generator
-generator = CustomGenerator(
-    target_cluster, target_points, source_cluster, source_points
-)
+generator = CustomGenerator(target_points, source_points)
 
 #
 custom_dense_blocks_generator = CustomDenseBlocksGenerator(generator)
diff --git a/example/use_custom_local_operator.py b/example/use_custom_local_operator.py
index 9d952d3..d9814fe 100644
--- a/example/use_custom_local_operator.py
+++ b/example/use_custom_local_operator.py
@@ -32,9 +32,7 @@
 
 
 # Build generator
-generator = CustomGenerator(
-    target_cluster, target_points, source_cluster, source_points
-)
+generator = CustomGenerator(target_points, source_points)
 
 # Build local operator
 local_operator = CustomLocalOperator(
@@ -44,22 +42,14 @@
     "N",
     "N",
     False,
-    False,
+    True,
 )
 
 # Build distributed operator
-target_partition_from_cluster = Htool.PartitionFromCluster(target_cluster)
-source_partition_from_cluster = Htool.PartitionFromCluster(source_cluster)
-distributed_operator = Htool.DistributedOperator(
-    target_partition_from_cluster,
-    source_partition_from_cluster,
-    "N",
-    "N",
-    mpi4py.MPI.COMM_WORLD,
+custom_local_approximation = Htool.CustomApproximationBuilder(
+    target_cluster, source_cluster, "N", "N", mpi4py.MPI.COMM_WORLD, local_operator
 )
-
-distributed_operator.add_local_operator(local_operator)
-
+distributed_operator = custom_local_approximation.distributed_operator
 
 # Test matrix vector product
 np.random.seed(0)
diff --git a/example/use_custom_low_rank_approximation.py b/example/use_custom_low_rank_approximation.py
index 1ed76b5..ac05a9c 100644
--- a/example/use_custom_low_rank_approximation.py
+++ b/example/use_custom_low_rank_approximation.py
@@ -32,13 +32,11 @@
 
 
 # Build generator
-generator = CustomGenerator(
-    target_cluster, target_points, source_cluster, source_points
-)
+generator = CustomGenerator(target_points, source_points)
 
 # Low rank generator
 
-low_rank_generator = CustomSVD()
+low_rank_generator = CustomSVD(generator)
 
 # Build HMatrix
 hmatrix_builder = Htool.HMatrixBuilder(
@@ -50,37 +48,16 @@
     "N",
     -1,
     mpi4py.MPI.COMM_WORLD.rank,
+    mpi4py.MPI.COMM_WORLD.rank,
 )
 hmatrix_builder.set_low_rank_generator(low_rank_generator)
-hmatrix: Htool.HMatrix = hmatrix_builder.build(generator)
-del hmatrix_builder
-low_rank_generator.test()
-del low_rank_generator
-
-
-# Build local operator
-local_operator = Htool.LocalHMatrix(
-    hmatrix,
-    target_cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank),
-    source_cluster,
-    "N",
-    "N",
-    False,
-    False,
-)
 
 # Build distributed operator
-target_partition_from_cluster = Htool.PartitionFromCluster(target_cluster)
-source_partition_from_cluster = Htool.PartitionFromCluster(source_cluster)
-distributed_operator = Htool.DistributedOperator(
-    target_partition_from_cluster,
-    source_partition_from_cluster,
-    "N",
-    "N",
-    mpi4py.MPI.COMM_WORLD,
+distributed_operator_from_hmatrix = Htool.DistributedOperatorFromHMatrix(
+    generator, target_cluster, source_cluster, hmatrix_builder, mpi4py.MPI.COMM_WORLD
 )
 
-distributed_operator.add_local_operator(local_operator)
+distributed_operator = distributed_operator_from_hmatrix.distributed_operator
 
 
 # Test matrix vector product
diff --git a/example/use_default_build.py b/example/use_hmatrix_compression.py
similarity index 94%
rename from example/use_default_build.py
rename to example/use_hmatrix_compression.py
index e8278af..932a118 100644
--- a/example/use_default_build.py
+++ b/example/use_hmatrix_compression.py
@@ -32,9 +32,7 @@
 
 
 # Build generator
-generator = CustomGenerator(
-    target_cluster, target_points, source_cluster, source_points
-)
+generator = CustomGenerator(target_points, source_points)
 
 # Build distributed operator
 default_approximation = Htool.DefaultApproximationBuilder(
@@ -77,10 +75,7 @@
     print(hmatrix_tree_parameter)
 
     fig = plt.figure()
-    ax1 = None
-    ax2 = None
-    ax3 = None
-    ax4 = None
+
     if dimension == 2:
         ax1 = fig.add_subplot(2, 2, 1)
         ax2 = fig.add_subplot(2, 2, 2)
diff --git a/example/use_local_build.py b/example/use_local_hmatrix_compression.py
similarity index 91%
rename from example/use_local_build.py
rename to example/use_local_hmatrix_compression.py
index 2607705..60d9e23 100644
--- a/example/use_local_build.py
+++ b/example/use_local_hmatrix_compression.py
@@ -53,9 +53,7 @@
     permuted_source_points[:, i] = source_points[:, source_permutation[i]]
 
 # Build generator
-generator = CustomGenerator(
-    target_cluster, target_points, source_cluster, source_points
-)
+generator = CustomGenerator(target_points, source_points)
 
 
 # Build distributed operator
@@ -90,12 +88,7 @@
     permuted_source_points, number_of_children, 2, off_diagonal_partition
 )
 
-off_diagonal_generator = CustomGenerator(
-    target_cluster,
-    target_points,
-    off_diagonal_cluster,
-    permuted_source_points,
-)
+off_diagonal_generator = CustomGenerator(target_points, permuted_source_points)
 
 local_operator_1 = None
 if off_diagonal_nc_1 > 0:
@@ -154,10 +147,6 @@
     print(hmatrix_tree_parameter)
 
     fig = plt.figure()
-    ax1 = None
-    ax2 = None
-    ax3 = None
-    ax4 = None
     if dimension == 2:
         ax1 = fig.add_subplot(2, 2, 1)
         ax2 = fig.add_subplot(2, 2, 2)
@@ -175,11 +164,12 @@
     ax4.set_title("Hmatrix on rank 0")
     Htool.plot(ax1, source_cluster, source_points, 1)
     Htool.plot(ax2, source_cluster, source_points, 2)
-    Htool.plot(
-        ax3,
-        off_diagonal_cluster.get_cluster_on_partition(1),
-        permuted_source_points,
-        2,
-    )
+    if mpi4py.MPI.COMM_WORLD.Get_size() > 1:
+        Htool.plot(
+            ax3,
+            off_diagonal_cluster.get_cluster_on_partition(1),
+            permuted_source_points,
+            2,
+        )
     Htool.plot(ax4, hmatrix)
     plt.show()
diff --git a/example/use_no_default_build.py b/example/use_no_default_build.py
deleted file mode 100644
index 6d1b1c8..0000000
--- a/example/use_no_default_build.py
+++ /dev/null
@@ -1,128 +0,0 @@
-import Htool
-import matplotlib.pyplot as plt
-import mpi4py
-import numpy as np
-from create_geometry import create_partitionned_geometries
-from define_custom_generators import CustomGenerator
-
-# Random geometry
-nb_rows = 500
-nb_cols = 500
-dimension = 3
-[target_points, source_points, target_partition] = create_partitionned_geometries(
-    dimension, nb_rows, nb_cols, mpi4py.MPI.COMM_WORLD.size
-)
-
-
-# Htool parameters
-eta = 10
-epsilon = 1e-3
-minclustersize = 10
-number_of_children = 2
-
-# Build clusters
-cluster_builder = Htool.ClusterBuilder()
-cluster_builder.set_minclustersize(minclustersize)
-target_cluster: Htool.Cluster = cluster_builder.create_cluster_tree(
-    target_points, number_of_children, mpi4py.MPI.COMM_WORLD.size, target_partition
-)
-source_cluster: Htool.Cluster = cluster_builder.create_cluster_tree(
-    source_points, number_of_children, mpi4py.MPI.COMM_WORLD.size
-)
-
-
-# Build generator
-generator = CustomGenerator(
-    target_cluster, target_points, source_cluster, source_points
-)
-
-# Build HMatrix
-hmatrix_builder = Htool.HMatrixBuilder(
-    target_cluster,
-    source_cluster,
-    epsilon,
-    eta,
-    "N",
-    "N",
-    -1,
-    mpi4py.MPI.COMM_WORLD.rank,
-)
-
-hmatrix: Htool.HMatrix = hmatrix_builder.build(generator)
-
-
-# Build local operator
-local_operator = Htool.LocalHMatrix(
-    hmatrix,
-    target_cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank),
-    source_cluster,
-    "N",
-    "N",
-    False,
-    False,
-)
-
-# Build distributed operator
-target_partition_from_cluster = Htool.PartitionFromCluster(target_cluster)
-source_partition_from_cluster = Htool.PartitionFromCluster(source_cluster)
-distributed_operator = Htool.DistributedOperator(
-    target_partition_from_cluster,
-    source_partition_from_cluster,
-    "N",
-    "N",
-    mpi4py.MPI.COMM_WORLD,
-)
-
-distributed_operator.add_local_operator(local_operator)
-
-
-# Test matrix vector product
-np.random.seed(0)
-x = np.random.rand(nb_cols)
-y_1 = distributed_operator * x
-y_2 = generator.mat_vec(x)
-print(mpi4py.MPI.COMM_WORLD.rank, np.linalg.norm(y_1 - y_2) / np.linalg.norm(y_2))
-
-
-# Test matrix matrix product
-X = np.asfortranarray(np.random.rand(nb_cols, 2))
-Y_1 = distributed_operator @ X
-Y_2 = generator.mat_mat(X)
-print(mpi4py.MPI.COMM_WORLD.rank, np.linalg.norm(Y_1 - Y_2) / np.linalg.norm(Y_2))
-
-
-# Outputs
-hmatrix_distributed_information = hmatrix.get_distributed_information(
-    mpi4py.MPI.COMM_WORLD
-)
-hmatrix_tree_parameter = hmatrix.get_tree_parameters()
-hmatrix_local_information = hmatrix.get_local_information()
-if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
-    print(hmatrix_distributed_information)
-    print(hmatrix_local_information)
-    print(hmatrix_tree_parameter)
-    fig = plt.figure()
-    ax1 = None
-    ax2 = None
-    ax3 = None
-    ax4 = None
-    if dimension == 2:
-        ax1 = fig.add_subplot(2, 2, 1)
-        ax2 = fig.add_subplot(2, 2, 2)
-        ax3 = fig.add_subplot(2, 2, 3)
-        ax4 = fig.add_subplot(2, 2, 4)
-    elif dimension == 3:
-        ax1 = fig.add_subplot(2, 2, 1, projection="3d")
-        ax2 = fig.add_subplot(2, 2, 2, projection="3d")
-        ax3 = fig.add_subplot(2, 2, 3, projection="3d")
-        ax4 = fig.add_subplot(2, 2, 4)
-
-    ax1.set_title("target cluster at depth 1")
-    ax2.set_title("target cluster at depth 2")
-    ax3.set_title("source cluster at depth 1")
-    ax4.set_title("Hmatrix on rank 0")
-    Htool.plot(ax1, target_cluster, target_points, 1)
-    Htool.plot(ax2, target_cluster, target_points, 2)
-    Htool.plot(ax3, source_cluster, source_points, 1)
-    Htool.plot(ax4, hmatrix)
-    plt.show()
diff --git a/lib/hpddm b/lib/hpddm
index 55c0af0..5890d5a 160000
--- a/lib/hpddm
+++ b/lib/hpddm
@@ -1 +1 @@
-Subproject commit 55c0af02e5b78d2cb1e466b684e06ce2f111d2ac
+Subproject commit 5890d5addf3962d539dc25c441ec3ff4af93b3ab
diff --git a/lib/htool b/lib/htool
index dd96716..29ce0df 160000
--- a/lib/htool
+++ b/lib/htool
@@ -1 +1 @@
-Subproject commit dd96716e2d522b2ca50949ddc1c15581c0d0a8f8
+Subproject commit 29ce0dfe8125b6ebbd6efc1dfff6229dbaf92f38
diff --git a/pyproject.toml b/pyproject.toml
index 3ae84e8..5537558 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -21,7 +21,7 @@ dependencies = ["mpi4py", "numpy"]
 
 
 [project.optional-dependencies]
-dev = ["ruff", "matplotlib>=3.0.0", "pytest"]
+dev = ["ruff", "matplotlib>=3.0.0", "pytest", "scipy"]
 
 
 [project.urls]
diff --git a/src/htool/clustering/cluster_node.hpp b/src/htool/clustering/cluster_node.hpp
index abfdf92..fdd5861 100644
--- a/src/htool/clustering/cluster_node.hpp
+++ b/src/htool/clustering/cluster_node.hpp
@@ -20,21 +20,6 @@ void declare_cluster_node(py::module &m, const std::string &className) {
     py_class.def("get_offset", &Class::get_offset);
     py_class.def("get_permutation", [](const Class &self) {
         auto &permutation = self.get_permutation();
-        // int rankWorld;
-        // MPI_Comm_rank(MPI_COMM_WORLD, &rankWorld);
-        // if (rankWorld == 0) {
-        //     for (auto &elt : permutation) {
-        //         std::cout << elt << " ";
-        //     }
-        //     std::cout << "\n";
-        // }
-        // MPI_Barrier(MPI_COMM_WORLD);
-        // if (rankWorld == 1) {
-        //     for (auto &elt : permutation) {
-        //         std::cout << elt << " ";
-        //     }
-        //     std::cout << "\n";
-        // }
         return py::array_t<int>(std::array<std::size_t, 1>{permutation.size()}, permutation.data(), py::capsule(permutation.data()));
         ;
     });
diff --git a/src/htool/distributed_operator/distributed_operator.hpp b/src/htool/distributed_operator/distributed_operator.hpp
index ceccf29..08b6215 100644
--- a/src/htool/distributed_operator/distributed_operator.hpp
+++ b/src/htool/distributed_operator/distributed_operator.hpp
@@ -2,7 +2,6 @@
 #define HTOOL_PYBIND11_DISTRIBUTED_OPERATOR_HPP
 #include "../misc/utility.hpp"
 #include "../misc/wrapper_mpi.hpp"
-#include "./interface/partition.hpp"
 #include <htool/distributed_operator/distributed_operator.hpp>
 #include <htool/distributed_operator/utility.hpp>
 #include <pybind11/pybind11.h>
@@ -17,21 +16,24 @@ void declare_distributed_operator(py::module &m, const std::string &class_name)
 
     // Linear algebra
     py_class.def(
-        "__mul__", [](const Class &self, std::vector<CoefficientPrecision> in) {
-            std::vector<CoefficientPrecision> out(self.get_target_partition().get_global_size());
-            self.vector_product_global_to_global(in.data(), out.data());
-            return as_pyarray(std::move(out));
-            ;
+        "__mul__", [](const Class &self, const py::array_t<CoefficientPrecision, py::array::f_style> input) {
+            if (input.ndim() != 1) {
+                throw std::runtime_error("Wrong dimension for HMatrix-vector product"); // LCOV_EXCL_LINE
+            }
+            if (input.shape()[0] != self.get_source_partition().get_global_size()) {
+                throw std::runtime_error("Wrong size for HMatrix-vector product"); // LCOV_EXCL_LINE
+            }
+            py::array_t<CoefficientPrecision, py::array::f_style> result(std::array<long int, 1>{self.get_target_partition().get_global_size()});
+            self.vector_product_global_to_global(input.data(), result.mutable_data());
+
+            return result;
         },
         "in"_a);
 
     py_class.def(
         "__matmul__", [](const Class &self, py::array_t<CoefficientPrecision, py::array::f_style> input) {
             int mu;
-
-            if (input.ndim() == 1) {
-                mu = 1;
-            } else if (input.ndim() == 2) {
+            if (input.ndim() == 2) {
                 mu = input.shape()[1];
             } else {
                 throw std::runtime_error("Wrong dimension for HMatrix-matrix product"); // LCOV_EXCL_LINE
@@ -40,21 +42,12 @@ void declare_distributed_operator(py::module &m, const std::string &class_name)
                 throw std::runtime_error("Wrong size for HMatrix-matrix product"); // LCOV_EXCL_LINE
             }
 
-            std::vector<CoefficientPrecision> result(self.get_target_partition().get_global_size() * mu, 0);
-
-            const CoefficientPrecision *in   = input.data();
-            int nc                           = input.shape()[0];
-            const CoefficientPrecision *test = input.data();
+            std::array<long int, 2> shape{self.get_target_partition().get_global_size(), mu};
+            py::array_t<CoefficientPrecision, py::array::f_style> result(shape);
 
-            self.matrix_product_global_to_global(input.data(), result.data(), mu);
+            self.matrix_product_global_to_global(input.data(), result.mutable_data(), mu);
 
-            if (input.ndim() == 1) {
-                std::array<long int, 1> shape{self.get_target_partition().get_global_size()};
-                return py::array_t<CoefficientPrecision, py::array::f_style>(shape, result.data());
-            } else {
-                std::array<long int, 2> shape{self.get_target_partition().get_global_size(), mu};
-                return py::array_t<CoefficientPrecision, py::array::f_style>(shape, result.data());
-            }
+            return result;
         },
         py::arg("input").noconvert(true));
 }
diff --git a/src/htool/distributed_operator/implementation/partition_from_cluster.hpp b/src/htool/distributed_operator/implementation/partition_from_cluster.hpp
deleted file mode 100644
index 497790f..0000000
--- a/src/htool/distributed_operator/implementation/partition_from_cluster.hpp
+++ /dev/null
@@ -1,16 +0,0 @@
-#ifndef HTOOL_DISTRIBUTED_OPERATOR_PARTITION_FROM_CLUSTER_CPP
-#define HTOOL_DISTRIBUTED_OPERATOR_PARTITION_FROM_CLUSTER_CPP
-
-#include <htool/distributed_operator/implementations/partition_from_cluster.hpp>
-#include <htool/distributed_operator/interfaces/partition.hpp>
-#include <pybind11/pybind11.h>
-
-template <typename CoefficientPrecision, typename CoordinatePrecision>
-void declare_partition_from_cluster(py::module &m, const std::string &class_name) {
-    using Class = htool::PartitionFromCluster<CoefficientPrecision, CoordinatePrecision>;
-
-    py::class_<Class, htool::IPartition<CoefficientPrecision>> py_class(m, class_name.c_str());
-    py_class.def(py::init<const Cluster<CoordinatePrecision> &>(), py::keep_alive<1, 2>());
-}
-
-#endif
diff --git a/src/htool/distributed_operator/interface/partition.hpp b/src/htool/distributed_operator/interface/partition.hpp
deleted file mode 100644
index ed42d39..0000000
--- a/src/htool/distributed_operator/interface/partition.hpp
+++ /dev/null
@@ -1,32 +0,0 @@
-#ifndef HTOOL_PYBIND11_DISTRIBUTED_OPERATOR_PARTITION_HPP
-#define HTOOL_PYBIND11_DISTRIBUTED_OPERATOR_PARTITION_HPP
-
-#include <htool/distributed_operator/interfaces/partition.hpp>
-#include <pybind11/pybind11.h>
-
-// class PyIPartition : public htool::IPartition {
-//   public:
-//     /* Inherit the constructors */
-//     using htool::IPartition::IPartition;
-
-//     /* Trampoline (need one for each virtual function) */
-//     std::string go(int n_times) override {
-//         PYBIND11_OVERRIDE_PURE(
-//             std::string, /* Return type */
-//             IPartition,  /* Parent class */
-//             go,          /* Name of function in C++ (must match Python name) */
-//             n_times      /* Argument(s) */
-//         );
-//     }
-// };
-
-template <typename CoefficientPrecision>
-void declare_interface_partition(py::module &m, const std::string &class_name) {
-    using Class = htool::IPartition<CoefficientPrecision>;
-    py::class_<Class> py_class(m, class_name.c_str());
-    py_class.def("get_size_of_partition", &Class::get_size_of_partition);
-    py_class.def("get_offset_of_partition", &Class::get_offset_of_partition);
-    py_class.def("get_global_size", &Class::get_global_size);
-}
-
-#endif
diff --git a/src/htool/distributed_operator/utility.hpp b/src/htool/distributed_operator/utility.hpp
index 660c009..8b5f292 100644
--- a/src/htool/distributed_operator/utility.hpp
+++ b/src/htool/distributed_operator/utility.hpp
@@ -8,12 +8,23 @@
 template <typename CoefficientPrecision, typename CoordinatePrecision>
 void declare_distributed_operator_utility(py::module &m, std::string prefix = "") {
 
-    using DefaultApproximation                   = DefaultApproximationBuilder<CoefficientPrecision, CoordinatePrecision>;
-    using LocalDefaultApproximation              = DefaultLocalApproximationBuilder<CoefficientPrecision, CoordinatePrecision>;
-    std::string default_approximation_name       = prefix + "DefaultApproximationBuilder";
-    std::string default_local_approximation_name = prefix + "DefaultLocalApproximationBuilder";
+    using CustomApproximation            = CustomApproximationBuilder<CoefficientPrecision, CoordinatePrecision>;
+    using DefaultApproximation           = DefaultApproximationBuilder<CoefficientPrecision, CoordinatePrecision>;
+    using LocalDefaultApproximation      = DefaultLocalApproximationBuilder<CoefficientPrecision, CoordinatePrecision>;
+    using DistributedOperatorFromHMatrix = DistributedOperatorFromHMatrix<CoefficientPrecision, CoordinatePrecision>;
+
+    std::string custom_approximation_name              = prefix + "CustomApproximationBuilder";
+    std::string default_approximation_name             = prefix + "DefaultApproximationBuilder";
+    std::string default_local_approximation_name       = prefix + "DefaultLocalApproximationBuilder";
+    std::string distributed_operator_from_hmatrix_name = prefix + "DistributedOperatorFromHMatrix";
+
+    py::class_<CustomApproximation> custom_approximation_class(m, custom_approximation_name.c_str());
+    custom_approximation_class.def(py::init<const Cluster<CoordinatePrecision> &, const Cluster<CoordinatePrecision> &, char, char, MPI_Comm_wrapper, const VirtualLocalOperator<CoefficientPrecision> &>());
+    custom_approximation_class.def_property_readonly(
+        "distributed_operator", [](const CustomApproximation &self) { return &self.distributed_operator; }, py::return_value_policy::reference_internal);
+
     py::class_<DefaultApproximation> default_approximation_class(m, default_approximation_name.c_str());
-    default_approximation_class.def(py::init<const VirtualGenerator<CoefficientPrecision> &, const Cluster<CoordinatePrecision> &, const Cluster<CoordinatePrecision> &, htool::underlying_type<CoefficientPrecision>, htool::underlying_type<CoefficientPrecision>, char, char, MPI_Comm_wrapper>());
+    default_approximation_class.def(py::init<const VirtualGeneratorInUserNumbering<CoefficientPrecision> &, const Cluster<CoordinatePrecision> &, const Cluster<CoordinatePrecision> &, htool::underlying_type<CoefficientPrecision>, htool::underlying_type<CoefficientPrecision>, char, char, MPI_Comm_wrapper>());
     default_approximation_class.def_property_readonly(
         "distributed_operator", [](const DefaultApproximation &self) { return &self.distributed_operator; }, py::return_value_policy::reference_internal);
     default_approximation_class.def_property_readonly(
@@ -22,12 +33,21 @@ void declare_distributed_operator_utility(py::module &m, std::string prefix = ""
         "block_diagonal_hmatrix", [](const DefaultApproximation &self) { return &*self.block_diagonal_hmatrix; }, py::return_value_policy::reference_internal);
 
     py::class_<LocalDefaultApproximation> default_local_approximation_class(m, default_local_approximation_name.c_str());
-    default_local_approximation_class.def(py::init<const VirtualGenerator<CoefficientPrecision> &, const Cluster<CoordinatePrecision> &, const Cluster<CoordinatePrecision> &, htool::underlying_type<CoefficientPrecision>, htool::underlying_type<CoefficientPrecision>, char, char, MPI_Comm_wrapper>());
+    default_local_approximation_class.def(py::init<const VirtualGeneratorInUserNumbering<CoefficientPrecision> &, const Cluster<CoordinatePrecision> &, const Cluster<CoordinatePrecision> &, htool::underlying_type<CoefficientPrecision>, htool::underlying_type<CoefficientPrecision>, char, char, MPI_Comm_wrapper>());
     default_local_approximation_class.def_property_readonly(
         "distributed_operator", [](const LocalDefaultApproximation &self) { return &self.distributed_operator; }, py::return_value_policy::reference_internal);
     default_local_approximation_class.def_property_readonly(
         "hmatrix", [](const LocalDefaultApproximation &self) { return &self.hmatrix; }, py::return_value_policy::reference_internal);
     default_local_approximation_class.def_property_readonly(
         "block_diagonal_hmatrix", [](const LocalDefaultApproximation &self) { return &*self.block_diagonal_hmatrix; }, py::return_value_policy::reference_internal);
+
+    py::class_<DistributedOperatorFromHMatrix> distributed_operator_from_hmatrix_class(m, distributed_operator_from_hmatrix_name.c_str());
+    distributed_operator_from_hmatrix_class.def(py::init<const VirtualGeneratorInUserNumbering<CoefficientPrecision> &, const Cluster<CoordinatePrecision> &, const Cluster<CoordinatePrecision> &, const HMatrixTreeBuilder<CoefficientPrecision, CoordinatePrecision> &, MPI_Comm_wrapper>());
+    distributed_operator_from_hmatrix_class.def_property_readonly(
+        "distributed_operator", [](const DistributedOperatorFromHMatrix &self) { return &self.distributed_operator; }, py::return_value_policy::reference_internal);
+    distributed_operator_from_hmatrix_class.def_property_readonly(
+        "hmatrix", [](const DistributedOperatorFromHMatrix &self) { return &self.hmatrix; }, py::return_value_policy::reference_internal);
+    distributed_operator_from_hmatrix_class.def_property_readonly(
+        "block_diagonal_hmatrix", [](const DistributedOperatorFromHMatrix &self) { return &*self.block_diagonal_hmatrix; }, py::return_value_policy::reference_internal);
 }
 #endif
diff --git a/src/htool/hmatrix/hmatrix.hpp b/src/htool/hmatrix/hmatrix.hpp
index 4dc9c3b..15c124f 100644
--- a/src/htool/hmatrix/hmatrix.hpp
+++ b/src/htool/hmatrix/hmatrix.hpp
@@ -22,22 +22,23 @@ void declare_HMatrix(py::module &m, const std::string &className) {
     using Class = HMatrix<CoefficientPrecision, CoordinatePrecision>;
     py::class_<Class> py_class(m, className.c_str());
 
-    // py_class.def("build", [](Class &self, VirtualGeneratorCpp<T> &mat, const py::array_t<double, py::array::f_style> &x) {
-    //     self.build(mat, x.data());
-    // });
+    py_class.def("to_dense", [](const Class &self) {
+        std::array<long int, 2> shape{self.get_target_cluster().get_size(), self.get_source_cluster().get_size()};
+        py::array_t<CoefficientPrecision, py::array::f_style> dense(shape);
+        std::fill_n(dense.mutable_data(), dense.size(), CoefficientPrecision(0));
+        copy_to_dense(self, dense.mutable_data());
+        return dense;
+    });
 
-    // py_class.def("build_dense_blocks", [](Class &self, VirtualDenseBlocksGeneratorCpp<T> &dense_block_generator) {
-    //     self.build_dense_blocks(dense_block_generator);
-    // });
+    py_class.def("to_dense_in_user_numbering", [](const Class &self) {
+        std::array<long int, 2> shape{self.get_target_cluster().get_size(), self.get_source_cluster().get_size()};
+        py::array_t<CoefficientPrecision, py::array::f_style> dense(shape);
+        std::fill_n(dense.mutable_data(), dense.size(), CoefficientPrecision(0));
+        copy_to_dense_in_user_numbering(self, dense.mutable_data());
+        return dense;
+    });
 
-    // // Setters
-    // py_class.def("set_maxblocksize", &Class::set_maxblocksize);
-    // py_class.def("set_minsourcedepth", &Class::set_minsourcedepth);
-    // py_class.def("set_mintargetdepth", &Class::set_mintargetdepth);
-    // py_class.def("set_delay_dense_computation", &Class::set_delay_dense_computation);
-    // py_class.def("set_compression", [](Class &self, std::shared_ptr<VirtualLowRankGeneratorCpp<T>> mat) {
-    //     self.set_compression(mat);
-    // });
+    py_class.def("__deepcopy__", [](const Class &self, py::dict) { return Class(self); }, "memo"_a);
 
     // // Getters
     // py_class.def_property_readonly("shape", [](const Class &self) {
@@ -82,13 +83,6 @@ void declare_HMatrix(py::module &m, const std::string &className) {
     //     }
     // });
 
-    // // Print information
-    // py_class.def("print_infos", &Class::print_infos);
-    // py_class.def("get_infos", overload_cast_<const std::string &>()(&Class::get_infos, py::const_));
-    // py_class.def("__str__", [](const Class &self) {
-    //     return "HMatrix: (shape: " + htool::NbrToStr(self.nb_cols()) + "x" + htool::NbrToStr(self.nb_rows()) + ", nb_low_rank_blocks: " + htool::NbrToStr(self.get_nlrmat()) + ", nb_dense_blocks: " + htool::NbrToStr(self.get_ndmat()) + ")";
-    // });
-
     py_class.def(
         "get_sub_hmatrix", [](const HMatrix<CoefficientPrecision, CoordinatePrecision> &hmatrix, const Cluster<CoordinatePrecision> &target_cluster, const Cluster<CoordinatePrecision> &source_cluster) {
             return &*hmatrix.get_sub_hmatrix(target_cluster, source_cluster);
@@ -106,92 +100,6 @@ void declare_HMatrix(py::module &m, const std::string &className) {
         auto information = htool::get_distributed_hmatrix_information(hmatrix, comm);
         return information;
     });
-
-    // Plot pattern
-    py_class.def(
-        "display", [](const HMatrix<CoefficientPrecision, CoordinatePrecision> &hmatrix, bool show = true) {
-            std::vector<int> buf;
-            int nb_leaves = 0;
-            htool::preorder_tree_traversal(
-                hmatrix,
-                [&buf, &nb_leaves, &hmatrix](const HMatrix<CoefficientPrecision, CoordinatePrecision> &current_hmatrix) {
-                    if (current_hmatrix.is_leaf()) {
-                        nb_leaves += 1;
-                        buf.push_back(current_hmatrix.get_target_cluster().get_offset() - hmatrix.get_target_cluster().get_offset());
-                        buf.push_back(current_hmatrix.get_target_cluster().get_size());
-                        buf.push_back(current_hmatrix.get_source_cluster().get_offset() - hmatrix.get_source_cluster().get_offset());
-                        buf.push_back(current_hmatrix.get_source_cluster().get_size());
-                        buf.push_back(current_hmatrix.get_rank());
-                    }
-                });
-
-            // Import
-            py::object plt     = py::module::import("matplotlib.pyplot");
-            py::object patches = py::module::import("matplotlib.patches");
-            py::object colors  = py::module::import("matplotlib.colors");
-            py::object numpy   = py::module::import("numpy");
-
-            // First Data
-            int nr = hmatrix.get_target_cluster().get_size();
-            int nc = hmatrix.get_source_cluster().get_size();
-            py::array_t<int> matrix({nr, nc});
-            py::array_t<bool> mask_matrix({nr, nc});
-            mask_matrix.attr("fill")(false);
-
-            // Figure
-            py::tuple sublots_output = plt.attr("subplots")(1, 1);
-            py::object fig           = sublots_output[0];
-            py::object axes          = sublots_output[1];
-            // axes.attr()
-
-            // Issue: there a shift of one pixel along the y-axis...
-            // int shift = axes.transData.transform([(0,0), (1,1)])
-            // shift = shift[1,1] - shift[0,1]  # 1 unit in display coords
-            int shift = 0;
-
-            int max_rank = 0;
-            for (int p = 0; p < nb_leaves; p++) {
-                int i_row  = buf[5 * p];
-                int nb_row = buf[5 * p + 1];
-                int i_col  = buf[5 * p + 2];
-                int nb_col = buf[5 * p + 3];
-                int rank   = buf[5 * p + 4];
-
-                if (rank > max_rank) {
-                    max_rank = rank;
-                }
-                for (int i = 0; i < nb_row; i++) {
-                    for (int j = 0; j < nb_col; j++) {
-                        matrix.mutable_at(i_row + i, i_col + j) = rank;
-                        if (rank == -1) {
-                            mask_matrix.mutable_at(i_row + i, i_col + j) = true;
-                        }
-                    }
-                }
-
-                py::object rect = patches.attr("Rectangle")(py::make_tuple(i_col - 0.5, i_row - 0.5 + shift), nb_col, nb_row, "linewidth"_a = 0.75, "edgecolor"_a = 'k', "facecolor"_a = "none");
-                axes.attr("add_patch")(rect);
-
-                if (rank >= 0 && nb_col / double(nc) > 0.05 && nb_row / double(nc) > 0.05) {
-                    axes.attr("annotate")(rank, py::make_tuple(i_col + nb_col / 2., i_row + nb_row / 2.), "color"_a = "white", "size"_a = 10, "va"_a = "center", "ha"_a = "center");
-                }
-            }
-
-            // Colormap
-            py::object cmap     = plt.attr("get_cmap")("YlGn");
-            py::object new_cmap = colors.attr("LinearSegmentedColormap").attr("from_list")("trunc(YlGn,0.4,1)", cmap(numpy.attr("linspace")(0.4, 1, 100)));
-
-            // Plot
-            py::object masked_matrix = numpy.attr("ma").attr("array")(matrix, "mask"_a = mask_matrix);
-            new_cmap.attr("set_bad")("color"_a = "red");
-
-            plt.attr("imshow")(masked_matrix, "cmap"_a = new_cmap, "vmin"_a = 0, "vmax"_a = 10);
-            plt.attr("draw")();
-            if (show) {
-                plt.attr("show")(); // LCOV_EXCL_LINE
-            }
-        },
-        py::arg("show") = true);
 }
 
 #endif
diff --git a/src/htool/hmatrix/hmatrix_builder.hpp b/src/htool/hmatrix/hmatrix_builder.hpp
index 75a1f6f..2a4578d 100644
--- a/src/htool/hmatrix/hmatrix_builder.hpp
+++ b/src/htool/hmatrix/hmatrix_builder.hpp
@@ -12,13 +12,13 @@ void declare_hmatrix_builder(py::module &m, const std::string &className) {
     py::class_<Class> py_class(m, className.c_str());
 
     // Constructor
-    py_class.def(py::init<const htool::Cluster<CoordinatePrecision> &, const htool::Cluster<CoordinatePrecision> &, htool::underlying_type<CoefficientPrecision>, CoordinatePrecision, char, char, int, int>());
+    py_class.def(py::init<const htool::Cluster<CoordinatePrecision> &, const htool::Cluster<CoordinatePrecision> &, htool::underlying_type<CoefficientPrecision>, CoordinatePrecision, char, char, int, int, int>());
 
     // Build
-    py_class.def("build", [](const Class &self, const VirtualGenerator<CoefficientPrecision> &generator) { return self.build(generator); });
+    // py_class.def("build", [](const Class &self, const VirtualGenerator<CoefficientPrecision> &generator) { return self.build(generator); });
+    py_class.def("build", [](const Class &self, const VirtualGeneratorInUserNumbering<CoefficientPrecision> &generator) { return self.build(GeneratorWithPermutation<CoefficientPrecision>(generator, self.get_target_cluster().get_permutation().data(), self.get_source_cluster().get_permutation().data())); });
 
     // Setters
-    py_class.def("set_maximal_block_size", &Class::set_maximal_block_size);
     py_class.def("set_minimal_source_depth", &Class::set_minimal_source_depth);
     py_class.def("set_minimal_target_depth", &Class::set_minimal_target_depth);
     py_class.def("set_low_rank_generator", [](Class &self, const std::shared_ptr<VirtualLowRankGeneratorPython<CoefficientPrecision, CoordinatePrecision>> &low_rank_generator) { self.set_low_rank_generator(low_rank_generator); });
diff --git a/src/htool/hmatrix/interfaces/virtual_generator.hpp b/src/htool/hmatrix/interfaces/virtual_generator.hpp
index f96c5ee..8e4f816 100644
--- a/src/htool/hmatrix/interfaces/virtual_generator.hpp
+++ b/src/htool/hmatrix/interfaces/virtual_generator.hpp
@@ -7,46 +7,13 @@
 using namespace htool;
 
 template <typename CoefficientPrecision>
-class VirtualGeneratorPython : public htool::VirtualGenerator<CoefficientPrecision> {
+class VirtualGeneratorInUserNumberingPython : public htool::VirtualGeneratorInUserNumbering<CoefficientPrecision> {
   public:
-    using VirtualGenerator<CoefficientPrecision>::VirtualGenerator;
+    using VirtualGeneratorInUserNumbering<CoefficientPrecision>::VirtualGeneratorInUserNumbering;
 
-    void copy_submatrix(int M, int N, int row_offset, int col_offset, CoefficientPrecision *ptr) const override {
+    VirtualGeneratorInUserNumberingPython(const py::array_t<int> &target_permutation, const py::array_t<int> &source_permutation) : VirtualGeneratorInUserNumbering<CoefficientPrecision>() {}
 
-        py::array_t<CoefficientPrecision, py::array::f_style> mat(std::array<long int, 2>{M, N}, ptr, py::capsule(ptr));
-        build_submatrix(row_offset, col_offset, mat);
-    }
-
-    // lcov does not see it because of trampoline I assume
-    virtual void build_submatrix(int row_offset, int col_offset, py::array_t<CoefficientPrecision, py::array::f_style> &mat) const = 0; // LCOV_EXCL_LINE
-};
-
-template <typename CoefficientPrecision>
-class PyVirtualGenerator : public VirtualGeneratorPython<CoefficientPrecision> {
-  public:
-    using VirtualGeneratorPython<CoefficientPrecision>::VirtualGeneratorPython;
-
-    /* Trampoline (need one for each virtual function) */
-    virtual void build_submatrix(int row_offset, int col_offset, py::array_t<CoefficientPrecision, py::array::f_style> &mat) const override {
-        PYBIND11_OVERRIDE_PURE(
-            void,                                         /* Return type */
-            VirtualGeneratorPython<CoefficientPrecision>, /* Parent class */
-            build_submatrix,                              /* Name of function in C++ (must match Python name) */
-            row_offset,
-            col_offset,
-            mat /* Argument(s) */
-        );
-    }
-};
-
-template <typename CoefficientPrecision>
-class VirtualGeneratorWithPermutationPython : public htool::VirtualGeneratorWithPermutation<CoefficientPrecision> {
-  public:
-    using VirtualGeneratorWithPermutation<CoefficientPrecision>::VirtualGeneratorWithPermutation;
-
-    VirtualGeneratorWithPermutationPython(const py::array_t<int> &target_permutation, const py::array_t<int> &source_permutation) : VirtualGeneratorWithPermutation<CoefficientPrecision>(target_permutation.data(), source_permutation.data()) {}
-
-    void copy_submatrix_from_user_numbering(int M, int N, const int *const rows, const int *const cols, CoefficientPrecision *ptr) const override {
+    void copy_submatrix(int M, int N, const int *const rows, const int *const cols, CoefficientPrecision *ptr) const override {
         if (M * N > 0) {
             py::array_t<CoefficientPrecision, py::array::f_style> mat(std::array<long int, 2>{M, N}, ptr, py::capsule(ptr));
 
@@ -62,15 +29,15 @@ class VirtualGeneratorWithPermutationPython : public htool::VirtualGeneratorWith
 };
 
 template <typename CoefficientPrecision>
-class PyVirtualGeneratorWithPermutation : public VirtualGeneratorWithPermutationPython<CoefficientPrecision> {
+class PyVirtualGeneratorInUserNumbering : public VirtualGeneratorInUserNumberingPython<CoefficientPrecision> {
   public:
-    using VirtualGeneratorWithPermutationPython<CoefficientPrecision>::VirtualGeneratorWithPermutationPython;
+    using VirtualGeneratorInUserNumberingPython<CoefficientPrecision>::VirtualGeneratorInUserNumberingPython;
 
     /* Trampoline (need one for each virtual function) */
     virtual void build_submatrix(const py::array_t<int> &J, const py::array_t<int> &K, py::array_t<CoefficientPrecision, py::array::f_style> &mat) const override {
         PYBIND11_OVERRIDE_PURE(
             void,                                                        /* Return type */
-            VirtualGeneratorWithPermutationPython<CoefficientPrecision>, /* Parent class */
+            VirtualGeneratorInUserNumberingPython<CoefficientPrecision>, /* Parent class */
             build_submatrix,                                             /* Name of function in C++ (must match Python name) */
             J,
             K,
@@ -81,21 +48,13 @@ class PyVirtualGeneratorWithPermutation : public VirtualGeneratorWithPermutation
 
 template <typename CoefficientPrecision>
 void declare_virtual_generator(py::module &m, const std::string &className, const std::string &base_class_name) {
-    using BaseClass = VirtualGenerator<CoefficientPrecision>;
+    using BaseClass = VirtualGeneratorInUserNumbering<CoefficientPrecision>;
     py::class_<BaseClass>(m, base_class_name.c_str());
 
-    using Class = VirtualGeneratorPython<CoefficientPrecision>;
-    py::class_<Class, BaseClass, PyVirtualGenerator<CoefficientPrecision>> py_class(m, className.c_str());
+    using Class = VirtualGeneratorInUserNumberingPython<CoefficientPrecision>;
+    py::class_<Class, BaseClass, PyVirtualGeneratorInUserNumbering<CoefficientPrecision>> py_class(m, className.c_str());
     py_class.def(py::init<>());
     py_class.def("build_submatrix", &Class::build_submatrix);
-
-    using BaseClassWithPermutation = VirtualGeneratorWithPermutation<CoefficientPrecision>;
-    py::class_<BaseClassWithPermutation, BaseClass>(m, (base_class_name + "WithPermutation").c_str());
-
-    using ClassWithPermutation = VirtualGeneratorWithPermutationPython<CoefficientPrecision>;
-    py::class_<ClassWithPermutation, BaseClassWithPermutation, PyVirtualGeneratorWithPermutation<CoefficientPrecision>> py_class_with_permutation(m, (className + "WithPermutation").c_str());
-    py_class_with_permutation.def(py::init<const py::array_t<int> &, const py::array_t<int> &>());
-    py_class_with_permutation.def("build_submatrix", &ClassWithPermutation::build_submatrix);
 }
 
 #endif
diff --git a/src/htool/hmatrix/interfaces/virtual_low_rank_generator.hpp b/src/htool/hmatrix/interfaces/virtual_low_rank_generator.hpp
index 18fa23b..dcfdc8c 100644
--- a/src/htool/hmatrix/interfaces/virtual_low_rank_generator.hpp
+++ b/src/htool/hmatrix/interfaces/virtual_low_rank_generator.hpp
@@ -16,14 +16,18 @@ class VirtualLowRankGeneratorPython : public VirtualLowRankGenerator<Coefficient
     int m_rank;
     mutable std::vector<py::array_t<CoefficientPrecision, py::array::f_style>> m_mats_U; // owned by Python
     mutable std::vector<py::array_t<CoefficientPrecision, py::array::f_style>> m_mats_V; // owned by Python
-
-    // py::array_t<CoefficientPrecision, py::array::f_style> m_mat_U, m_mat_V;
+    const VirtualGeneratorInUserNumbering<CoefficientPrecision> &m_generator_in_user_numbering;
 
   public:
     using VirtualLowRankGenerator<CoefficientPrecision, CoordinatePrecision>::VirtualLowRankGenerator;
 
+    VirtualLowRankGeneratorPython(const VirtualGeneratorInUserNumbering<CoefficientPrecision> &generator_in_user_numbering) : m_generator_in_user_numbering(generator_in_user_numbering) {}
+
     void copy_low_rank_approximation(const VirtualGenerator<CoefficientPrecision> &A, const Cluster<CoordinatePrecision> &target_cluster, const Cluster<CoordinatePrecision> &source_cluster, underlying_type<CoefficientPrecision> epsilon, int &rank, Matrix<CoefficientPrecision> &U, Matrix<CoefficientPrecision> &V) const override {
-        build_low_rank_approximation(A, target_cluster.get_size(), source_cluster.get_size(), target_cluster.get_offset(), source_cluster.get_offset(), epsilon);
+        py::array_t<int, py::array::f_style> rows(target_cluster.get_size(), target_cluster.get_permutation().data() + target_cluster.get_offset(), py::capsule(target_cluster.get_permutation().data()));
+        py::array_t<int, py::array::f_style> cols(source_cluster.get_size(), source_cluster.get_permutation().data() + source_cluster.get_offset(), py::capsule(source_cluster.get_permutation().data()));
+
+        build_low_rank_approximation(rows, cols, epsilon);
         rank = m_rank;
         U.assign(m_mats_U.back().shape()[0], m_mats_U.back().shape()[1], m_mats_U.back().mutable_data(), false);
         V.assign(m_mats_V.back().shape()[0], m_mats_V.back().shape()[1], m_mats_V.back().mutable_data(), false);
@@ -32,13 +36,17 @@ class VirtualLowRankGeneratorPython : public VirtualLowRankGenerator<Coefficient
     bool is_htool_owning_data() const override { return false; }
 
     // lcov does not see it because of trampoline I assume
-    virtual void build_low_rank_approximation(const VirtualGenerator<CoefficientPrecision> &A, int target_size, int source_size, int target_offset, int source_offset, underlying_type<CoefficientPrecision> epsilon) const = 0; // LCOV_EXCL_LINE
+    virtual void build_low_rank_approximation(const py::array_t<int, py::array::f_style> &rows, const py::array_t<int, py::array::f_style> &cols, underlying_type<CoefficientPrecision> epsilon) const = 0; // LCOV_EXCL_LINE
 
     void set_U(py::array_t<CoefficientPrecision, py::array::f_style> U0) {
         m_mats_U.push_back(U0); // no copy here
     }
     void set_V(py::array_t<CoefficientPrecision, py::array::f_style> V0) { m_mats_V.push_back(V0); }
     void set_rank(int rank) { m_rank = rank; }
+
+    void build_submatrix(const py::array_t<int> rows, const py::array_t<int> cols, py::array_t<CoefficientPrecision, py::array::f_style> &mat) const {
+        m_generator_in_user_numbering.copy_submatrix(rows.size(), cols.size(), rows.data(), cols.data(), mat.mutable_data());
+    }
 };
 
 template <typename CoefficientPrecision, typename CoordinatePrecision>
@@ -47,46 +55,27 @@ class PyVirtualLowRankGenerator : public VirtualLowRankGeneratorPython<Coefficie
     using VirtualLowRankGeneratorPython<CoefficientPrecision, CoordinatePrecision>::VirtualLowRankGeneratorPython;
 
     /* Trampoline (need one for each virtual function) */
-    virtual void build_low_rank_approximation(const VirtualGenerator<CoefficientPrecision> &A, int target_size, int source_size, int target_offset, int source_offset, underlying_type<CoefficientPrecision> epsilon) const override {
+    virtual void build_low_rank_approximation(const py::array_t<int, py::array::f_style> &rows, const py::array_t<int, py::array::f_style> &cols, underlying_type<CoefficientPrecision> epsilon) const override {
         PYBIND11_OVERRIDE_PURE(
             void,                                                /* Return type */
             VirtualLowRankGeneratorPython<CoefficientPrecision>, /* Parent class */
             build_low_rank_approximation,                        /* Name of function in C++ (must match Python name) */
-            A,
-            target_size,
-            source_size,
-            target_offset,
-            source_offset,
+            rows,
+            cols,
             epsilon);
     }
 };
 
 template <typename CoefficientPrecision, typename CoordinatePrecision>
 void declare_custom_VirtualLowRankGenerator(py::module &m, const std::string &className) {
-    // using BaseClass = VirtualLowRankGenerator<CoefficientPrecision, CoordinatePrecision>;
-    // py::class_<BaseClass, std::shared_ptr<BaseClass>>(m, base_class_name.c_str());
-
     using Class = VirtualLowRankGeneratorPython<CoefficientPrecision, CoordinatePrecision>;
     py::class_<Class, std::shared_ptr<Class>, PyVirtualLowRankGenerator<CoefficientPrecision, CoordinatePrecision>> py_class(m, className.c_str());
-    py_class.def(py::init<>());
+    py_class.def(py::init<const VirtualGeneratorInUserNumbering<CoefficientPrecision> &>());
     py_class.def("build_low_rank_approximation", &Class::build_low_rank_approximation);
     py_class.def("set_U", &Class::set_U);
     py_class.def("set_V", &Class::set_V);
     py_class.def("set_rank", &Class::set_rank);
+    py_class.def("build_submatrix", &Class::build_submatrix);
 }
 
-// template <typename T>
-// void declare_VirtualLowRankGenerator(py::module &m, const std::string &className) {
-//     using Class = VirtualLowRankGenerator<T>;
-//     py::class_<Class> py_class(m, className.c_str());
-// }
-
-// template <template <class> class LowRankGeneratorType, typename T>
-// void declare_predefined_LowRankGenerator(py::module &m, const std::string &className) {
-
-//     py::class_<LowRankGeneratorType<T>, std::shared_ptr<LowRankGeneratorType<T>>, VirtualLowRankGenerator<T>> py_class(m, className.c_str());
-//     py_class.def(py::init<>());
-//     py_class.def("copy_low_rank_approximation", &LowRankGeneratorType<T>::copy_low_rank_approximation);
-// }
-
 #endif
diff --git a/src/htool/local_operator/local_operator.hpp b/src/htool/local_operator/local_operator.hpp
index 2ad7ffe..3304054 100644
--- a/src/htool/local_operator/local_operator.hpp
+++ b/src/htool/local_operator/local_operator.hpp
@@ -14,16 +14,16 @@ class LocalOperatorPython : public htool::LocalOperator<CoefficientPrecision, Co
 
     void local_add_vector_product(char trans, CoefficientPrecision alpha, const CoefficientPrecision *in, CoefficientPrecision beta, CoefficientPrecision *out) const override {
 
-        py::array_t<CoefficientPrecision> input(this->m_source_cluster.get_size(), in, py::capsule(in));
-        py::array_t<CoefficientPrecision> output(this->m_target_cluster.get_size(), out, py::capsule(out));
+        py::array_t<CoefficientPrecision> input(std::array<long int, 1>{this->m_source_cluster.get_size()}, in, py::capsule(in));
+        py::array_t<CoefficientPrecision> output(std::array<long int, 1>{this->m_target_cluster.get_size()}, out, py::capsule(out));
 
         add_vector_product(trans, alpha, input, beta, output);
     }
 
     void local_add_vector_product_symmetric(char trans, CoefficientPrecision alpha, const CoefficientPrecision *in, CoefficientPrecision beta, CoefficientPrecision *out, char UPLO, char symmetry) const override {
 
-        py::array_t<CoefficientPrecision> input(this->m_source_cluster.get_size(), in, py::capsule(in));
-        py::array_t<CoefficientPrecision> output(this->m_target_cluster.get_size(), out, py::capsule(out));
+        py::array_t<CoefficientPrecision> input(std::array<long int, 1>{this->m_source_cluster.get_size()}, in, py::capsule(in));
+        py::array_t<CoefficientPrecision> output(std::array<long int, 1>{this->m_target_cluster.get_size()}, out, py::capsule(out));
 
         add_vector_product(trans, alpha, input, beta, output);
     }
diff --git a/src/htool/main.cpp b/src/htool/main.cpp
index 84df0f9..a847324 100644
--- a/src/htool/main.cpp
+++ b/src/htool/main.cpp
@@ -16,17 +16,15 @@
 #include "hmatrix/interfaces/virtual_generator.hpp"
 #include "hmatrix/interfaces/virtual_low_rank_generator.hpp"
 
-#include "local_operator/local_dense_operator.hpp"
-#include "local_operator/local_hmatrix.hpp"
 #include "local_operator/local_operator.hpp"
 #include "local_operator/virtual_local_operator.hpp"
 
 #include "distributed_operator/distributed_operator.hpp"
-#include "distributed_operator/implementation/partition_from_cluster.hpp"
 #include "distributed_operator/utility.hpp"
 
 #include "solver/geneo/coarse_operator_builder.hpp"
-#include "solver/geneo/coarse_space_builder.hpp"
+// #include "solver/geneo/coarse_space_builder.hpp"
+#include "solver/geneo/coarse_space_dense_builder.hpp"
 #include "solver/interfaces/virtual_coarse_operator_builder.hpp"
 #include "solver/interfaces/virtual_coarse_space_builder.hpp"
 #include "solver/solver.hpp"
@@ -36,11 +34,6 @@
 #include "matplotlib/hmatrix.hpp"
 #include "misc/logger.hpp"
 #include "misc/wrapper_mpi.hpp"
-// #include "ddm_solver.hpp"
-// #include "dense_blocks_generator.hpp"
-// #include "hmatrix.hpp"
-// #include "lrmat_generator.hpp"
-// #include "matrix.hpp"
 
 PYBIND11_MODULE(Htool, m) {
     // Delegate logging to python logging module
@@ -63,16 +56,11 @@ PYBIND11_MODULE(Htool, m) {
 
     declare_hmatrix_builder<double, double>(m, "HMatrixBuilder");
     declare_HMatrix<double, double>(m, "HMatrix");
-    declare_virtual_generator<double>(m, "VirtualGenerator", "IGenerator");
+    declare_virtual_generator<double>(m, "VirtualGeneratorInUserNumbering", "IGeneratorInUserNumbering");
     declare_custom_VirtualLowRankGenerator<double, double>(m, "VirtualLowRankGenerator");
     declare_custom_VirtualDenseBlocksGenerator<double>(m, "VirtualDenseBlocksGenerator");
 
     declare_local_operator<double, double>(m, "LocalOperator");
-    declare_local_hmatrix<double, double>(m, "LocalHMatrix");
-
-    declare_interface_partition<double>(m, "IPartition");
-    declare_partition_from_cluster<double, double>(m, "PartitionFromCluster");
-
     declare_distributed_operator<double>(m, "DistributedOperator");
     declare_distributed_operator_utility<double, double>(m);
 
@@ -82,7 +70,6 @@ PYBIND11_MODULE(Htool, m) {
     declare_geneo_coarse_operator_builder<double>(m, "GeneoCoarseOperatorBuilder");
     declare_geneo_coarse_space_dense_builder<double>(m, "GeneoCoarseSpaceDenseBuilder");
     declare_virtual_geneo_coarse_space_dense_builder<double>(m, "VirtualGeneoCoarseSpaceDenseBuilder");
-    declare_solver_utility(m);
     declare_solver_utility<double, double>(m);
 
     declare_matplotlib_cluster<double>(m);
@@ -90,7 +77,7 @@ PYBIND11_MODULE(Htool, m) {
 
     declare_hmatrix_builder<std::complex<double>, double>(m, "ComplexHMatrixBuilder");
     declare_HMatrix<std::complex<double>, double>(m, "ComplexHMatrix");
-    declare_virtual_generator<std::complex<double>>(m, "ComplexVirtualGenerator", "IComplexGenerator");
+    declare_virtual_generator<std::complex<double>>(m, "ComplexVirtualGeneratorInUserNumbering", "IComplexGeneratorInUserNumbering");
 
     declare_distributed_operator<std::complex<double>>(m, "ComplexDistributedOperator");
     declare_distributed_operator_utility<std::complex<double>, double>(m, "Complex");
diff --git a/src/htool/misc/utility.hpp b/src/htool/misc/utility.hpp
index f94887d..96d2781 100644
--- a/src/htool/misc/utility.hpp
+++ b/src/htool/misc/utility.hpp
@@ -16,7 +16,7 @@ inline pybind11::array_t<typename Sequence::value_type> as_pyarray(Sequence &&se
     std::unique_ptr<Sequence> seq_ptr = std::make_unique<Sequence>(std::move(seq));
     auto capsule                      = pybind11::capsule(seq_ptr.get(), [](void *p) { std::unique_ptr<Sequence>(reinterpret_cast<Sequence *>(p)); });
     seq_ptr.release();
-    return pybind11::array(size, data, capsule);
+    return pybind11::array({size}, {sizeof(typename Sequence::value_type)}, data, capsule);
 }
 
 #endif
diff --git a/src/htool/solver/geneo/coarse_space_builder.hpp b/src/htool/solver/geneo/coarse_space_builder.hpp
index e4d4364..b829276 100644
--- a/src/htool/solver/geneo/coarse_space_builder.hpp
+++ b/src/htool/solver/geneo/coarse_space_builder.hpp
@@ -2,20 +2,30 @@
 #define HTOOL_PYTHON_GENEO_COARSE_SPACE_BUILDER_HPP
 
 #include <htool/solvers/geneo/coarse_space_builder.hpp>
+#include <htool/solvers/interfaces/virtual_coarse_space_builder.hpp>
 #include <pybind11/pybind11.h>
 namespace py = pybind11;
 
 template <typename CoefficientPrecision, typename CoordinatePrecision = CoefficientPrecision>
-class GeneoCoarseSpaceDenseBuilderPython : public GeneoCoarseSpaceDenseBuilder<CoefficientPrecision> {
+class GeneoCoarseSpaceBuilderPython : public VirtualCoarseSpaceBuilder<CoefficientPrecision> {
     py::array_t<CoefficientPrecision, py::array::f_style> m_coarse_space;
 
+    int m_size_wo_overlap;
+    int m_size_with_overlap;
+    Matrix<CoefficientPrecision> m_DAiD;
+    Matrix<CoefficientPrecision> m_Bi;
+    char m_symmetry                                                = 'N';
+    char m_uplo                                                    = 'N';
+    int m_geneo_nu                                                 = 2;
+    htool::underlying_type<CoefficientPrecision> m_geneo_threshold = -1.;
+
     // using GeneoCoarseSpaceDenseBuilder<CoefficientPrecision>::GeneoCoarseSpaceDenseBuilder;
   public:
     char get_symmetry() { return this->m_symmetry; }
     int get_geneo_nu() { return this->m_geneo_nu; }
     htool::underlying_type<CoefficientPrecision> get_geneo_threshold() { return this->m_geneo_threshold; }
 
-    explicit GeneoCoarseSpaceDenseBuilderPython(int size_wo_overlap, Matrix<CoefficientPrecision> Ai, Matrix<CoefficientPrecision> Bi, char symmetry, char uplo, int geneo_nu, htool::underlying_type<CoefficientPrecision> geneo_threshold) : GeneoCoarseSpaceDenseBuilder<CoefficientPrecision>(size_wo_overlap, Ai, Bi, symmetry, uplo, geneo_nu, geneo_threshold) {}
+    explicit GeneoCoarseSpaceBuilderPython(int size_wo_overlap, HMatrix<CoefficientPrecision, CoordinatePrecision> Ai, Matrix<CoefficientPrecision> Bi, char symmetry, char uplo, int geneo_nu, htool::underlying_type<CoefficientPrecision> geneo_threshold) : m_size_wo_overlap(size_wo_overlap), m_size_with_overlap(Ai.nb_cols()), m_DAiD(m_size_with_overlap, m_size_with_overlap), m_Bi(Bi), m_symmetry(symmetry), m_uplo(uplo), m_geneo_nu(geneo_nu), m_geneo_threshold(geneo_threshold) {}
 
     Matrix<CoefficientPrecision> build_coarse_space() override {
         py::array_t<CoefficientPrecision, py::array::f_style> Ai(std::array<long int, 2>{this->m_DAiD.nb_rows(), this->m_DAiD.nb_cols()}, this->m_DAiD.data(), py::capsule(this->m_DAiD.data()));
@@ -23,8 +33,7 @@ class GeneoCoarseSpaceDenseBuilderPython : public GeneoCoarseSpaceDenseBuilder<C
         compute_coarse_space(Ai, Bi);
         Matrix<CoefficientPrecision> coarse_space_mat(m_coarse_space.shape()[0], m_coarse_space.shape()[1]);
         std::copy_n(m_coarse_space.data(), m_coarse_space.shape()[0] * m_coarse_space.shape()[1], coarse_space_mat.data()); // HPDDM deletes the coarse space, so we have to copy.
-        // coarse_space_mat.assign(m_coarse_space.shape()[0], m_coarse_space.shape()[1], m_coarse_space.mutable_data(), false);
-        // coarse_space_mat.print(std::cout, ",");
+
         return coarse_space_mat;
     }
 
@@ -36,20 +45,20 @@ class GeneoCoarseSpaceDenseBuilderPython : public GeneoCoarseSpaceDenseBuilder<C
 };
 
 template <typename CoefficientPrecision, typename CoordinatePrecision = CoefficientPrecision>
-class PyGeneoCoarseSpaceDenseBuilder : public GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision> {
+class PyGeneoCoarseSpaceDenseBuilder : public GeneoCoarseSpaceBuilderPython<CoefficientPrecision> {
 
   public:
     /* Inherit the constructors */
-    using GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>::GeneoCoarseSpaceDenseBuilderPython;
+    using GeneoCoarseSpaceBuilderPython<CoefficientPrecision>::GeneoCoarseSpaceBuilderPython;
 
-    // explicit PyGeneoCoarseSpaceDenseBuilder(int size_wo_overlap, Matrix<CoefficientPrecision> Ai, Matrix<CoefficientPrecision> Bi, char symmetry, char uplo, int geneo_nu, htool::underlying_type<CoefficientPrecision> geneo_threshold) : GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>(size_wo_overlap, Ai, Bi, symmetry, uplo, geneo_nu, geneo_threshold) {}
+    // explicit PyGeneoCoarseSpaceDenseBuilder(int size_wo_overlap, Matrix<CoefficientPrecision> Ai, Matrix<CoefficientPrecision> Bi, char symmetry, char uplo, int geneo_nu, htool::underlying_type<CoefficientPrecision> geneo_threshold) : GeneoCoarseSpaceBuilderPython<CoefficientPrecision>(size_wo_overlap, Ai, Bi, symmetry, uplo, geneo_nu, geneo_threshold) {}
 
     /* Trampoline (need one for each virtual function) */
     void compute_coarse_space(py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi) override {
         PYBIND11_OVERRIDE_PURE(
-            void,                                                     /* Return type */
-            GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>, /* Parent class */
-            compute_coarse_space,                                     /* Name of function in C++ (must match Python name) */
+            void,                                                /* Return type */
+            GeneoCoarseSpaceBuilderPython<CoefficientPrecision>, /* Parent class */
+            compute_coarse_space,                                /* Name of function in C++ (must match Python name) */
             Ai,
             Bi /* Argument(s) */
         );
@@ -57,9 +66,9 @@ class PyGeneoCoarseSpaceDenseBuilder : public GeneoCoarseSpaceDenseBuilderPython
 };
 
 template <typename CoefficientPrecision>
-void declare_geneo_coarse_space_dense_builder(py::module &m, const std::string &className) {
+void declare_geneo_coarse_space_builder(py::module &m, const std::string &className) {
 
-    using Class = GeneoCoarseSpaceDenseBuilder<CoefficientPrecision>;
+    using Class = GeneoCoarseSpaceBuilder<CoefficientPrecision>;
     py::class_<Class, VirtualCoarseSpaceBuilder<CoefficientPrecision>> py_class(m, className.c_str());
     py_class.def(py::init([](int size_wo_overlap, py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi, char symmetry, char uplo, int geneo_nu) {
                      Matrix<CoefficientPrecision> Ai_mat;
@@ -94,7 +103,7 @@ void declare_geneo_coarse_space_dense_builder(py::module &m, const std::string &
 template <typename CoefficientPrecision>
 void declare_virtual_geneo_coarse_space_dense_builder(py::module &m, const std::string &className) {
 
-    using Class = GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>;
+    using Class = GeneoCoarseSpaceBuilderPython<CoefficientPrecision>;
     py::class_<Class, PyGeneoCoarseSpaceDenseBuilder<CoefficientPrecision>, VirtualCoarseSpaceBuilder<CoefficientPrecision>> py_class(m, className.c_str());
     py_class.def(py::init([](int size_wo_overlap, py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi, char symmetry, char uplo, int geneo_nu) {
                      Matrix<CoefficientPrecision> Ai_mat;
diff --git a/src/htool/solver/geneo/coarse_space_dense_builder.hpp b/src/htool/solver/geneo/coarse_space_dense_builder.hpp
new file mode 100644
index 0000000..ad2f00f
--- /dev/null
+++ b/src/htool/solver/geneo/coarse_space_dense_builder.hpp
@@ -0,0 +1,133 @@
+#ifndef HTOOL_PYTHON_GENEO_COARSE_SPACE_DENSE_BUILDER_HPP
+#define HTOOL_PYTHON_GENEO_COARSE_SPACE_DENSE_BUILDER_HPP
+
+#include <htool/solvers/geneo/coarse_space_builder.hpp>
+#include <pybind11/pybind11.h>
+namespace py = pybind11;
+
+template <typename CoefficientPrecision, typename CoordinatePrecision = CoefficientPrecision>
+class GeneoCoarseSpaceDenseBuilderPython : public GeneoCoarseSpaceDenseBuilder<CoefficientPrecision> {
+    py::array_t<CoefficientPrecision, py::array::f_style> m_coarse_space;
+
+    // using GeneoCoarseSpaceDenseBuilder<CoefficientPrecision>::GeneoCoarseSpaceDenseBuilder;
+  public:
+    char get_symmetry() { return this->m_symmetry; }
+    int get_geneo_nu() { return this->m_geneo_nu; }
+    htool::underlying_type<CoefficientPrecision> get_geneo_threshold() { return this->m_geneo_threshold; }
+
+    explicit GeneoCoarseSpaceDenseBuilderPython(int size_wo_overlap, int size_with_overlap, const Matrix<CoefficientPrecision> &Ai, const Matrix<CoefficientPrecision> &Bi, char symmetry, char uplo, int geneo_nu, htool::underlying_type<CoefficientPrecision> geneo_threshold) : GeneoCoarseSpaceDenseBuilder<CoefficientPrecision>(size_wo_overlap, size_with_overlap, Ai, Bi, symmetry, uplo, geneo_nu, geneo_threshold) {}
+
+    Matrix<CoefficientPrecision> build_coarse_space() override {
+        py::array_t<CoefficientPrecision, py::array::f_style> Ai(std::array<long int, 2>{this->m_DAiD.nb_rows(), this->m_DAiD.nb_cols()}, this->m_DAiD.data(), py::capsule(this->m_DAiD.data()));
+        py::array_t<CoefficientPrecision, py::array::f_style> Bi(std::array<long int, 2>{this->m_Bi.nb_rows(), this->m_Bi.nb_cols()}, this->m_Bi.data(), py::capsule(this->m_Bi.data()));
+        compute_coarse_space(Ai, Bi);
+        Matrix<CoefficientPrecision> coarse_space_mat(m_coarse_space.shape()[0], m_coarse_space.shape()[1]);
+        std::copy_n(m_coarse_space.data(), m_coarse_space.shape()[0] * m_coarse_space.shape()[1], coarse_space_mat.data()); // HPDDM deletes the coarse space, so we have to copy.
+        // coarse_space_mat.assign(m_coarse_space.shape()[0], m_coarse_space.shape()[1], m_coarse_space.mutable_data(), false);
+        // std::cout << "ICI?\n";
+        // coarse_space_mat.print(std::cout, ",");
+        return coarse_space_mat;
+    }
+
+    virtual void compute_coarse_space(py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi) = 0;
+
+    void set_coarse_space(py::array_t<CoefficientPrecision, py::array::f_style> coarse_space) {
+        m_coarse_space = coarse_space;
+    }
+};
+
+template <typename CoefficientPrecision, typename CoordinatePrecision = CoefficientPrecision>
+class PyGeneoCoarseSpaceDenseBuilder : public GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision> {
+
+  public:
+    /* Inherit the constructors */
+    using GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>::GeneoCoarseSpaceDenseBuilderPython;
+
+    // explicit PyGeneoCoarseSpaceDenseBuilder(int size_wo_overlap, Matrix<CoefficientPrecision> Ai, Matrix<CoefficientPrecision> Bi, char symmetry, char uplo, int geneo_nu, htool::underlying_type<CoefficientPrecision> geneo_threshold) : GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>(size_wo_overlap, Ai, Bi, symmetry, uplo, geneo_nu, geneo_threshold) {}
+
+    /* Trampoline (need one for each virtual function) */
+    void compute_coarse_space(py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi) override {
+        PYBIND11_OVERRIDE_PURE(
+            void,                                                     /* Return type */
+            GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>, /* Parent class */
+            compute_coarse_space,                                     /* Name of function in C++ (must match Python name) */
+            Ai,
+            Bi /* Argument(s) */
+        );
+    }
+};
+
+template <typename CoefficientPrecision>
+void declare_geneo_coarse_space_dense_builder(py::module &m, const std::string &className) {
+
+    using Class = GeneoCoarseSpaceDenseBuilder<CoefficientPrecision>;
+    py::class_<Class, VirtualCoarseSpaceBuilder<CoefficientPrecision>> py_class(m, className.c_str());
+    py_class.def(py::init([](int size_wo_overlap, int size_with_overlap, const HMatrix<CoefficientPrecision, underlying_type<CoefficientPrecision>> &Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi, char symmetry, char uplo, int geneo_nu) {
+                     Matrix<CoefficientPrecision> Bi_mat;
+                     Bi_mat.assign(Bi.shape()[0], Bi.shape()[1], Bi.mutable_data(), false);
+                     return Class::GeneoWithNu(size_wo_overlap, size_with_overlap, Ai, Bi_mat, symmetry, uplo, geneo_nu);
+                 }),
+                 py::arg("size_wo_overlap"),
+                 py::arg("size_with_overlap"),
+                 py::arg("Ai"),
+                 py::arg("Bi"),
+                 py::arg("symmetry"),
+                 py::arg("uplo"),
+                 py::kw_only(),
+                 py::arg("geneo_nu"));
+    py_class.def(py::init([](int size_wo_overlap, int size_with_overlap, const HMatrix<CoefficientPrecision, underlying_type<CoefficientPrecision>> &Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi, char symmetry, char uplo, double geneo_threshold) {
+                     Matrix<CoefficientPrecision> Bi_mat;
+                     Bi_mat.assign(Bi.shape()[0], Bi.shape()[1], Bi.mutable_data(), false);
+                     return Class::GeneoWithThreshold(size_wo_overlap, size_with_overlap, Ai, Bi_mat, symmetry, uplo, geneo_threshold);
+                 }),
+                 py::arg("size_wo_overlap"),
+                 py::arg("size_with_overlap"),
+                 py::arg("Ai"),
+                 py::arg("Bi"),
+                 py::arg("symmetry"),
+                 py::arg("uplo"),
+                 py::kw_only(),
+                 py::arg("geneo_threshold"));
+}
+
+template <typename CoefficientPrecision>
+void declare_virtual_geneo_coarse_space_dense_builder(py::module &m, const std::string &className) {
+
+    using Class = GeneoCoarseSpaceDenseBuilderPython<CoefficientPrecision>;
+    py::class_<Class, PyGeneoCoarseSpaceDenseBuilder<CoefficientPrecision>, VirtualCoarseSpaceBuilder<CoefficientPrecision>> py_class(m, className.c_str());
+    py_class.def(py::init([](int size_wo_overlap, int size_with_overlap, py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi, char symmetry, char uplo, int geneo_nu) {
+                     Matrix<CoefficientPrecision> Ai_mat;
+                     Ai_mat.assign(Ai.shape()[0], Ai.shape()[1], Ai.mutable_data(), false);
+                     Matrix<CoefficientPrecision> Bi_mat;
+                     Bi_mat.assign(Bi.shape()[0], Bi.shape()[1], Bi.mutable_data(), false);
+                     return PyGeneoCoarseSpaceDenseBuilder<CoefficientPrecision>(size_wo_overlap, size_with_overlap, Ai_mat, Bi_mat, symmetry, uplo, geneo_nu, -1);
+                 }),
+                 py::arg("size_wo_overlap"),
+                 py::arg("size_with_overlap"),
+                 py::arg("Ai"),
+                 py::arg("Bi"),
+                 py::arg("symmetry"),
+                 py::arg("uplo"),
+                 py::kw_only(),
+                 py::arg("geneo_nu"));
+    py_class.def(py::init([](int size_wo_overlap, int size_with_overlap, py::array_t<CoefficientPrecision, py::array::f_style> Ai, py::array_t<CoefficientPrecision, py::array::f_style> Bi, char symmetry, char uplo, double geneo_threshold) {
+                     Matrix<CoefficientPrecision> Ai_mat;
+                     Ai_mat.assign(Ai.shape()[0], Ai.shape()[1], Ai.mutable_data(), false);
+                     Matrix<CoefficientPrecision> Bi_mat;
+                     Bi_mat.assign(Bi.shape()[0], Bi.shape()[1], Bi.mutable_data(), false);
+                     return PyGeneoCoarseSpaceDenseBuilder<CoefficientPrecision>(size_wo_overlap, size_with_overlap, Ai_mat, Bi_mat, symmetry, uplo, 0, geneo_threshold);
+                 }),
+                 py::arg("size_wo_overlap"),
+                 py::arg("size_with_overlap"),
+                 py::arg("Ai"),
+                 py::arg("Bi"),
+                 py::arg("symmetry"),
+                 py::arg("uplo"),
+                 py::kw_only(),
+                 py::arg("geneo_threshold"));
+    py_class.def("set_coarse_space", &Class::set_coarse_space);
+    py_class.def_property_readonly("symmetry", &Class::get_symmetry);
+    py_class.def_property_readonly("geneo_nu", &Class::get_geneo_nu);
+    py_class.def_property_readonly("geneo_threshold", &Class::get_geneo_threshold);
+}
+#endif
diff --git a/src/htool/solver/solver.hpp b/src/htool/solver/solver.hpp
index 826cb0c..2b888fa 100644
--- a/src/htool/solver/solver.hpp
+++ b/src/htool/solver/solver.hpp
@@ -12,26 +12,9 @@ using namespace htool;
 template <typename CoefficientPrecision>
 void declare_DDM(py::module &m, const std::string &className) {
 
-    using Class = DDM<CoefficientPrecision>;
+    using Class = DDM<CoefficientPrecision, HPDDMCustomLocalSolver>;
     py::class_<Class> py_class(m, className.c_str());
-    py_class.def(py::init<
-                 const DistributedOperator<CoefficientPrecision> &,
-                 Matrix<CoefficientPrecision> &,
-                 const std::vector<int> &,
-                 const std::vector<std::vector<int>> &>());
     py_class.def("facto_one_level", &Class::facto_one_level);
-    // py_class.def("build_coarse_space", [](Class &self, py::array_t<CoefficientPrecision, py::array::f_style> Ki) {
-    //     if (Ki.ndim() != 2) {
-    //         throw std::invalid_argument("Wrong dimension for local matrix when building coarse space\n"); // LCOV_EXCL_LINE
-    //     }
-    //     if (Ki.shape()[0] != self.get_local_size() && Ki.shape()[1] != self.get_local_size()) {
-    //         throw std::invalid_argument("Wrong size for local matrix when building coarse space: (" + std::to_string(Ki.shape()[0]) + "," + std::to_string(Ki.shape()[1]) + ") vs (" + std::to_string(self.get_local_size()) + "," + std::to_string(self.get_local_size()) + ")\n"); // LCOV_EXCL_LINE
-    //     }
-
-    //     Matrix<CoefficientPrecision> Ki_mat(Ki.shape()[0], Ki.shape()[1]);
-    //     std::copy_n(Ki.data(), Ki.shape()[0] * Ki.shape()[1], Ki_mat.data());
-    //     self.build_coarse_space(Ki_mat);
-    // });
     py_class.def("build_coarse_space", py::overload_cast<VirtualCoarseSpaceBuilder<CoefficientPrecision> &, VirtualCoarseOperatorBuilder<CoefficientPrecision> &>(&Class::build_coarse_space));
     py_class.def(
         "solve", [](Class &self, py::array_t<CoefficientPrecision, py::array::f_style> x, const py::array_t<CoefficientPrecision, py::array::f_style | py::array::forcecast> b, std::string hpddm_args) {
diff --git a/src/htool/solver/utility.hpp b/src/htool/solver/utility.hpp
index f32ad8d..47636fa 100644
--- a/src/htool/solver/utility.hpp
+++ b/src/htool/solver/utility.hpp
@@ -3,53 +3,22 @@
 
 #include <htool/solvers/utility.hpp>
 
-void declare_solver_utility(py::module &m) {
-    py::class_<LocalNumberingBuilder> py_class(m, "LocalNumberingBuilder");
-    py_class.def(py::init<const std::vector<int> &, const std::vector<int> &, const std::vector<std::vector<int>> &>());
-    py_class.def_property_readonly(
-        "local_to_global_numbering", [](const LocalNumberingBuilder &self) { return &self.local_to_global_numbering; }, py::return_value_policy::reference_internal);
-    py_class.def_property_readonly(
-        "intersections", [](const LocalNumberingBuilder &self) { return &self.intersections; }, py::return_value_policy::reference_internal);
-}
-
 template <typename CoefficientPrecision, typename CoordinatePrecision>
 void declare_solver_utility(py::module &m, std::string prefix = "") {
 
-    using DefaultSolverBuilder                 = DefaultSolverBuilder<CoefficientPrecision, CoordinatePrecision>;
-    using DefaultDDMSolverBuilderAddingOverlap = DefaultDDMSolverBuilderAddingOverlap<CoefficientPrecision, CoordinatePrecision>;
-    using DefaultDDMSolverBuilder              = DefaultDDMSolverBuilder<CoefficientPrecision, CoordinatePrecision>;
+    using DDMSolverBuilder = DDMSolverBuilder<CoefficientPrecision, CoordinatePrecision>;
 
-    std::string default_solver_name                    = prefix + "DefaultSolverBuilder";
-    std::string default_ddm_solver_adding_overlap_name = prefix + "DefaultDDMSolverBuilderAddingOverlap";
-    std::string default_ddm_solver_name                = prefix + "DefaultDDMSolverBuilder";
+    std::string ddm_solver_name = prefix + "DDMSolverBuilder";
 
-    py::class_<DefaultSolverBuilder> default_solver_class(m, default_solver_name.c_str());
-    default_solver_class.def(py::init<DistributedOperator<CoefficientPrecision> &, const HMatrix<CoefficientPrecision, CoordinatePrecision> *>());
-    default_solver_class.def_property_readonly(
-        "solver", [](const DefaultSolverBuilder &self) { return &self.solver; }, py::return_value_policy::reference_internal);
+    py::class_<DDMSolverBuilder> ddm_solver_class(m, ddm_solver_name.c_str());
+    ddm_solver_class.def(py::init<DistributedOperator<CoefficientPrecision> &, HMatrix<CoefficientPrecision, CoordinatePrecision> &>());
 
-    py::class_<DefaultDDMSolverBuilderAddingOverlap> default_ddm_solver_adding_overlap_class(m, default_ddm_solver_adding_overlap_name.c_str());
-    default_ddm_solver_adding_overlap_class.def(py::init<DistributedOperator<CoefficientPrecision> &, const HMatrix<CoefficientPrecision, CoordinatePrecision> *, const VirtualGeneratorWithPermutation<CoefficientPrecision> &, const std::vector<int> &, const std::vector<int> &, const std::vector<int> &, const std::vector<std::vector<int>> &>());
-    default_ddm_solver_adding_overlap_class.def_property_readonly(
-        "solver", [](const DefaultDDMSolverBuilderAddingOverlap &self) { return &self.solver; }, py::return_value_policy::reference_internal);
-    default_ddm_solver_adding_overlap_class.def_property_readonly(
-        "local_to_global_numbering", [](const DefaultDDMSolverBuilderAddingOverlap &self) { return &self.local_to_global_numbering; }, py::return_value_policy::reference_internal);
-    default_ddm_solver_adding_overlap_class.def_property_readonly(
-        "block_diagonal_dense_matrix", [](const DefaultDDMSolverBuilderAddingOverlap &self) {
-            py::array_t<CoefficientPrecision, py::array::f_style> mat({self.block_diagonal_dense_matrix.nb_cols(), self.block_diagonal_dense_matrix.nb_rows()}, self.block_diagonal_dense_matrix.data(), py::capsule(self.block_diagonal_dense_matrix.data()));
-            return mat;
-        },
-        py::return_value_policy::reference_internal);
+    ddm_solver_class.def(py::init<DistributedOperator<CoefficientPrecision> &, HMatrix<CoefficientPrecision, CoordinatePrecision> &, const VirtualGeneratorInUserNumbering<CoefficientPrecision> &, const std::vector<int> &, const std::vector<int> &, const std::vector<int> &, const std::vector<std::vector<int>> &>());
+    ddm_solver_class.def(py::init([](DistributedOperator<CoefficientPrecision> &distributed_operator, const std::vector<int> &ovr_subdomain_to_global, const std::vector<int> &cluster_to_ovr_subdomain, const std::vector<int> &neighbors, const std::vector<std::vector<int>> &intersections, const VirtualGeneratorInUserNumbering<CoefficientPrecision> &generator, const py::array_t<CoordinatePrecision, py::array::f_style | py::array::forcecast> coordinates, underlying_type<CoefficientPrecision> epsilon, CoordinatePrecision eta) {
+        return new DDMSolverBuilder(distributed_operator, ovr_subdomain_to_global, cluster_to_ovr_subdomain, neighbors, intersections, generator, coordinates.shape()[0], coordinates.data(), epsilon, eta);
+    }));
 
-    py::class_<DefaultDDMSolverBuilder> default_ddm_solver_class(m, default_ddm_solver_name.c_str());
-    default_ddm_solver_class.def(py::init<DistributedOperator<CoefficientPrecision> &, const HMatrix<CoefficientPrecision, CoordinatePrecision> &, const std::vector<int> &, const std::vector<std::vector<int>> &>(), py::keep_alive<1, 2>(), py::keep_alive<1, 4>(), py::keep_alive<1, 5>());
-    default_ddm_solver_class.def_property_readonly(
-        "solver", [](const DefaultDDMSolverBuilder &self) { return &self.solver; }, py::return_value_policy::reference_internal);
-    default_ddm_solver_class.def_property_readonly(
-        "block_diagonal_dense_matrix", [](const DefaultDDMSolverBuilder &self) {
-            py::array_t<CoefficientPrecision, py::array::f_style> mat({self.block_diagonal_dense_matrix.nb_cols(), self.block_diagonal_dense_matrix.nb_rows()}, self.block_diagonal_dense_matrix.data(), py::capsule(self.block_diagonal_dense_matrix.data()));
-            return mat;
-        },
-        py::return_value_policy::reference_internal);
+    ddm_solver_class.def_property_readonly(
+        "solver", [](const DDMSolverBuilder &self) { return &self.solver; }, py::return_value_policy::reference_internal);
 }
 #endif
diff --git a/tests/conftest.py b/tests/conftest.py
index f7db6e7..1ca161d 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -13,13 +13,9 @@
 from example.define_custom_low_rank_generator import CustomSVD
 
 
-class GeneratorFromMatrix(Htool.ComplexVirtualGeneratorWithPermutation):
-    def __init__(
-        self,
-        permutation,
-        matrix,
-    ):
-        super().__init__(permutation, permutation)
+class GeneratorFromMatrix(Htool.ComplexVirtualGeneratorInUserNumbering):
+    def __init__(self, matrix):
+        super().__init__()
         self.matrix = matrix
 
     def get_coef(self, i, j):
@@ -31,7 +27,7 @@ def build_submatrix(self, J, K, mat):
                 mat[j, k] = self.get_coef(J[j], K[k])
 
 
-class LocalGeneratorFromMatrix(Htool.ComplexVirtualGeneratorWithPermutation):
+class LocalGeneratorFromMatrix(Htool.ComplexVirtualGeneratorInUserNumbering):
     def __init__(
         self,
         permutation,
@@ -138,7 +134,7 @@ def cluster(geometry, symmetry):
 def generator(geometry, cluster):
     [target_points, source_points, _] = geometry
     [target_cluster, source_cluster] = cluster
-    return CustomGenerator(target_cluster, target_points, source_cluster, source_points)
+    return CustomGenerator(target_points, source_points)
 
 
 @pytest.fixture(
@@ -172,7 +168,7 @@ def local_operator(request, generator, cluster, geometry):
 )
 def low_rank_approximation(request, generator, cluster, epsilon):
     if request.param:
-        return CustomSVD()
+        return CustomSVD(generator)
     else:
         return None
 
@@ -209,26 +205,17 @@ def custom_distributed_operator(
 ):
     [target_cluster, source_cluster] = cluster
 
-    # Build distributed operator
-    target_partition_from_cluster = Htool.PartitionFromCluster(target_cluster)
-    source_partition_from_cluster = Htool.PartitionFromCluster(source_cluster)
-    distributed_operator = Htool.DistributedOperator(
-        target_partition_from_cluster,
-        source_partition_from_cluster,
-        symmetry,
-        UPLO,
-        mpi4py.MPI.COMM_WORLD,
-    )
-
-    local_hmatrix = None
-    hmatrix = None
     if local_operator is not None:
-        distributed_operator.add_local_operator(local_operator)
-    else:
-        local_target_cluster = target_cluster.get_cluster_on_partition(
-            mpi4py.MPI.COMM_WORLD.rank
+        custom_local_approximation = Htool.CustomApproximationBuilder(
+            target_cluster,
+            source_cluster,
+            symmetry,
+            UPLO,
+            mpi4py.MPI.COMM_WORLD,
+            local_operator,
         )
-
+        distributed_operator = custom_local_approximation.distributed_operator
+    else:
         hmatrix_builder = Htool.HMatrixBuilder(
             target_cluster,
             source_cluster,
@@ -238,24 +225,20 @@ def custom_distributed_operator(
             UPLO,
             -1,
             mpi4py.MPI.COMM_WORLD.rank,
+            mpi4py.MPI.COMM_WORLD.rank,
         )
         if dense_blocks_generator is not None:
             hmatrix_builder.set_dense_blocks_generator(dense_blocks_generator)
         if low_rank_approximation is not None:
             hmatrix_builder.set_low_rank_generator(low_rank_approximation)
 
-        hmatrix: Htool.HMatrix = hmatrix_builder.build(generator)
-
-        local_hmatrix = Htool.LocalHMatrix(
-            hmatrix,
-            local_target_cluster,
+        distributed_operator = Htool.DistributedOperatorFromHMatrix(
+            generator,
+            target_cluster,
             source_cluster,
-            symmetry,
-            UPLO,
-            False,
-            False,
+            hmatrix_builder,
+            mpi4py.MPI.COMM_WORLD,
         )
-        distributed_operator.add_local_operator(local_hmatrix)
 
     return distributed_operator
 
diff --git a/tests/test_cluster.py b/tests/test_cluster.py
index f2266a0..a612a67 100644
--- a/tests/test_cluster.py
+++ b/tests/test_cluster.py
@@ -20,9 +20,16 @@ def test_cluster(geometry, cluster):
         mpi4py.MPI.COMM_WORLD.Get_rank()
     )
 
+    total_size = 0
+    for p in range(0, mpi4py.MPI.COMM_WORLD.Get_size()):
+        total_size += target_cluster.get_cluster_on_partition(p).get_size()
+
+    assert total_size == len(local_target_cluster.get_permutation())
+    assert total_size == len(target_cluster.get_permutation())
+
     # Several ways to display information
     if mpi4py.MPI.COMM_WORLD.Get_rank() == 0:
-        fig, ax = plt.subplots(2, 2)
+        _, ax = plt.subplots(2, 2)
         Htool.plot(ax[0, 0], target_cluster, target_points, 1)
         Htool.plot(ax[0, 1], target_cluster, target_points, 2)
         Htool.plot(ax[1, 0], local_target_cluster, target_points, 1)
diff --git a/tests/test_ddm_solver.py b/tests/test_ddm_solver.py
index 1c128d0..cb730c4 100644
--- a/tests/test_ddm_solver.py
+++ b/tests/test_ddm_solver.py
@@ -1,3 +1,5 @@
+import copy
+
 import Htool
 import mpi4py
 import numpy as np
@@ -11,25 +13,21 @@ class CustomGeneoCoarseSpaceDenseBuilder(
 ):
     def compute_coarse_space(self, Ai, Bi):
         coarse_space = None
-
         if self.symmetry == "S" or self.symmetry == "H":
             if self.geneo_threshold > 0:
-                [_, coarse_space] = eigh(
-                    Ai, Bi, subset_by_value=[self.geneo_threshold, np.inf]
-                )
+                [w, v] = eigh(Ai, Bi, driver="gv")
             else:
-                n = Ai.shape[0]
-                [_, coarse_space] = eigh(
-                    Ai, Bi, subset_by_index=[n - self.geneo_nu, n - 1]
-                )
+                [w, v] = eigh(Ai, Bi, driver="gv")
         else:
             [w, v] = eig(Ai, Bi)
-            if self.geneo_threshold > 0:
-                nb_eig = (w > self.geneo_threshold).sum()
-                coarse_space = v[:, 0:nb_eig]
-            else:
-                coarse_space = v[:, 0 : self.geneo_nu]
 
+        idx = w.argsort()[::-1]
+
+        if self.geneo_threshold > 0:
+            nb_eig = (w > self.geneo_threshold).sum()
+            coarse_space = v[:, idx[0:nb_eig]]
+        else:
+            coarse_space = v[:, idx[0 : self.geneo_nu]]
         self.set_coarse_space(coarse_space)
 
 
@@ -39,42 +37,42 @@ def compute_coarse_space(self, Ai, Bi):
 @pytest.mark.parametrize(
     "mu,symmetry,ddm_builder,hpddm_schwarz_method,hpddm_schwarz_coarse_correction,geneo_type",
     [
-        (1, "N", "SolverBuilder", "none", "none", "none"),
-        (1, "N", "SolverBuilder", "asm", "none", "none"),
-        (1, "N", "SolverBuilder", "ras", "none", "none"),
-        (1, "N", "DDMSolverBuilderAddingOverlap", "asm", "none", "none"),
-        (1, "N", "DDMSolverBuilderAddingOverlap", "ras", "none", "none"),
-        (1, "N", "DDMSolverBuilder", "asm", "none", "none"),
-        (1, "N", "DDMSolverBuilder", "ras", "none", "none"),
-        (10, "N", "SolverBuilder", "none", "none", "none"),
-        (10, "N", "SolverBuilder", "asm", "none", "none"),
-        (10, "N", "SolverBuilder", "ras", "none", "none"),
-        (10, "N", "DDMSolverBuilderAddingOverlap", "asm", "none", "none"),
-        (10, "N", "DDMSolverBuilderAddingOverlap", "ras", "none", "none"),
-        (10, "N", "DDMSolverBuilder", "asm", "none", "none"),
-        (10, "N", "DDMSolverBuilder", "ras", "none", "none"),
-        (1, "S", "SolverBuilder", "none", "none", "none"),
-        (1, "S", "SolverBuilder", "asm", "none", "none"),
-        (1, "S", "SolverBuilder", "ras", "none", "none"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "asm", "none", "none"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "ras", "none", "none"),
-        (1, "S", "DDMSolverBuilder", "asm", "none", "none"),
-        (1, "S", "DDMSolverBuilder", "ras", "none", "none"),
-        (10, "S", "SolverBuilder", "none", "none", "none"),
-        (10, "S", "SolverBuilder", "asm", "none", "none"),
-        (10, "S", "SolverBuilder", "ras", "none", "none"),
-        (10, "S", "DDMSolverBuilderAddingOverlap", "asm", "none", "none"),
-        (10, "S", "DDMSolverBuilderAddingOverlap", "ras", "none", "none"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "asm", "additive", "geneo_nu"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "ras", "additive", "geneo_nu"),
-        (10, "S", "DDMSolverBuilderAddingOverlap", "asm", "additive", "geneo_nu"),
-        (10, "S", "DDMSolverBuilderAddingOverlap", "ras", "additive", "geneo_nu"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "asm", "additive", "geneo_threshold"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "ras", "additive", "geneo_threshold"),
+        (1, "N", "BlockJacobi", "none", "none", "none"),
+        (1, "N", "BlockJacobi", "asm", "none", "none"),
+        (1, "N", "BlockJacobi", "ras", "none", "none"),
+        (1, "N", "DDMWithHMatrixPlusOverlap", "asm", "none", "none"),
+        (1, "N", "DDMWithHMatrixPlusOverlap", "ras", "none", "none"),
+        (1, "N", "DDMWithHMatrix", "asm", "none", "none"),
+        (1, "N", "DDMWithHMatrix", "ras", "none", "none"),
+        (10, "N", "BlockJacobi", "none", "none", "none"),
+        (10, "N", "BlockJacobi", "asm", "none", "none"),
+        (10, "N", "BlockJacobi", "ras", "none", "none"),
+        (10, "N", "DDMWithHMatrixPlusOverlap", "asm", "none", "none"),
+        (10, "N", "DDMWithHMatrixPlusOverlap", "ras", "none", "none"),
+        (10, "N", "DDMWithHMatrix", "asm", "none", "none"),
+        (10, "N", "DDMWithHMatrix", "ras", "none", "none"),
+        (1, "S", "BlockJacobi", "none", "none", "none"),
+        (1, "S", "BlockJacobi", "asm", "none", "none"),
+        (1, "S", "BlockJacobi", "ras", "none", "none"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "asm", "none", "none"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "ras", "none", "none"),
+        (1, "S", "DDMWithHMatrix", "asm", "none", "none"),
+        (1, "S", "DDMWithHMatrix", "ras", "none", "none"),
+        (10, "S", "BlockJacobi", "none", "none", "none"),
+        (10, "S", "BlockJacobi", "asm", "none", "none"),
+        (10, "S", "BlockJacobi", "ras", "none", "none"),
+        (10, "S", "DDMWithHMatrixPlusOverlap", "asm", "none", "none"),
+        (10, "S", "DDMWithHMatrixPlusOverlap", "ras", "none", "none"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "asm", "additive", "geneo_nu"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "ras", "additive", "geneo_nu"),
+        (10, "S", "DDMWithHMatrixPlusOverlap", "asm", "additive", "geneo_nu"),
+        (10, "S", "DDMWithHMatrixPlusOverlap", "ras", "additive", "geneo_nu"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "asm", "additive", "geneo_threshold"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "ras", "additive", "geneo_threshold"),
         (
             10,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "asm",
             "additive",
             "geneo_threshold",
@@ -82,17 +80,17 @@ def compute_coarse_space(self, Ai, Bi):
         (
             10,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "ras",
             "additive",
             "geneo_threshold",
         ),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "asm", "additive", "custom_geneo_nu"),
-        (1, "S", "DDMSolverBuilderAddingOverlap", "ras", "additive", "custom_geneo_nu"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "asm", "additive", "custom_geneo_nu"),
+        (1, "S", "DDMWithHMatrixPlusOverlap", "ras", "additive", "custom_geneo_nu"),
         (
             10,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "asm",
             "additive",
             "custom_geneo_nu",
@@ -100,7 +98,7 @@ def compute_coarse_space(self, Ai, Bi):
         (
             10,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "ras",
             "additive",
             "custom_geneo_nu",
@@ -108,7 +106,7 @@ def compute_coarse_space(self, Ai, Bi):
         (
             1,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "asm",
             "additive",
             "custom_geneo_threshold",
@@ -116,7 +114,7 @@ def compute_coarse_space(self, Ai, Bi):
         (
             1,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "ras",
             "additive",
             "custom_geneo_threshold",
@@ -124,7 +122,7 @@ def compute_coarse_space(self, Ai, Bi):
         (
             10,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "asm",
             "additive",
             "custom_geneo_threshold",
@@ -132,29 +130,29 @@ def compute_coarse_space(self, Ai, Bi):
         (
             10,
             "S",
-            "DDMSolverBuilderAddingOverlap",
+            "DDMWithHMatrixPlusOverlap",
             "ras",
             "additive",
             "custom_geneo_threshold",
         ),
-        (10, "S", "DDMSolverBuilder", "asm", "none", "none"),
-        (10, "S", "DDMSolverBuilder", "ras", "none", "none"),
-        (1, "S", "DDMSolverBuilder", "asm", "additive", "geneo_nu"),
-        (1, "S", "DDMSolverBuilder", "ras", "additive", "geneo_nu"),
-        (10, "S", "DDMSolverBuilder", "asm", "additive", "geneo_nu"),
-        (10, "S", "DDMSolverBuilder", "ras", "additive", "geneo_nu"),
-        (1, "S", "DDMSolverBuilder", "asm", "additive", "geneo_threshold"),
-        (1, "S", "DDMSolverBuilder", "ras", "additive", "geneo_threshold"),
-        (10, "S", "DDMSolverBuilder", "asm", "additive", "geneo_threshold"),
-        (10, "S", "DDMSolverBuilder", "ras", "additive", "geneo_threshold"),
-        (1, "S", "DDMSolverBuilder", "asm", "additive", "custom_geneo_nu"),
-        (1, "S", "DDMSolverBuilder", "ras", "additive", "custom_geneo_nu"),
-        (10, "S", "DDMSolverBuilder", "asm", "additive", "custom_geneo_nu"),
-        (10, "S", "DDMSolverBuilder", "ras", "additive", "custom_geneo_nu"),
-        (1, "S", "DDMSolverBuilder", "asm", "additive", "custom_geneo_threshold"),
-        (1, "S", "DDMSolverBuilder", "ras", "additive", "custom_geneo_threshold"),
-        (10, "S", "DDMSolverBuilder", "asm", "additive", "custom_geneo_threshold"),
-        (10, "S", "DDMSolverBuilder", "ras", "additive", "custom_geneo_threshold"),
+        (10, "S", "DDMWithHMatrix", "asm", "none", "none"),
+        (10, "S", "DDMWithHMatrix", "ras", "none", "none"),
+        (1, "S", "DDMWithHMatrix", "asm", "additive", "geneo_nu"),
+        (1, "S", "DDMWithHMatrix", "ras", "additive", "geneo_nu"),
+        (10, "S", "DDMWithHMatrix", "asm", "additive", "geneo_nu"),
+        (10, "S", "DDMWithHMatrix", "ras", "additive", "geneo_nu"),
+        (1, "S", "DDMWithHMatrix", "asm", "additive", "geneo_threshold"),
+        (1, "S", "DDMWithHMatrix", "ras", "additive", "geneo_threshold"),
+        (10, "S", "DDMWithHMatrix", "asm", "additive", "geneo_threshold"),
+        (10, "S", "DDMWithHMatrix", "ras", "additive", "geneo_threshold"),
+        (1, "S", "DDMWithHMatrix", "asm", "additive", "custom_geneo_nu"),
+        (1, "S", "DDMWithHMatrix", "ras", "additive", "custom_geneo_nu"),
+        (10, "S", "DDMWithHMatrix", "asm", "additive", "custom_geneo_nu"),
+        (10, "S", "DDMWithHMatrix", "ras", "additive", "custom_geneo_nu"),
+        (1, "S", "DDMWithHMatrix", "asm", "additive", "custom_geneo_threshold"),
+        (1, "S", "DDMWithHMatrix", "ras", "additive", "custom_geneo_threshold"),
+        (10, "S", "DDMWithHMatrix", "asm", "additive", "custom_geneo_threshold"),
+        (10, "S", "DDMWithHMatrix", "ras", "additive", "custom_geneo_threshold"),
     ],
     # indirect=["setup_solver_dependencies"],
 )
@@ -194,7 +192,7 @@ def test_ddm_solver(
         local_neumann_matrix,
     ] = load_data_solver
 
-    generator = GeneratorFromMatrix(cluster.get_permutation(), A)
+    generator = GeneratorFromMatrix(A)
     default_approximation = Htool.ComplexDefaultApproximationBuilder(
         generator,
         cluster,
@@ -208,16 +206,22 @@ def test_ddm_solver(
 
     solver = None
     default_solver_builder = None
-    if ddm_builder == "SolverBuilder":
-        default_solver_builder = Htool.ComplexDefaultSolverBuilder(
+    if ddm_builder == "BlockJacobi":
+        block_diagonal_hmatrix = copy.deepcopy(
+            default_approximation.block_diagonal_hmatrix
+        )
+        default_solver_builder = Htool.ComplexDDMSolverBuilder(
             default_approximation.distributed_operator,
-            default_approximation.block_diagonal_hmatrix,
+            block_diagonal_hmatrix,
         )
 
-    elif ddm_builder == "DDMSolverBuilderAddingOverlap":
-        default_solver_builder = Htool.ComplexDefaultDDMSolverBuilderAddingOverlap(
+    elif ddm_builder == "DDMWithHMatrixPlusOverlap":
+        block_diagonal_hmatrix = copy.deepcopy(
+            default_approximation.block_diagonal_hmatrix
+        )
+        default_solver_builder = Htool.ComplexDDMSolverBuilder(
             default_approximation.distributed_operator,
-            default_approximation.block_diagonal_hmatrix,
+            block_diagonal_hmatrix,
             generator,
             ovr_subdomain_to_global,
             cluster_to_ovr_subdomain,
@@ -225,45 +229,23 @@ def test_ddm_solver(
             intersections,
         )
 
-    elif ddm_builder == "DDMSolverBuilder":
-        local_numbering_builder = Htool.LocalNumberingBuilder(
+    elif ddm_builder == "DDMWithHMatrix":
+        default_solver_builder = Htool.ComplexDDMSolverBuilder(
+            default_approximation.distributed_operator,
             ovr_subdomain_to_global,
             cluster_to_ovr_subdomain,
+            neighbors,
             intersections,
-        )
-        intersections = local_numbering_builder.intersections
-        local_to_global_numbering = local_numbering_builder.local_to_global_numbering
-        local_geometry = geometry[:, local_to_global_numbering]
-
-        local_cluster_builder = Htool.ClusterBuilder()
-
-        local_cluster: Htool.Cluster = local_cluster_builder.create_cluster_tree(
-            local_geometry, 2, 2
-        )
-
-        local_hmatrix_builder = Htool.ComplexHMatrixBuilder(
-            local_cluster,
-            local_cluster,
+            generator,
+            geometry,
             epsilon,
             eta,
-            symmetry,
-            UPLO,
-            -1,
-            -1,
-        )
-        local_generator = LocalGeneratorFromMatrix(
-            local_cluster.get_permutation(), local_to_global_numbering, A
-        )
-        local_hmatrix = local_hmatrix_builder.build(local_generator)
-        default_solver_builder = Htool.ComplexDefaultDDMSolverBuilder(
-            default_approximation.distributed_operator,
-            local_hmatrix,
-            neighbors,
-            intersections,
         )
 
     solver = default_solver_builder.solver
     distributed_operator = default_approximation.distributed_operator
+    local_size_wo_overlap = len(cluster_to_ovr_subdomain)
+    local_size_with_overlap = len(ovr_subdomain_to_global)
 
     # Solver
     x = np.zeros(len(f), dtype="complex128", order="F")
@@ -287,15 +269,12 @@ def test_ddm_solver(
     solver.set_hpddm_args(hpddm_args)
 
     if hpddm_schwarz_coarse_correction != "none" and mpi4py.MPI.COMM_WORLD.size > 1:
-        solver.set_hpddm_args(
-            "-hpddm_schwarz_coarse_correction " + hpddm_schwarz_coarse_correction
-        )
-
         geneo_space_operator_builder = None
         if geneo_type == "geneo_nu":
             geneo_space_operator_builder = Htool.ComplexGeneoCoarseSpaceDenseBuilder(
-                cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank).get_size(),
-                default_solver_builder.block_diagonal_dense_matrix,
+                local_size_wo_overlap,
+                local_size_with_overlap,
+                default_approximation.block_diagonal_hmatrix,
                 local_neumann_matrix,
                 symmetry,
                 UPLO,
@@ -303,8 +282,9 @@ def test_ddm_solver(
             )
         elif geneo_type == "geneo_threshold":
             geneo_space_operator_builder = Htool.ComplexGeneoCoarseSpaceDenseBuilder(
-                cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank).get_size(),
-                default_solver_builder.block_diagonal_dense_matrix,
+                local_size_wo_overlap,
+                local_size_with_overlap,
+                default_approximation.block_diagonal_hmatrix,
                 local_neumann_matrix,
                 symmetry,
                 UPLO,
@@ -312,17 +292,19 @@ def test_ddm_solver(
             )
         elif geneo_type == "custom_geneo_nu":
             geneo_space_operator_builder = CustomGeneoCoarseSpaceDenseBuilder(
-                cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank).get_size(),
-                default_solver_builder.block_diagonal_dense_matrix,
+                local_size_wo_overlap,
+                local_size_with_overlap,
+                default_approximation.block_diagonal_hmatrix.to_dense(),
                 local_neumann_matrix,
                 symmetry,
                 UPLO,
                 geneo_nu=2,
             )
         elif geneo_type == "custom_geneo_threshold":
-            geneo_space_operator_builder = Htool.ComplexGeneoCoarseSpaceDenseBuilder(
-                cluster.get_cluster_on_partition(mpi4py.MPI.COMM_WORLD.rank).get_size(),
-                default_solver_builder.block_diagonal_dense_matrix,
+            geneo_space_operator_builder = CustomGeneoCoarseSpaceDenseBuilder(
+                local_size_wo_overlap,
+                local_size_with_overlap,
+                default_approximation.block_diagonal_hmatrix.to_dense(),
                 local_neumann_matrix,
                 symmetry,
                 UPLO,
@@ -335,6 +317,10 @@ def test_ddm_solver(
             geneo_space_operator_builder, geneo_coarse_operator_builder
         )
 
+        solver.set_hpddm_args(
+            "-hpddm_schwarz_coarse_correction " + hpddm_schwarz_coarse_correction
+        )
+
     if hpddm_schwarz_method == "asm" or hpddm_schwarz_method == "ras":
         solver.facto_one_level()