diff --git a/src/solvers/amgcl/LICENSE.md b/src/solvers/amgcl/LICENSE.md
deleted file mode 100644
index 7b70f24..0000000
--- a/src/solvers/amgcl/LICENSE.md
+++ /dev/null
@@ -1,22 +0,0 @@
-The MIT License
-===============
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
diff --git a/src/solvers/amgcl/README.md b/src/solvers/amgcl/README.md
deleted file mode 100644
index 7a9f272..0000000
--- a/src/solvers/amgcl/README.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# AMGCL
-
-[![Documentation Status](https://readthedocs.org/projects/amgcl/badge/?version=latest)](http://amgcl.readthedocs.io/en/latest/?badge=latest)
-[![DOI](https://zenodo.org/badge/6987353.svg)](https://zenodo.org/badge/latestdoi/6987353)
-[![Build Status](https://travis-ci.org/ddemidov/amgcl.svg?branch=master)](https://travis-ci.org/ddemidov/amgcl)
-[![Build status](https://ci.appveyor.com/api/projects/status/r0s4lbln4qf9r8aq/branch/master?svg=true)](https://ci.appveyor.com/project/ddemidov/amgcl/branch/master)
-[![codecov](https://codecov.io/gh/ddemidov/amgcl/branch/master/graph/badge.svg)](https://codecov.io/gh/ddemidov/amgcl)
-[![Coverity Scan Build Status](https://scan.coverity.com/projects/5301/badge.svg)](https://scan.coverity.com/projects/5301)
-
-AMGCL is a header-only C++ library for solving large sparse linear systems with
-algebraic multigrid (AMG) method. AMG is one of the most effective iterative
-methods for solution of equation systems arising, for example, from
-discretizing PDEs on unstructured grids. The method can be used as a black-box
-solver for various computational problems, since it does not require any
-information about the underlying geometry. AMG is often used not as a
-standalone solver but as a preconditioner within an iterative solver (e.g.
-Conjugate Gradients, BiCGStab, or GMRES).
-
-AMGCL builds the AMG hierarchy on a CPU and then transfers it to one of the
-provided backends. This allows for transparent acceleration of the solution
-phase with help of OpenCL, CUDA, or OpenMP technologies. Users may provide
-their own backends which enables tight integration between AMGCL and the user
-code.
-
-See AMGCL documentation at http://amgcl.readthedocs.io/
-
-## Referencing
-
-Demidov, Denis. AMGCL: An efficient, flexible, and extensible algebraic multigrid
-implementation. Lobachevskii Journal of Mathematics, 40(5):535–546, May 2019.
-[doi](https://doi.org/10.1134/S1995080219050056) [pdf](https://rdcu.be/bHFsY)
-[bib](https://raw.githubusercontent.com/ddemidov/amgcl/master/docs/demidov19.bib)
-
-Demidov, Denis. AMGCL -- A C++ library for efficient solution of large sparse linear
-systems.  Software Impacts, 6:100037, November 2020.
-[doi](https://doi.org/10.1016/j.simpa.2020.100037)
-[bib](https://raw.githubusercontent.com/ddemidov/amgcl/master/docs/demidov20.bib)
-
-Demidov, Denis, Lin Mu, and Bin Wang. Accelerating linear solvers for Stokes
-problems with C++ metaprogramming. Journal of Computational Science (2020):
-101285.
-[doi](https://doi.org/10.1016/j.jocs.2020.101285)
-[arxiv](https://arxiv.org/pdf/2006.06052.pdf)
-[bib](https://raw.githubusercontent.com/ddemidov/amgcl/master/docs/demidov-mu-wang-20.bib)
-
-## Support
-
-* GitHub issues page: https://github.com/ddemidov/amgcl/issues
-* Mailing list: https://groups.google.com/forum/#!forum/amgcl
diff --git a/src/solvers/amgcl/adapter/block_matrix.hpp b/src/solvers/amgcl/adapter/block_matrix.hpp
deleted file mode 100644
index ea7eedd..0000000
--- a/src/solvers/amgcl/adapter/block_matrix.hpp
+++ /dev/null
@@ -1,249 +0,0 @@
-#ifndef AMGCL_ADAPTER_BLOCK_MATRIX_HPP
-#define AMGCL_ADAPTER_BLOCK_MATRIX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/block_matrix.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   On-the-fly conversion to block valued matrix.
-\ingroup adapters
-*/
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/detail/matrix_ops.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace adapter {
-
-template <class Matrix, class BlockType>
-struct block_matrix_adapter {
-    typedef BlockType value_type;
-    static const int BlockSize = math::static_rows<BlockType>::value;
-
-    const Matrix &A;
-
-    block_matrix_adapter(const Matrix &A) : A(A) {
-        precondition(
-                backend::rows(A) % BlockSize == 0 &&
-                backend::cols(A) % BlockSize == 0,
-                "Matrix size is not divisible by block size!"
-                );
-    }
-
-    size_t rows() const {
-        return backend::rows(A) / BlockSize;
-    }
-
-    size_t cols() const {
-        return backend::cols(A) / BlockSize;
-    }
-
-    size_t nonzeros() const {
-        // Just an estimate:
-        return backend::nonzeros(A) / (BlockSize * BlockSize);
-    }
-
-    struct row_iterator {
-        typedef typename backend::row_iterator<Matrix>::type Base;
-        typedef ptrdiff_t col_type;
-        typedef BlockType val_type;
-
-        std::array<char, sizeof(Base) * BlockSize> buf;
-        Base * base;
-
-        bool done;
-        col_type cur_col;
-        val_type cur_val;
-
-        row_iterator(const Matrix &A, col_type row)
-            : base(reinterpret_cast<Base*>(buf.data())), done(true)
-        {
-            for(int i = 0; i < BlockSize; ++i) {
-                new (base + i) Base(backend::row_begin(A, row * BlockSize + i));
-
-                if (base[i]) {
-                    col_type col = base[i].col() / BlockSize;
-                    if (done) {
-                        cur_col = col;
-                        done = false;
-                    } else {
-                        cur_col = std::min<col_type>(cur_col, col);
-                    }
-                }
-            }
-
-            if (done) return;
-
-            // While we are gathering the current value,
-            // base iteratirs are advanced to the next block-column.
-            cur_val = math::zero<val_type>();
-            col_type end = (cur_col + 1) * BlockSize;
-            for(int i = 0; i < BlockSize; ++i) {
-                for(; base[i] && static_cast<ptrdiff_t>(base[i].col()) < end; ++base[i]) {
-                    cur_val(i, base[i].col() % BlockSize) = base[i].value();
-                }
-            }
-        }
-
-        ~row_iterator() {
-            for(int i = 0; i < BlockSize; ++i) base[i].~Base();
-        }
-
-        operator bool() const {
-            return !done;
-        }
-
-        row_iterator& operator++() {
-            // Base iterators are already at the next block-column.
-            // We just need to gather the current column and value.
-            done = true;
-
-            col_type end = (cur_col + 1) * BlockSize;
-            for(int i = 0; i < BlockSize; ++i) {
-                if (base[i]) {
-                    col_type col = base[i].col() / BlockSize;
-                    if (done) {
-                        cur_col = col;
-                        done = false;
-                    } else {
-                        cur_col = std::min<col_type>(cur_col, col);
-                    }
-                }
-            }
-
-            if (done) return *this;
-
-            cur_val = math::zero<val_type>();
-            end = (cur_col + 1) * BlockSize;
-            for(int i = 0; i < BlockSize; ++i) {
-                for(; base[i] && static_cast<ptrdiff_t>(base[i].col()) < end; ++base[i]) {
-                    cur_val(i, base[i].col() % BlockSize) = base[i].value();
-                }
-            }
-
-            return *this;
-        }
-
-        col_type col() const {
-            return cur_col;
-        }
-
-        val_type value() const {
-            return cur_val;
-        }
-    };
-
-    row_iterator row_begin(size_t i) const {
-        return row_iterator(A, i);
-    }
-};
-
-/// Convert scalar-valued matrix to a block-valued one.
-template <class BlockType, class Matrix>
-block_matrix_adapter<Matrix, BlockType> block_matrix(const Matrix &A) {
-    return block_matrix_adapter<Matrix, BlockType>(A);
-}
-
-template <class Matrix>
-std::shared_ptr<
-    backend::crs<
-        typename math::element_of<
-            typename backend::value_type<Matrix>::type
-            >::type,
-        typename backend::col_type<Matrix>::type,
-        typename backend::ptr_type<Matrix>::type
-        >
-    >
-unblock_matrix(const Matrix &B) {
-    typedef typename backend::value_type<Matrix>::type Block;
-    typedef typename math::element_of<Block>::type Scalar;
-    typedef typename backend::col_type<Matrix>::type Col;
-    typedef typename backend::ptr_type<Matrix>::type Ptr;
-
-    const int brows = math::static_rows<Block>::value;
-    const int bcols = math::static_cols<Block>::value;
-
-    static_assert(brows > 1 || bcols > 1, "Can not unblock scalar matrix!");
-
-    auto A = std::make_shared<backend::crs<Scalar, Col, Ptr>>();
-
-    A->set_size(backend::rows(B) * brows, backend::cols(B) * bcols);
-    A->ptr[0] = 0;
-
-    const ptrdiff_t nb = backend::rows(B);
-
-#pragma omp for
-    for (ptrdiff_t ib = 0; ib < nb; ++ib) {
-        auto w = backend::row_nonzeros(B, ib);
-        for (ptrdiff_t i = 0, ia = ib * brows; i < brows; ++i, ++ia) {
-            A->ptr[ia + 1] = w * bcols;
-        }
-    }
-
-    A->scan_row_sizes();
-    A->set_nonzeros();
-
-#pragma omp for
-    for (ptrdiff_t ib = 0; ib < nb; ++ib) {
-        for(auto b = backend::row_begin(B, ib); b; ++b) {
-            auto c = b.col();
-            auto v = b.value();
-
-            for (ptrdiff_t i = 0, ia = ib * brows; i < brows; ++i, ++ia) {
-                auto row_head = A->ptr[ia];
-                for(int j = 0; j < bcols; ++j) {
-                    A->col[row_head] = c * bcols + j;
-                    A->val[row_head] = v(i,j);
-                    ++row_head;
-                }
-                A->ptr[ia] = row_head;
-            }
-        }
-    }
-
-    std::rotate(A->ptr, A->ptr + A->nrows, A->ptr + A->nrows + 1);
-    A->ptr[0] = 0;
-
-    return A;
-}
-
-} // namespace adapter
-
-namespace backend {
-namespace detail {
-
-template <class Matrix, class BlockType>
-struct use_builtin_matrix_ops< adapter::block_matrix_adapter<Matrix, BlockType> >
-    : std::true_type
-{};
-
-} // namespace detail
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/complex.hpp b/src/solvers/amgcl/adapter/complex.hpp
deleted file mode 100644
index dbbacfa..0000000
--- a/src/solvers/amgcl/adapter/complex.hpp
+++ /dev/null
@@ -1,176 +0,0 @@
-#ifndef AMGCL_ADAPTER_COMPLEX_HPP
-#define AMGCL_ADAPTER_COMPLEX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/complex.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Complex-valued matrix adapter.
-\ingroup adapters
-*/
-
-#include <type_traits>
-#include <boost/range/iterator_range.hpp>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/detail/matrix_ops.hpp>
-
-namespace amgcl {
-namespace adapter {
-
-template <class Matrix>
-struct complex_adapter {
-    static_assert(is_complex<typename backend::value_type<Matrix>::type>::value,
-            "value type should be complex");
-
-    typedef typename backend::value_type<Matrix>::type::value_type value_type;
-
-    const Matrix &A;
-
-    complex_adapter(const Matrix &A) : A(A) {}
-
-    size_t rows() const {
-        return 2 * backend::rows(A);
-    }
-
-    size_t cols() const {
-        return 2 * backend::cols(A);
-    }
-
-    size_t nonzeros() const {
-        return 4 * backend::nonzeros(A);
-    }
-
-    struct row_iterator {
-        typedef typename backend::row_iterator<Matrix>::type Base;
-        typedef typename Base::col_type col_type;
-
-        row_iterator(const Base &base, bool row_real)
-            : base(base), row_real(row_real), col_real(true) {}
-
-        operator bool() const {
-            return static_cast<bool>(base);
-        }
-
-        row_iterator& operator++() {
-            col_real = !col_real;
-            if (col_real) ++base;
-
-            return *this;
-        }
-
-        col_type col() const {
-            if (col_real)
-                return base.col() * 2;
-            else
-                return base.col() * 2 + 1;
-        }
-
-        value_type value() const {
-            if (row_real) {
-                if (col_real)
-                    return std::real(base.value());
-                else
-                    return -std::imag(base.value());
-            } else {
-                if (col_real)
-                    return std::imag(base.value());
-                else
-                    return std::real(base.value());
-            }
-        }
-
-        private:
-            Base base;
-            bool row_real;
-            bool col_real;
-
-    };
-
-    row_iterator row_begin(size_t i) const {
-        return row_iterator(backend::row_begin(A, i / 2), i % 2 == 0);
-    }
-};
-
-template <class Matrix>
-complex_adapter<Matrix> complex_matrix(const Matrix &A) {
-    return complex_adapter<Matrix>(A);
-}
-
-template <class Range>
-boost::iterator_range<
-    typename std::add_pointer<
-        typename std::conditional<
-            std::is_const<Range>::value,
-            typename std::add_const<
-                typename boost::range_value<
-                    typename std::decay<Range>::type
-                    >::type::value_type
-                >::type,
-            typename boost::range_value<
-                typename std::decay<Range>::type
-                >::type::value_type
-            >::type
-        >::type
-    >
-complex_range(Range &rng) {
-    typedef
-        typename std::add_pointer<
-            typename std::conditional<
-                std::is_const<Range>::value,
-                typename std::add_const<
-                    typename boost::range_value<
-                        typename std::decay<Range>::type
-                        >::type::value_type
-                    >::type,
-                typename boost::range_value<
-                    typename std::decay<Range>::type
-                    >::type::value_type
-                >::type
-            >::type
-        pointer_type;
-
-    pointer_type b = reinterpret_cast<pointer_type>(&rng[0]);
-    pointer_type e = b + 2 * boost::size(rng);
-
-    return boost::iterator_range<pointer_type>(b, e);
-}
-
-} // namespace adapter
-
-namespace backend {
-namespace detail {
-
-template <class Matrix>
-struct use_builtin_matrix_ops< amgcl::adapter::complex_adapter<Matrix> >
-    : std::true_type
-{};
-
-} // namespace detail
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/crs_builder.hpp b/src/solvers/amgcl/adapter/crs_builder.hpp
deleted file mode 100644
index 0065aad..0000000
--- a/src/solvers/amgcl/adapter/crs_builder.hpp
+++ /dev/null
@@ -1,178 +0,0 @@
-#ifndef AMGCL_ADAPTER_CRS_BUILDER_HPP
-#define AMGCL_ADAPTER_CRS_BUILDER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/crs_builder.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Matrix builder that creates matrix rows as needed.
-\ingroup adapters
-
-Example:
-\code
-struct poisson_2d {
-    typedef double val_type;
-    typedef long   col_type;
-
-    poisson_2d(size_t n) : n(n), h2i((n - 1) * (n - 1)) {}
-
-    // Number of rows in the constructed matrix:
-    size_t rows() const { return n * n; }
-
-    // Estimated number of nonzeros in the problem:
-    size_t nonzeros() const { return 5 * rows(); }
-
-    // Fills column numbers and values of nonzero elements in the given matrix row.
-    void operator()(size_t row,
-            std::vector<col_type> &col,
-            std::vector<val_type> &val
-            ) const
-    {
-        size_t i = row % n;
-        size_t j = row / n;
-
-        if (j > 0) {
-            col.push_back(row - n);
-            val.push_back(-h2i);
-        }
-
-        if (i > 0) {
-            col.push_back(row - 1);
-            val.push_back(-h2i);
-        }
-
-        col.push_back(row);
-        val.push_back(4 * h2i);
-
-        if (i + 1 < n) {
-            col.push_back(row + 1);
-            val.push_back(-h2i);
-        }
-
-        if (j + 1 < n) {
-            col.push_back(row + n);
-            val.push_back(-h2i);
-        }
-    }
-
-    private:
-        size_t n;
-        double h2i;
-};
-
-amgcl::make_solver<
-    Backend, Coarsening, Relaxation, IterativeSolver
-    > solve( amgcl::backend::make_matrix( poisson_2d(m) ) );
-\endcode
-*/
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/detail/matrix_ops.hpp>
-
-namespace amgcl {
-
-/// Matrix adapters.
-namespace adapter {
-
-/// Generates matrix rows as needed with help of user-provided functor.
-/**
- * The generated rows are not stored anywhere.
- */
-template <class RowBuilder>
-struct matrix_builder {
-    typedef typename RowBuilder::val_type value_type;
-    typedef typename RowBuilder::col_type col_type;
-
-    RowBuilder build_row;
-
-    matrix_builder(const RowBuilder &row_builder) : build_row(row_builder) {}
-
-    size_t rows()     const { return build_row.rows(); }
-    size_t cols()     const { return build_row.rows(); }
-    size_t nonzeros() const { return build_row.nonzeros(); }
-
-    struct row_iterator {
-        typedef typename RowBuilder::col_type col_type;
-        typedef typename RowBuilder::val_type val_type;
-
-        typedef typename std::vector<col_type>::const_iterator col_iterator;
-        typedef typename std::vector<val_type>::const_iterator val_iterator;
-
-        row_iterator(const RowBuilder &build_row, size_t i) : ptr(0)
-        {
-            build_row(i, m_col, m_val);
-        }
-
-        operator bool() const {
-            return m_col.size() - ptr;
-        }
-
-        row_iterator& operator++() {
-            ++ptr;
-            return *this;
-        }
-
-        col_type col() const {
-            return m_col[ptr];
-        }
-
-        val_type value() const {
-            return m_val[ptr];
-        }
-
-        private:
-            int ptr;
-            std::vector<col_type>   m_col;
-            std::vector<value_type> m_val;
-    };
-
-    row_iterator row_begin(size_t i) const {
-        return row_iterator(build_row, i);
-    }
-
-};
-
-/// Convenience function returning an instance of matrix_builder<RowBuilder>
-template <class RowBuilder>
-matrix_builder<RowBuilder> make_matrix(const RowBuilder &row_builder) {
-    return matrix_builder<RowBuilder>(row_builder);
-}
-
-} // namespace adapter
-
-namespace backend {
-namespace detail {
-
-template <class RowBuilder>
-struct use_builtin_matrix_ops< amgcl::adapter::matrix_builder<RowBuilder> >
-    : std::true_type
-{};
-
-} // namespace detail
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/crs_tuple.hpp b/src/solvers/amgcl/adapter/crs_tuple.hpp
deleted file mode 100644
index db623ca..0000000
--- a/src/solvers/amgcl/adapter/crs_tuple.hpp
+++ /dev/null
@@ -1,218 +0,0 @@
-#ifndef AMGCL_ADAPTER_CRS_TUPLE_HPP
-#define AMGCL_ADAPTER_CRS_TUPLE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/crs_tuple.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Specify sparse matrix as a tuple of CRS arrays.
-\ingroup adapters
-
-Example:
-\code
-// Adapt STL containers:
-std::vector<int>    ptr;
-std::vector<int>    col;
-std::vector<double> val;
-
-AMG amg( std::tie(n, ptr, col, val) );
-
-// Adapt raw arrays:
-int    *ptr;
-int    *col;
-double *val;
-
-AMG amg(std::make_tuple(n,
-                          amgcl::make_iterator_range(ptr, ptr + n + 1),
-                          amgcl::make_iterator_range(col, col + ptr[n]),
-                          amgcl::make_iterator_range(val, val + ptr[n])
-                          ) );
-\endcode
-*/
-
-/**
- * \defgroup adapters Matrix adapters
- * \brief Adapters for variuos sparse matrix formats.
- */
-
-#include <vector>
-#include <numeric>
-#include <tuple>
-#include <type_traits>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/detail/matrix_ops.hpp>
-
-namespace amgcl {
-namespace backend {
-
-//---------------------------------------------------------------------------
-// Specialization of matrix interface
-//---------------------------------------------------------------------------
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct value_type< std::tuple<N, PRng, CRng, VRng> >
-{
-    typedef typename std::decay<decltype(std::declval<VRng>()[0])>::type type;
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct rows_impl< std::tuple<N, PRng, CRng, VRng> >
-{
-    static size_t get(const std::tuple<N, PRng, CRng, VRng> &A) {
-        return std::get<0>(A);
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct cols_impl< std::tuple<N, PRng, CRng, VRng> >
-{
-    static size_t get(const std::tuple<N, PRng, CRng, VRng> &A) {
-        return std::get<0>(A);
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct nonzeros_impl< std::tuple<N, PRng, CRng, VRng> >
-{
-    static size_t get(const std::tuple<N, PRng, CRng, VRng> &A) {
-        return std::get<1>(A)[std::get<0>(A)];
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct row_iterator< std::tuple<N, PRng, CRng, VRng> >
-{
-    class type {
-        public:
-            typedef typename std::decay<decltype(std::declval<CRng>()[0])>::type col_type;
-            typedef typename std::decay<decltype(std::declval<VRng>()[0])>::type val_type;
-
-            type(const std::tuple<N, PRng, CRng, VRng> &A, size_t row)
-                : m_col(std::begin(std::get<2>(A)))
-                , m_end(std::begin(std::get<2>(A)))
-                , m_val(std::begin(std::get<3>(A)))
-            {
-                typedef typename std::decay<decltype(std::declval<PRng>()[0])>::type ptr_type;
-
-                ptr_type row_begin = std::get<1>(A)[row];
-                ptr_type row_end   = std::get<1>(A)[row + 1];
-
-                m_col += row_begin;
-                m_end += row_end;
-                m_val += row_begin;
-            }
-
-            operator bool() const {
-                return m_col != m_end;
-            }
-
-            type& operator++() {
-                ++m_col;
-                ++m_val;
-                return *this;
-            }
-
-            col_type col() const {
-                return *m_col;
-            }
-
-            val_type value() const {
-                return *m_val;
-            }
-
-        private:
-            typedef decltype(std::begin(std::declval<VRng>())) val_iterator;
-            typedef decltype(std::begin(std::declval<CRng>())) col_iterator;
-
-            col_iterator m_col;
-            col_iterator m_end;
-            val_iterator m_val;
-    };
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct row_begin_impl< std::tuple<N, PRng, CRng, VRng> >
-{
-    typedef std::tuple<N, PRng, CRng, VRng> Matrix;
-    static typename row_iterator<Matrix>::type
-    get(const Matrix &matrix, size_t row) {
-        return typename row_iterator<Matrix>::type(matrix, row);
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct row_nonzeros_impl< std::tuple<N, PRng, CRng, VRng> > {
-    typedef std::tuple<N, PRng, CRng, VRng> Matrix;
-
-    static size_t get(const Matrix &A, size_t row) {
-        return std::get<1>(A)[row + 1] - std::get<1>(A)[row];
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct ptr_data_impl< std::tuple<N, PRng, CRng, VRng> > {
-    typedef std::tuple<N, PRng, CRng, VRng> Matrix;
-    typedef typename std::decay<decltype(std::declval<PRng>()[0])>::type ptr_type;
-    typedef const ptr_type* type;
-    static type get(const Matrix &A) {
-        return &std::get<1>(A)[0];
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct col_data_impl< std::tuple<N, PRng, CRng, VRng> > {
-    typedef std::tuple<N, PRng, CRng, VRng> Matrix;
-    typedef typename std::decay<decltype(std::declval<CRng>()[0])>::type col_type;
-    typedef const col_type* type;
-    static type get(const Matrix &A) {
-        return &std::get<2>(A)[0];
-    }
-};
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct val_data_impl< std::tuple<N, PRng, CRng, VRng> > {
-    typedef std::tuple<N, PRng, CRng, VRng> Matrix;
-    typedef typename std::decay<decltype(std::declval<VRng>()[0])>::type val_type;
-    typedef const val_type* type;
-    static type get(const Matrix &A) {
-        return &std::get<3>(A)[0];
-    }
-};
-
-namespace detail {
-
-template < typename N, typename PRng, typename CRng, typename VRng >
-struct use_builtin_matrix_ops< std::tuple<N, PRng, CRng, VRng> >
-    : std::true_type
-{};
-
-} // namespace detail
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/eigen.hpp b/src/solvers/amgcl/adapter/eigen.hpp
deleted file mode 100644
index 37a2947..0000000
--- a/src/solvers/amgcl/adapter/eigen.hpp
+++ /dev/null
@@ -1,125 +0,0 @@
-#ifndef AMGCL_ADAPTER_EIGEN_HPP
-#define AMGCL_ADAPTER_EIGEN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/eigen.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Adapters for Eigen types to be used with builtin backend.
-\ingroup adapters
-*/
-
-#include <type_traits>
-#include <Eigen/SparseCore>
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace backend {
-
-//---------------------------------------------------------------------------
-// Backend interface specialization for Eigen types
-//---------------------------------------------------------------------------
-template <class T, class Enable = void>
-struct is_eigen_sparse_matrix : std::false_type {};
-
-template <class T, class Enable = void>
-struct is_eigen_type : std::false_type {};
-
-template <typename Scalar, int Flags, typename Storage>
-struct is_eigen_sparse_matrix<
-    Eigen::Map<Eigen::SparseMatrix<Scalar, Flags, Storage>>
-    > : std::true_type
-{};
-
-template <typename Scalar, int Flags, typename Storage>
-struct is_eigen_sparse_matrix<
-    Eigen::SparseMatrix<Scalar, Flags, Storage>
-    > : std::true_type
-{};
-
-template <class T>
-struct is_eigen_type<
-    T,
-    typename std::enable_if<
-        std::is_arithmetic<typename T::Scalar>::value &&
-        std::is_base_of<Eigen::EigenBase<T>, T>::value
-        >::type
-    > : std::true_type
-{};
-
-template <class T>
-struct value_type<
-    T,
-    typename std::enable_if<is_eigen_type<T>::value>::type
-    >
-{
-    typedef typename T::Scalar type;
-};
-
-template <class T>
-struct nonzeros_impl<
-    T,
-    typename std::enable_if<is_eigen_sparse_matrix<T>::value>::type
-    >
-{
-    static size_t get(const T &matrix) {
-        return matrix.nonZeros();
-    }
-};
-
-template <class T>
-struct row_iterator <
-    T,
-    typename std::enable_if<is_eigen_sparse_matrix<T>::value>::type
-    >
-{
-    typedef typename T::InnerIterator type;
-};
-
-template <class T>
-struct row_begin_impl <
-    T,
-    typename std::enable_if<is_eigen_sparse_matrix<T>::value>::type
-    >
-{
-    typedef typename row_iterator<T>::type iterator;
-    static iterator get(const T &matrix, size_t row) {
-        return iterator(matrix, row);
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#define AMGCL_USE_EIGEN_VECTORS_WITH_BUILTIN_BACKEND()                         \
-    namespace amgcl { namespace backend {                                      \
-        template <class T >                                                    \
-        struct is_builtin_vector< Eigen::Matrix<T, Eigen::Dynamic, 1> >        \
-          : std::true_type {};                                                 \
-    } }
-
-#endif
diff --git a/src/solvers/amgcl/adapter/epetra.hpp b/src/solvers/amgcl/adapter/epetra.hpp
deleted file mode 100644
index 50260de..0000000
--- a/src/solvers/amgcl/adapter/epetra.hpp
+++ /dev/null
@@ -1,157 +0,0 @@
-#ifndef AMGCL_ADAPTER_EPETRA_HPP
-#define AMGCL_ADAPTER_EPETRA_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2014, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/epetra.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Adapt Epetra_CrsMatrix from Trilinos.
-\ingroup adapters
-*/
-
-#include <vector>
-
-#include <Epetra_CrsMatrix.h>
-#include <Epetra_IntVector.h>
-#include <Epetra_Import.h>
-#include <Epetra_Comm.h>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/detail/sort_row.hpp>
-
-namespace amgcl {
-namespace adapter {
-
-/// Adapts Epetra_CrsMatrix
-class epetra_map {
-    public:
-        typedef double value_type;
-
-        epetra_map(const Epetra_CrsMatrix &A)
-            : A(A), order(A.ColMap())
-        {
-            const Epetra_Map& row_map = A.RowMap();
-            const Epetra_Map& col_map = A.ColMap();
-
-            int entries_before;
-            int local_entries = row_map.NumMyElements();
-            A.Comm().ScanSum(&local_entries, &entries_before, 1);
-            entries_before -= local_entries;
-
-            Epetra_IntVector perm(row_map);
-            for(int i = 0, j = entries_before; i < local_entries; ++i, ++j)
-                perm[i] = j;
-
-            Epetra_Import importer = Epetra_Import(col_map, row_map);
-
-            order.Import(perm, importer, Insert);
-        }
-
-        size_t rows() const {
-            return A.NumMyRows();
-        }
-
-        size_t cols() const {
-            return A.NumGlobalCols();
-        }
-
-        size_t nonzeros() const {
-            return A.NumMyNonzeros();
-        }
-
-        class row_iterator {
-            public:
-                typedef int    col_type;
-                typedef double val_type;
-
-                row_iterator(
-                        const Epetra_CrsMatrix &A,
-                        const Epetra_IntVector &order,
-                        int row
-                        )
-                {
-                    int nnz;
-                    A.ExtractMyRowView(row, nnz, m_val, m_col);
-                    m_end = m_col + nnz;
-
-                    col_copy.assign(m_col, m_col + nnz);
-                    val_copy.assign(m_val, m_val + nnz);
-
-                    for(auto &c : col_copy) c = order[c];
-
-                    m_col = &col_copy[0];
-                    m_end = m_col + nnz;
-                    m_val = &val_copy[0];
-
-                    amgcl::detail::sort_row(m_col, m_val, nnz);
-                }
-
-                operator bool() const {
-                    return m_col != m_end;
-                }
-
-                row_iterator& operator++() {
-                    ++m_col;
-                    ++m_val;
-                    return *this;
-                }
-
-                col_type col() const {
-                    return *m_col;
-                }
-
-                val_type value() const {
-                    return *m_val;
-                }
-
-            private:
-                col_type * m_col;
-                col_type * m_end;
-                val_type * m_val;
-
-                std::vector<col_type> col_copy;
-                std::vector<val_type> val_copy;
-        };
-
-        row_iterator row_begin(int row) const {
-            return row_iterator(A, order, row);
-        }
-    private:
-        const Epetra_CrsMatrix &A;
-        Epetra_IntVector order;
-};
-
-/// Adapts Epetra_CrsMatrix
-inline epetra_map map(const Epetra_CrsMatrix &A) {
-    return epetra_map(A);
-}
-
-} // namespace adapter
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/adapter/reorder.hpp b/src/solvers/amgcl/adapter/reorder.hpp
deleted file mode 100644
index 8649d3a..0000000
--- a/src/solvers/amgcl/adapter/reorder.hpp
+++ /dev/null
@@ -1,238 +0,0 @@
-#ifndef AMGCL_ADAPTER_REORDER_HPP
-#define AMGCL_ADAPTER_REORDER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/reorder.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   On-the-fly reodering of matrix and vectors.
-\ingroup adapters
-*/
-
-#include <type_traits>
-#include <boost/range/size.hpp>
-#include <boost/iterator/permutation_iterator.hpp>
-
-
-#include <amgcl/reorder/cuthill_mckee.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/backend/detail/matrix_ops.hpp>
-
-namespace amgcl {
-namespace adapter {
-
-template <class Matrix>
-struct reordered_matrix {
-    typedef typename backend::value_type<Matrix>::type value_type;
-    typedef typename backend::row_iterator<Matrix>::type base_iterator;
-
-    const Matrix &A;
-    const ptrdiff_t * perm;
-    const ptrdiff_t * iperm;
-
-    reordered_matrix(const Matrix &A, const ptrdiff_t *perm, const ptrdiff_t * iperm)
-        : A(A), perm(perm), iperm(iperm)
-    {}
-
-    size_t rows() const {
-        return backend::rows(A);
-    }
-
-    size_t cols() const {
-        return backend::cols(A);
-    }
-
-    size_t nonzeros() const {
-        return backend::nonzeros(A);
-    }
-
-    struct row_iterator {
-        base_iterator base;
-        const ptrdiff_t * iperm;
-
-        row_iterator(const base_iterator &base, const ptrdiff_t *iperm)
-            : base(base), iperm(iperm)
-        {}
-
-        operator bool() const {
-            return base;
-        }
-
-        row_iterator& operator++() {
-            ++base;
-            return *this;
-        }
-
-        ptrdiff_t col() const {
-            return iperm[base.col()];
-        }
-
-        value_type value() const {
-            return base.value();
-        }
-    };
-
-    row_iterator row_begin(size_t i) const {
-        return row_iterator(backend::row_begin(A, perm[i]), iperm);
-    }
-};
-
-template <class Vector>
-struct reordered_vector {
-    typedef typename backend::value_type<typename std::decay<Vector>::type>::type raw_value_type;
-    typedef typename std::conditional<
-        std::is_const<Vector>::value,
-        const raw_value_type,
-        raw_value_type
-        >::type value_type;
-
-    Vector &x;
-    const ptrdiff_t *perm;
-
-    reordered_vector(Vector &x, const ptrdiff_t *perm) : x(x), perm(perm) {}
-
-    size_t size() const {
-        return boost::size(x);
-    }
-
-    value_type& operator[](size_t i) const {
-        return x[perm[i]];
-    }
-
-    boost::permutation_iterator<
-        typename std::decay<Vector>::type::iterator,
-        const ptrdiff_t*
-        >
-    begin() {
-        return boost::make_permutation_iterator(boost::begin(x), perm);
-    }
-
-    boost::permutation_iterator<
-        typename std::decay<Vector>::type::const_iterator,
-        const ptrdiff_t*
-        >
-    begin() const {
-        return boost::make_permutation_iterator(boost::begin(x), perm);
-    }
-
-    boost::permutation_iterator<
-        typename std::decay<Vector>::type::iterator,
-        const ptrdiff_t*
-        >
-    end() {
-        return boost::make_permutation_iterator(boost::end(x), perm + size());
-    }
-
-    boost::permutation_iterator<
-        typename std::decay<Vector>::type::const_iterator,
-        const ptrdiff_t*
-        >
-    end() const {
-        return boost::make_permutation_iterator(boost::end(x), perm + size());
-    }
-};
-
-} // namespace adapter
-
-namespace backend {
-namespace detail {
-
-template <class Matrix>
-struct use_builtin_matrix_ops< adapter::reordered_matrix<Matrix> >
-    : std::true_type
-{};
-
-} // namespace detail
-
-
-template <class Vector>
-struct is_builtin_vector< adapter::reordered_vector<Vector> >
-    : is_builtin_vector<typename std::decay<Vector>::type>
-{};
-
-} // namespace backend
-
-namespace adapter {
-
-template <class ordering = amgcl::reorder::cuthill_mckee<false> >
-class reorder {
-    public:
-        template <class Matrix>
-        reorder(const Matrix &A) : n(backend::rows(A)), perm(n), iperm(n)
-        {
-            ordering::get(A, perm);
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) iperm[perm[i]] = i;
-        }
-
-        template <class Matrix>
-        typename std::enable_if<
-            !backend::is_builtin_vector<Matrix>::value,
-            reordered_matrix<Matrix>
-        >::type
-        operator()(const Matrix &A) const {
-            return reordered_matrix<Matrix>(A, perm.data(), iperm.data());
-        }
-
-        template <class Vector>
-        typename std::enable_if<
-            backend::is_builtin_vector<Vector>::value,
-            reordered_vector<Vector>
-        >::type
-        operator()(Vector &x) const {
-            return reordered_vector<Vector>(x, perm.data());
-        }
-
-        template <class Vector>
-        typename std::enable_if<
-            backend::is_builtin_vector<Vector>::value,
-            reordered_vector<const Vector>
-        >::type
-        operator()(const Vector &x) const {
-            return reordered_vector<const Vector>(x, perm.data());
-        }
-
-        template <class Vector1, class Vector2>
-        void forward(const Vector1 &x, Vector2 &y) const {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) y[i] = x[perm[i]];
-        }
-
-        template <class Vector1, class Vector2>
-        void inverse(const Vector1 &x, Vector2 &y) const {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) y[perm[i]] = x[i];
-        }
-
-    private:
-        ptrdiff_t n;
-        backend::numa_vector<ptrdiff_t> perm, iperm;
-};
-
-} // namespace adapter
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/scaled_problem.hpp b/src/solvers/amgcl/adapter/scaled_problem.hpp
deleted file mode 100644
index 2566d1c..0000000
--- a/src/solvers/amgcl/adapter/scaled_problem.hpp
+++ /dev/null
@@ -1,166 +0,0 @@
-#ifndef AMGCL_ADAPTER_SCALED_PROBLEM_HPP
-#define AMGCL_ADAPTER_SCALED_PROBLEM_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/scaled_problem.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Scale matrix, rhs, and solution.
-
-Example:
-\code
-auto A = std::tie(rows, ptr, col, val);
-auto scale = amgcl::adapter::scale_diagonal<Backend>(A, bprm);
-
-// Setup solver
-Solver solve(scale.matrix(A), prm, bprm);
-
-// option 1: rhs is untouched
-solve(*scale.rhs(b), x);
-
-// option 2: rhs is prescaled in-place
-scale(b);
-solve(b, x);
-
-// postprocess the solution:
-scale(x);
-\endcode
-*/
-
-#include <vector>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace adapter {
-
-template <class Matrix, class Scale>
-struct scaled_matrix {
-    typedef typename backend::value_type<Matrix>::type value_type;
-    typedef typename backend::value_type<Scale>::type  scale_type;
-
-    const Matrix &A;
-    const Scale  &s;
-
-    scaled_matrix(const Matrix &A, const Scale &s) : A(A), s(s) {}
-
-    size_t rows()     const { return backend::rows(A);     }
-    size_t cols()     const { return backend::cols(A);     }
-    size_t nonzeros() const { return backend::nonzeros(A); }
-
-    struct row_iterator : public backend::row_iterator<Matrix>::type {
-        typedef typename backend::row_iterator<Matrix>::type Base;
-
-        scale_type  si;
-        const Scale &s;
-
-        row_iterator(const Matrix &A, const Scale &s, size_t i)
-            : Base(A, i), si(s[i]), s(s) {}
-
-        value_type value() const {
-            return si * static_cast<const Base*>(this)->value() * s[this->col()];
-        }
-    };
-
-    row_iterator row_begin(size_t i) const {
-        return row_iterator(A, s, i);
-    }
-};
-
-template <class Backend, class Scale>
-struct scaled_problem {
-    typedef typename Backend::params backend_params;
-
-    const std::shared_ptr<Scale> s;
-    const backend_params &bprm;
-
-    scaled_problem(std::shared_ptr<Scale> s, const backend_params &bprm = backend_params())
-        : s(s), bprm(bprm) {}
-
-    template <class Matrix>
-    scaled_matrix<Matrix, Scale> matrix(const Matrix &A) const {
-        return scaled_matrix<Matrix, Scale>(A, *s);
-    }
-
-    template <class Vector>
-    std::shared_ptr<typename Backend::vector> rhs(const Vector &v) const {
-        auto t = Backend::copy_vector(v, bprm);
-        (*this)(*t);
-        return t;
-    }
-
-    template <class Vector>
-    void operator()(Vector &x) const {
-        typedef typename backend::value_type<Vector>::type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        const auto one  = math::identity<scalar_type>();
-        const auto zero = math::zero<scalar_type>();
-
-        if (backend::is_builtin_vector<Vector>::value) {
-            backend::vmul(one, *s, x, zero, x);
-        } else {
-            backend::vmul(one, *Backend::copy_vector(*s, bprm), x, zero, x);
-        }
-    }
-};
-
-template <class Backend, class Matrix>
-scaled_problem<
-    Backend,
-    std::vector<
-        typename math::scalar_of<
-            typename backend::value_type<Matrix>::type
-            >::type>
-        >
-scale_diagonal(
-        const Matrix &A,
-        const typename Backend::params &bprm = typename Backend::params()
-        )
-{
-    typedef typename backend::value_type<Matrix>::type value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    ptrdiff_t n = backend::rows(A);
-    auto      s = std::make_shared<std::vector<scalar_type>>(n);
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        for(auto a = backend::row_begin(A, i); a; ++a) {
-            if (a.col() == i) {
-                (*s)[i] = math::inverse(sqrt(math::norm(a.value())));
-                break;
-            }
-        }
-    }
-
-    return scaled_problem<Backend, std::vector<scalar_type>>(s, bprm);
-}
-
-} // namespace adapter
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/ublas.hpp b/src/solvers/amgcl/adapter/ublas.hpp
deleted file mode 100644
index d2fcd25..0000000
--- a/src/solvers/amgcl/adapter/ublas.hpp
+++ /dev/null
@@ -1,75 +0,0 @@
-#ifndef AMGCL_ADAPTER_UBLAS_HPP
-#define AMGCL_ADAPTER_UBLAS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2014, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/ublas.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Adapters for Boost.uBlas matrices and vectors.
-\ingroup adapters
-*/
-
-#include <boost/numeric/ublas/vector.hpp>
-#include <boost/numeric/ublas/matrix_sparse.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/adapter/crs_tuple.hpp>
-
-namespace amgcl {
-namespace backend {
-
-// Make builtin backend recognize ublas vectors as its own:
-template <typename T>
-struct is_builtin_vector< boost::numeric::ublas::vector<T> >
-    : std::true_type {};
-
-/// Adapts Boost.uBlas matrix.
-template <typename T>
-std::tuple<
-    size_t,
-    iterator_range<const size_t*>,
-    iterator_range<const size_t*>,
-    iterator_range<const T*>
-    >
-map(const boost::numeric::ublas::compressed_matrix<T, boost::numeric::ublas::row_major> &A) {
-    return std::make_tuple(
-            A.size1(),
-            make_iterator_range(
-                A.index1_data().begin(), A.index1_data().end()
-                ),
-            make_iterator_range(
-                A.index2_data().begin(), A.index2_data().end()
-                ),
-            make_iterator_range(
-                A.value_data().begin(), A.value_data().end()
-                )
-            );
-}
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/adapter/zero_copy.hpp b/src/solvers/amgcl/adapter/zero_copy.hpp
deleted file mode 100644
index b28736d..0000000
--- a/src/solvers/amgcl/adapter/zero_copy.hpp
+++ /dev/null
@@ -1,98 +0,0 @@
-#ifndef AMGCL_ADAPTER_ZERO_COPY_HPP
-#define AMGCL_ADAPTER_ZERO_COPY_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file    amgcl/adapter/zero_copy.hpp
-\author  Denis Demidov <dennis.demidov@gmail.com>
-\brief   Zero-copy adapter for input matrix in CRS format.
-\ingroup adapters
-*/
-
-#include <type_traits>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace adapter {
-
-template <typename Ptr, typename Col, typename Val>
-std::shared_ptr< backend::crs<Val> >
-zero_copy(size_t nrows, size_t ncols, const Ptr *ptr, const Col *col, const Val *val) {
-    // Check that Ptr and Col types are binary-compatible with ptrdiff_t:
-    static_assert(std::is_integral<Ptr>::value, "Unsupported Ptr type");
-    static_assert(std::is_integral<Col>::value, "Unsupported Col type");
-    static_assert(sizeof(Ptr) == sizeof(ptrdiff_t), "Unsupported Ptr type");
-    static_assert(sizeof(Col) == sizeof(ptrdiff_t), "Unsupported Col type");
-
-    auto A = std::make_shared< backend::crs<Val> >();
-    A->nrows = nrows;
-    A->ncols = ncols;
-    A->nnz   = nrows ? ptr[nrows] : 0;
-
-    A->ptr = (ptrdiff_t*)ptr;
-    A->col = (ptrdiff_t*)col;
-    A->val = (Val*)val;
-
-    A->own_data = false;
-
-    return A;
-}
-
-template <typename Ptr, typename Col, typename Val>
-std::shared_ptr< backend::crs<Val> >
-zero_copy(size_t n, const Ptr *ptr, const Col *col, const Val *val) {
-    return zero_copy(n, n, ptr, col, val);
-}
-
-template <typename Ptr, typename Col, typename Val>
-std::shared_ptr< backend::crs<Val, Col, Ptr> >
-zero_copy_direct(size_t nrows, size_t ncols, const Ptr *ptr, const Col *col, const Val *val) {
-    auto A = std::make_shared< backend::crs<Val, Col, Ptr> >();
-    A->nrows = nrows;
-    A->ncols = ncols;
-    A->nnz   = nrows ? ptr[nrows] : 0;
-
-    A->ptr = const_cast<Ptr*>(ptr);
-    A->col = const_cast<Col*>(col);
-    A->val = const_cast<Val*>(val);
-
-    A->own_data = false;
-
-    return A;
-}
-
-template <typename Ptr, typename Col, typename Val>
-std::shared_ptr< backend::crs<Val, Col, Ptr> >
-zero_copy_direct(size_t n, const Ptr *ptr, const Col *col, const Val *val) {
-    return zero_copy_direct(n, n, ptr, col, val);
-}
-
-} // namespace adapter
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/amg.hpp b/src/solvers/amgcl/amg.hpp
deleted file mode 100644
index e58a5f5..0000000
--- a/src/solvers/amgcl/amg.hpp
+++ /dev/null
@@ -1,602 +0,0 @@
-#ifndef AMGCL_AMG_HPP
-#define AMGCL_AMG_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/amg.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  An AMG preconditioner.
- */
-
-#include <iostream>
-#include <iomanip>
-#include <list>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/util.hpp>
-
-/// Primary namespace.
-namespace amgcl {
-
-/// Algebraic multigrid method.
-/**
- * AMG is one the most effective methods for solution of large sparse
- * unstructured systems of equations, arising, for example, from discretization
- * of PDEs on unstructured grids \cite Trottenberg2001. The method can be used
- * as a black-box solver for various computational problems, since it does not
- * require any information about the underlying geometry.
- *
- * The three template parameters allow the user to select the exact components
- * of the method:
- *  1. *Backend* to transfer the constructed hierarchy to,
- *  2. *Coarsening* strategy for hierarchy construction, and
- *  3. *Relaxation* scheme (smoother to use during the solution phase).
- *
- * Instance of the class builds the AMG hierarchy for the given system matrix
- * and is intended to be used as a preconditioner.
- */
-template <
-    class Backend,
-    template <class> class Coarsening,
-    template <class> class Relax
-    >
-class amg {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::col_type   col_type;
-        typedef typename Backend::ptr_type   ptr_type;
-        typedef typename Backend::matrix     matrix;
-        typedef typename Backend::vector     vector;
-
-        typedef Coarsening<Backend>            coarsening_type;
-        typedef Relax<Backend>                 relax_type;
-
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        /// Backend parameters.
-        typedef typename Backend::params     backend_params;
-
-        /// Parameters of the method.
-        /**
-         * The amgcl::amg::params struct includes parameters for each
-         * component of the method as well as some universal parameters.
-         */
-        struct params {
-            typedef typename coarsening_type::params coarsening_params;
-            typedef typename relax_type::params relax_params;
-
-            coarsening_params coarsening;   ///< Coarsening parameters.
-            relax_params      relax;        ///< Relaxation parameters.
-
-            /// Specifies when level is coarse enough to be solved directly.
-            /**
-             * If number of variables at a next level in the hierarchy becomes
-             * lower than this threshold, then the hierarchy construction is
-             * stopped and the linear system is solved directly at this level.
-             */
-            unsigned coarse_enough;
-
-            /// Use direct solver at the coarsest level.
-            /**
-             * When set, the coarsest level is solved with a direct solver.
-             * Otherwise a smoother is used as a solver.
-             */
-            bool direct_coarse;
-
-            /// Maximum number of levels.
-            /** If this number is reached while the size of the last level is
-             * greater that `coarse_enough`, then the coarsest level will not
-             * be solved exactly, but will use a smoother.
-             */
-            unsigned max_levels;
-
-            /// Number of pre-relaxations.
-            unsigned npre;
-
-            /// Number of post-relaxations.
-            unsigned npost;
-
-            /// Number of cycles (1 for V-cycle, 2 for W-cycle, etc.).
-            unsigned ncycle;
-
-            /// Number of cycles to make as part of preconditioning.
-            unsigned pre_cycles;
-
-            /// Keep matrices in internal format to allow for quick rebuild of the hierarchy
-            bool allow_rebuild;
-
-            params() :
-                coarse_enough( Backend::direct_solver::coarse_enough() ),
-                direct_coarse(true),
-                max_levels( std::numeric_limits<unsigned>::max() ),
-                npre(1), npost(1), ncycle(1), pre_cycles(1),
-                allow_rebuild(std::is_same<matrix, build_matrix>::value)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, coarsening),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, relax),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, coarse_enough),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, direct_coarse),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, max_levels),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, npre),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, npost),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ncycle),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, pre_cycles),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, allow_rebuild)
-            {
-                check_params(p, {"coarsening", "relax", "coarse_enough",
-                        "direct_coarse", "max_levels", "npre", "npost",
-                        "ncycle",  "pre_cycles", "allow_rebuild"});
-
-                precondition(max_levels > 0, "max_levels should be positive");
-            }
-
-            void get(
-                    boost::property_tree::ptree &p,
-                    const std::string &path = ""
-                    ) const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, coarsening);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, relax);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, coarse_enough);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, direct_coarse);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, max_levels);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, npre);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, npost);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ncycle);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, pre_cycles);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, allow_rebuild);
-            }
-#endif
-        } prm;
-
-        /// Builds the AMG hierarchy for the system matrix.
-        /**
-         * The input matrix is copied here and is safe to delete afterwards.
-         *
-         * \param A The system matrix. Should be convertible to
-         *          amgcl::backend::crs<>.
-         * \param p AMG parameters.
-         *
-         * \sa amgcl/adapter/crs_tuple.hpp
-         */
-        template <class Matrix>
-        amg(
-                const Matrix &M,
-                const params &p = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(p)
-        {
-            auto A = std::make_shared<build_matrix>(M);
-            sort_rows(*A);
-
-            do_init(A, bprm);
-        }
-
-        /// Builds the AMG hierarchy for the system matrix.
-        /**
-         * The shared pointer to the input matrix is passed here. The matrix
-         * will not be copied and should out-live the amg instance.
-         * The matrix should be either in amgcl::backend::crs<T> format, or
-         * inherit from the class and override its ptr(), col(), and val()
-         * virtual functions.
-         *
-         * \param A The system matrix.
-         * \param p AMG parameters.
-         *
-         * \sa amgcl/adapter/crs_tuple.hpp
-         */
-        amg(
-                std::shared_ptr<build_matrix> A,
-                const params &p = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(p)
-        {
-            do_init(A, bprm);
-        }
-
-        /// Rebuild the hierarchy using the new system matrix.
-        /**
-         * This requires for prm.allow_rebuild to be set. The transfer
-         * operators created during the initial setup are reused.
-         */
-        template <class Matrix>
-        void rebuild(
-                const Matrix &M,
-                const backend_params &bprm = backend_params()
-                )
-        {
-            auto A = std::make_shared<build_matrix>(M);
-            sort_rows(*A);
-            rebuild(A, bprm);
-        }
-
-        /// Rebuild the hierarchy using the new system matrix.
-        /**
-         * This requires for prm.allow_rebuild to be set. The transfer
-         * operators created during the initial setup are reused.
-         */
-        void rebuild(
-                std::shared_ptr<build_matrix> A,
-                const backend_params &bprm = backend_params()
-                )
-        {
-            precondition(prm.allow_rebuild,
-                    "allow_rebuild is not set!");
-            precondition(
-                    backend::rows(*A) == backend::rows(system_matrix()) &&
-                    backend::cols(*A) == backend::rows(*A),
-                    "Matrix dimensions differ from the original ones!"
-                    );
-
-            AMGCL_TIC("rebuild");
-            coarsening_type C(prm.coarsening);
-            for(auto &level : levels) {
-                A = level.rebuild(A, C, prm, bprm);
-            }
-            AMGCL_TOC("rebuild");
-        }
-
-        /// Performs single V-cycle for the given right-hand side and solution.
-        /**
-         * \param rhs Right-hand side vector.
-         * \param x   Solution vector.
-         */
-        template <class Vec1, class Vec2>
-        void cycle(const Vec1 &rhs, Vec2 &&x) const {
-            cycle(levels.begin(), rhs, x);
-        }
-
-        /// Performs single V-cycle after clearing x.
-        /**
-         * This is intended for use as a preconditioning procedure.
-         *
-         * \param rhs Right-hand side vector.
-         * \param x   Solution vector.
-         */
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            if (prm.pre_cycles) {
-                backend::clear(x);
-                for(unsigned i = 0; i < prm.pre_cycles; ++i)
-                    cycle(rhs, x);
-            } else {
-                backend::copy(rhs, x);
-            }
-        }
-
-        /// Returns the system matrix from the finest level.
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return levels.front().A;
-        }
-
-        const matrix& system_matrix() const {
-            return *system_matrix_ptr();
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-            for(const auto &lvl : levels) b += lvl.bytes();
-            return b;
-        }
-    private:
-        struct level {
-            size_t m_rows, m_nonzeros;
-
-            std::shared_ptr<vector> f;
-            std::shared_ptr<vector> u;
-            std::shared_ptr<vector> t;
-
-            std::shared_ptr<matrix> A;
-            std::shared_ptr<matrix> P;
-            std::shared_ptr<matrix> R;
-
-            std::shared_ptr<build_matrix> bP;
-            std::shared_ptr<build_matrix> bR;
-
-            std::shared_ptr< typename Backend::direct_solver > solve;
-
-            std::shared_ptr<relax_type> relax;
-
-            size_t bytes() const {
-                size_t b = 0;
-
-                if (f) b += backend::bytes(*f);
-                if (u) b += backend::bytes(*u);
-                if (t) b += backend::bytes(*t);
-
-                if (A) b += backend::bytes(*A);
-                if (P) b += backend::bytes(*P);
-                if (R) b += backend::bytes(*R);
-
-                if (solve) b += backend::bytes(*solve);
-                if (relax) b += backend::bytes(*relax);
-
-                return b;
-            }
-
-            level() : m_rows(0), m_nonzeros(0) {}
-
-            level(std::shared_ptr<build_matrix> A,
-                    params &prm, const backend_params &bprm)
-                : m_rows(backend::rows(*A)), m_nonzeros(backend::nonzeros(*A))
-            {
-                AMGCL_TIC("move to backend");
-                f = Backend::create_vector(m_rows, bprm);
-                u = Backend::create_vector(m_rows, bprm);
-                t = Backend::create_vector(m_rows, bprm);
-                this->A = Backend::copy_matrix(A, bprm);
-                AMGCL_TOC("move to backend");
-
-                AMGCL_TIC("relaxation");
-                relax = std::make_shared<relax_type>(*A, prm.relax, bprm);
-                AMGCL_TOC("relaxation");
-            }
-
-            std::shared_ptr<build_matrix> step_down(
-                    std::shared_ptr<build_matrix> A,
-                    coarsening_type &C, const backend_params &bprm,
-                    bool allow_rebuild)
-            {
-                AMGCL_TIC("transfer operators");
-                std::shared_ptr<build_matrix> P, R;
-
-                try {
-                    std::tie(P, R) = C.transfer_operators(*A);
-                } catch(error::empty_level) {
-                    AMGCL_TOC("transfer operators");
-                    return std::shared_ptr<build_matrix>();
-                }
-
-                sort_rows(*P);
-                sort_rows(*R);
-
-                if (allow_rebuild) {
-                    bP = P;
-                    bR = R;
-                }
-                AMGCL_TOC("transfer operators");
-
-                AMGCL_TIC("move to backend");
-                this->P = Backend::copy_matrix(P, bprm);
-                this->R = Backend::copy_matrix(R, bprm);
-                AMGCL_TOC("move to backend");
-
-                AMGCL_TIC("coarse operator");
-                A = C.coarse_operator(*A, *P, *R);
-                sort_rows(*A);
-                AMGCL_TOC("coarse operator");
-
-                return A;
-            }
-
-            void create_coarse(
-                    std::shared_ptr<build_matrix> A,
-                    const backend_params &bprm, bool single_level)
-            {
-                m_rows     = backend::rows(*A);
-                m_nonzeros = backend::nonzeros(*A);
-
-                u = Backend::create_vector(m_rows, bprm);
-                f = Backend::create_vector(m_rows, bprm);
-
-                solve = Backend::create_solver(A, bprm);
-                if (single_level)
-                    this->A = Backend::copy_matrix(A, bprm);
-            }
-
-            std::shared_ptr<build_matrix> rebuild(
-                    std::shared_ptr<build_matrix> A,
-                    const coarsening_type &C,
-                    const params &prm,
-                    const backend_params &bprm
-                    )
-            {
-                if (this->A) {
-                    AMGCL_TIC("move to backend");
-                    this->A = Backend::copy_matrix(A, bprm);
-                    AMGCL_TOC("move to backend");
-                }
-
-                if(relax) {
-                    AMGCL_TIC("relaxation");
-                    relax = std::make_shared<relax_type>(*A, prm.relax, bprm);
-                    AMGCL_TOC("relaxation");
-                }
-
-                if (solve) {
-                    AMGCL_TIC("coarsest level");
-                    solve = Backend::create_solver(A, bprm);
-                    AMGCL_TOC("coarsest level");
-                }
-
-                if (bP && bR) {
-                    AMGCL_TIC("coarse operator");
-                    A = C.coarse_operator(*A, *bP, *bR);
-                    sort_rows(*A);
-                    AMGCL_TOC("coarse operator");
-                }
-
-                return A;
-            }
-
-            size_t rows() const {
-                return m_rows;
-            }
-
-            size_t nonzeros() const {
-                return m_nonzeros;
-            }
-        };
-
-        typedef typename std::list<level>::const_iterator level_iterator;
-
-        std::list<level> levels;
-
-        void do_init(
-                std::shared_ptr<build_matrix> A,
-                const backend_params &bprm = backend_params()
-           )
-        {
-            precondition(
-                    backend::rows(*A) == backend::cols(*A),
-                    "Matrix should be square!"
-                    );
-
-            bool direct_coarse_solve = true;
-
-            coarsening_type C(prm.coarsening);
-
-            while( backend::rows(*A) > prm.coarse_enough) {
-                levels.push_back( level(A, prm, bprm) );
-
-                if (levels.size() >= prm.max_levels) break;
-
-                A = levels.back().step_down(A, C, bprm, prm.allow_rebuild);
-                if (!A) {
-                    // Zero-sized coarse level. Probably the system matrix on
-                    // this level is diagonal, should be easily solvable with a
-                    // couple of smoother iterations.
-                    direct_coarse_solve = false;
-                    break;
-                }
-            }
-
-            if (!A || backend::rows(*A) > prm.coarse_enough) {
-                // The coarse matrix is still too big to be solved directly.
-                direct_coarse_solve = false;
-            }
-
-            if (direct_coarse_solve) {
-                AMGCL_TIC("coarsest level");
-                if (prm.direct_coarse) {
-                    level l;
-                    l.create_coarse(A, bprm, levels.empty());
-                    levels.push_back(l);
-                } else {
-                    levels.push_back( level(A, prm, bprm) );
-                }
-                AMGCL_TOC("coarsest level");
-            }
-        }
-
-        template <class Vec1, class Vec2>
-        void cycle(level_iterator lvl, const Vec1 &rhs, Vec2 &x) const
-        {
-            level_iterator nxt = lvl, end = levels.end();
-            ++nxt;
-
-            if (nxt == end) {
-                if (lvl->solve) {
-                    AMGCL_TIC("coarse");
-                    (*lvl->solve)(rhs, x);
-                    AMGCL_TOC("coarse");
-                } else {
-                    AMGCL_TIC("relax");
-                    for(size_t i = 0; i < prm.npre;  ++i) lvl->relax->apply_pre(*lvl->A, rhs, x, *lvl->t);
-                    for(size_t i = 0; i < prm.npost; ++i) lvl->relax->apply_post(*lvl->A, rhs, x, *lvl->t);
-                    AMGCL_TOC("relax");
-                }
-            } else {
-                for (size_t j = 0; j < prm.ncycle; ++j) {
-                    AMGCL_TIC("relax");
-                    for(size_t i = 0; i < prm.npre; ++i)
-                        lvl->relax->apply_pre(*lvl->A, rhs, x, *lvl->t);
-                    AMGCL_TOC("relax");
-
-                    backend::residual(rhs, *lvl->A, x, *lvl->t);
-
-                    backend::spmv(math::identity<scalar_type>(), *lvl->R, *lvl->t, math::zero<scalar_type>(), *nxt->f);
-
-                    backend::clear(*nxt->u);
-                    cycle(nxt, *nxt->f, *nxt->u);
-
-                    backend::spmv(math::identity<scalar_type>(), *lvl->P, *nxt->u, math::identity<scalar_type>(), x);
-
-                    AMGCL_TIC("relax");
-                    for(size_t i = 0; i < prm.npost; ++i)
-                        lvl->relax->apply_post(*lvl->A, rhs, x, *lvl->t);
-                    AMGCL_TOC("relax");
-                }
-            }
-        }
-
-    template <class B, template <class> class C, template <class> class R>
-    friend std::ostream& operator<<(std::ostream &os, const amg<B, C, R> &a);
-};
-
-/// Sends information about the AMG hierarchy to output stream.
-template <class B, template <class> class C, template <class> class R>
-std::ostream& operator<<(std::ostream &os, const amg<B, C, R> &a)
-{
-    typedef typename amg<B, C, R>::level level;
-    ios_saver ss(os);
-
-    size_t sum_dof = 0;
-    size_t sum_nnz = 0;
-    size_t sum_mem = 0;
-
-    for(const level &lvl : a.levels) {
-        sum_dof += lvl.rows();
-        sum_nnz += lvl.nonzeros();
-        sum_mem += lvl.bytes();
-    }
-
-    os << "Number of levels:    "   << a.levels.size()
-        << "\nOperator complexity: " << std::fixed << std::setprecision(2)
-        << 1.0 * sum_nnz / a.levels.front().nonzeros()
-        << "\nGrid complexity:     " << std::fixed << std::setprecision(2)
-        << 1.0 * sum_dof / a.levels.front().rows()
-        << "\nMemory footprint:    " << human_readable_memory(sum_mem)
-        << "\n\n"
-           "level     unknowns       nonzeros      memory\n"
-           "---------------------------------------------\n";
-
-    size_t depth = 0;
-    for(const level &lvl : a.levels) {
-        os << std::setw(5)  << depth++
-            << std::setw(13) << lvl.rows()
-            << std::setw(15) << lvl.nonzeros()
-            << std::setw(12) << human_readable_memory(lvl.bytes())
-            << " (" << std::setw(5) << std::fixed << std::setprecision(2)
-            << 100.0 * lvl.nonzeros() / sum_nnz
-            << "%)" << std::endl;
-    }
-
-    return os;
-}
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/blaze.hpp b/src/solvers/amgcl/backend/blaze.hpp
deleted file mode 100644
index 6766d6a..0000000
--- a/src/solvers/amgcl/backend/blaze.hpp
+++ /dev/null
@@ -1,332 +0,0 @@
-#ifndef AMGCL_BACKEND_BLAZE_HPP
-#define AMGCL_BACKEND_BLAZE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/viennacl.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Blaze backend.
- *
- * Uses Blaze (https://code.google.com/p/blaze-lib) types and operations.
- */
-
-#include <blaze/Math.h>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// Blaze backend
-/**
- * This is a backend that uses types defined in the Blaze library
- * (https://bitbucket.org/blaze-lib/blaze/src).
- *
- * \param real Value type.
- * \ingroup backends
- */
-template <class real>
-struct blaze {
-    typedef real      value_type;
-    typedef ptrdiff_t index_type;
-    typedef ptrdiff_t col_type;
-    typedef ptrdiff_t ptr_type;
-
-    struct provides_row_iterator : std::true_type {};
-
-    typedef ::blaze::CompressedMatrix<real> matrix;
-    typedef ::blaze::DynamicVector<real>    vector;
-    typedef ::blaze::DynamicVector<real>    matrix_diagonal;
-    typedef solver::skyline_lu<real>        direct_solver;
-
-    /// Backend parameters.
-    typedef amgcl::detail::empty_params params;
-
-    static std::string name() { return "blaze"; }
-
-    /// Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(
-            std::shared_ptr< typename builtin<real>::matrix > A,
-            const params&
-            )
-    {
-        typedef
-            typename row_iterator<typename builtin<real>::matrix>::type
-            row_iterator;
-
-        const size_t n = rows(*A);
-        const size_t m = cols(*A);
-
-        auto B = std::make_shared<matrix>(n, m);
-
-        B->reserve(nonzeros(*A));
-        for(size_t i = 0; i < n; ++i) {
-            for(row_iterator a = A->row_begin(i); a; ++a) {
-                B->append(i, a.col(), a.value());
-            }
-            B->finalize(i);
-        }
-
-        return B;
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(typename builtin<real>::vector const &x, const params&)
-    {
-        auto v = std::make_shared<vector>(x.size(), &x[0]);
-        return v;
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(
-            std::shared_ptr< typename builtin<real>::vector > x,
-            const params &prm
-            )
-    {
-        return copy_vector(*x, prm);
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    /// Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr< typename builtin<real>::matrix > A, const params&)
-    {
-        return std::make_shared<direct_solver>(*A);
-    }
-
-};
-
-//---------------------------------------------------------------------------
-// Backend interface implementation
-//---------------------------------------------------------------------------
-template < typename V, bool O >
-struct value_type < ::blaze::CompressedMatrix<V, O> > {
-    typedef V type;
-};
-
-template < typename V >
-struct value_type < ::blaze::DynamicVector<V> > {
-    typedef V type;
-};
-
-template < typename V, bool O >
-struct cols_impl< ::blaze::CompressedMatrix<V, O> > {
-    typedef ::blaze::CompressedMatrix<V, O> matrix;
-
-    static size_t get(const matrix &A) {
-        return A.columns();
-    }
-};
-
-template < typename V, bool O >
-struct nonzeros_impl< ::blaze::CompressedMatrix<V, O> > {
-    typedef ::blaze::CompressedMatrix<V, O> matrix;
-
-    static size_t get(const matrix &A) {
-        return A.nonZeros();
-    }
-};
-
-template < typename V, bool O >
-struct row_iterator< ::blaze::CompressedMatrix<V, O> >
-{
-    struct type {
-        typedef typename ::blaze::CompressedMatrix<V, O>::ConstIterator Base;
-        Base base;
-        Base end;
-
-        operator bool() const {
-            return base != end;
-        }
-
-        type operator++() {
-            ++base;
-            return *this;
-        }
-
-        size_t col() const {
-            return base->index();
-        }
-
-        V value() const {
-            return base->value();
-        }
-    };
-};
-
-template < typename V, bool O >
-struct row_begin_impl< ::blaze::CompressedMatrix<V, O> > {
-    typedef typename row_iterator< ::blaze::CompressedMatrix<V, O> >::type iterator;
-    static iterator get(const ::blaze::CompressedMatrix<V, O> &A, size_t row) {
-        return iterator{A.cbegin(row), A.cend(row)};
-    }
-};
-
-template < class A, class B, typename V, bool O >
-struct spmv_impl<
-    A, ::blaze::CompressedMatrix<V, O>, ::blaze::DynamicVector<V>,
-    B, ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::CompressedMatrix<V, O> matrix;
-    typedef ::blaze::DynamicVector<V>    vector;
-
-    static void apply(A alpha, const matrix &K, const vector &x, B beta, vector &y)
-    {
-        if (!math::is_zero(beta))
-            y = alpha * (K * x) + beta * y;
-        else
-            y = alpha * (K * x);
-    }
-};
-
-template < typename V, bool O >
-struct residual_impl<
-    ::blaze::CompressedMatrix<V, O>,
-    ::blaze::DynamicVector<V>,
-    ::blaze::DynamicVector<V>,
-    ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::CompressedMatrix<V, O> matrix;
-    typedef ::blaze::DynamicVector<V>    vector;
-
-    static void apply(const vector &rhs, const matrix &A, const vector &x,
-            vector &r)
-    {
-        r = rhs - A * x;
-    }
-};
-
-template < typename V >
-struct clear_impl< ::blaze::DynamicVector<V> >
-{
-    typedef ::blaze::DynamicVector<V> vector;
-
-    static void apply(vector &x)
-    {
-        x = 0;
-    }
-};
-
-template < typename V >
-struct copy_impl<
-    ::blaze::DynamicVector<V>,
-    ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::DynamicVector<V> vector;
-
-    static void apply(const vector &x, vector &y)
-    {
-        y = x;
-    }
-};
-
-template < typename V >
-struct inner_product_impl<
-    ::blaze::DynamicVector<V>,
-    ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::DynamicVector<V> vector;
-
-    static V get(const vector &x, const vector &y)
-    {
-        return (x, y);
-    }
-};
-
-template < typename A, typename B, typename V >
-struct axpby_impl<
-    A, ::blaze::DynamicVector<V>,
-    B, ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::DynamicVector<V> vector;
-
-    static void apply(A a, const vector &x, B b, vector &y)
-    {
-        if (!math::is_zero(b))
-            y = a * x + b * y;
-        else
-            y = a * x;
-    }
-};
-
-template < typename A, typename B, typename C, typename V >
-struct axpbypcz_impl<
-    A, ::blaze::DynamicVector<V>,
-    B, ::blaze::DynamicVector<V>,
-    C, ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::DynamicVector<V> vector;
-
-    static void apply(
-            V a, const vector &x,
-            V b, const vector &y,
-            V c,       vector &z
-            )
-    {
-        if (!math::is_zero(c))
-            z = a * x + b * y + c * z;
-        else
-            z = a * x + b * y;
-    }
-};
-
-template < typename A, typename B, typename V >
-struct vmul_impl<
-    A, ::blaze::DynamicVector<V>, ::blaze::DynamicVector<V>,
-    B, ::blaze::DynamicVector<V>
-    >
-{
-    typedef ::blaze::DynamicVector<V> vector;
-
-    static void apply(A a, const vector &x, const vector &y, B b, vector &z)
-    {
-        if (!math::is_zero(b))
-            z = a * x * y + b * z;
-        else
-            z = a * x * y;
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/block_crs.hpp b/src/solvers/amgcl/backend/block_crs.hpp
deleted file mode 100644
index 657f559..0000000
--- a/src/solvers/amgcl/backend/block_crs.hpp
+++ /dev/null
@@ -1,313 +0,0 @@
-#ifndef AMGCL_BACKEND_BLOCK_CRS_HPP
-#define AMGCL_BACKEND_BLOCK_CRS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/block_crs.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Sparse matrix in block-CRS format.
- */
-
-#include <algorithm>
-#include <numeric>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// Sparse matrix in Block CRS format.
-/**
- * \param V Value type.
- * \param C Column number type.
- * \param P Index type.
- */
-template < typename V, typename C, typename P >
-struct bcrs {
-    typedef V value_type;
-    typedef V val_type;
-    typedef C col_type;
-    typedef P ptr_type;
-
-    size_t block_size;
-    size_t nrows, ncols;
-    size_t brows, bcols;
-
-    std::vector<ptr_type> ptr;
-    std::vector<col_type> col;
-    std::vector<val_type> val;
-
-    /// Converts matrix in CRS format to Block CRS format.
-    /**
-     * \param A          Input matrix.
-     * \param block_size Block size.
-     *
-     * \note Input matrix dimensions are *not* required to be divisible by
-     * block_size.
-     */
-    template < class Matrix >
-    bcrs(const Matrix &A, size_t block_size)
-        : block_size(block_size), nrows( rows(A) ), ncols( cols(A) ),
-          brows((nrows + block_size - 1) / block_size),
-          bcols((ncols + block_size - 1) / block_size),
-          ptr(brows + 1, 0)
-    {
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> marker(bcols, -1);
-
-            // Count number of nonzeros in block matrix.
-#pragma omp for
-            for(ptr_type ib = 0; ib < static_cast<ptr_type>(brows); ++ib) {
-                ptr_type ia = ib * block_size;
-
-                for(size_t k = 0; k < block_size && ia < static_cast<ptr_type>(nrows); ++k, ++ia) {
-                    for(auto a = backend::row_begin(A, ia); a; ++a) {
-                        col_type cb = a.col() / block_size;
-
-                        if (marker[cb] != static_cast<col_type>(ib)) {
-                            marker[cb]  = static_cast<col_type>(ib);
-                            ++ptr[ib + 1];
-                        }
-                    }
-                }
-            }
-
-#pragma omp single
-            {
-                std::partial_sum(ptr.begin(), ptr.end(), ptr.begin());
-                col.resize(ptr.back());
-                val.resize(ptr.back() * block_size * block_size, 0);
-            }
-
-            std::fill(marker.begin(), marker.end(), -1);
-
-            // Fill the block matrix.
-#pragma omp for
-            for(ptr_type ib = 0; ib < static_cast<ptr_type>(brows); ++ib) {
-                ptr_type ia = ib * block_size;
-                ptr_type row_beg = ptr[ib];
-                ptr_type row_end = row_beg;
-
-                for(size_t k = 0; k < block_size && ia < static_cast<ptr_type>(nrows); ++k, ++ia) {
-                    for(auto a = backend::row_begin(A, ia); a; ++a) {
-                        col_type cb = a.col() / block_size;
-                        col_type cc = a.col() % block_size;
-                        val_type va = a.value();
-
-                        if (marker[cb] < row_beg) {
-                            marker[cb] = row_end;
-                            col[row_end] = cb;
-                            val[block_size * (block_size * row_end + k) + cc] = va;
-                            ++row_end;
-                        } else {
-                            val[block_size * (block_size * marker[cb] + k) + cc] = va;
-                        }
-                    }
-                }
-            }
-        }
-    }
-};
-
-/// block_crs backend definition.
-/**
- * \param real Value type.
- * \ingroup backends
- */
-template <typename real>
-struct block_crs {
-    typedef real      value_type;
-    typedef ptrdiff_t index_type;
-    typedef ptrdiff_t col_type;
-    typedef ptrdiff_t ptr_type;
-
-    typedef bcrs<real, index_type, index_type> matrix;
-    typedef typename builtin<real>::vector     vector;
-    typedef typename builtin<real>::vector     matrix_diagonal;
-    typedef solver::skyline_lu<value_type>     direct_solver;
-
-    struct provides_row_iterator : std::false_type {};
-
-    /// Backend parameters.
-    struct params {
-        /// Block size to use with the created matrices.
-        size_t block_size;
-
-        params(size_t block_size = 4) : block_size(block_size) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, block_size)
-        {
-            check_params(p, {"block_size"});
-        }
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, block_size);
-        }
-#endif
-    };
-
-    static std::string name() { return "block_crs"; }
-
-    /// Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr< typename backend::builtin<real>::matrix > A,
-            const params &prm)
-    {
-        return std::make_shared<matrix>(*A, prm.block_size);
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(const vector &x, const params&)
-    {
-        return std::make_shared<vector>(x);
-    }
-
-    static std::shared_ptr< vector >
-    copy_vector(const std::vector<value_type> &x, const params&)
-    {
-        return std::make_shared<vector>(x);
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(std::shared_ptr< vector > x, const params&)
-    {
-        return x;
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    static std::shared_ptr<direct_solver>
-    create_solver(
-            std::shared_ptr< typename backend::builtin<real>::matrix > A,
-            const params&)
-    {
-        return std::make_shared<direct_solver>(*A);
-    }
-};
-
-//---------------------------------------------------------------------------
-// Specialization of backend interface
-//---------------------------------------------------------------------------
-template < typename V, typename C, typename P >
-struct rows_impl< bcrs<V, C, P> > {
-    static size_t get(const bcrs<V, C, P> &A) {
-        return A.nrows;
-    }
-};
-
-template < typename V, typename C, typename P >
-struct cols_impl< bcrs<V, C, P> > {
-    static size_t get(const bcrs<V, C, P> &A) {
-        return A.ncols;
-    }
-};
-
-template < typename V, typename C, typename P >
-struct nonzeros_impl< bcrs<V, C, P> > {
-    static size_t get(const bcrs<V, C, P> &A) {
-        return A.ptr.back() * A.block_size * A.block_size;
-    }
-};
-
-template < typename Alpha, typename Beta, typename V, typename C, typename P, class Vec1, class Vec2 >
-struct spmv_impl< Alpha, bcrs<V, C, P>, Vec1, Beta, Vec2 >
-{
-    typedef bcrs<V, C, P>  matrix;
-
-    static void apply(Alpha alpha, const matrix &A, const Vec1 &x, Beta beta, Vec2 &y)
-    {
-        const size_t nb  = A.brows;
-        const size_t na  = A.nrows;
-        const size_t ma  = A.ncols;
-        const size_t b1 = A.block_size;
-        const size_t b2 = b1 * b1;
-
-        if (!math::is_zero(beta)) {
-            if (beta != 1) {
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(na); ++i) {
-                    y[i] *= beta;
-                }
-            }
-        } else {
-            backend::clear(y);
-        }
-
-#pragma omp parallel for
-        for(ptrdiff_t ib = 0; ib < static_cast<ptrdiff_t>(nb); ++ib) {
-            for(P jb = A.ptr[ib], eb = A.ptr[ib + 1]; jb < eb; ++jb) {
-                size_t x0 = A.col[jb] * b1;
-                size_t y0 = ib * b1;
-                block_prod(b1, std::min(b1, ma - x0), std::min(b1, na - y0),
-                        alpha, &A.val[jb * b2], &x[x0], &y[y0]
-                        );
-            }
-        }
-    }
-
-    static void block_prod(size_t dim, size_t nx, size_t ny,
-            Alpha alpha, const V *A, const V *x, V *y)
-    {
-        for(size_t i = 0; i < ny; ++i, ++y) {
-            const V * xx = x;
-            V sum = 0;
-            for(size_t j = 0; j < dim; ++j, ++A, ++xx)
-                if (j < nx) sum += (*A) * (*xx);
-            *y += alpha * sum;
-        }
-    }
-};
-
-template < typename V, typename C, typename P, class Vec1, class Vec2, class Vec3 >
-struct residual_impl< bcrs<V, C, P>, Vec1, Vec2, Vec3 >
-{
-    typedef bcrs<V, C, P>  matrix;
-
-    static void apply(const Vec1 &rhs, const matrix &A, const Vec2 &x, Vec3 &r)
-    {
-        typedef typename math::scalar_of<V>::type S;
-        const auto one = math::identity<S>();
-        backend::copy(rhs, r);
-        backend::spmv(-one, A, x, one, r);
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/builtin.hpp b/src/solvers/amgcl/backend/builtin.hpp
deleted file mode 100644
index 90a254e..0000000
--- a/src/solvers/amgcl/backend/builtin.hpp
+++ /dev/null
@@ -1,1372 +0,0 @@
-#ifndef AMGCL_BACKEND_BUILTIN_HPP
-#define AMGCL_BACKEND_BUILTIN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/builtin.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Builtin backend.
- */
-
-#include <vector>
-#include <numeric>
-#include <memory>
-#include <random>
-#include <type_traits>
-
-#ifdef _OPENMP
-#  include <omp.h>
-#endif
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-#include <amgcl/detail/inverse.hpp>
-#include <amgcl/detail/sort_row.hpp>
-#include <amgcl/detail/spgemm.hpp>
-#include <amgcl/backend/detail/matrix_ops.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// Sparse matrix stored in CRS format.
-template <
-    typename val_t = double,
-    typename col_t = ptrdiff_t,
-    typename ptr_t = col_t
-    >
-struct crs {
-    typedef val_t value_type;
-    typedef val_t val_type;
-    typedef col_t col_type;
-    typedef ptr_t ptr_type;
-
-    size_t nrows, ncols, nnz;
-    ptr_type * ptr;
-    col_type * col;
-    val_type * val;
-    bool own_data;
-
-    crs() : nrows(0), ncols(0), nnz(0), ptr(0), col(0), val(0), own_data(true)
-    {}
-
-    template <
-        class PtrRange,
-        class ColRange,
-        class ValRange
-        >
-    crs(size_t nrows, size_t ncols,
-        const PtrRange &ptr_range,
-        const ColRange &col_range,
-        const ValRange &val_range
-        ) :
-        nrows(nrows), ncols(ncols), nnz(0),
-        ptr(0), col(0), val(0), own_data(true)
-    {
-        AMGCL_TIC("CSR copy");
-        precondition(static_cast<ptrdiff_t>(nrows + 1) == std::distance(
-                    std::begin(ptr_range), std::end(ptr_range)),
-                "ptr_range has wrong size in crs constructor");
-
-        nnz = ptr_range[nrows];
-
-        precondition(static_cast<ptrdiff_t>(nnz) == std::distance(
-                    std::begin(col_range), std::end(col_range)),
-                "col_range has wrong size in crs constructor");
-
-        precondition(static_cast<ptrdiff_t>(nnz) == std::distance(
-                    std::begin(val_range), std::end(val_range)),
-                "val_range has wrong size in crs constructor");
-
-        ptr = new ptr_type[nrows + 1];
-        col = new col_type[nnz];
-        val = new val_type[nnz];
-
-        ptr[0] = ptr_range[0];
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i) {
-            ptr[i+1] = ptr_range[i+1];
-            for(auto j = ptr_range[i]; j < ptr_range[i+1]; ++j) {
-                col[j] = col_range[j];
-                val[j] = val_range[j];
-            }
-        }
-        AMGCL_TOC("CSR copy");
-    }
-
-    template <class Matrix>
-    crs(const Matrix &A) :
-        nrows(backend::rows(A)), ncols(backend::cols(A)),
-        nnz(0), ptr(0), col(0), val(0), own_data(true)
-    {
-        AMGCL_TIC("CSR copy");
-        ptr = new ptr_type[nrows + 1];
-        ptr[0] = 0;
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i) {
-            int row_width = 0;
-            for(auto a = backend::row_begin(A, i); a; ++a) ++row_width;
-            ptr[i+1] = row_width;
-        }
-
-        nnz = scan_row_sizes();
-        col = new col_type[nnz];
-        val = new val_type[nnz];
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i) {
-            ptr_type row_head = ptr[i];
-            for(auto a = backend::row_begin(A, i); a; ++a) {
-                col[row_head] = a.col();
-                val[row_head] = a.value();
-
-                ++row_head;
-            }
-        }
-        AMGCL_TOC("CSR copy");
-    }
-
-    crs(const crs &other) :
-        nrows(other.nrows), ncols(other.ncols), nnz(other.nnz),
-        ptr(0), col(0), val(0), own_data(true)
-    {
-        if (other.ptr && other.col && other.val) {
-            ptr = new ptr_type[nrows + 1];
-            col = new col_type[nnz];
-            val = new val_type[nnz];
-
-            ptr[0] = other.ptr[0];
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i) {
-                ptr[i+1] = other.ptr[i+1];
-                for(ptr_type j = other.ptr[i]; j < other.ptr[i+1]; ++j) {
-                    col[j] = other.col[j];
-                    val[j] = other.val[j];
-                }
-            }
-        }
-    }
-
-    crs(crs &&other) :
-        nrows(other.nrows), ncols(other.ncols), nnz(other.nnz),
-        ptr(other.ptr), col(other.col), val(other.val),
-        own_data(other.own_data)
-    {
-        other.nrows = 0;
-        other.ncols = 0;
-        other.nnz   = 0;
-        other.ptr   = 0;
-        other.col   = 0;
-        other.val   = 0;
-    }
-
-    const crs& operator=(const crs &other) {
-        free_data();
-
-        nrows = other.nrows;
-        ncols = other.ncols;
-        nnz   = other.nnz;
-
-        if (other.ptr && other.col && other.val) {
-            ptr = new ptr_type[nrows + 1];
-            col = new col_type[nnz];
-            val = new val_type[nnz];
-
-            ptr[0] = other.ptr[0];
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i) {
-                ptr[i+1] = other.ptr[i+1];
-                for(ptr_type j = other.ptr[i]; j < other.ptr[i+1]; ++j) {
-                    col[j] = other.col[j];
-                    val[j] = other.val[j];
-                }
-            }
-        }
-
-        return *this;
-    }
-
-    const crs& operator=(crs &&other) {
-        std::swap(nrows,    other.nrows);
-        std::swap(ncols,    other.ncols);
-        std::swap(nnz,      other.nnz);
-        std::swap(ptr,      other.ptr);
-        std::swap(col,      other.col);
-        std::swap(val,      other.val);
-        std::swap(own_data, other.own_data);
-
-        return *this;
-    }
-
-    void free_data() {
-        if (own_data) {
-            delete[] ptr; ptr = 0;
-            delete[] col; col = 0;
-            delete[] val; val = 0;
-        }
-    }
-
-    void set_size(size_t n, size_t m, bool clean_ptr = false) {
-        precondition(!ptr, "matrix data has already been allocated!");
-
-        nrows = n;
-        ncols = m;
-
-        ptr = new ptr_type[nrows + 1];
-
-        if (clean_ptr) {
-            ptr[0] = 0;
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i)
-                ptr[i+1] = 0;
-        }
-    }
-
-    ptr_type scan_row_sizes() {
-        std::partial_sum(ptr, ptr + nrows + 1, ptr);
-        return ptr[nrows];
-    }
-
-    void set_nonzeros() {
-        set_nonzeros(ptr[nrows]);
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nrows); ++i) {
-            ptrdiff_t row_beg = ptr[i];
-            ptrdiff_t row_end = ptr[i+1];
-            for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                col[j] = 0;
-                val[j] = math::zero<val_type>();
-            }
-        }
-    }
-
-    void set_nonzeros(size_t n, bool need_values = true) {
-        precondition(!col && !val, "matrix data has already been allocated!");
-
-        nnz = n;
-
-        col = new col_type[nnz];
-
-        if (need_values)
-            val = new val_type[nnz];
-    }
-
-    ~crs() {
-        free_data();
-    }
-
-    class row_iterator {
-        public:
-            row_iterator(
-                    const col_type * col,
-                    const col_type * end,
-                    const val_type * val
-                    ) : m_col(col), m_end(end), m_val(val)
-            {}
-
-            operator bool() const {
-                return m_col < m_end;
-            }
-
-            row_iterator& operator++() {
-                ++m_col;
-                ++m_val;
-                return *this;
-            }
-
-            col_type col() const {
-                return *m_col;
-            }
-
-            val_type value() const {
-                return *m_val;
-            }
-
-        private:
-            const col_type * m_col;
-            const col_type * m_end;
-            const val_type * m_val;
-    };
-
-    row_iterator row_begin(size_t row) const {
-        ptr_type p = ptr[row];
-        ptr_type e = ptr[row + 1];
-        return row_iterator(col + p, col + e, val + p);
-    }
-
-    size_t bytes() const {
-        if (own_data) {
-            return sizeof(ptr_type) * (nrows + 1)
-                 + sizeof(col_type) * nnz
-                 + sizeof(val_type) * nnz;
-        } else {
-            return 0;
-        }
-    }
-};
-
-/// Sort rows of the matrix column-wise.
-template < typename V, typename C, typename P >
-void sort_rows(crs<V, C, P> &A) {
-    const size_t n = rows(A);
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-        P beg = A.ptr[i];
-        P end = A.ptr[i + 1];
-        amgcl::detail::sort_row(A.col + beg, A.val + beg, end - beg);
-    }
-}
-
-/// Transpose of a sparse matrix.
-template < typename V, typename C, typename P >
-std::shared_ptr< crs<V,C,P> > transpose(const crs<V, C, P> &A)
-{
-    const size_t n   = rows(A);
-    const size_t m   = cols(A);
-    const size_t nnz = nonzeros(A);
-
-    auto T = std::make_shared< crs<V,C,P> >();
-    T->set_size(m, n, true);
-
-    for(size_t j = 0; j < nnz; ++j)
-        ++( T->ptr[A.col[j] + 1] );
-
-    T->scan_row_sizes();
-    T->set_nonzeros();
-
-    for(size_t i = 0; i < n; i++) {
-        for(P j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j) {
-            P head = T->ptr[A.col[j]]++;
-
-            T->col[head] = static_cast<C>(i);
-            T->val[head] = math::adjoint(A.val[j]);
-        }
-    }
-
-    std::rotate(T->ptr, T->ptr + m, T->ptr + m + 1);
-    T->ptr[0] = 0;
-
-    return T;
-}
-
-/// Matrix-matrix product.
-template <class Val, class Col, class Ptr>
-std::shared_ptr< crs<Val, Col, Ptr> >
-product(const crs<Val,Col,Ptr> &A, const crs<Val,Col,Ptr> &B, bool sort = false) {
-    auto C = std::make_shared< crs<Val,Col,Ptr> >();
-
-#ifdef _OPENMP
-    int nt = omp_get_max_threads();
-#else
-    int nt = 1;
-#endif
-
-    if (nt > 16) {
-        spgemm_rmerge(A, B, *C);
-    } else {
-        spgemm_saad(A, B, *C, sort);
-    }
-
-    return C;
-}
-
-/// Sum of two matrices
-template <class Val, class Col, class Ptr>
-std::shared_ptr< crs<Val, Col, Ptr> >
-sum(Val alpha, const crs<Val,Col,Ptr> &A, Val beta, const crs<Val,Col,Ptr> &B, bool sort = false) {
-    typedef ptrdiff_t Idx;
-
-    auto C = std::make_shared< crs<Val,Col,Ptr> >();
-    precondition(A.nrows == B.nrows && A.ncols == B.ncols , "matrices should have same shape!");
-    C->set_size(A.nrows, A.ncols);
-
-    C->ptr[0] = 0;
-
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> marker(C->ncols, -1);
-
-#pragma omp for
-        for(Idx i = 0; i < static_cast<Idx>(C->nrows); ++i) {
-            Idx C_cols = 0;
-
-            for(Idx j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                Idx c = A.col[j];
-
-                if (marker[c] != i) {
-                    marker[c]  = i;
-                    ++C_cols;
-                }
-            }
-
-            for(Idx j = B.ptr[i], e = B.ptr[i+1]; j < e; ++j) {
-                Idx c = B.col[j];
-
-                if (marker[c] != i) {
-                    marker[c]  = i;
-                    ++C_cols;
-                }
-            }
-
-            C->ptr[i + 1] = C_cols;
-        }
-    }
-
-    C->set_nonzeros(C->scan_row_sizes());
-
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> marker(C->ncols, -1);
-
-#pragma omp for
-        for(Idx i = 0; i < static_cast<Idx>(C->nrows); ++i) {
-            Idx row_beg = C->ptr[i];
-            Idx row_end = row_beg;
-
-            for(Idx j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                Idx c = A.col[j];
-                Val v = alpha * A.val[j];
-
-                if (marker[c] < row_beg) {
-                    marker[c] = row_end;
-                    C->col[row_end] = c;
-                    C->val[row_end] = v;
-                    ++row_end;
-                } else {
-                    C->val[marker[c]] += v;
-                }
-            }
-
-            for(Idx j = B.ptr[i], e = B.ptr[i+1]; j < e; ++j) {
-                Idx c = B.col[j];
-                Val v = beta * B.val[j];
-
-                if (marker[c] < row_beg) {
-                    marker[c] = row_end;
-                    C->col[row_end] = c;
-                    C->val[row_end] = v;
-                    ++row_end;
-                } else {
-                    C->val[marker[c]] += v;
-                }
-            }
-
-            if (sort) amgcl::detail::sort_row(
-                    C->col + row_beg, C->val + row_beg, row_end - row_beg);
-        }
-    }
-
-    return C;
-}
-
-/// Scale matrix values.
-template<class Val, class Col, class Ptr, class T>
-void scale(crs<Val, Col, Ptr> &A, T s) {
-    ptrdiff_t n = backend::rows(A);
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        for(ptrdiff_t j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j)
-            A.val[j] *= s;
-    }
-}
-
-// Reduce matrix to a pointwise one
-template <class value_type, class col_type, class ptr_type>
-std::shared_ptr<
-    crs< typename math::scalar_of<value_type>::type, col_type, ptr_type >
-    >
-pointwise_matrix(const crs<value_type, col_type, ptr_type> &A, unsigned block_size) {
-    typedef value_type V;
-    typedef typename math::scalar_of<V>::type S;
-
-    AMGCL_TIC("pointwise_matrix");
-    const ptrdiff_t n  = A.nrows;
-    const ptrdiff_t m  = A.ncols;
-    const ptrdiff_t np = n / block_size;
-    const ptrdiff_t mp = m / block_size;
-
-    precondition(np * block_size == n,
-            "Matrix size should be divisible by block_size");
-
-    auto ap = std::make_shared< crs<S, col_type, ptr_type> >();
-    auto &Ap = *ap;
-
-    Ap.set_size(np, mp, true);
-
-#pragma omp parallel
-    {
-        std::vector<ptr_type> j(block_size);
-        std::vector<ptr_type> e(block_size);
-
-        // Count number of nonzeros in block matrix.
-#pragma omp for
-        for(ptrdiff_t ip = 0; ip < np; ++ip) {
-            ptrdiff_t ia = ip * block_size;
-            col_type cur_col = 0;
-            bool done = true;
-
-            for(unsigned k = 0; k < block_size; ++k) {
-                ptr_type beg = j[k] = A.ptr[ia + k];
-                ptr_type end = e[k] = A.ptr[ia + k + 1];
-
-                if (beg == end) continue;
-
-                col_type c = A.col[beg];
-
-                if (done) {
-                    done = false;
-                    cur_col = c;
-                } else {
-                    cur_col = std::min(cur_col, c);
-                }
-            }
-
-            while(!done) {
-                cur_col /= block_size;
-                ++Ap.ptr[ip + 1];
-
-                done = true;
-                col_type col_end = (cur_col + 1) * block_size;
-                for(unsigned k = 0; k < block_size; ++k) {
-                    ptr_type beg = j[k];
-                    ptr_type end = e[k];
-
-                    while(beg < end) {
-                        col_type c = A.col[beg++];
-
-                        if (c >= col_end) {
-                            if (done) {
-                                done = false;
-                                cur_col = c;
-                            } else {
-                                cur_col = std::min(cur_col, c);
-                            }
-
-                            break;
-                        }
-                    }
-
-                    j[k] = beg;
-                }
-            }
-        }
-    }
-
-    Ap.set_nonzeros(Ap.scan_row_sizes());
-
-#pragma omp parallel
-    {
-        std::vector<ptr_type> j(block_size);
-        std::vector<ptr_type> e(block_size);
-
-#pragma omp for
-        for(ptrdiff_t ip = 0; ip < np; ++ip) {
-            ptrdiff_t ia = ip * block_size;
-            col_type cur_col = 0;
-            ptr_type head = Ap.ptr[ip];
-            bool done = true;
-
-            for(unsigned k = 0; k < block_size; ++k) {
-                ptr_type beg = j[k] = A.ptr[ia + k];
-                ptr_type end = e[k] = A.ptr[ia + k + 1];
-
-                if (beg == end) continue;
-
-                col_type c = A.col[beg];
-
-                if (done) {
-                    done = false;
-                    cur_col = c;
-                } else {
-                    cur_col = std::min(cur_col, c);
-                }
-            }
-
-            while(!done) {
-                cur_col /= block_size;
-
-                Ap.col[head] = cur_col;
-
-                done = true;
-                bool first = true;
-                S cur_val = math::zero<S>();
-
-                col_type col_end = (cur_col + 1) * block_size;
-                for(unsigned k = 0; k < block_size; ++k) {
-                    ptr_type beg = j[k];
-                    ptr_type end = e[k];
-
-                    while(beg < end) {
-                        col_type c = A.col[beg];
-                        S v = math::norm(A.val[beg]);
-                        ++beg;
-
-                        if (c >= col_end) {
-                            if (done) {
-                                done = false;
-                                cur_col = c;
-                            } else {
-                                cur_col = std::min(cur_col, c);
-                            }
-
-                            break;
-                        }
-
-
-                        if (first) {
-                            first = false;
-                            cur_val = v;
-                        } else {
-                            cur_val = std::max(cur_val, v);
-                        }
-                    }
-
-                    j[k] = beg;
-                }
-
-                Ap.val[head++] = cur_val;
-            }
-        }
-    }
-
-    AMGCL_TOC("pointwise_matrix");
-    return ap;
-}
-
-/** NUMA-aware vector container. */
-template <class T>
-class numa_vector {
-    public:
-        typedef T value_type;
-
-        numa_vector() : n(0), p(0) {}
-
-        numa_vector(size_t n, bool init = true) : n(n), p(new T[n]) {
-            if (init) {
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-                    p[i] = math::zero<T>();
-            }
-        }
-
-        void resize(size_t size, bool init = true) {
-            delete[] p; p = 0;
-
-            n = size;
-            p = new T[n];
-
-            if (init) {
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-                    p[i] = math::zero<T>();
-            }
-        }
-
-        template <class Vector>
-        numa_vector(const Vector &other,
-                typename std::enable_if<!std::is_integral<Vector>::value, int>::type = 0
-                ) : n(other.size()), p(new T[n])
-        {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-                p[i] = other[i];
-        }
-
-        template <class Iterator>
-        numa_vector(Iterator beg, Iterator end)
-            : n(std::distance(beg, end)), p(new T[n])
-        {
-            static_assert(std::is_same<
-                    std::random_access_iterator_tag,
-                    typename std::iterator_traits<Iterator>::iterator_category
-                    >::value,
-                    "Iterator has to be random access");
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-                p[i] = beg[i];
-        }
-
-        ~numa_vector() {
-            delete[] p; p = 0;
-        }
-
-        inline size_t size() const {
-            return n;
-        }
-
-        inline const T& operator[](size_t i) const {
-            return p[i];
-        }
-
-        inline T& operator[](size_t i) {
-            return p[i];
-        }
-
-        inline const T* data() const {
-            return p;
-        }
-
-        inline T* data() {
-            return p;
-        }
-
-        void swap(numa_vector &other) {
-            std::swap(n, other.n);
-            std::swap(p, other.p);
-        }
-
-    private:
-        size_t n;
-        T *p;
-};
-
-/// Diagonal of a matrix
-template < typename V, typename C, typename P >
-std::shared_ptr< numa_vector<V> > diagonal(const crs<V, C, P> &A, bool invert = false)
-{
-    const size_t n = rows(A);
-    auto dia = std::make_shared< numa_vector<V> >(n, false);
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-        for(auto a = A.row_begin(i); a; ++a) {
-            if (a.col() == i) {
-                V d = a.value();
-                if (invert) {
-                    d = math::is_zero(d) ? math::identity<V>() : math::inverse(d);
-                }
-                (*dia)[i] = d;
-                break;
-            }
-        }
-    }
-
-    return dia;
-}
-
-// Estimate spectral radius of the matrix.
-// Use Gershgorin disk theorem when power_iters == 0,
-// Use Power method when power_iters > 0.
-// When scale = true, scale the matrix by its inverse diagonal.
-template <bool scale, class Matrix>
-static typename math::scalar_of<typename backend::value_type<Matrix>::type>::type
-spectral_radius(const Matrix &A, int power_iters = 0) {
-    AMGCL_TIC("spectral radius");
-    typedef typename backend::value_type<Matrix>::type   value_type;
-    typedef typename math::rhs_of<value_type>::type      rhs_type;
-    typedef typename math::scalar_of<value_type>::type   scalar_type;
-
-    const ptrdiff_t n = backend::rows(A);
-    scalar_type radius;
-
-    if (power_iters <= 0) {
-        // Use Gershgorin disk theorem.
-        radius = 0;
-
-#pragma omp parallel
-        {
-            scalar_type emax = 0;
-            value_type  dia = math::identity<value_type>();
-
-#pragma omp for nowait
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                scalar_type s = 0;
-
-                for(ptrdiff_t j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                    ptrdiff_t  c = A.col[j];
-                    value_type v = A.val[j];
-
-                    s += math::norm(v);
-
-                    if (scale && c == i) dia = v;
-                }
-
-                if (scale) s *= math::norm(math::inverse(dia));
-
-                emax = std::max(emax, s);
-            }
-
-#pragma omp critical
-            radius = std::max(radius, emax);
-        }
-    } else {
-        // Power method.
-        backend::numa_vector<rhs_type> b0(n, false), b1(n, false);
-
-        // Fill the initial vector with random values.
-        // Also extract the inverted matrix diagonal values.
-        scalar_type b0_norm = 0;
-#pragma omp parallel
-        {
-#ifdef _OPENMP
-            int tid = omp_get_thread_num();
-#else
-            int tid = 0;
-#endif
-            std::mt19937 rng(tid);
-            std::uniform_real_distribution<scalar_type> rnd(-1, 1);
-
-            scalar_type loc_norm = 0;
-
-#pragma omp for nowait
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                rhs_type v = math::constant<rhs_type>(rnd(rng));
-
-                b0[i] = v;
-                loc_norm += math::norm(math::inner_product(v,v));
-            }
-
-#pragma omp critical
-            b0_norm += loc_norm;
-        }
-
-        // Normalize b0
-        b0_norm = 1 / sqrt(b0_norm);
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            b0[i] = b0_norm * b0[i];
-        }
-
-        for(int iter = 0; iter < power_iters;) {
-            // b1 = scale ? (D^1 * A) * b0 : A * b0
-            // b1_norm = ||b1||
-            // radius = <b1,b0>
-            scalar_type b1_norm = 0;
-            radius = 0;
-#pragma omp parallel
-            {
-                scalar_type loc_norm = 0;
-                scalar_type loc_radi = 0;
-                value_type  dia = math::identity<value_type>();
-
-#pragma omp for nowait
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    rhs_type s = math::zero<rhs_type>();
-
-                    for(ptrdiff_t j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                        ptrdiff_t  c = A.col[j];
-                        value_type v = A.val[j];
-                        if (scale && c == i) dia = v;
-                        s += v * b0[c];
-                    }
-
-                    if (scale) s = math::inverse(dia) * s;
-
-                    loc_norm += math::norm(math::inner_product(s, s));
-                    loc_radi += math::norm(math::inner_product(s, b0[i]));
-
-                    b1[i] = s;
-                }
-
-#pragma omp critical
-                {
-                    b1_norm += loc_norm;
-                    radius  += loc_radi;
-                }
-            }
-
-            if (++iter < power_iters) {
-                // b0 = b1 / b1_norm
-                b1_norm = 1 / sqrt(b1_norm);
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    b0[i] = b1_norm * b1[i];
-                }
-            }
-        }
-    }
-    AMGCL_TOC("spectral radius");
-
-    return radius < 0 ? static_cast<scalar_type>(2) : radius;
-}
-
-/**
- * The builtin backend does not have any dependencies, and uses OpenMP for
- * parallelization. Matrices are stored in the CRS format, and vectors are
- * instances of ``std::vector<value_type>``. There is no usual overhead of
- * moving the constructed hierarchy to the builtin backend, since the backend
- * is used internally during setup.
- */
-template <typename ValueType, typename ColumnType = ptrdiff_t, typename PointerType = ColumnType>
-struct builtin {
-    typedef ValueType      value_type;
-    typedef ColumnType     index_type;
-    typedef ColumnType     col_type;
-    typedef PointerType    ptr_type;
-
-    typedef typename math::rhs_of<value_type>::type rhs_type;
-
-    struct provides_row_iterator : std::true_type {};
-
-    typedef crs<value_type, col_type, ptr_type>  matrix;
-    typedef numa_vector<rhs_type>                vector;
-    typedef numa_vector<value_type>              matrix_diagonal;
-    typedef solver::skyline_lu<value_type>       direct_solver;
-
-    /// The backend has no parameters.
-    typedef amgcl::detail::empty_params params;
-
-    static std::string name() { return "builtin"; }
-
-    // Copy matrix. This is a noop for builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr<matrix> A, const params&)
-    {
-        return A;
-    }
-
-    // Copy vector to builtin backend.
-    template <class T>
-    static std::shared_ptr< numa_vector<T> >
-    copy_vector(const std::vector<T> &x, const params&)
-    {
-        return std::make_shared< numa_vector<T> >(x);
-    }
-
-    // Copy vector to builtin backend. This is a noop for builtin backend.
-    template <class T>
-    static std::shared_ptr< numa_vector<T> >
-    copy_vector(std::shared_ptr< numa_vector<T> > x, const params&)
-    {
-        return x;
-    }
-
-    // Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    struct gather {
-        std::vector<ptrdiff_t> I;
-
-        gather(size_t /*size*/, const std::vector<ptrdiff_t> &I, const params&)
-            : I(I) { }
-
-        template <class InVec, class OutVec>
-        void operator()(const InVec &vec, OutVec &vals) const {
-            for(size_t i = 0; i < I.size(); ++i)
-                vals[i] = vec[I[i]];
-        }
-    };
-
-    struct scatter {
-        std::vector<ptrdiff_t> I;
-
-        scatter(size_t /*size*/, const std::vector<ptrdiff_t> &I, const params&)
-            : I(I) { }
-
-        template <class InVec, class OutVec>
-        void operator()(const InVec &vals, OutVec &vec) const {
-            for(size_t i = 0; i < I.size(); ++i)
-                vec[I[i]] = vals[i];
-        }
-    };
-
-    // Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr<matrix> A, const params&) {
-        return std::make_shared<direct_solver>(*A);
-    }
-};
-
-template <class T>
-struct is_builtin_vector : std::false_type {};
-
-template <class V>
-struct is_builtin_vector< std::vector<V> > : std::is_arithmetic<V> {};
-
-template <class V>
-struct is_builtin_vector< numa_vector<V> > : std::true_type {};
-
-//---------------------------------------------------------------------------
-// Specialization of backend interface
-//---------------------------------------------------------------------------
-template <typename T1, typename T2>
-struct backends_compatible< builtin<T1>, builtin<T2> > : std::true_type {};
-
-template < typename V, typename C, typename P >
-struct rows_impl< crs<V, C, P> > {
-    static size_t get(const crs<V, C, P> &A) {
-        return A.nrows;
-    }
-};
-
-template < typename V, typename C, typename P >
-struct cols_impl< crs<V, C, P> > {
-    static size_t get(const crs<V, C, P> &A) {
-        return A.ncols;
-    }
-};
-
-template < class Vec >
-struct bytes_impl<
-    Vec,
-    typename std::enable_if< is_builtin_vector<Vec>::value >::type
-    >
-{
-    static size_t get(const Vec &x) {
-        typedef typename backend::value_type<Vec>::type V;
-        return x.size() * sizeof(V);
-    }
-};
-
-template < typename V, typename C, typename P >
-struct ptr_data_impl< crs<V, C, P> > {
-    typedef const P* type;
-    static type get(const crs<V, C, P> &A) {
-        return &A.ptr[0];
-    }
-};
-
-template < typename V, typename C, typename P >
-struct col_data_impl< crs<V, C, P> > {
-    typedef const C* type;
-    static type get(const crs<V, C, P> &A) {
-        return &A.col[0];
-    }
-};
-
-template < typename V, typename C, typename P >
-struct val_data_impl< crs<V, C, P> > {
-    typedef const V* type;
-    static type get(const crs<V, C, P> &A) {
-        return &A.val[0];
-    }
-};
-
-template < typename V, typename C, typename P >
-struct nonzeros_impl< crs<V, C, P> > {
-    static size_t get(const crs<V, C, P> &A) {
-        return A.nrows == 0 ? 0 : A.ptr[A.nrows];
-    }
-};
-
-template < typename V, typename C, typename P >
-struct row_nonzeros_impl< crs<V, C, P> > {
-    static size_t get(const crs<V, C, P> &A, size_t row) {
-        return A.ptr[row + 1] - A.ptr[row];
-    }
-};
-
-template < class Vec >
-struct clear_impl<
-    Vec,
-    typename std::enable_if< is_builtin_vector<Vec>::value >::type
-    >
-{
-    static void apply(Vec &x)
-    {
-        typedef typename backend::value_type<Vec>::type V;
-
-        const size_t n = x.size();
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            x[i] = math::zero<V>();
-        }
-    }
-};
-
-template < class Vec1, class Vec2 >
-struct inner_product_impl<
-    Vec1, Vec2,
-    typename std::enable_if<
-        is_builtin_vector<Vec1>::value &&
-        is_builtin_vector<Vec2>::value
-        >::type
-    >
-{
-    typedef typename value_type<Vec1>::type V;
-
-    typedef typename math::inner_product_impl<V>::return_type return_type;
-
-    static return_type get(const Vec1 &x, const Vec2 &y) {
-#ifdef _OPENMP
-        if (omp_get_max_threads() > 1) {
-            return parallel(x, y);
-        } else
-#endif
-        {
-            return serial(x, y);
-        }
-    }
-
-    static return_type serial(const Vec1 &x, const Vec2 &y) {
-        const size_t n = x.size();
-
-        return_type s = math::zero<return_type>();
-        return_type c = math::zero<return_type>();
-
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            return_type d = math::inner_product(x[i], y[i]) - c;
-            return_type t = s + d;
-            c = (t - s) - d;
-            s = t;
-        }
-
-        return s;
-    }
-
-#ifdef _OPENMP
-#  ifndef AMGCL_MAX_OPENMP_THREADS
-#    define AMGCL_MAX_OPENMP_THREADS 64
-#  endif
-    static return_type parallel(const Vec1 &x, const Vec2 &y)
-    {
-        const size_t n = x.size();
-        return_type              _sum_stat[AMGCL_MAX_OPENMP_THREADS];
-        std::vector<return_type> _sum_dyna;
-        return_type              *sum;
-
-        const int nt = omp_get_max_threads();
-
-        if (nt < 64) {
-            sum = _sum_stat;
-            for(int i = 0; i < nt; ++i) {
-                sum[i] = math::zero<return_type>();
-            }
-        } else {
-            _sum_dyna.resize(nt, math::zero<return_type>());
-            sum = _sum_dyna.data();
-        }
-
-#pragma omp parallel
-        {
-            const int tid = omp_get_thread_num();
-
-            return_type s = math::zero<return_type>();
-            return_type c = math::zero<return_type>();
-
-#pragma omp for nowait
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                return_type d = math::inner_product(x[i], y[i]) - c;
-                return_type t = s + d;
-                c = (t - s) - d;
-                s = t;
-            }
-
-            sum[tid] = s;
-        }
-
-        return std::accumulate(sum, sum + nt, math::zero<return_type>());
-    }
-#endif
-};
-
-template <class A, class Vec1, class B, class Vec2 >
-struct axpby_impl<
-    A, Vec1, B, Vec2,
-    typename std::enable_if<
-        is_builtin_vector<Vec1>::value &&
-        is_builtin_vector<Vec2>::value
-        >::type
-    >
-{
-    static void apply(A a, const Vec1 &x, B b, Vec2 &y)
-    {
-        const size_t n = x.size();
-        if (!math::is_zero(b)) {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                y[i] = a * x[i] + b * y[i];
-            }
-        } else {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                y[i] = a * x[i];
-            }
-        }
-    }
-};
-
-template < class A, class Vec1, class B, class Vec2, class C, class Vec3 >
-struct axpbypcz_impl<
-    A, Vec1, B, Vec2, C, Vec3,
-    typename std::enable_if<
-        is_builtin_vector<Vec1>::value &&
-        is_builtin_vector<Vec2>::value &&
-        is_builtin_vector<Vec3>::value
-        >::type
-    >
-{
-    static void apply(A a, const Vec1 &x, B b, const Vec2 &y, C c, Vec3 &z)
-    {
-        const size_t n = x.size();
-        if (!math::is_zero(c)) {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                z[i] = a * x[i] + b * y[i] + c * z[i];
-            }
-        } else {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                z[i] = a * x[i] + b * y[i];
-            }
-        }
-    }
-};
-
-template < class Alpha, class Vec1, class Vec2, class Beta, class Vec3 >
-struct vmul_impl<
-    Alpha, Vec1, Vec2, Beta, Vec3,
-    typename std::enable_if<
-        is_builtin_vector<Vec1>::value &&
-        is_builtin_vector<Vec2>::value &&
-        is_builtin_vector<Vec3>::value &&
-        math::static_rows<typename value_type<Vec1>::type>::value == math::static_rows<typename value_type<Vec2>::type>::value &&
-        math::static_rows<typename value_type<Vec1>::type>::value == math::static_rows<typename value_type<Vec3>::type>::value
-        >::type
-    >
-{
-    static void apply(Alpha a, const Vec1 &x, const Vec2 &y, Beta b, Vec3 &z)
-    {
-        const size_t n = x.size();
-        if (!math::is_zero(b)) {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                z[i] = a * x[i] * y[i] + b * z[i];
-            }
-        } else {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                z[i] = a * x[i] * y[i];
-            }
-        }
-    }
-};
-
-// Support for mixed scalar/nonscalar types
-template < class Alpha, class Vec1, class Vec2, class Beta, class Vec3 >
-struct vmul_impl<
-    Alpha, Vec1, Vec2, Beta, Vec3,
-    typename std::enable_if<
-        is_builtin_vector<Vec1>::value &&
-        is_builtin_vector<Vec2>::value &&
-        is_builtin_vector<Vec3>::value &&
-        (
-         math::static_rows<typename value_type<Vec1>::type>::value != math::static_rows<typename value_type<Vec2>::type>::value ||
-         math::static_rows<typename value_type<Vec1>::type>::value != math::static_rows<typename value_type<Vec3>::type>::value
-        )
-        >::type
-    >
-{
-    static void apply(Alpha a, const Vec1 &x, const Vec2 &y, Beta b, Vec3 &z)
-    {
-        typedef typename value_type<Vec1>::type     M_type;
-        auto Y = backend::reinterpret_as_rhs<M_type>(y);
-        auto Z = backend::reinterpret_as_rhs<M_type>(z);
-
-        const size_t n = x.size();
-
-        if (!math::is_zero(b)) {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                Z[i] = a * x[i] * Y[i] + b * Z[i];
-            }
-        } else {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                Z[i] = a * x[i] * Y[i];
-            }
-        }
-    }
-};
-
-template < class Vec1, class Vec2 >
-struct copy_impl<
-    Vec1, Vec2,
-    typename std::enable_if<
-        is_builtin_vector<Vec1>::value &&
-        is_builtin_vector<Vec2>::value
-        >::type
-    >
-{
-    static void apply(const Vec1 &x, Vec2 &y)
-    {
-        const size_t n = x.size();
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            y[i] = x[i];
-        }
-    }
-};
-
-template <class MatrixValue, class Vector, bool IsConst>
-struct reinterpret_as_rhs_impl<
-    MatrixValue, Vector, IsConst,
-    typename std::enable_if<is_builtin_vector<Vector>::value>::type
-    >
-{
-    typedef typename backend::value_type<Vector>::type src_type;
-    typedef typename math::scalar_of<src_type>::type scalar_type;
-    typedef typename math::rhs_of<MatrixValue>::type rhs_type;
-    typedef typename math::replace_scalar<rhs_type, scalar_type>::type dst_type;
-    typedef typename std::conditional<IsConst, const dst_type*, dst_type*>::type ptr_type;
-    typedef iterator_range<ptr_type> return_type;
-
-    template <class V>
-    static return_type get(V &&x) {
-        auto ptr = reinterpret_cast<ptr_type>(&x[0]);
-        const size_t n = x.size() * sizeof(src_type) / sizeof(dst_type);
-        return make_iterator_range(ptr, ptr + n);
-    }
-};
-
-namespace detail {
-
-template <typename V, typename C, typename P>
-struct use_builtin_matrix_ops< amgcl::backend::crs<V, C, P> >
-    : std::true_type
-{};
-
-} // namespace detail
-
-} // namespace backend
-} // namespace amgcl
-
-
-// Allow to use boost::iterator_range as vector in builtin backend:
-namespace boost { template <class Iterator> class iterator_range; }
-
-namespace amgcl {
-namespace backend {
-
-template <class Iterator>
-struct is_builtin_vector< amgcl::iterator_range<Iterator> > : std::true_type {};
-
-template <class Iterator>
-struct is_builtin_vector< boost::iterator_range<Iterator> > : std::true_type {};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/builtin_hybrid.hpp b/src/solvers/amgcl/backend/builtin_hybrid.hpp
deleted file mode 100644
index b512b20..0000000
--- a/src/solvers/amgcl/backend/builtin_hybrid.hpp
+++ /dev/null
@@ -1,69 +0,0 @@
-#ifndef AMGCL_BACKEND_BUILTIN_HYBRID_HPP
-#define AMGCL_BACKEND_BUILTIN_HYBRID_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/builtin_hybrid.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Builtin backend that uses scalar matrices to build the hierarchy, but stores the computed matrix in block format.
- */
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/adapter/block_matrix.hpp>
-
-namespace amgcl {
-namespace backend {
-
-// Hybrid backend uses scalar matrices to build the hierarchy,
-// but stores the computed matrices in the block format.
-template <typename BlockType, typename ColumnType = ptrdiff_t, typename PointerType = ColumnType>
-struct builtin_hybrid : public builtin<typename math::scalar_of<BlockType>::type, ColumnType, PointerType>
-{
-    typedef typename math::scalar_of<BlockType>::type ScalarType;
-    typedef builtin<ScalarType, ColumnType, PointerType> Base;
-    typedef crs<BlockType, ColumnType, PointerType> matrix;
-    struct provides_row_iterator : std::false_type {};
-
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr<typename Base::matrix> As, const typename Base::params&)
-    {
-        return std::make_shared<matrix>(amgcl::adapter::block_matrix<BlockType>(*As));
-    }
-};
-
-template <typename B1, typename B2, typename C, typename P>
-struct backends_compatible< builtin_hybrid<B1, C, P>, builtin_hybrid<B2, C, P> > : std::true_type {};
-
-template <typename T1, typename B2, typename C, typename P>
-struct backends_compatible< builtin<T1, C, P>, builtin_hybrid<B2, C, P> > : std::true_type {};
-
-template <typename B1, typename T2, typename C, typename P>
-struct backends_compatible< builtin_hybrid<B1, C, P>, builtin<T2, C, P> > : std::true_type {};
-
-} // namespace backend
-} // namespace amgcl
-#endif
diff --git a/src/solvers/amgcl/backend/cuda.hpp b/src/solvers/amgcl/backend/cuda.hpp
deleted file mode 100644
index a0b45dc..0000000
--- a/src/solvers/amgcl/backend/cuda.hpp
+++ /dev/null
@@ -1,753 +0,0 @@
-#ifndef AMGCL_BACKEND_CUDA_HPP
-#define AMGCL_BACKEND_CUDA_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/cuda.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  CUDA backend.
- */
-
-#include <type_traits>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-#include <amgcl/util.hpp>
-
-#include <thrust/device_vector.h>
-#include <thrust/fill.h>
-#include <thrust/copy.h>
-#include <thrust/gather.h>
-#include <thrust/scatter.h>
-#include <thrust/for_each.h>
-#include <thrust/inner_product.h>
-#include <cusparse_v2.h>
-
-namespace amgcl {
-
-namespace solver {
-
-/** Wrapper around solver::skyline_lu for use with the CUDA backend.
- * Copies the rhs to the host memory, solves the problem using the host CPU,
- * then copies the solution back to the compute device(s).
- */
-template <class T>
-struct cuda_skyline_lu : solver::skyline_lu<T> {
-    typedef solver::skyline_lu<T> Base;
-
-    mutable std::vector<T> _rhs, _x;
-
-    template <class Matrix, class Params>
-    cuda_skyline_lu(const Matrix &A, const Params&)
-        : Base(*A), _rhs(backend::rows(*A)), _x(backend::rows(*A))
-    { }
-
-    template <class Vec1, class Vec2>
-    void operator()(const Vec1 &rhs, Vec2 &x) const {
-        thrust::copy(rhs.begin(), rhs.end(), _rhs.begin());
-        static_cast<const Base*>(this)->operator()(_rhs, _x);
-        thrust::copy(_x.begin(), _x.end(), x.begin());
-    }
-
-    size_t bytes() const {
-        return
-            backend::bytes(*static_cast<const Base*>(this)) +
-            backend::bytes(_rhs) +
-            backend::bytes(_x);
-    }
-};
-
-}
-
-namespace backend {
-namespace detail {
-
-inline void cuda_check(cusparseStatus_t rc, const char *file, int line) {
-    if (rc != CUSPARSE_STATUS_SUCCESS) {
-        std::ostringstream msg;
-        msg << "CUDA error " << rc << " at \"" << file << ":" << line;
-        precondition(false, msg.str());
-    }
-}
-
-inline void cuda_check(cudaError_t rc, const char *file, int line) {
-    if (rc != cudaSuccess) {
-        std::ostringstream msg;
-        msg << "CUDA error " << rc << " at \"" << file << ":" << line;
-        precondition(false, msg.str());
-    }
-}
-
-#define AMGCL_CALL_CUDA(rc)                                                    \
-    amgcl::backend::detail::cuda_check(rc, __FILE__, __LINE__)
-
-struct cuda_deleter {
-    void operator()(cusparseMatDescr_t handle) {
-        AMGCL_CALL_CUDA( cusparseDestroyMatDescr(handle) );
-    }
-
-#if CUDART_VERSION < 11000
-    void operator()(cusparseHybMat_t handle) {
-        AMGCL_CALL_CUDA( cusparseDestroyHybMat(handle) );
-    }
-#endif
-
-    void operator()(csrilu02Info_t handle) {
-        AMGCL_CALL_CUDA( cusparseDestroyCsrilu02Info(handle) );
-    }
-
-    void operator()(csrsv2Info_t handle) {
-        AMGCL_CALL_CUDA( cusparseDestroyCsrsv2Info(handle) );
-    }
-
-    void operator()(cudaEvent_t handle) {
-        AMGCL_CALL_CUDA( cudaEventDestroy(handle) );
-    }
-};
-
-
-} // namespace detail
-
-#if CUDART_VERSION >= 11000
-/// CUSPARSE matrix in CSR format.
-template <typename real>
-class cuda_matrix {
-    public:
-        typedef real value_type;
-
-        cuda_matrix(
-                size_t n, size_t m,
-                const ptrdiff_t *ptr,
-                const ptrdiff_t *col,
-                const real      *val,
-                cusparseHandle_t handle
-                )
-            : nrows(n), ncols(m), nnz(ptr[n]), handle(handle),
-              ptr(ptr, ptr + n + 1), col(col, col + nnz), val(val, val + nnz),
-              desc(create_description(), backend::detail::cuda_deleter())
-        {
-        }
-
-        void spmv(
-                real alpha, thrust::device_vector<real> const &x,
-                real beta,  thrust::device_vector<real>       &y
-            ) const
-        {
-            size_t buf_size;
-            AMGCL_CALL_CUDA(
-                    cusparseCsrmvEx_bufferSize(
-                        handle,
-                        CUSPARSE_ALG_MERGE_PATH,
-                        CUSPARSE_OPERATION_NON_TRANSPOSE,
-                        nrows,
-                        ncols,
-                        nnz,
-                        &alpha, datatype(),
-                        desc.get(),
-                        thrust::raw_pointer_cast(&val[0]), datatype(),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        thrust::raw_pointer_cast(&x[0]), datatype(),
-                        &beta, datatype(),
-                        thrust::raw_pointer_cast(&y[0]), datatype(),
-                        datatype(),
-                        &buf_size)
-                    );
-
-            if (buf.size() < buf_size)
-                buf.resize(buf_size);
-
-            AMGCL_CALL_CUDA(
-                    cusparseCsrmvEx(
-                        handle,
-                        CUSPARSE_ALG_MERGE_PATH,
-                        CUSPARSE_OPERATION_NON_TRANSPOSE,
-                        nrows,
-                        ncols,
-                        nnz,
-                        &alpha, datatype(),
-                        desc.get(),
-                        thrust::raw_pointer_cast(&val[0]), datatype(),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        thrust::raw_pointer_cast(&x[0]), datatype(),
-                        &beta, datatype(),
-                        thrust::raw_pointer_cast(&y[0]), datatype(),
-                        datatype(),
-                        thrust::raw_pointer_cast(&buf[0])
-                        )
-                    );
-        }
-
-        size_t rows()     const { return nrows; }
-        size_t cols()     const { return ncols; }
-        size_t nonzeros() const { return nnz;   }
-        size_t bytes()    const {
-            return
-                sizeof(int)  * (nrows + 1) +
-                sizeof(int)  * nnz +
-                sizeof(real) * nnz;
-        }
-    private:
-        size_t nrows, ncols, nnz;
-
-        cusparseHandle_t handle;
-
-        std::shared_ptr<std::remove_pointer<cusparseMatDescr_t>::type> desc;
-
-        thrust::device_vector<int>  ptr;
-        thrust::device_vector<int>  col;
-        thrust::device_vector<real> val;
-
-        mutable thrust::device_vector<char> buf;
-
-        static cusparseMatDescr_t create_description() {
-            cusparseMatDescr_t desc;
-            AMGCL_CALL_CUDA( cusparseCreateMatDescr(&desc) );
-            AMGCL_CALL_CUDA( cusparseSetMatType(desc, CUSPARSE_MATRIX_TYPE_GENERAL) );
-            AMGCL_CALL_CUDA( cusparseSetMatIndexBase(desc, CUSPARSE_INDEX_BASE_ZERO) );
-            return desc;
-        }
-
-        static cudaDataType datatype() {
-            if (sizeof(real) == sizeof(float))
-                return CUDA_R_32F;
-            else
-                return CUDA_R_64F;
-        }
-};
-
-#else  // CUDART_VERSION >= 11000
-
-/// CUSPARSE matrix in Hyb format.
-template <typename real>
-class cuda_matrix {
-    public:
-        typedef real value_type;
-
-        cuda_matrix(
-                size_t n, size_t m,
-                const ptrdiff_t *ptr,
-                const ptrdiff_t *col,
-                const real      *val,
-                cusparseHandle_t handle
-                )
-            : nrows(n), ncols(m), nnz(ptr[n]), handle( handle ),
-              desc  ( create_description(), backend::detail::cuda_deleter() ),
-              mat   ( create_matrix(),      backend::detail::cuda_deleter() )
-        {
-            fill_matrix(n, m, ptr, col, val);
-        }
-
-        void spmv(
-                real alpha, thrust::device_vector<real> const &x,
-                real beta,  thrust::device_vector<real>       &y
-            ) const
-        {
-            spmv(alpha, x, beta, y, std::integral_constant<bool, sizeof(real) == sizeof(double)>());
-        }
-
-        void spmv(
-                real alpha, thrust::device_vector<real> const &x,
-                real beta,  thrust::device_vector<real>       &y,
-                std::false_type
-            ) const
-        {
-            AMGCL_CALL_CUDA(
-                    cusparseShybmv(handle, CUSPARSE_OPERATION_NON_TRANSPOSE,
-                        &alpha, desc.get(), mat.get(),
-                        thrust::raw_pointer_cast(&x[0]), &beta,
-                        thrust::raw_pointer_cast(&y[0])
-                        )
-                    );
-        }
-
-        void spmv(
-                real alpha, thrust::device_vector<real> const &x,
-                real beta,  thrust::device_vector<real>       &y,
-                std::true_type
-            ) const
-        {
-            AMGCL_CALL_CUDA(
-                    cusparseDhybmv(handle, CUSPARSE_OPERATION_NON_TRANSPOSE,
-                        &alpha, desc.get(), mat.get(),
-                        thrust::raw_pointer_cast(&x[0]), &beta,
-                        thrust::raw_pointer_cast(&y[0])
-                        )
-                    );
-        }
-
-        size_t rows()     const { return nrows; }
-        size_t cols()     const { return ncols; }
-        size_t nonzeros() const { return nnz;   }
-        size_t bytes()    const {
-            return
-                sizeof(int)  * (nrows + 1) +
-                sizeof(int)  * nnz +
-                sizeof(real) * nnz;
-        }
-    private:
-        size_t nrows, ncols, nnz;
-
-        cusparseHandle_t handle;
-
-        std::shared_ptr<std::remove_pointer<cusparseMatDescr_t>::type> desc;
-        std::shared_ptr<std::remove_pointer<cusparseHybMat_t>::type>   mat;
-
-        static cusparseMatDescr_t create_description() {
-            cusparseMatDescr_t desc;
-            AMGCL_CALL_CUDA( cusparseCreateMatDescr(&desc) );
-            AMGCL_CALL_CUDA( cusparseSetMatType(desc, CUSPARSE_MATRIX_TYPE_GENERAL) );
-            AMGCL_CALL_CUDA( cusparseSetMatIndexBase(desc, CUSPARSE_INDEX_BASE_ZERO) );
-            return desc;
-        }
-
-        static cusparseHybMat_t create_matrix() {
-            cusparseHybMat_t mat;
-            AMGCL_CALL_CUDA( cusparseCreateHybMat(&mat) );
-            return mat;
-        }
-
-        void fill_matrix(size_t n, size_t m,
-                const ptrdiff_t *ptr, const ptrdiff_t *col, const float *val
-                )
-        {
-            thrust::device_vector<int>   p(ptr, ptr + n + 1);
-            thrust::device_vector<int>   c(col, col + ptr[n]);
-            thrust::device_vector<float> v(val, val + ptr[n]);
-
-            AMGCL_CALL_CUDA(
-                    cusparseScsr2hyb(handle, n, m, desc.get(),
-                        thrust::raw_pointer_cast(&v[0]),
-                        thrust::raw_pointer_cast(&p[0]),
-                        thrust::raw_pointer_cast(&c[0]),
-                        mat.get(), 0, CUSPARSE_HYB_PARTITION_AUTO
-                        )
-                    );
-        }
-
-        void fill_matrix(size_t n, size_t m,
-                const ptrdiff_t *ptr, const ptrdiff_t *col, const double *val
-                )
-        {
-            thrust::device_vector<int>    p(ptr, ptr + n + 1);
-            thrust::device_vector<int>    c(col, col + ptr[n]);
-            thrust::device_vector<double> v(val, val + ptr[n]);
-
-            AMGCL_CALL_CUDA(
-                    cusparseDcsr2hyb(handle, n, m, desc.get(),
-                        thrust::raw_pointer_cast(&v[0]),
-                        thrust::raw_pointer_cast(&p[0]),
-                        thrust::raw_pointer_cast(&c[0]),
-                        mat.get(), 0, CUSPARSE_HYB_PARTITION_AUTO
-                        )
-                    );
-        }
-};
-
-#endif // CUDART_VERSION >= 11000
-
-/// CUDA backend.
-/**
- * Uses CUSPARSE for matrix operations and Thrust for vector operations.
- *
- * \param real Value type.
- * \ingroup backends
- */
-template <typename real, class DirectSolver = solver::cuda_skyline_lu<real> >
-struct cuda {
-        static_assert(
-                std::is_same<real, float>::value ||
-                std::is_same<real, double>::value,
-                "Unsupported value type for cuda backend"
-                );
-
-    typedef real value_type;
-    typedef ptrdiff_t col_type;
-    typedef ptrdiff_t ptr_type;
-    typedef cuda_matrix<real>       matrix;
-    typedef thrust::device_vector<real> vector;
-    typedef thrust::device_vector<real> matrix_diagonal;
-    typedef DirectSolver                direct_solver;
-
-    struct provides_row_iterator : std::false_type {};
-
-    /// Backend parameters.
-    struct params {
-        /// CUSPARSE handle.
-        cusparseHandle_t cusparse_handle;
-
-        params(cusparseHandle_t handle = 0) : cusparse_handle(handle) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, cusparse_handle)
-        {
-            check_params(p, {"cusparse_handle"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, cusparse_handle);
-        }
-#endif
-    };
-
-    static std::string name() { return "cuda"; }
-
-    /// Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr< typename builtin<real>::matrix > A, const params &prm)
-    {
-        return std::make_shared<matrix>(rows(*A), cols(*A),
-                A->ptr, A->col, A->val, prm.cusparse_handle
-                );
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(typename builtin<real>::vector const &x, const params&)
-    {
-        return std::make_shared<vector>(x.data(), x.data() + x.size());
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(std::shared_ptr< typename builtin<real>::vector > x, const params &prm)
-    {
-        return copy_vector(*x, prm);
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    /// Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr< typename builtin<real>::matrix > A, const params &prm)
-    {
-        return std::make_shared<direct_solver>(A, prm);
-    }
-
-    struct gather {
-        thrust::device_vector<ptrdiff_t>  I;
-        mutable thrust::device_vector<value_type> T;
-
-        gather(size_t src_size, const std::vector<ptrdiff_t> &I, const params&)
-            : I(I), T(I.size())
-        { }
-
-        void operator()(const vector &src, vector &dst) const {
-            thrust::gather(I.begin(), I.end(), src.begin(), dst.begin());
-        }
-
-        void operator()(const vector &vec, std::vector<value_type> &vals) const {
-            thrust::gather(I.begin(), I.end(), vec.begin(), T.begin());
-            thrust::copy(T.begin(), T.end(), vals.begin());
-        }
-    };
-
-    struct scatter {
-        thrust::device_vector<ptrdiff_t>  I;
-
-        scatter(size_t size, const std::vector<ptrdiff_t> &I, const params &)
-            : I(I)
-        { }
-
-        void operator()(const vector &src, vector &dst) const {
-            thrust::scatter(src.begin(), src.end(), I.begin(), dst.begin());
-        }
-    };
-};
-
-//---------------------------------------------------------------------------
-// Backend interface implementation
-//---------------------------------------------------------------------------
-template < typename V >
-struct bytes_impl< thrust::device_vector<V> > {
-    static size_t get(const thrust::device_vector<V> &v) {
-        return v.size() * sizeof(V);
-    }
-};
-
-template < typename Alpha, typename Beta, typename V >
-struct spmv_impl<
-    Alpha, cuda_matrix<V>, thrust::device_vector<V>,
-    Beta,  thrust::device_vector<V>
-    >
-{
-    typedef cuda_matrix<V> matrix;
-    typedef thrust::device_vector<V> vector;
-
-    static void apply(Alpha alpha, const matrix &A, const vector &x,
-            Beta beta, vector &y)
-    {
-        A.spmv(alpha, x, beta, y);
-    }
-};
-
-template < typename V >
-struct residual_impl<
-    cuda_matrix<V>,
-    thrust::device_vector<V>,
-    thrust::device_vector<V>,
-    thrust::device_vector<V>
-    >
-{
-    typedef cuda_matrix<V> matrix;
-    typedef thrust::device_vector<V> vector;
-
-    static void apply(const vector &rhs, const matrix &A, const vector &x,
-            vector &r)
-    {
-        thrust::copy(rhs.begin(), rhs.end(), r.begin());
-        A.spmv(-1, x, 1, r);
-    }
-};
-
-template < typename V >
-struct clear_impl< thrust::device_vector<V> >
-{
-    typedef thrust::device_vector<V> vector;
-
-    static void apply(vector &x)
-    {
-        thrust::fill(x.begin(), x.end(), V());
-    }
-};
-
-template <class V, class T>
-struct copy_impl<V, thrust::device_vector<T> >
-{
-    static void apply(const V &x, thrust::device_vector<T> &y)
-    {
-        thrust::copy(x.begin(), x.end(), y.begin());
-    }
-};
-
-template <class T, class V>
-struct copy_impl<thrust::device_vector<T>, V >
-{
-    static void apply(const thrust::device_vector<T> &x, V &y)
-    {
-        thrust::copy(x.begin(), x.end(), y.begin());
-    }
-};
-
-template <class T1, class T2>
-struct copy_impl<thrust::device_vector<T1>, thrust::device_vector<T2> >
-{
-    static void apply(const thrust::device_vector<T1> &x, thrust::device_vector<T2> &y)
-    {
-        thrust::copy(x.begin(), x.end(), y.begin());
-    }
-};
-
-template < typename V >
-struct inner_product_impl<
-    thrust::device_vector<V>,
-    thrust::device_vector<V>
-    >
-{
-    typedef thrust::device_vector<V> vector;
-
-    static V get(const vector &x, const vector &y)
-    {
-        return thrust::inner_product(x.begin(), x.end(), y.begin(), V());
-    }
-};
-
-template < typename A, typename B, typename V >
-struct axpby_impl<
-    A, thrust::device_vector<V>,
-    B, thrust::device_vector<V>
-    >
-{
-    typedef thrust::device_vector<V> vector;
-
-    struct functor {
-        A a;
-        B b;
-        functor(A a, B b) : a(a), b(b) {}
-
-        template <class Tuple>
-        __host__ __device__ void operator()( Tuple t ) const {
-            using thrust::get;
-
-            if (b)
-                get<1>(t) = a * get<0>(t) + b * get<1>(t);
-            else
-                get<1>(t) = a * get<0>(t);
-        }
-    };
-
-    static void apply(A a, const vector &x, B b, vector &y)
-    {
-        thrust::for_each(
-                thrust::make_zip_iterator(
-                    thrust::make_tuple(
-                        x.begin(), y.begin()
-                        )
-                    ),
-                thrust::make_zip_iterator(
-                    thrust::make_tuple(
-                        x.end(), y.end()
-                        )
-                    ),
-                functor(a, b)
-                );
-    }
-};
-
-template < typename A, typename B, typename C, typename V >
-struct axpbypcz_impl<
-    A, thrust::device_vector<V>,
-    B, thrust::device_vector<V>,
-    C, thrust::device_vector<V>
-    >
-{
-    typedef thrust::device_vector<V> vector;
-
-    struct functor {
-        A a;
-        B b;
-        C c;
-
-        functor(A a, B b, C c) : a(a), b(b), c(c) {}
-
-        template <class Tuple>
-        __host__ __device__ void operator()( Tuple t ) const {
-            using thrust::get;
-
-            if (c)
-                get<2>(t) = a * get<0>(t) + b * get<1>(t) + c * get<2>(t);
-            else
-                get<2>(t) = a * get<0>(t) + b * get<1>(t);
-        }
-    };
-
-    static void apply(
-            A a, const vector &x,
-            B b, const vector &y,
-            C c,       vector &z
-            )
-    {
-        thrust::for_each(
-                thrust::make_zip_iterator(
-                    thrust::make_tuple(
-                        x.begin(), y.begin(), z.begin()
-                        )
-                    ),
-                thrust::make_zip_iterator(
-                    thrust::make_tuple(
-                        x.end(), y.end(), z.end()
-                        )
-                    ),
-                functor(a, b, c)
-                );
-    }
-};
-
-template < typename A, typename B, typename V >
-struct vmul_impl<
-    A, thrust::device_vector<V>, thrust::device_vector<V>,
-    B, thrust::device_vector<V>
-    >
-{
-    typedef thrust::device_vector<V> vector;
-
-    struct functor {
-        A a;
-        B b;
-        functor(A a, B b) : a(a), b(b) {}
-
-        template <class Tuple>
-        __host__ __device__ void operator()( Tuple t ) const {
-            using thrust::get;
-
-            if (b)
-                get<2>(t) = a * get<0>(t) * get<1>(t) + b * get<2>(t);
-            else
-                get<2>(t) = a * get<0>(t) * get<1>(t);
-        }
-    };
-
-    static void apply(A a, const vector &x, const vector &y, B b, vector &z)
-    {
-        thrust::for_each(
-                thrust::make_zip_iterator(
-                    thrust::make_tuple(
-                        x.begin(), y.begin(), z.begin()
-                        )
-                    ),
-                thrust::make_zip_iterator(
-                    thrust::make_tuple(
-                        x.end(), y.end(), z.end()
-                        )
-                    ),
-                functor(a, b)
-                );
-    }
-};
-
-class cuda_event {
-    public:
-        cuda_event() : e(create_event(), backend::detail::cuda_deleter()) { }
-
-        float operator-(cuda_event tic) const {
-            float delta;
-            cudaEventSynchronize(e.get());
-            cudaEventElapsedTime(&delta, tic.e.get(), e.get());
-            return delta / 1000.0f;
-        }
-    private:
-        std::shared_ptr<std::remove_pointer<cudaEvent_t>::type> e;
-
-        static cudaEvent_t create_event() {
-            cudaEvent_t e;
-            cudaEventCreate(&e);
-            cudaEventRecord(e, 0);
-            return e;
-        }
-};
-
-struct cuda_clock {
-    typedef cuda_event value_type;
-
-    static const char* units() { return "s"; }
-
-    cuda_event current() const {
-        return cuda_event();
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/detail/default_direct_solver.hpp b/src/solvers/amgcl/backend/detail/default_direct_solver.hpp
deleted file mode 100644
index 24cd00b..0000000
--- a/src/solvers/amgcl/backend/detail/default_direct_solver.hpp
+++ /dev/null
@@ -1,74 +0,0 @@
-#ifndef AMGCL_BACKEND_DETAIL_DEFAULT_DIRECT_SOLVER_HPP
-#define AMGCL_BACKEND_DETAIL_DEFAULT_DIRECT_SOLVER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/detail/default_direct_solver.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Default direct solver for coarse level.
- */
-
-#include <memory>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace backend {
-namespace detail {
-
-template <class Backend>
-struct default_direct_solver {
-    typedef typename Backend::value_type   real;
-    typedef typename math::scalar_of<real>::type scalar;
-    typedef typename Backend::matrix       matrix;
-    typedef typename builtin<real>::matrix host_matrix;
-
-    std::shared_ptr<matrix> Ainv;
-
-    default_direct_solver(
-            std::shared_ptr<host_matrix> A,
-            typename Backend::params const &prm
-            )
-    {
-        auto ainv = std::make_shared<host_matrix>();
-        *ainv = inverse(*A);
-        Ainv = Backend::copy_matrix(ainv, prm);
-    }
-
-    template <class Vec1, class Vec2>
-    void operator()(const Vec1 &rhs, Vec2 &x) const {
-        backend::spmv(math::identity<scalar>(), *Ainv, rhs, math::zero<scalar>(), x);
-    }
-
-    static size_t coarse_enough() { return 500; }
-};
-
-} // namespace detail
-} // namespace backend
-} // namespace amgcl
-
-
-
-#endif
diff --git a/src/solvers/amgcl/backend/detail/matrix_ops.hpp b/src/solvers/amgcl/backend/detail/matrix_ops.hpp
deleted file mode 100644
index 5bbe3d9..0000000
--- a/src/solvers/amgcl/backend/detail/matrix_ops.hpp
+++ /dev/null
@@ -1,174 +0,0 @@
-#ifndef AMGCL_BACKEND_DETAIL_MATRIX_OPS_HPP
-#define AMGCL_BACKEND_DETAIL_MATRIX_OPS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file    amgcl/adapter/detail/matrix_ops.hpp
- * \author  Denis Demidov <dennis.demidov@gmail.com>
- * \brief   Sparse matrix operations for matrices that provide row_iterator.
- */
-
-#include <type_traits>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace backend {
-namespace detail {
-
-template <class Matrix, class Enable = void>
-struct use_builtin_matrix_ops : std::false_type {};
-
-} // namespace detail
-
-template <class Alpha, class Matrix, class Vector1, class Beta, class Vector2>
-struct spmv_impl<
-    Alpha, Matrix, Vector1, Beta, Vector2,
-    typename std::enable_if<
-        detail::use_builtin_matrix_ops<Matrix>::value &&
-        math::static_rows<typename value_type<Matrix>::type>::value == math::static_rows<typename value_type<Vector1>::type>::value &&
-        math::static_rows<typename value_type<Matrix>::type>::value == math::static_rows<typename value_type<Vector2>::type>::value
-        >::type
-    >
-{
-    static void apply(
-            Alpha alpha, const Matrix &A, const Vector1 &x, Beta beta, Vector2 &y
-            )
-    {
-        typedef typename value_type<Vector2>::type V;
-
-        const ptrdiff_t n = static_cast<ptrdiff_t>( rows(A) );
-
-        if (!math::is_zero(beta)) {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                V sum = math::zero<V>();
-                for(typename row_iterator<Matrix>::type a = row_begin(A, i); a; ++a)
-                    sum += a.value() * x[ a.col() ];
-                y[i] = alpha * sum + beta * y[i];
-            }
-        } else {
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                V sum = math::zero<V>();
-                for(typename row_iterator<Matrix>::type a = row_begin(A, i); a; ++a)
-                    sum += a.value() * x[ a.col() ];
-                y[i] = alpha * sum;
-            }
-        }
-    }
-};
-
-template <class Matrix, class Vector1, class Vector2, class Vector3>
-struct residual_impl<
-    Matrix, Vector1, Vector2, Vector3,
-    typename std::enable_if<
-        detail::use_builtin_matrix_ops<Matrix>::value &&
-        math::static_rows<typename value_type<Matrix>::type>::value == math::static_rows<typename value_type<Vector1>::type>::value &&
-        math::static_rows<typename value_type<Matrix>::type>::value == math::static_rows<typename value_type<Vector2>::type>::value &&
-        math::static_rows<typename value_type<Matrix>::type>::value == math::static_rows<typename value_type<Vector3>::type>::value
-        >::type
-    >
-{
-    static void apply(
-            Vector1 const &rhs,
-            Matrix  const &A,
-            Vector2 const &x,
-            Vector3       &res
-            )
-    {
-        typedef typename value_type<Vector3>::type V;
-
-        const ptrdiff_t n = static_cast<ptrdiff_t>( rows(A) );
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            V sum = math::zero<V>();
-            for(typename row_iterator<Matrix>::type a = row_begin(A, i); a; ++a)
-                sum += a.value() * x[ a.col() ];
-            res[i] = rhs[i] - sum;
-        }
-    }
-};
-
-/* Allows to do matrix-vector products with mixed scalar/nonscalar types.
- * Reinterprets pointers to the vectors data into appropriate types.
- */
-template <class Alpha, class Matrix, class Vector1, class Beta, class Vector2>
-struct spmv_impl<
-    Alpha, Matrix, Vector1, Beta, Vector2,
-    typename std::enable_if<
-            detail::use_builtin_matrix_ops<Matrix>::value && (
-            math::static_rows<typename value_type<Matrix>::type>::value != math::static_rows<typename value_type<Vector1>::type>::value ||
-            math::static_rows<typename value_type<Matrix>::type>::value != math::static_rows<typename value_type<Vector2>::type>::value)
-        >::type
-    >
-{
-    static void apply(
-            Alpha alpha, const Matrix &A, const Vector1 &x, Beta beta, Vector2 &y
-            )
-    {
-        typedef typename value_type<Matrix>::type V;
-
-        auto X = backend::reinterpret_as_rhs<V>(x);
-        auto Y = backend::reinterpret_as_rhs<V>(y);
-
-        spmv(alpha, A, X, beta, Y);
-    }
-};
-
-template <class Matrix, class Vector1, class Vector2, class Vector3>
-struct residual_impl<
-    Matrix, Vector1, Vector2, Vector3,
-    typename std::enable_if<
-            detail::use_builtin_matrix_ops<Matrix>::value && (
-            math::static_rows<typename value_type<Matrix>::type>::value != math::static_rows<typename value_type<Vector1>::type>::value ||
-            math::static_rows<typename value_type<Matrix>::type>::value != math::static_rows<typename value_type<Vector2>::type>::value ||
-            math::static_rows<typename value_type<Matrix>::type>::value != math::static_rows<typename value_type<Vector3>::type>::value)
-        >::type
-    >
-{
-    static void apply(
-            Vector1 const &f,
-            Matrix  const &A,
-            Vector2 const &x,
-            Vector3       &r
-            )
-    {
-        typedef typename value_type<Matrix>::type V;
-
-        auto X = backend::reinterpret_as_rhs<V>(x);
-        auto F = backend::reinterpret_as_rhs<V>(f);
-        auto R = backend::reinterpret_as_rhs<V>(r);
-
-        residual(F, A, X, R);
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/detail/mixing.hpp b/src/solvers/amgcl/backend/detail/mixing.hpp
deleted file mode 100644
index 8b9a473..0000000
--- a/src/solvers/amgcl/backend/detail/mixing.hpp
+++ /dev/null
@@ -1,80 +0,0 @@
-#ifndef AMGCL_BACKEND_DETAIL_MIXING_HPP
-#define AMGCL_BACKEND_DETAIL_MIXING_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2016, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/detail/mixing.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Utilities for mixed-precision of mixed-block backends.
- */
-
-#include <type_traits>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace backend {
-namespace detail {
-
-// Backend with scalar value_type of highest precision.
-
-template <class B1, class B2, class Enable = void>
-struct common_scalar_backend;
-
-template <class B>
-struct common_scalar_backend<B, B,
-    typename std::enable_if<
-        math::static_rows<typename B::value_type>::value == 1
-        >::type >
-{
-    typedef B type;
-};
-
-template <class V1, class V2>
-struct common_scalar_backend< backend::builtin<V1>, backend::builtin<V2>,
-    typename std::enable_if<
-        math::static_rows<V1>::value != 1 ||
-        math::static_rows<V2>::value != 1
-        >::type>
-{
-    typedef typename math::scalar_of<V1>::type S1;
-    typedef typename math::scalar_of<V2>::type S2;
-
-    typedef
-        typename std::conditional<
-            (sizeof(S1) > sizeof(S2)), backend::builtin<S1>, backend::builtin<S2>
-            >::type
-        type;
-};
-
-} // namespace detail
-} // namespace backend
-} // namespace amgcl
-
-
-
-#endif
diff --git a/src/solvers/amgcl/backend/eigen.hpp b/src/solvers/amgcl/backend/eigen.hpp
deleted file mode 100644
index a4c26ff..0000000
--- a/src/solvers/amgcl/backend/eigen.hpp
+++ /dev/null
@@ -1,277 +0,0 @@
-#ifndef AMGCL_BACKEND_EIGEN_HPP
-#define AMGCL_BACKEND_EIGEN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/eigen.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Sparse matrix in CRS format.
- */
-
-#include <memory>
-#include <amgcl/adapter/eigen.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// Eigen backend.
-/**
- * This is a backend that uses types defined in the Eigen library
- * (http://eigen.tuxfamily.org).
- *
- * \param real Value type.
- * \ingroup backends
- */
-template <typename real>
-struct eigen {
-    typedef real      value_type;
-    typedef ptrdiff_t index_type;
-    typedef ptrdiff_t col_type;
-    typedef ptrdiff_t ptr_type;
-
-    typedef
-        Eigen::Map<Eigen::SparseMatrix<value_type, Eigen::RowMajor, index_type>>
-        matrix;
-
-    typedef Eigen::Matrix<value_type, Eigen::Dynamic, 1> vector;
-    typedef Eigen::Matrix<value_type, Eigen::Dynamic, 1> matrix_diagonal;
-
-    typedef solver::skyline_lu<real> direct_solver;
-
-    struct provides_row_iterator : std::true_type {};
-
-    /// Backend parameters.
-    typedef amgcl::detail::empty_params params;
-
-    static std::string name() { return "eigen"; }
-
-    /// Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr< typename builtin<real>::matrix > A, const params&)
-    {
-        const typename builtin<real>::matrix &a = *A;
-
-        return std::shared_ptr<matrix>(
-                new matrix(
-                    rows(*A), cols(*A), nonzeros(*A),
-                    const_cast<index_type*>(a.ptr),
-                    const_cast<index_type*>(a.col),
-                    const_cast<value_type*>(a.val)
-                    ),
-                hold_host(A)
-                );
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(typename builtin<real>::vector const &x, const params&)
-    {
-        return std::make_shared<vector>(
-                Eigen::Map<const vector>(x.data(), x.size())
-                );
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(std::shared_ptr< typename builtin<real>::vector > x, const params &prm)
-    {
-        return copy_vector(*x, prm);
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    /// Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr< typename builtin<real>::matrix > A, const params&)
-    {
-        return std::make_shared<direct_solver>(*A);
-    }
-
-    private:
-        struct hold_host {
-            typedef std::shared_ptr< crs<real, ptrdiff_t, ptrdiff_t> > host_matrix;
-            host_matrix host;
-
-            hold_host( host_matrix host ) : host(host) {}
-
-            void operator()(matrix *ptr) const {
-                delete ptr;
-            }
-        };
-
-};
-
-template < class Alpha, class M, class V1, class Beta, class V2 >
-struct spmv_impl<
-    Alpha, M, V1, Beta, V2,
-    typename std::enable_if<
-        is_eigen_sparse_matrix<M>::value &&
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value
-        >::type
-    >
-{
-    static void apply(Alpha alpha, const M &A, const V1 &x, Beta beta, V2 &y)
-    {
-        if (!math::is_zero(beta))
-            y = alpha * A * x + beta * y;
-        else
-            y = alpha * A * x;
-    }
-};
-
-template < class M, class V1, class V2, class V3 >
-struct residual_impl<
-    M, V1, V2, V3,
-    typename std::enable_if<
-        is_eigen_sparse_matrix<M>::value &&
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value &&
-        is_eigen_type<V3>::value
-        >::type
-    >
-{
-    static void apply(const V1 &rhs, const M &A, const V2 &x, V3 &r)
-    {
-        r = rhs - A * x;
-    }
-};
-
-template < typename V >
-struct clear_impl<
-    V,
-    typename std::enable_if<is_eigen_type<V>::value>::type
-    >
-{
-    static void apply(V &x)
-    {
-        x.setZero();
-    }
-};
-
-template < class V1, class V2 >
-struct inner_product_impl<
-    V1, V2,
-    typename std::enable_if<
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value
-        >::type
-    >
-{
-    typedef typename value_type<V1>::type real;
-    static real get(const V1 &x, const V2 &y)
-    {
-        return x.dot(y);
-    }
-};
-
-template < class A, class V1, class B, class V2 >
-struct axpby_impl<
-    A, V1, B, V2,
-    typename std::enable_if<
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value
-        >::type
-    >
-{
-    static void apply(A a, const V1 &x, B b, V2 &y)
-    {
-        if (!math::is_zero(b))
-            y = a * x + b * y;
-        else
-            y = a * x;
-    }
-};
-
-template < class A, class V1, class B, class V2, class C, class V3 >
-struct axpbypcz_impl<
-    A, V1, B, V2, C, V3,
-    typename std::enable_if<
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value &&
-        is_eigen_type<V3>::value
-        >::type
-    >
-{
-    typedef typename value_type<V1>::type real;
-
-    static void apply(
-            real a, const V1 &x,
-            real b, const V2 &y,
-            real c,       V3 &z
-            )
-    {
-        if (!math::is_zero(c))
-            z = a * x + b * y + c * z;
-        else
-            z = a * x + b * y;
-    }
-};
-
-template < class Alpha, class V1, class V2, class Beta, class V3 >
-struct vmul_impl<
-    Alpha, V1, V2, Beta, V3,
-    typename std::enable_if<
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value &&
-        is_eigen_type<V3>::value
-        >::type
-    >
-{
-    static void apply(Alpha a, const V1 &x, const V2 &y, Beta b, V3 &z)
-    {
-        if (!math::is_zero(b))
-            z.array() = a * x.array() * y.array() + b * z.array();
-        else
-            z.array() = a * x.array() * y.array();
-    }
-};
-
-template < class V1, class V2 >
-struct copy_impl<
-    V1, V2,
-    typename std::enable_if<
-        is_eigen_type<V1>::value &&
-        is_eigen_type<V2>::value
-        >::type
-    >
-{
-    static void apply(const V1 &x, V2 &y)
-    {
-        y = x;
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/hpx.hpp b/src/solvers/amgcl/backend/hpx.hpp
deleted file mode 100644
index 8812757..0000000
--- a/src/solvers/amgcl/backend/hpx.hpp
+++ /dev/null
@@ -1,966 +0,0 @@
-#ifndef AMGCL_BACKEND_HPX_HPP
-#define AMGCL_BACKEND_HPX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/hpx.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  HPX backend.
- */
-
-#include <vector>
-
-#include <hpx/hpx.hpp>
-#include <hpx/include/lcos.hpp>
-#include <hpx/include/parallel_for_each.hpp>
-#include <hpx/include/parallel_transform_reduce.hpp>
-
-#include <boost/range/irange.hpp>
-#include <boost/range/algorithm.hpp>
-#include <boost/range/iterator_range.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// The matrix is a thin wrapper on top of amgcl::builtin::crs<>.
-template <typename real>
-class hpx_matrix {
-    public:
-        typedef real      value_type;
-        typedef ptrdiff_t index_type;
-
-        typedef crs<value_type, index_type> Base;
-        typedef typename Base::row_iterator row_iterator;
-
-        // For each of the output segments y[i] in y = A * x it stores a range of
-        // segments in x that y[i] depends on.
-        std::vector<std::tuple<index_type, index_type>> xrange;
-
-        // And yrange stores the inverted dependencies: for each segment in x
-        // yrange stores range of segments in y that depend on x. This is required
-        // to determine when a segment of x in [y = A * x] is safe to update.
-        std::vector<std::tuple<index_type, index_type>> yrange;
-
-        // Creates the matrix from builtin datatype, sets up xrange.
-        hpx_matrix(std::shared_ptr<Base> A, int grain_size) : base(A)
-        {
-            index_type n = backend::rows(*A);
-            index_type m = backend::cols(*A);
-
-            index_type nseg = (n + grain_size - 1) / grain_size;
-            index_type mseg = (m + grain_size - 1) / grain_size;
-
-            xrange.resize(nseg);
-            yrange.resize(mseg, std::make_tuple(m, 0));
-
-            auto range = boost::irange<index_type>(0, nseg);
-
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [this, grain_size, n, A](index_type seg) {
-                        index_type i = seg * grain_size;
-                        index_type beg = A->ptr[i];
-                        index_type end = A->ptr[std::min<index_type>(i + grain_size, n)];
-
-                        auto mm = std::minmax_element(A->col + beg, A->col + end);
-
-                        index_type xbeg = *std::get<0>(mm) / grain_size;
-                        index_type xend = *std::get<1>(mm) / grain_size + 1;
-
-                        xrange[seg] = std::make_tuple(xbeg, xend);
-
-                        for(index_type i = xbeg; i < xend; ++i) {
-                            std::get<0>(yrange[i]) = std::min(seg,   std::get<0>(yrange[i]));
-                            std::get<1>(yrange[i]) = std::max(seg+1, std::get<1>(yrange[i]));
-                        }
-                    });
-        }
-
-        size_t rows()     const { return backend::rows(*base);     }
-        size_t cols()     const { return backend::cols(*base);     }
-        size_t nonzeros() const { return backend::nonzeros(*base); }
-
-        row_iterator row_begin(size_t row) const {
-            return base->row_begin(row);
-        }
-    private:
-        // Base matrix is stored in shared_ptr<> to reduce the overhead
-        // of data transfer from builtin datatypes (used for AMG setup) to the
-        // backend datatypes.
-        std::shared_ptr<Base> base;
-
-};
-
-/// The vector type to be used with HPX backend.
-/**
- * hpx_vector is a thin wrapper on top of std::vector.
- * The vector consists of continuous segments of fixed size (grain_size) except
- * may be the last one that is allowed to be shorter.
- * A vector of shared_futures corresponding to each of the segments is stored
- * along the data vector to facilitate construction of HPX dependency graph.
- */
-template < typename real >
-class hpx_vector {
-    public:
-        typedef real                          value_type;
-        typedef std::vector<real>             Base;
-        typedef typename Base::iterator       iterator;
-        typedef typename Base::const_iterator const_iterator;
-
-        int nseg;        // Number of segments in the vector
-        int grain_size;  // Segment size.
-
-        // Futures associated with each segment:
-        mutable std::vector<hpx::shared_future<void>> safe_to_read;
-        mutable std::vector<hpx::shared_future<void>> safe_to_write;
-
-        hpx_vector(size_t n, int grain_size)
-            : nseg( (n + grain_size - 1) / grain_size ),
-              grain_size( grain_size ),
-              buf( std::make_shared<Base>(n) )
-        {
-            precondition(grain_size > 0, "grain size should be positive");
-            init_futures();
-        }
-
-        template <class Other>
-        hpx_vector(std::shared_ptr<Other> o, int grain_size)
-            : nseg( (o->size() + grain_size - 1) / grain_size ),
-              grain_size( grain_size ),
-              buf(std::make_shared<Base>(o->data(), o->data() + o->size()))
-        {
-            precondition(grain_size > 0, "grain size should be positive");
-            init_futures();
-        }
-
-        size_t size() const { return buf->size(); }
-
-        const real & operator[](size_t i) const { return (*buf)[i]; }
-        real & operator[](size_t i) { return (*buf)[i]; }
-
-        const real* data() const { return buf->data(); }
-        real*       data()       { return buf->data(); }
-
-        iterator begin() { return buf->begin(); }
-        iterator end()   { return buf->end();   }
-
-        const_iterator begin() const { return buf->cbegin(); }
-        const_iterator end()   const { return buf->cend();   }
-
-        const_iterator cbegin() const { return buf->cbegin(); }
-        const_iterator cend()   const { return buf->cend();   }
-
-        template <class IdxTuple>
-        boost::iterator_range<
-            typename std::vector< hpx::shared_future<void> >::iterator
-            >
-        safe_range(IdxTuple idx) const {
-            return boost::make_iterator_range(
-                    safe_to_read.begin() + std::get<0>(idx),
-                    safe_to_read.begin() + std::get<1>(idx)
-                    );
-        }
-    private:
-        // Segments stored in a continuous array.
-        // The base vector is stored with shared_ptr for the same reason as with
-        // hpx_matrix above: to reduce the overhead of data transfer.
-        std::shared_ptr<Base> buf;
-
-        void init_futures() {
-            safe_to_read.reserve(nseg);
-            safe_to_write.reserve(nseg);
-            for(ptrdiff_t i = 0; i < nseg; ++i) {
-                safe_to_read.push_back(hpx::make_ready_future());
-                safe_to_write.push_back(hpx::make_ready_future());
-            }
-        }
-};
-
-/// HPX backend
-/**
- * This is a backend that is based on HPX -- a general purpose C++ runtime
- * system for parallel and distributed applications of any scale
- * http://stellar-group.org/libraries/hpx.
- */
-template <typename real>
-struct HPX {
-    typedef real      value_type;
-    typedef ptrdiff_t index_type;
-    typedef ptrdiff_t col_type;
-    typedef ptrdiff_t ptr_type;
-
-    struct provides_row_iterator : std::false_type {};
-
-    struct params {
-        /// Number of vector elements in a single segment.
-        int grain_size;
-
-        params() : grain_size(4096) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, grain_size)
-        {
-            check_params(p, {"grain_size"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, grain_size);
-        }
-#endif
-    };
-
-    typedef hpx_matrix<value_type>         matrix;
-    typedef hpx_vector<value_type>         vector;
-    typedef hpx_vector<value_type>         matrix_diagonal;
-
-    struct direct_solver : public solver::skyline_lu<value_type> {
-        typedef solver::skyline_lu<value_type> Base;
-        typedef typename Base::params params;
-
-        template <class Matrix>
-        direct_solver(const Matrix &A, const params &prm = params())
-            : Base(A, prm)
-        {}
-
-        struct call_base {
-            const Base *base;
-            const real *fptr;
-            real       *xptr;
-
-            template <class... T>
-            void operator()(T&&...) const {
-                (*base)(fptr, xptr);
-            }
-        };
-
-        void operator()(const vector &rhs, vector &x) const {
-            const real *fptr = &rhs[0];
-            real       *xptr = &x[0];
-
-            using hpx::dataflow;
-
-            hpx::shared_future<void> solve = dataflow(
-                    hpx::launch::async,
-                    call_base{this, fptr, xptr},
-                    rhs.safe_to_read,
-                    x.safe_to_write
-                    );
-
-            boost::fill(x.safe_to_read, solve);
-        }
-    };
-
-    static std::string name() { return "HPX"; }
-
-    /// Copy matrix.
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr<typename matrix::Base> A, const params &p)
-    {
-        return std::make_shared<matrix>(A, p.grain_size);
-    }
-
-    /// Copy vector to builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(const typename vector::Base &x, const params &p)
-    {
-        return std::make_shared<vector>(
-                std::make_shared<typename vector::Base>(x), p.grain_size
-                );
-    }
-
-    /// Copy vector to builtin backend.
-    template <typename Other>
-    static std::shared_ptr<hpx_vector<typename Other::value_type>>
-    copy_vector(std::shared_ptr<Other> x, const params &p)
-    {
-        return std::make_shared<hpx_vector<typename Other::value_type>>(x, p.grain_size);
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params &p)
-    {
-        return std::make_shared<vector>(size, p.grain_size);
-    }
-
-    /// Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr<typename matrix::Base> A, const params&) {
-        return std::make_shared<direct_solver>(*A);
-    }
-};
-
-//---------------------------------------------------------------------------
-// Backend interface implementation
-//---------------------------------------------------------------------------
-template < typename Alpha, typename Beta, typename real >
-struct spmv_impl<
-    Alpha, hpx_matrix<real>, hpx_vector<real>,
-    Beta,  hpx_vector<real>
-    >
-{
-    typedef hpx_matrix<real> matrix;
-    typedef hpx_vector<real> vector;
-
-    struct process_ab {
-        Alpha                   alpha;
-        const hpx_matrix<real> &A;
-        const real             *xptr;
-        Beta                    beta;
-        real                   *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i) {
-                real sum = 0;
-                for(auto a = A.row_begin(i); a; ++a)
-                    sum += a.value() * xptr[a.col()];
-                yptr[i] = alpha * sum + beta * yptr[i];
-            }
-        }
-    };
-
-    struct process_a {
-        Alpha                   alpha;
-        const hpx_matrix<real> &A;
-        const real             *xptr;
-        real                   *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i) {
-                real sum = 0;
-                for(auto a = A.row_begin(i); a; ++a)
-                    sum += a.value() * xptr[a.col()];
-                yptr[i] = alpha * sum;
-            }
-        }
-    };
-
-    struct wait_for_it {
-        template <class T>
-        void operator()(T&&) const {}
-    };
-
-    static void apply(Alpha alpha, const matrix &A, const vector &x,
-            Beta beta, vector &y)
-    {
-        const real *xptr = &x[0];
-        real       *yptr = &y[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, y.nseg);
-
-        if (beta) {
-            // y = alpha * A * x + beta * y
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [alpha, &A, &x, beta, &y, xptr, yptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * y.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + y.grain_size, y.size());
-
-                        y.safe_to_read[seg] = dataflow(
-                                hpx::launch::async,
-                                process_ab{alpha, A, xptr, beta, yptr, beg, end},
-                                y.safe_to_read[seg],
-                                y.safe_to_write[seg],
-                                x.safe_range(A.xrange[seg])
-                                );
-                    });
-        } else {
-            // y = alpha * A * x
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [alpha, &A, &x, &y, xptr, yptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * y.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + y.grain_size, y.size());
-
-                        y.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_a{alpha, A, xptr, yptr, beg, end},
-                                y.safe_to_write[seg],
-                                x.safe_range(A.xrange[seg])
-                                );
-                    });
-        }
-
-        // Do not update x until y is ready.
-        range = boost::irange(0, x.nseg);
-        hpx::parallel::for_each(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                [&A, &x, &y](ptrdiff_t seg) {
-                    x.safe_to_write[seg] = dataflow(hpx::launch::async,
-                            wait_for_it(),
-                            y.safe_range(A.yrange[seg])
-                            );
-                });
-    }
-};
-
-template < typename real >
-struct residual_impl<
-    hpx_matrix<real>,
-    hpx_vector<real>,
-    hpx_vector<real>,
-    hpx_vector<real>
-    >
-{
-    typedef hpx_matrix<real> matrix;
-    typedef hpx_vector<real> vector;
-
-    struct process {
-        const real             *fptr;
-        const hpx_matrix<real> &A;
-        const real             *xptr;
-        real                   *rptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i) {
-                real sum = fptr[i];
-                for(auto a = A.row_begin(i); a; ++a)
-                    sum -= a.value() * xptr[a.col()];
-                rptr[i] = sum;
-            }
-        }
-    };
-
-    struct wait_for_it {
-        template <class T>
-        void operator()(T&&) const {}
-    };
-
-    static void apply(const vector &f, const matrix &A, const vector &x,
-            vector &r)
-    {
-        const real *xptr = &x[0];
-        const real *fptr = &f[0];
-        real       *rptr = &r[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, f.nseg);
-        hpx::parallel::for_each(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                [&f, &A, &x, &r, xptr, fptr, rptr](ptrdiff_t seg) {
-                    ptrdiff_t beg = seg * f.grain_size;
-                    ptrdiff_t end = std::min<ptrdiff_t>(beg + f.grain_size, f.size());
-
-                    r.safe_to_read[seg] = dataflow(hpx::launch::async,
-                            process{fptr, A, xptr, rptr, beg, end},
-                            f.safe_to_read[seg],
-                            r.safe_to_write[seg],
-                            x.safe_range(A.xrange[seg])
-                            );
-                });
-
-        // Do not update x until r is ready.
-        range = boost::irange(0, x.nseg);
-        hpx::parallel::for_each(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                [&A, &x, &r](ptrdiff_t seg) {
-                    x.safe_to_write[seg] = dataflow(hpx::launch::async,
-                            wait_for_it(),
-                            r.safe_range(A.yrange[seg])
-                            );
-                });
-    }
-};
-
-template < typename real >
-struct clear_impl<
-    hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process {
-        real *xptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                xptr[i] = 0;
-        }
-    };
-
-    static void apply(vector &x) {
-        real *xptr = &x[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, x.nseg);
-        hpx::parallel::for_each(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                [&x, xptr](ptrdiff_t seg) {
-                    ptrdiff_t beg = seg * x.grain_size;
-                    ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                    x.safe_to_read[seg] = dataflow(hpx::launch::async,
-                            process{xptr, beg, end},
-                            x.safe_to_write[seg]
-                            );
-                });
-    }
-};
-
-template < typename real >
-struct copy_impl<
-    hpx_vector<real>,
-    hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process {
-        const real *xptr;
-        real       *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                yptr[i] = xptr[i];
-        }
-    };
-
-    static void apply(const vector &x, vector &y)
-    {
-        const real *xptr = &x[0];
-        real       *yptr = &y[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, x.nseg);
-        hpx::parallel::for_each(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                [&x, &y, xptr, yptr](ptrdiff_t seg) {
-                    ptrdiff_t beg = seg * x.grain_size;
-                    ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                    y.safe_to_read[seg] = dataflow(hpx::launch::async,
-                            process{xptr, yptr, beg, end},
-                            x.safe_to_read[seg],
-                            y.safe_to_write[seg]
-                            );
-                });
-    }
-};
-
-template < typename real >
-struct copy<
-    std::vector<real>,
-    hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process {
-        const real *xptr;
-        real       *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                yptr[i] = xptr[i];
-        }
-    };
-
-    static void apply(const std::vector<real> &x, vector &y)
-    {
-        const real *xptr = &x[0];
-        real       *yptr = &y[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, y.nseg);
-        hpx::parallel::for_each(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                [&y, xptr, yptr](ptrdiff_t seg) {
-                    ptrdiff_t beg = seg * y.grain_size;
-                    ptrdiff_t end = std::min<ptrdiff_t>(beg + y.grain_size, y.size());
-
-                    y.safe_to_read[seg] = dataflow(hpx::launch::async,
-                            process{xptr, yptr, beg, end},
-                            y.safe_to_write[seg]
-                            );
-                });
-    }
-};
-
-template < typename real >
-struct inner_product_impl<
-    hpx_vector<real>,
-    hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process {
-        const real *xptr;
-        const real *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        double operator()(T&&...) const {
-            real sum = 0;
-
-            for(ptrdiff_t i = beg; i < end; ++i)
-                sum += xptr[i] * yptr[i];
-
-            return sum;
-        }
-    };
-
-    static real get(const vector &x, const vector &y)
-    {
-        const real *xptr = &x[0];
-        const real *yptr = &y[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, x.nseg);
-        return hpx::parallel::transform_reduce(
-                hpx::parallel::par,
-                boost::begin(range), boost::end(range),
-                math::zero<real>(), std::plus<real>(),
-                [&x, &y, xptr, yptr](ptrdiff_t seg) {
-                    ptrdiff_t beg = seg * x.grain_size;
-                    ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                    return dataflow(hpx::launch::async,
-                            process{xptr, yptr, beg, end},
-                            x.safe_to_read[seg],
-                            y.safe_to_read[seg]
-                            ).get();
-                }
-                );
-    }
-};
-
-template < typename A, typename B, typename real >
-struct axpby_impl<
-    A, hpx_vector<real>,
-    B, hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process_ab {
-        typedef void result_type;
-
-        A           a;
-        const real *xptr;
-        B           b;
-        real       *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                yptr[i] = a * xptr[i] + b * yptr[i];
-        }
-    };
-
-    struct process_a {
-        typedef void result_type;
-
-        A           a;
-        const real *xptr;
-        real       *yptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                yptr[i] = a * xptr[i];
-        }
-    };
-
-    static void apply(A a, const vector &x, B b, vector &y)
-    {
-        const real *xptr = &x[0];
-        real       *yptr = &y[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, x.nseg);
-        if (b) {
-            // y = a * x + b * y;
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [a, &x, b, &y, xptr, yptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * x.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                        y.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_ab{a, xptr, b, yptr, beg, end},
-                                x.safe_to_read[seg],
-                                y.safe_to_read[seg],
-                                y.safe_to_write[seg]
-                                );
-                    });
-        } else {
-            // y = a * x;
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [a, &x, &y, xptr, yptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * x.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                        y.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_a{a, xptr, yptr, beg, end},
-                                x.safe_to_read[seg],
-                                y.safe_to_write[seg]
-                                );
-                    });
-        }
-    }
-};
-
-template < typename A, typename B, typename C, typename real >
-struct axpbypcz_impl<
-    A, hpx_vector<real>,
-    B, hpx_vector<real>,
-    C, hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process_abc {
-        A           a;
-        const real *xptr;
-        B           b;
-        const real *yptr;
-        C           c;
-        real       *zptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                zptr[i] = a * xptr[i] + b * yptr[i] + c * zptr[i];
-        }
-    };
-
-    struct process_ab {
-        A           a;
-        const real *xptr;
-        B           b;
-        const real *yptr;
-        real       *zptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                zptr[i] = a * xptr[i] + b * yptr[i];
-        }
-    };
-
-    static void apply(
-            A a, const vector &x,
-            B b, const vector &y,
-            C c,       vector &z
-            )
-    {
-        const real *xptr = &x[0];
-        const real *yptr = &y[0];
-        real       *zptr = &z[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, x.nseg);
-        if (c) {
-            //z = a * x + b * y + c * z;
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [a, &x, b, &y, c, &z, xptr, yptr, zptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * x.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                        z.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_abc{a, xptr, b, yptr, c, zptr, beg, end},
-                                x.safe_to_read[seg],
-                                y.safe_to_read[seg],
-                                z.safe_to_read[seg],
-                                z.safe_to_write[seg]
-                                );
-                    });
-        } else {
-            //z = a * x + b * y;
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [a, &x, b, &y, &z, xptr, yptr, zptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * x.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                        z.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_ab{a, xptr, b, yptr, zptr, beg, end},
-                                x.safe_to_read[seg],
-                                y.safe_to_read[seg],
-                                z.safe_to_write[seg]
-                                );
-                    });
-        }
-    }
-};
-
-template < typename A, typename B, typename real >
-struct vmul_impl<
-    A, hpx_vector<real>, hpx_vector<real>,
-    B, hpx_vector<real>
-    >
-{
-    typedef hpx_vector<real> vector;
-
-    struct process_ab {
-        A           a;
-        const real *xptr;
-        const real *yptr;
-        B           b;
-        real       *zptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                zptr[i] = a * xptr[i] * yptr[i] + b * zptr[i];
-        }
-    };
-
-    struct process_a {
-        A           a;
-        const real *xptr;
-        const real *yptr;
-        real       *zptr;
-
-        ptrdiff_t beg;
-        ptrdiff_t end;
-
-        template <class... T>
-        void operator()(T&&...) const {
-            for(ptrdiff_t i = beg; i < end; ++i)
-                zptr[i] = a * xptr[i] * yptr[i];
-        }
-    };
-
-    static void apply(A a, const vector &x, const vector &y, B b, vector &z)
-    {
-        const real *xptr = &x[0];
-        const real *yptr = &y[0];
-        real       *zptr = &z[0];
-
-        using hpx::dataflow;
-
-        auto range = boost::irange(0, x.nseg);
-        if (b) {
-            //z = a * x * y + b * z;
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [a, &x, &y, b, &z, xptr, yptr, zptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * x.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                        z.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_ab{a, xptr, yptr, b, zptr, beg, end},
-                                x.safe_to_read[seg],
-                                y.safe_to_read[seg],
-                                z.safe_to_read[seg],
-                                z.safe_to_write[seg]
-                                );
-                    });
-        } else {
-            //z = a * x * y;
-            hpx::parallel::for_each(
-                    hpx::parallel::par,
-                    boost::begin(range), boost::end(range),
-                    [a, &x, &y, &z, xptr, yptr, zptr](ptrdiff_t seg) {
-                        ptrdiff_t beg = seg * x.grain_size;
-                        ptrdiff_t end = std::min<ptrdiff_t>(beg + x.grain_size, x.size());
-
-                        z.safe_to_read[seg] = dataflow(hpx::launch::async,
-                                process_a{a, xptr, yptr, zptr, beg, end},
-                                x.safe_to_read[seg],
-                                y.safe_to_read[seg],
-                                z.safe_to_write[seg]
-                                );
-                    });
-        }
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/interface.hpp b/src/solvers/amgcl/backend/interface.hpp
deleted file mode 100644
index c3074c4..0000000
--- a/src/solvers/amgcl/backend/interface.hpp
+++ /dev/null
@@ -1,449 +0,0 @@
-#ifndef AMGCL_BACKEND_INTERFACE_HPP
-#define AMGCL_BACKEND_INTERFACE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/interface.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Backend interface required for AMG.
- */
-
-#include <cmath>
-
-#include <type_traits>
-
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Provided backends.
-namespace backend {
-
-/**
- * \defgroup backends Provided backends
- * \brief Backends implemented in AMGCL.
- *
- * A backend in AMGCL is a class that defines matrix and vector types together
- * with several operations on them, such as creation, matrix-vector products,
- * vector sums, inner products etc.  The AMG hierarchy is moved to the
- * specified backend upon construction. The solution phase then uses types and
- * operations defined in the backend. This enables transparent acceleration of
- * the solution phase with OpenMP, OpenCL, CUDA, or any other technologies.
- */
-
-/**
- * \defgroup backend_interface Backend interface
- * \brief Backend interface specification.
- *
- * One has to specify these templates in order to define a new backend.
- */
-
-/** \addtogroup backend_interface
- * @{
- */
-
-/// Metafunction that checks if two backends are compatible.
-/**
- * That is, a solver in SBackend may be used together with a preconditioner in PBackend.
- */
-template <class SBackend, class PBackend>
-struct backends_compatible : std::is_same<SBackend, PBackend> {};
-
-/// Metafunction that returns value type of a matrix or a vector type.
-template <class T, class Enable = void>
-struct value_type {
-    typedef typename T::value_type type;
-};
-
-/// Metafunction that returns column type of a matrix.
-template <class T, class Enable = void>
-struct col_type {
-    typedef typename T::col_type type;
-};
-
-/// Metafunction that returns pointer type of a matrix.
-template <class T, class Enable = void>
-struct ptr_type {
-    typedef typename T::ptr_type type;
-};
-
-/// Implementation for function returning the number of rows in a matrix.
-/** \note Used in rows() */
-template <class Matrix, class Enable = void>
-struct rows_impl {
-    static size_t get(const Matrix &A) {
-        return A.rows();
-    }
-};
-
-/// Implementation for function returning the number of columns in a matrix.
-/** \note Used in cols() */
-template <class Matrix, class Enable = void>
-struct cols_impl {
-    static size_t get(const Matrix &A) {
-        return A.cols();
-    }
-};
-
-/// Implementation for function returning number of bytes allocated for a matrix/vector.
-/** \note Used in bytes() */
-template <class T, class Enable = void>
-struct bytes_impl {
-
-    // Use bytes() method when available.
-    template <class U>
-    static auto get_impl(const U &t, int) -> decltype(t.bytes()) {
-        return t.bytes();
-    }
-
-    // Fallback to zero.
-    template <class U>
-    static size_t get_impl(const U&, ...) {
-        return 0;
-    }
-
-    static size_t get(const T &t) {
-        return get_impl(t, 0);
-    }
-};
-
-template <class Matrix, class Enable = void>
-struct ptr_data_impl {
-    typedef typename Matrix::PTR_DATA_NOT_IMPLEMENTED type;
-};
-
-template <class Matrix, class Enable = void>
-struct col_data_impl {
-    typedef typename Matrix::COL_DATA_NOT_IMPLEMENTED type;
-};
-
-template <class Matrix, class Enable = void>
-struct val_data_impl {
-    typedef typename Matrix::VAL_DATA_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for function returning the number of nonzeros in a matrix.
-/** \note Used in nonzeros() */
-template <class Matrix, class Enable = void>
-struct nonzeros_impl {
-    static size_t get(const Matrix &A) {
-        return A.nonzeros();
-    }
-};
-
-/// Implementation for function returning the number of nonzeros in a matrix row.
-/** \note Used in row_nonzeros() */
-template <class Matrix, class Enable = void>
-struct row_nonzeros_impl {
-    typedef typename Matrix::ROW_NONZEROS_NOT_IMPLEMENTED type;
-};
-
-/// Metafunction returning the row iterator type for a matrix type.
-/**
- * \note This only has to be implemented in the backend if support for serial
- * smoothers (Gauss-Seidel or ILU0) is required.
- */
-template <class Matrix, class Enable = void>
-struct row_iterator {
-    typedef typename Matrix::row_iterator type;
-};
-
-/// Implementation for function returning row iterator for a matrix.
-/**
- * \note This only has to be implemented in the backend if support for serial
- * smoothers (Gauss-Seidel or ILU0) is required.
- * \note Used in row_begin()
- */
-template <class Matrix, class Enable = void>
-struct row_begin_impl {
-    static typename row_iterator<Matrix>::type
-    get(const Matrix &A, size_t row) {
-        return A.row_begin(row);
-    }
-};
-
-/// Implementation for matrix-vector product.
-/** \note Used in spmv() */
-template <class Alpha, class Matrix, class Vector1, class Beta, class Vector2, class Enable = void>
-struct spmv_impl {
-    typedef typename Matrix::SPMV_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for residual error compuatation.
-/** \note Used in residual() */
-template <class Matrix, class Vector1, class Vector2, class Vector3, class Enable = void>
-struct residual_impl {
-    typedef typename Matrix::RESIDUAL_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for zeroing out a vector.
-/** \note Used in clear() */
-template <class Vector, class Enable = void>
-struct clear_impl {
-    typedef typename Vector::CLEAR_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for vector copy.
-/** \note Used in copy() */
-template <class Vector1, class Vector2, class Enable = void>
-struct copy_impl {
-    typedef typename Vector1::COPY_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for inner product.
-/** \note Used in inner_product() */
-template <class Vector1, class Vector2, class Enable = void>
-struct inner_product_impl {
-    typedef typename Vector1::INNER_PRODUCT_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for linear combination of two vectors.
-/** \note Used in axpby() */
-template <class A, class Vector1, class B, class Vector2, class Enable = void>
-struct axpby_impl {
-    typedef typename Vector1::AXPBY_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for linear combination of three vectors.
-/** \note Used in axpbypcz() */
-template <class A, class Vector1, class B, class Vector2, class C, class Vector3, class Enable = void>
-struct axpbypcz_impl {
-    typedef typename Vector1::AXPBYPCZ_NOT_IMPLEMENTED type;
-};
-
-/// Implementation for element-wize vector product.
-/** \note Used in vmul() */
-template <class Alpha, class Vector1, class Vector2, class Beta, class Vector3, class Enable = void>
-struct vmul_impl {
-    typedef typename Vector1::VMUL_NOT_IMPLEMENTED type;
-};
-
-/// Reinterpret the vector to be compatible with the matrix value type
-template <class MatrixValue, class Vector, bool IsConst, class Enable = void>
-struct reinterpret_as_rhs_impl {
-    typedef typename MatrixValue::REINTERPRET_AS_RHS_NOT_IMPLEMENTED type;
-};
-
-/** @} */
-
-/// Returns the number of rows in a matrix.
-template <class Matrix>
-size_t rows(const Matrix &matrix) {
-    return rows_impl<Matrix>::get(matrix);
-}
-
-/// Returns the number of columns in a matrix.
-template <class Matrix>
-size_t cols(const Matrix &matrix) {
-    return cols_impl<Matrix>::get(matrix);
-}
-
-/// Returns number of bytes allocated for the container (matrix / vector)
-template <class T>
-size_t bytes(const T &t) {
-    return bytes_impl<T>::get(t);
-}
-
-template <class Matrix>
-typename ptr_data_impl<Matrix>::type
-ptr_data(const Matrix &matrix) {
-    return ptr_data_impl<Matrix>::get(matrix);
-}
-
-template <class Matrix>
-typename col_data_impl<Matrix>::type
-col_data(const Matrix &matrix) {
-    return col_data_impl<Matrix>::get(matrix);
-}
-
-template <class Matrix>
-typename val_data_impl<Matrix>::type
-val_data(const Matrix &matrix) {
-    return val_data_impl<Matrix>::get(matrix);
-}
-
-/// Returns the number of nonzeros in a matrix.
-template <class Matrix>
-size_t nonzeros(const Matrix &matrix) {
-    return nonzeros_impl<Matrix>::get(matrix);
-}
-
-/// Returns row iterator for a matrix.
-template <class Matrix>
-typename row_iterator<Matrix>::type
-row_begin(const Matrix &matrix, size_t row) {
-    return row_begin_impl<Matrix>::get(matrix, row);
-}
-
-/// Returns number of nonzeros in a matrix row.
-template <class Matrix>
-size_t row_nonzeros(const Matrix &A, size_t row) {
-    return row_nonzeros_impl<Matrix>::get(A, row);
-}
-
-/// Performs matrix-vector product.
-/**
- * \f[y = \alpha A x + \beta y.\f]
- */
-template <class Alpha, class Matrix, class Vector1, class Beta, class Vector2>
-void spmv(
-        Alpha alpha,
-        const Matrix &A,
-        const Vector1 &x,
-        Beta beta,
-        Vector2 &y)
-{
-    AMGCL_TIC("spmv");
-    spmv_impl<Alpha, Matrix, Vector1, Beta, Vector2>::apply(alpha, A, x, beta, y);
-    AMGCL_TOC("spmv");
-}
-
-/// Computes residual error.
-/**
- * \f[r = rhs - Ax.\f]
- */
-template <class Matrix, class Vector1, class Vector2, class Vector3>
-void residual(const Vector1 &rhs, const Matrix &A, const Vector2 &x, Vector3 &r)
-{
-    AMGCL_TIC("residual");
-    residual_impl<Matrix, Vector1, Vector2, Vector3>::apply(rhs, A, x, r);
-    AMGCL_TOC("residual");
-}
-
-/// Zeros out a vector.
-template <class Vector>
-void clear(Vector &x)
-{
-    AMGCL_TIC("clear");
-    clear_impl<Vector>::apply(x);
-    AMGCL_TOC("clear");
-}
-
-/// Vector copy.
-template <class Vector1, class Vector2>
-void copy(const Vector1 &x, Vector2 &y)
-{
-    AMGCL_TIC("copy");
-    copy_impl<Vector1, Vector2>::apply(x, y);
-    AMGCL_TOC("copy");
-}
-
-/// Computes inner product of two vectors.
-template <class Vector1, class Vector2>
-typename math::inner_product_impl<
-    typename value_type<Vector1>::type
-    >::return_type
-inner_product(const Vector1 &x, const Vector2 &y)
-{
-    typedef typename math::inner_product_impl<
-        typename value_type<Vector1>::type
-        >::return_type result_type;
-
-    AMGCL_TIC("inner_product");
-    result_type p = inner_product_impl<Vector1, Vector2>::get(x, y);
-    AMGCL_TOC("inner_product");
-
-    return p;
-}
-
-/// Computes linear combination of two vectors.
-/**
- * \f[y = ax + by.\f]
- */
-template <class A, class Vector1, class B, class Vector2>
-void axpby(A a, Vector1 const &x, B b, Vector2 &y) {
-    AMGCL_TIC("axpby");
-    axpby_impl<A, Vector1, B, Vector2>::apply(a, x, b, y);
-    AMGCL_TOC("axpby");
-}
-
-/// Computes linear combination of three vectors.
-/**
- * \f[z = ax + by + cz.\f]
- */
-template <class A, class Vector1, class B, class Vector2, class C, class Vector3>
-void axpbypcz(A a, Vector1 const &x, B b, Vector2 const &y, C c, Vector3 &z) {
-    AMGCL_TIC("axpbypcz");
-    axpbypcz_impl<A, Vector1, B, Vector2, C, Vector3>::apply(a, x, b, y, c, z);
-    AMGCL_TOC("axpbypcz");
-}
-
-/// Computes element-wize vector product.
-/**
- * \f[z = \alpha xy + \beta z.\f]
- */
-template <class Alpha, class Vector1, class Vector2, class Beta, class Vector3>
-void vmul(Alpha alpha, const Vector1 &x, const Vector2 &y, Beta beta, Vector3 &z)
-{
-    AMGCL_TIC("vmul");
-    vmul_impl<Alpha, Vector1, Vector2, Beta, Vector3>::apply(alpha, x, y, beta, z);
-    AMGCL_TOC("vmul");
-}
-
-/// Reinterpret the vector to be compatible with the matrix value type
-template <class MatrixValue, class Vector>
-typename reinterpret_as_rhs_impl<
-    MatrixValue,
-    typename std::decay<Vector>::type,
-    std::is_const<typename std::remove_reference<Vector>::type>::value
-    >::return_type
-reinterpret_as_rhs(Vector &&x) {
-    return reinterpret_as_rhs_impl<
-        MatrixValue,
-        typename std::decay<Vector>::type,
-        std::is_const<typename std::remove_reference<Vector>::type>::value
-        >::get(std::forward<Vector>(x));
-}
-
-/// Is the relaxation supported by the backend?
-template <class Backend, template <class> class Relaxation, class Enable = void>
-struct relaxation_is_supported : std::true_type {};
-
-/// Is the coarsening supported by the backend?
-template <class Backend, template <class> class Coarsening, class Enable = void>
-struct coarsening_is_supported : std::true_type {};
-
-/// Linear combination of vectors
-/**
- * \f[ y = \sum_j c_j v_j + alpha * y \f]
- */
-template <class Coefs, class Vecs, class Coef, class Vec>
-void lin_comb(size_t n, const Coefs &c, const Vecs &v, const Coef &alpha, Vec &y) {
-    axpby(c[0], *v[0], alpha, y);
-    size_t i = 1;
-    for(; i + 1 < n; i += 2)
-        axpbypcz(c[i], *v[i], c[i+1], *v[i+1], math::identity<Coef>(), y);
-
-    for(; i < n; ++i)
-        axpby(c[i], *v[i], math::identity<Coef>(), y);
-}
-
-} // namespace backend
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/backend/mkl.hpp b/src/solvers/amgcl/backend/mkl.hpp
deleted file mode 100644
index c26d4fb..0000000
--- a/src/solvers/amgcl/backend/mkl.hpp
+++ /dev/null
@@ -1,294 +0,0 @@
-#ifndef AMGCL_BACKEND_MKL_HPP
-#define AMGCL_BACKEND_MKL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2014 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/mkl.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Intel Math Kernel library backend.
- */
-
-#include <vector>
-#include <amgcl/backend/builtin.hpp>
-
-#include <mkl.h>
-
-namespace amgcl {
-namespace backend {
-
-/// Sparse matrix stored in CRS format.
-struct mkl_crs : public crs<double, int> {
-    typedef crs<double, int> Base;
-
-    template <
-        class PtrRange,
-        class ColRange,
-        class ValRange
-        >
-    mkl_crs(size_t nrows, size_t ncols,
-        const PtrRange &ptr_range,
-        const ColRange &col_range,
-        const ValRange &val_range
-        )
-    : Base(nrows, ncols, ptr_range, col_range, val_range)
-    {}
-
-    template <class Matrix>
-    mkl_crs(const Matrix &A) : Base(A) {}
-};
-
-/// BLAS vector.
-class mkl_vec {
-    public:
-        mkl_vec() {}
-        mkl_vec(size_t n) : buf(n) {}
-
-        template <class Iterator>
-        mkl_vec(Iterator beg, Iterator end) : buf(beg, end) {}
-
-        size_t size() const {
-            return buf.size();
-        }
-
-        double operator[](size_t i) const {
-            return buf[i];
-        }
-
-        double& operator[](size_t i) {
-            return buf[i];
-        }
-
-        const double* data() const {
-            return buf.data();
-        }
-
-        double* data() {
-            return buf.data();
-        }
-    private:
-        std::vector<double> buf;
-};
-
-/// Intel Math Kernel library backend.
-struct mkl {
-    typedef double value_type;
-    typedef int    index_type;
-    typedef int    col_type;
-    typedef int    ptr_type;
-
-    typedef mkl_crs matrix;
-    typedef mkl_vec vector;
-    typedef vector  matrix_diagonal;
-    typedef solver::skyline_lu<value_type> direct_solver;
-
-    /// Backend parameters.
-    struct params {
-        params() {}
-        params(const boost::property_tree::ptree&) {}
-    };
-
-    /// Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(
-            std::shared_ptr< typename builtin<value_type>::matrix > A,
-            const params&
-            )
-    {
-        return std::make_shared<matrix>(*A);
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(typename builtin<value_type>::vector const &x, const params&)
-    {
-        return std::make_shared<vector>(x.data(), x.data() + x.size());
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(
-            std::shared_ptr< typename builtin<value_type>::vector > x,
-            const params &prm
-            )
-    {
-        return copy_vector(*x, prm);
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    /// Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr< typename builtin<value_type>::matrix > A, const params&)
-    {
-        return std::make_shared<direct_solver>(*A);
-    }
-};
-
-//---------------------------------------------------------------------------
-// Backend interface implementation
-//---------------------------------------------------------------------------
-template <>
-struct value_type < mkl_crs > {
-    typedef double type;
-};
-
-template <>
-struct value_type < mkl_vec > {
-    typedef double type;
-};
-
-template <>
-struct rows_impl< mkl_crs > {
-    static size_t get(const mkl_crs &A) {
-        return A.nrows;
-    }
-};
-
-template <>
-struct cols_impl< mkl_crs > {
-    static size_t get(const mkl_crs &A) {
-        return A.ncols;
-    }
-};
-
-template <>
-struct nonzeros_impl< mkl_crs > {
-    static size_t get(const mkl_crs &A) {
-        return A.ptr[A.nrows];
-    }
-};
-
-template <typename Alpha, typename Beta>
-struct spmv_impl<
-  Alpha, mkl_crs, mkl_vec,
-  Beta, mkl_vec
-  >
-{
-    static void apply(Alpha alpha, const mkl_crs &A, const mkl_vec &x,
-            Beta beta, mkl_vec &y)
-    {
-        MKL_INT m = A.nrows;
-        MKL_INT k = A.ncols;
-        mkl_dcsrmv("N", &m, &k, &alpha, "G__C",
-                const_cast<double*>(&A.val[0]),
-                const_cast<int*   >(&A.col[0]),
-                const_cast<int*   >(&A.ptr[0]),
-                const_cast<int*   >(&A.ptr[1]),
-                const_cast<double*>(x.data()),
-                &beta,
-                y.data());
-    }
-};
-
-template <>
-struct residual_impl< mkl_crs, mkl_vec, mkl_vec, mkl_vec >
-{
-    static void apply(const mkl_vec &rhs, const mkl_crs &A, const mkl_vec &x,
-            mkl_vec &r)
-    {
-        cblas_dcopy(rhs.size(), rhs.data(), 1, r.data(), 1);
-        spmv_impl<double, mkl_crs, mkl_vec, double, mkl_vec>::apply(-1, A, x, 1, r);
-    }
-};
-
-template <>
-struct clear_impl< mkl_vec >
-{
-    static void apply(mkl_vec &x)
-    {
-        std::fill_n(x.data(), x.size(), 0.0);
-    }
-};
-
-template <>
-struct copy_impl< mkl_vec, mkl_vec >
-{
-    static void apply(const mkl_vec &x, mkl_vec &y)
-    {
-        cblas_dcopy(x.size(), x.data(), 1, y.data(), 1);
-    }
-};
-
-template <>
-struct inner_product_impl< mkl_vec, mkl_vec >
-{
-    static double get(const mkl_vec &x, const mkl_vec &y)
-    {
-        return cblas_ddot(x.size(), x.data(), 1, y.data(), 1);
-    }
-};
-
-template <typename A, typename B>
-struct axpby_impl<
-  A, mkl_vec,
-  B, mkl_vec
-  >
-{
-    static void apply(A a, const mkl_vec &x, B b, mkl_vec &y)
-    {
-        cblas_dscal(y.size(), b, y.data(), 1);
-        cblas_daxpy(y.size(), a, x.data(), 1, y.data(), 1);
-    }
-};
-
-template <typename A, typename B, typename C>
-struct axpbypcz_impl<
-  A, mkl_vec,
-  B, mkl_vec,
-  C, mkl_vec
-  >
-{
-    static void apply(
-            A a, const mkl_vec &x,
-            B b, const mkl_vec &y,
-            C c,       mkl_vec &z
-            )
-    {
-        cblas_dscal(z.size(), c, z.data(), 1);
-        cblas_daxpy(z.size(), a, x.data(), 1, z.data(), 1);
-        cblas_daxpy(z.size(), b, y.data(), 1, z.data(), 1);
-    }
-};
-
-template <typename A, typename B>
-struct vmul_impl<
-  A, mkl_vec, mkl_vec,
-  B, mkl_vec >
-{
-    static void apply(A a, const mkl_vec &x, const mkl_vec &y, B b, mkl_vec &z)
-    {
-        cblas_dsbmv(CblasRowMajor, CblasLower, z.size(), 0, a, x.data(), 1, y.data(), 1, b, z.data(), 1);
-    }
-};
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/vexcl.hpp b/src/solvers/amgcl/backend/vexcl.hpp
deleted file mode 100644
index 4a1dcc2..0000000
--- a/src/solvers/amgcl/backend/vexcl.hpp
+++ /dev/null
@@ -1,493 +0,0 @@
-#ifndef AMGCL_BACKEND_VEXCL_HPP
-#define AMGCL_BACKEND_VEXCL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/vexcl.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  VexCL backend.
- */
-
-#include <iostream>
-#include <memory>
-
-#include <boost/range/iterator_range.hpp>
-
-#include <amgcl/solver/skyline_lu.hpp>
-#include <amgcl/adapter/block_matrix.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/static_matrix.hpp>
-
-#include <vexcl/vector.hpp>
-#include <vexcl/gather.hpp>
-#include <vexcl/sparse/matrix.hpp>
-#include <vexcl/sparse/distributed.hpp>
-
-
-namespace amgcl {
-
-namespace solver {
-
-/** Wrapper around solver::skyline_lu for use with the VexCL backend.
- * Copies the rhs to the host memory, solves the problem using the host CPU,
- * then copies the solution back to the compute device(s).
- */
-template <class value_type>
-struct vexcl_skyline_lu : solver::skyline_lu<value_type> {
-    typedef solver::skyline_lu<value_type> Base;
-    typedef typename math::rhs_of<value_type>::type rhs_type;
-
-    mutable std::vector<rhs_type> _rhs, _x;
-
-    template <class Matrix, class Params>
-    vexcl_skyline_lu(const Matrix &A, const Params&)
-        : Base(*A), _rhs(backend::rows(*A)), _x(backend::rows(*A))
-    { }
-
-    template <class Vec1, class Vec2>
-    void operator()(const Vec1 &rhs, Vec2 &x) const {
-        vex::copy(rhs, _rhs);
-        static_cast<const Base*>(this)->operator()(_rhs, _x);
-        vex::copy(_x, x);
-    }
-
-    size_t bytes() const {
-        return
-            backend::bytes(*static_cast<const Base*>(this)) +
-            backend::bytes(_rhs) +
-            backend::bytes(_x);
-    }
-};
-
-}
-
-namespace backend {
-
-/// The VexCL backend parameters.
-struct vexcl_params {
-
-    std::vector< vex::backend::command_queue > q; ///< Command queues that identify compute devices to use with VexCL.
-
-    /// Do CSR to ELL conversion on the GPU side.
-    /** This will result in faster setup, but will require more GPU memory. */
-    bool fast_matrix_setup;
-
-    vexcl_params() : fast_matrix_setup(true) {}
-
-#ifndef AMGCL_NO_BOOST
-    vexcl_params(const boost::property_tree::ptree &p)
-        : fast_matrix_setup(p.get("fast_matrix_setup", vexcl_params().fast_matrix_setup))
-    {
-        std::vector<vex::backend::command_queue> *ptr = 0;
-        ptr = p.get("q", ptr);
-        if (ptr) q = *ptr;
-        check_params(p, {"q", "fast_matrix_setup"});
-    }
-
-    void get(boost::property_tree::ptree &p, const std::string &path) const {
-        p.put(path + "q", &q);
-        p.put(path + "fast_matrix_setup", fast_matrix_setup);
-    }
-#endif
-
-    const std::vector<vex::backend::command_queue>& context() const {
-        if (q.empty())
-            return vex::current_context().queue();
-        else
-            return q;
-    }
-};
-
-
-/**
- * The backend uses the <a href="https://github.com/ddemidov/vexcl">VexCL</a>
- * library for accelerating solution on the modern GPUs and multicore
- * processors with the help of OpenCL or CUDA technologies.
- * The VexCL backend stores the system matrix as ``vex::SpMat<real>`` and
- * expects the right hand side and the solution vectors to be instances of the
- * ``vex::vector<real>`` type.
- */
-template <typename real, typename ColumnType = ptrdiff_t, typename PointerType = ColumnType, class DirectSolver = solver::vexcl_skyline_lu<real> >
-struct vexcl {
-    typedef real        value_type;
-    typedef ptrdiff_t   index_type;
-    typedef ColumnType  col_type;
-    typedef PointerType ptr_type;
-
-    typedef vex::sparse::distributed<
-                vex::sparse::matrix<value_type, col_type, ptr_type>
-                > matrix;
-    typedef typename math::rhs_of<value_type>::type rhs_type;
-    typedef vex::vector<rhs_type>                          vector;
-    typedef vex::vector<value_type>                        matrix_diagonal;
-    typedef DirectSolver                                   direct_solver;
-
-    struct provides_row_iterator : std::false_type {};
-
-    typedef vexcl_params params;
-
-    static std::string name() { return "vexcl"; }
-
-    // Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr< typename builtin<real, col_type, ptr_type>::matrix > A, const params &prm)
-    {
-        precondition(!prm.context().empty(), "Empty VexCL context!");
-
-        const typename builtin<real, col_type, ptr_type>::matrix &a = *A;
-
-        const size_t n   = rows(*A);
-        const size_t m   = cols(*A);
-        const size_t nnz = a.ptr[n];
-
-        return std::make_shared<matrix>(prm.context(), n, m,
-                boost::make_iterator_range(a.ptr, a.ptr + n+1),
-                boost::make_iterator_range(a.col, a.col + nnz),
-                boost::make_iterator_range(a.val, a.val + nnz),
-                prm.fast_matrix_setup
-                );
-    }
-
-    // Copy vector from builtin backend.
-    template <class T>
-    static std::shared_ptr< vex::vector<T> >
-    copy_vector(const std::vector<T> &x, const params &prm)
-    {
-        precondition(!prm.context().empty(), "Empty VexCL context!");
-        return std::make_shared< vex::vector<T> >(prm.context(), x);
-    }
-
-    template <class T>
-    static std::shared_ptr< vex::vector<T> >
-    copy_vector(const numa_vector<T> &x, const params &prm)
-    {
-        precondition(!prm.context().empty(), "Empty VexCL context!");
-        return std::make_shared< vex::vector<T> >(prm.context(), x.size(), x.data());
-    }
-
-    // Copy vector from builtin backend.
-    template <class T>
-    static std::shared_ptr< vex::vector<T> >
-    copy_vector(std::shared_ptr< numa_vector<T> > x, const params &prm)
-    {
-        return copy_vector(*x, prm);
-    }
-
-    // Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params &prm)
-    {
-        precondition(!prm.context().empty(), "Empty VexCL context!");
-
-        return std::make_shared<vector>(prm.context(), size);
-    }
-
-    struct gather {
-        size_t n;
-        mutable vex::gather G;
-        mutable std::vector<char> buf;
-
-        gather(size_t src_size, const std::vector<ptrdiff_t> &I, const params &prm)
-            : n(I.size()), G(prm.context(), src_size, std::vector<size_t>(I.begin(), I.end()))
-        { }
-
-        template <class S, class D>
-        void operator()(const vex::vector<S> &src, vex::vector<D> &dst) const {
-            if (buf.size() < sizeof(D) * n) buf.resize(sizeof(D) * n);
-            auto t = reinterpret_cast<D*>(buf.data());
-            G(src, t);
-            vex::copy(t, t + n, dst.begin());
-        }
-
-        template <class S, class D>
-        void operator()(const vex::vector<S> &vec, std::vector<D> &vals) const {
-            G(vec, vals);
-        }
-    };
-
-    struct scatter {
-        size_t n;
-        mutable vex::scatter S;
-        mutable std::vector<char> buf;
-
-        scatter(size_t size, const std::vector<ptrdiff_t> &I, const params &prm)
-            : n(I.size()), S(prm.context(), size, std::vector<size_t>(I.begin(), I.end()))
-        { }
-
-        template <class S, class D>
-        void operator()(const vex::vector<S> &src, vex::vector<D> &dst) const {
-            if (buf.size() < sizeof(D) * n) buf.resize(sizeof(D) * n);
-            auto t = reinterpret_cast<D*>(buf.data());
-            vex::copy(src.begin(), src.end(), t);
-            S(t, dst);
-        }
-    };
-
-
-    // Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr< typename builtin<real, ColumnType, PointerType>::matrix > A, const params &prm)
-    {
-        return std::make_shared<direct_solver>(A, prm);
-    }
-};
-
-// Hybrid backend uses scalar matrices to build the hierarchy,
-// but stores the computed matrices in the block format.
-template <
-    typename BlockType,
-    typename ColumnType = ptrdiff_t,
-    typename PointerType = ColumnType,
-    class DirectSolver = solver::vexcl_skyline_lu<typename math::scalar_of<BlockType>::type>
-    >
-struct vexcl_hybrid : public vexcl<typename math::scalar_of<BlockType>::type, ColumnType, PointerType, DirectSolver>
-{
-    typedef typename math::scalar_of<BlockType>::type ScalarType;
-    typedef vexcl<ScalarType, ColumnType, PointerType, DirectSolver> Base;
-    typedef vex::sparse::distributed<
-                vex::sparse::matrix<
-                    BlockType,
-                    typename Base::col_type,
-                    typename Base::ptr_type
-                    >
-                > matrix;
-
-    static std::shared_ptr<matrix>
-    copy_matrix(std::shared_ptr< typename builtin<ScalarType, ColumnType, PointerType>::matrix > As, const typename Base::params &prm)
-    {
-        precondition(!prm.context().empty(), "Empty VexCL context!");
-
-        typename builtin<BlockType, ColumnType, PointerType>::matrix A(amgcl::adapter::block_matrix<BlockType>(*As));
-
-        const size_t n   = rows(A);
-        const size_t m   = cols(A);
-        const size_t nnz = A.ptr[n];
-
-        return std::make_shared<matrix>(prm.context(), n, m,
-                boost::make_iterator_range(A.ptr, A.ptr + n+1),
-                boost::make_iterator_range(A.col, A.col + nnz),
-                boost::make_iterator_range(A.val, A.val + nnz),
-                prm.fast_matrix_setup
-                );
-    }
-};
-
-//---------------------------------------------------------------------------
-// Backend interface implementation
-//---------------------------------------------------------------------------
-template <typename T1, typename T2, typename C, typename P>
-struct backends_compatible< vexcl<T1, C, P>, vexcl<T2, C, P> > : std::true_type {};
-
-template <typename B1, typename B2, typename C, typename P>
-struct backends_compatible< vexcl_hybrid<B1, C, P>, vexcl_hybrid<B2, C, P> > : std::true_type {};
-
-template <typename T1, typename B2, typename C, typename P>
-struct backends_compatible< vexcl<T1, C, P>, vexcl_hybrid<B2, C, P> > : std::true_type {};
-
-template <typename B1, typename T2, typename C, typename P>
-struct backends_compatible< vexcl_hybrid<B1, C, P>, vexcl<T2, C, P> > : std::true_type {};
-
-template < typename V, typename C, typename P >
-struct bytes_impl< vex::sparse::distributed<vex::sparse::matrix<V,C,P> > > {
-    static size_t get(const vex::sparse::distributed<vex::sparse::matrix<V,C,P> > &A) {
-        return
-            sizeof(P) * (A.rows() + 1) +
-            sizeof(C) * A.nonzeros() +
-            sizeof(V) * A.nonzeros();
-    }
-};
-
-template < typename V >
-struct bytes_impl< vex::vector<V> > {
-    static size_t get(const vex::vector<V> &v) {
-        return v.size() * sizeof(V);
-    }
-};
-
-template < typename Alpha, typename Beta, typename Va, typename Vx, typename Vy, typename C, typename P >
-struct spmv_impl<
-    Alpha, vex::sparse::distributed<vex::sparse::matrix<Va,C,P>>, vex::vector<Vx>,
-    Beta,  vex::vector<Vy>,
-    typename std::enable_if<
-        math::static_rows<Va>::value == 1 &&
-        math::static_rows<Vx>::value == 1 &&
-        math::static_rows<Vy>::value == 1
-        >::type
-    >
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<Va,C,P>> matrix;
-
-    static void apply(Alpha alpha, const matrix &A, const vex::vector<Vx> &x,
-            Beta beta, vex::vector<Vy> &y)
-    {
-        if (beta)
-            y = alpha * (A * x) + beta * y;
-        else
-            y = alpha * (A * x);
-    }
-};
-
-template < typename Va, typename Vf, typename Vx, typename Vr, typename C, typename P >
-struct residual_impl<
-    vex::sparse::distributed<vex::sparse::matrix<Va,C,P>>,
-    vex::vector<Vf>,
-    vex::vector<Vx>,
-    vex::vector<Vr>,
-    typename std::enable_if<
-        !is_static_matrix<Va>::value &&
-        !is_static_matrix<Vf>::value &&
-        !is_static_matrix<Vx>::value &&
-        !is_static_matrix<Vr>::value
-        >::type
-    >
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<Va,C,P>> matrix;
-
-    static void apply(const vex::vector<Vf> &rhs, const matrix &A, const vex::vector<Vx> &x,
-            vex::vector<Vr> &r)
-    {
-        r = rhs - A * x;
-    }
-};
-
-template < typename V >
-struct clear_impl< vex::vector<V> >
-{
-    static void apply(vex::vector<V> &x)
-    {
-        x = 0;
-    }
-};
-
-template < class V, class T >
-struct copy_impl<V, vex::vector<T> >
-{
-    static void apply(const V &x, vex::vector<T> &y)
-    {
-        vex::copy(x, y);
-    }
-};
-
-template < class T, class V >
-struct copy_impl<vex::vector<T>, V>
-{
-    static void apply(const vex::vector<T> &x, V &y)
-    {
-        vex::copy(x, y);
-    }
-};
-
-template < class T1, class T2 >
-struct copy_impl<vex::vector<T1>, vex::vector<T2>>
-{
-    static void apply(const vex::vector<T1> &x, vex::vector<T2> &y)
-    {
-        vex::copy(x, y);
-    }
-};
-
-template < typename V >
-struct inner_product_impl<
-    vex::vector<V>,
-    vex::vector<V>
-    >
-{
-    static V get(const vex::vector<V> &x, const vex::vector<V> &y)
-    {
-        vex::Reductor<V, vex::SUM_Kahan> sum( x.queue_list() );
-        return sum(x * y);
-    }
-};
-
-template < typename A, typename B, typename V1, typename V2 >
-struct axpby_impl<
-    A, vex::vector<V1>,
-    B, vex::vector<V2>
-    > {
-    static void apply(A a, const vex::vector<V1> &x, B b, vex::vector<V2> &y)
-    {
-        if (b)
-            y = a * x + b * y;
-        else
-            y = a * x;
-    }
-};
-
-template < typename A, typename B, typename C, typename V1, typename V2, typename V3 >
-struct axpbypcz_impl<
-    A, vex::vector<V1>,
-    B, vex::vector<V2>,
-    C, vex::vector<V3>
-    >
-{
-    static void apply(
-            A a, const vex::vector<V1> &x,
-            B b, const vex::vector<V2> &y,
-            C c,       vex::vector<V3> &z
-            )
-    {
-        if (c)
-            z = a * x + b * y + c * z;
-        else
-            z = a * x + b * y;
-    }
-};
-
-template < typename A, typename B, typename Vx, typename Vy, typename Vz >
-struct vmul_impl<
-    A, vex::vector<Vx>, vex::vector<Vy>,
-    B, vex::vector<Vz>
-    >
-{
-    static void apply(A a, const vex::vector<Vx> &x, const vex::vector<Vy> &y,
-            B b, vex::vector<Vz> &z)
-    {
-        if (b)
-            z = a * x * y + b * z;
-        else
-            z = a * x * y;
-    }
-};
-
-template <class MatrixValue, class V, bool IsConst>
-struct reinterpret_as_rhs_impl<MatrixValue, vex::vector<V>, IsConst>
-{
-    typedef typename math::scalar_of<V>::type scalar_type;
-    typedef typename math::rhs_of<MatrixValue>::type rhs_type;
-    typedef typename math::replace_scalar<rhs_type, scalar_type>::type dst_type;
-    typedef vex::vector<dst_type> return_type;
-
-    static return_type get(const vex::vector<V> &x) {
-        return x.template reinterpret<dst_type>();
-    }
-};
-
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/vexcl_static_matrix.hpp b/src/solvers/amgcl/backend/vexcl_static_matrix.hpp
deleted file mode 100644
index ad2fde6..0000000
--- a/src/solvers/amgcl/backend/vexcl_static_matrix.hpp
+++ /dev/null
@@ -1,1031 +0,0 @@
-#ifndef AMGCL_BACKEND_VEXCL_STATIC_MATRIX_HPP
-#define AMGCL_BACKEND_VEXCL_STATIC_MATRIX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/vexcl_static_matrix.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Static matrix support for the VexCL backend.
- */
-
-#include <cassert>
-#include <amgcl/backend/detail/mixing.hpp>
-#include <amgcl/backend/vexcl.hpp>
-#include <amgcl/value_type/static_matrix.hpp>
-
-namespace vex {
-
-template <typename T, int N, int M>
-struct is_cl_native< amgcl::static_matrix<T, N, M> > : std::true_type {};
-
-template <typename T, int N, int M>
-struct type_name_impl< amgcl::static_matrix<T, N, M> >
-{
-    static std::string get() {
-        std::ostringstream s;
-        s << "amgcl_matrix_" << type_name<T>() << "_" << N << "x" << M;
-        return s.str();
-    }
-};
-
-template <typename T, int N, int M>
-struct cl_scalar_of< amgcl::static_matrix<T, N, M> > {
-    typedef T type;
-};
-
-namespace sparse {
-
-template <typename T, int N>
-struct rhs_of< amgcl::static_matrix<T, N, N> > {
-    typedef amgcl::static_matrix<T, N, 1> type;
-};
-
-template <typename TA, typename TX, int N>
-struct spmv_ops_impl<amgcl::static_matrix<TA,N,N>, amgcl::static_matrix<TX,N,1>> {
-    typedef amgcl::static_matrix<TA,N,N> matrix_value;
-    typedef amgcl::static_matrix<TX,N,1> vector_value;
-
-    static void decl_accum_var(backend::source_generator &src, const std::string &name)
-    {
-        src.new_line() << type_name<amgcl::static_matrix<TA,N,1>>() << " " << name << ";";
-        for(int i = 0; i < N; ++i) {
-            src.new_line() << name << ".data[" << i << "][0] = 0;";
-        }
-    }
-
-    static void append(backend::source_generator &src,
-            const std::string &sum, const std::string &val)
-    {
-        for(int i = 0; i < N; ++i)
-            src.new_line() << sum << ".data[" << i << "][0] += " << val << ".data[" << i << "][0];";
-    }
-
-    static void append_product(backend::source_generator &src,
-            const std::string &sum, const std::string &mat_val, const std::string &vec_val)
-    {
-        src.open("{");
-        src.new_line() << type_name<vector_value>() << " v = " << vec_val << ";";
-        for(int i = 0; i < N; ++i) {
-            src.new_line() << sum << ".data[" << i << "][0] += ";
-            for(int j = 0; j < N; ++j) {
-                if (j) src << " + ";
-                src << mat_val << ".data[" << i << "][" << j << "] * v.data[" << j << "][0]";
-            }
-            src << ";";
-        }
-        src.close("}");
-    }
-};
-
-template <typename T, int N, typename Col, typename Ptr>
-class ell<amgcl::static_matrix<T, N, N>, Col, Ptr> {
-    public:
-        typedef amgcl::static_matrix<T, N, N> Val;
-        typedef Val value_type;
-
-        typedef Val val_type;
-        typedef Col col_type;
-        typedef Ptr ptr_type;
-
-        template <class PtrRange, class ColRange, class ValRange>
-        ell(
-                const std::vector<backend::command_queue> &q,
-                size_t nrows, size_t ncols,
-                const PtrRange &ptr,
-                const ColRange &col,
-                const ValRange &val,
-                bool fast = true
-           ) : q(q[0]), n(nrows), m(ncols),
-               nnz(std::distance(std::begin(val), std::end(val))),
-               ell_pitch(alignup(nrows, 16U)), csr_nnz(0)
-        {
-            precondition(q.size() == 1,
-                    "sparse::ell is only supported for single-device contexts");
-
-            if (fast) {
-                convert(ptr, col, val);
-                return;
-            }
-
-            /* 1. Get optimal ELL widths for local and remote parts. */
-            // Speed of ELL relative to CSR:
-            const double ell_vs_csr = 3.0;
-
-            // Find maximum widths for local and remote parts:
-            size_t max_width = 0;
-            for(size_t i = 0; i < n; ++i)
-                max_width = std::max<size_t>(max_width, ptr[i+1] - ptr[i]);
-
-            // Build width distribution histogram.
-            std::vector<Ptr> hist(max_width + 1, 0);
-            for(size_t i = 0; i < n; ++i)
-                ++hist[ptr[i+1] - ptr[i]];
-
-            // Estimate optimal width for ELL part of the matrix.
-            ell_width = max_width;
-            for(size_t i = 0, rows = n; i < max_width; ++i) {
-                rows -= hist[i]; // Number of rows wider than i.
-                if (ell_vs_csr * rows < n) {
-                    ell_width = i;
-                    break;
-                }
-            }
-
-            if (ell_width == 0) {
-                assert(csr_nnz == nnz);
-
-                csr_ptr = backend::device_vector<Ptr>(q[0], n + 1,   &ptr[0]);
-                csr_col = backend::device_vector<Col>(q[0], csr_nnz, &col[0]);
-                csr_val = create_device_vector       (q[0], csr_nnz, &val[0], false);
-
-                return;
-            }
-
-            size_t ell_nnz = ell_pitch * ell_width;
-
-            // Count nonzeros in CSR part of the matrix.
-            for(size_t i = ell_width + 1; i <= max_width; ++i)
-                csr_nnz += hist[i] * (i - ell_width);
-
-            /* 3. Split the input matrix into ELL and CSR submatrices. */
-            std::vector<Col> _ell_col(ell_nnz, static_cast<Col>(-1));
-            std::vector<T>   _ell_val(ell_nnz * N * N);
-            std::vector<Ptr> _csr_ptr;
-            std::vector<Col> _csr_col;
-            std::vector<T>   _csr_val;
-
-            if (csr_nnz) {
-                _csr_ptr.resize(n + 1);
-                _csr_col.resize(csr_nnz);
-                _csr_val.resize(csr_nnz * N * N);
-
-                _csr_ptr[0] = 0;
-                for(size_t i = 0; i < n; ++i) {
-                    size_t w = ptr[i+1] - ptr[i];
-                    _csr_ptr[i+1] = _csr_ptr[i] + (w > ell_width ? w - ell_width : 0);
-                }
-            }
-
-
-            for(size_t i = 0; i < n; ++i) {
-                size_t w = 0;
-                Ptr csr_head = csr_nnz ? _csr_ptr[i] : 0;
-                for(Ptr j = ptr[i], e = ptr[i+1]; j < e; ++j, ++w) {
-                    Col c = col[j];
-                    Val v = val[j];
-
-                    if (w < ell_width) {
-                        _ell_col[i + w * ell_pitch] = c;
-                        for(int k = 0, ii = 0; ii < N; ++ii)
-                            for(int jj = 0; jj < N; ++jj, ++k)
-                                _ell_val[k * ell_nnz + w * ell_pitch + i] = v(ii,jj);
-                    } else {
-                        _csr_col[csr_head] = c;
-                        for(int k = 0, ii = 0; ii < N; ++ii)
-                            for(int jj = 0; jj < N; ++jj, ++k)
-                                _csr_val[k * csr_nnz + csr_head] = v(ii,jj);
-                        ++csr_head;
-                    }
-                }
-            }
-
-            {
-                size_t ell_size = ell_pitch * ell_width;
-                ell_col = backend::device_vector<Col>(q[0], ell_size, _ell_col.data());
-                ell_val = backend::device_vector<T>  (q[0], ell_nnz * N * N, _ell_val.data());
-            }
-
-            if (csr_nnz) {
-                csr_ptr = backend::device_vector<Ptr>(q[0], n + 1,   _csr_ptr.data());
-                csr_col = backend::device_vector<Col>(q[0], csr_nnz, _csr_col.data());
-                csr_val = backend::device_vector<T>  (q[0], csr_nnz * N * N, _csr_val.data());
-            }
-        }
-
-        // Dummy matrix; used internally to pass empty parameters to kernels.
-        ell(const backend::command_queue &q)
-            : q(q), n(0), m(0), nnz(0), ell_width(0), ell_pitch(0), csr_nnz(0)
-        {}
-
-        template <class Expr>
-        friend
-        typename std::enable_if<
-            boost::proto::matches<
-                typename boost::proto::result_of::as_expr<Expr>::type,
-                vector_expr_grammar
-            >::value,
-            matrix_vector_product<ell, Expr>
-        >::type
-        operator*(const ell &A, const Expr &x) {
-            return matrix_vector_product<ell, Expr>(A, x);
-        }
-
-        template <class Vector>
-        static void terminal_preamble(const Vector &x, backend::source_generator &src,
-            const backend::command_queue &q, const std::string &prm_name,
-            detail::kernel_generator_state_ptr state)
-        {
-            detail::output_terminal_preamble tp(src, q, prm_name + "_x", state);
-            boost::proto::eval(boost::proto::as_child(x), tp);
-        }
-
-        template <class Vector>
-        static void local_terminal_init(const Vector &x, backend::source_generator &src,
-            const backend::command_queue &q, const std::string &prm_name,
-            detail::kernel_generator_state_ptr state)
-        {
-            typedef typename detail::return_type<Vector>::type x_type;
-            typedef amgcl::static_matrix<T,N,1> vector_value;
-
-            src.new_line() << type_name<vector_value>() << " " << prm_name << "_sum;";
-            for(int i = 0; i < N; ++i) {
-                src.new_line() << prm_name << "_sum.data[" << i << "][0] = 0;";
-            }
-            src.open("{");
-
-            // ELL part
-            src.new_line() << type_name<size_t>() << " " << prm_name << "_ell_size = " << prm_name << "_ell_width * " << prm_name << "_ell_pitch;";
-            src.new_line() << "for(size_t j = 0; j < " << prm_name << "_ell_width; ++j)";
-            src.open("{");
-            src.new_line() << type_name<Col>() << " nnz_idx = idx + j * " << prm_name << "_ell_pitch;";
-            src.new_line() << type_name<Col>() << " c = " << prm_name << "_ell_col[nnz_idx];";
-            src.new_line() << "if (c != (" << type_name<Col>() << ")(-1))";
-            src.open("{");
-
-            src.new_line() << type_name<Col>() << " idx = c;";
-
-            {
-                detail::output_local_preamble init_x(src, q, prm_name + "_x", state);
-                boost::proto::eval(boost::proto::as_child(x), init_x);
-
-                backend::source_generator vec_value;
-                detail::vector_expr_context expr_x(vec_value, q, prm_name + "_x", state);
-                boost::proto::eval(boost::proto::as_child(x), expr_x);
-
-                src.open("{");
-                src.new_line() << type_name<x_type>() << " v = " << vec_value.str() << ";";
-                for(int k = 0, j = 0; j < N; ++j) {
-                    src.new_line() << prm_name << "_sum.data[" << j << "][0] += ";
-                    for(int i = 0; i < N; ++i, ++k) {
-                        if (i) src << " + ";
-                        src << prm_name << "_ell_val[" << k << " * " << prm_name << "_ell_size + nnz_idx] * v.data[" << i << "][0]";
-                    }
-                    src << ";";
-                }
-                src.close("}");
-            }
-
-            src.close("} else break;");
-            src.close("}");
-
-            // CSR part
-            src.new_line() << "if (" << prm_name << "_csr_ptr)";
-            src.open("{");
-            src.new_line() << type_name<size_t>() << " " << prm_name << "_csr_size = " << prm_name << "_csr_ptr[n];";
-            src.new_line() << type_name<Ptr>() << " csr_beg = " << prm_name << "_csr_ptr[idx];";
-            src.new_line() << type_name<Ptr>() << " csr_end = " << prm_name << "_csr_ptr[idx+1];";
-            src.new_line() << "for(" << type_name<Ptr>() << " j = csr_beg; j < csr_end; ++j)";
-            src.open("{");
-
-            src.new_line() << type_name<Col>() << " idx = " << prm_name << "_csr_col[j];";
-
-            {
-                detail::output_local_preamble init_x(src, q, prm_name + "_x", state);
-                boost::proto::eval(boost::proto::as_child(x), init_x);
-
-                backend::source_generator vec_value;
-                detail::vector_expr_context expr_x(vec_value, q, prm_name + "_x", state);
-                boost::proto::eval(boost::proto::as_child(x), expr_x);
-
-                src.open("{");
-                src.new_line() << type_name<x_type>() << " v = " << vec_value.str() << ";";
-                for(int k = 0, j = 0; j < N; ++j) {
-                    src.new_line() << prm_name << "_sum.data[" << j << "][0] += ";
-                    for(int i = 0; i < N; ++i, ++k) {
-                        if (i) src << " + ";
-                        src << prm_name << "_csr_val[" << k << " * " << prm_name << "_csr_size + j] * v.data[" << i << "][0]";
-                    }
-                    src << ";";
-                }
-                src.close("}");
-            }
-
-            src.close("}");
-            src.close("}");
-            src.close("}");
-        }
-
-        template <class Vector>
-        static void kernel_param_declaration(const Vector &x, backend::source_generator &src,
-            const backend::command_queue &q, const std::string &prm_name,
-            detail::kernel_generator_state_ptr state)
-        {
-            src.parameter< size_t >(prm_name + "_ell_width");
-            src.parameter< size_t >(prm_name + "_ell_pitch");
-
-            src.parameter< global_ptr<Col> >(prm_name + "_ell_col");
-            src.parameter< global_ptr<T  > >(prm_name + "_ell_val");
-            src.parameter< global_ptr<Ptr> >(prm_name + "_csr_ptr");
-            src.parameter< global_ptr<Col> >(prm_name + "_csr_col");
-            src.parameter< global_ptr<T  > >(prm_name + "_csr_val");
-
-            detail::declare_expression_parameter decl_x(src, q, prm_name + "_x", state);
-            detail::extract_terminals()(boost::proto::as_child(x), decl_x);
-        }
-
-        template <class Vector>
-        static void partial_vector_expr(const Vector&, backend::source_generator &src,
-            const backend::command_queue&, const std::string &prm_name,
-            detail::kernel_generator_state_ptr)
-        {
-            src << prm_name << "_sum";
-        }
-
-        template <class Vector>
-        void kernel_arg_setter(const Vector &x,
-            backend::kernel &kernel, unsigned part, size_t index_offset,
-            detail::kernel_generator_state_ptr state) const
-        {
-            kernel.push_arg(ell_width);
-            kernel.push_arg(ell_pitch);
-            if (ell_width) {
-                kernel.push_arg(ell_col);
-                kernel.push_arg(ell_val);
-            } else {
-                kernel.push_arg(static_cast<size_t>(0));
-                kernel.push_arg(static_cast<size_t>(0));
-            }
-            if (csr_nnz) {
-                kernel.push_arg(csr_ptr);
-                kernel.push_arg(csr_col);
-                kernel.push_arg(csr_val);
-            } else {
-                kernel.push_arg(static_cast<size_t>(0));
-                kernel.push_arg(static_cast<size_t>(0));
-                kernel.push_arg(static_cast<size_t>(0));
-            }
-
-            detail::set_expression_argument x_args(kernel, part, index_offset, state);
-            detail::extract_terminals()( boost::proto::as_child(x), x_args);
-        }
-
-        template <class Vector>
-        void expression_properties(const Vector&,
-            std::vector<backend::command_queue> &queue_list,
-            std::vector<size_t> &partition,
-            size_t &size) const
-        {
-            queue_list = std::vector<backend::command_queue>(1, q);
-            partition  = std::vector<size_t>(2, 0);
-            partition.back() = size = n;
-        }
-
-        size_t rows()     const { return n; }
-        size_t cols()     const { return m; }
-        size_t nonzeros() const { return nnz; }
-    private:
-        backend::command_queue q;
-
-        size_t n, m, nnz, ell_width, ell_pitch, csr_nnz;
-
-        backend::device_vector<Col> ell_col;
-        backend::device_vector<T>   ell_val;
-
-        backend::device_vector<Ptr> csr_ptr;
-        backend::device_vector<Col> csr_col;
-        backend::device_vector<T>   csr_val;
-
-        backend::device_vector<T> create_device_vector(const backend::command_queue &q,
-                size_t nnz, const Val *host_data, bool fast = true)
-        {
-            backend::device_vector<T> val(q, nnz * N * N);
-
-            if (nnz) {
-                if (fast) {
-                    backend::device_vector<T> tmp(q, nnz * N * N, reinterpret_cast<const T*>(host_data));
-
-                    VEX_FUNCTION(T, transpose, (int,k)(int,m)(int,nnz)(T*, v),
-                            int i = k / nnz;
-                            int j = k % nnz;
-                            return v[j * m + i];
-                            );
-
-                    vex::vector<T>(q,val) = transpose(vex::element_index(), N*N, nnz, raw_pointer(vex::vector<T>(q, tmp)));
-                } else {
-                    auto v = val.map(q);
-
-                    for(int k = 0, i = 0; i < N; ++i)
-                        for(int j = 0; j < N; ++j, ++k)
-                            for(size_t m = 0; m < nnz; ++m)
-                                v[k * nnz + m] = host_data[m](i,j);
-                }
-            }
-
-            return val;
-        }
-
-        backend::kernel& csr2ell_kernel() const {
-            using namespace vex::detail;
-            static kernel_cache cache;
-
-            auto kernel = cache.find(q);
-            if (kernel == cache.end()) {
-                backend::source_generator src(q);
-
-                src.begin_kernel("convert_csr2ell");
-                src.begin_kernel_parameters();
-                src.template parameter<size_t>("n");
-                src.template parameter<size_t>("ell_width");
-                src.template parameter<size_t>("ell_pitch");
-                src.template parameter< global_ptr<const ptr_type> >("ptr");
-                src.template parameter< global_ptr<const col_type> >("col");
-                src.template parameter< global_ptr<const T> >("val");
-                src.template parameter< global_ptr<col_type> >("ell_col");
-                src.template parameter< global_ptr<T> >("ell_val");
-                src.template parameter< global_ptr<const ptr_type> >("csr_ptr");
-                src.template parameter< global_ptr<col_type> >("csr_col");
-                src.template parameter< global_ptr<T> >("csr_val");
-                src.end_kernel_parameters();
-                src.new_line() << type_name<size_t>() << " nnz = ptr[n];";
-                src.new_line() << type_name<size_t>() << " ell_nnz = ell_width * ell_pitch;";
-                src.new_line() << type_name<size_t>() << " csr_nnz = csr_ptr ? csr_ptr[n] : 0;";
-                src.grid_stride_loop().open("{");
-
-                src.new_line() << type_name<int>() << " w = 0;";
-                src.new_line() << type_name<ptr_type>() << " csr_head = 0;";
-                src.new_line() << "if (csr_ptr) csr_head = csr_ptr[idx];";
-                src.new_line() << "for(" << type_name<ptr_type>() << " j = ptr[idx], e = ptr[idx+1]; j < e; ++j, ++w)";
-                src.open("{");
-                src.new_line() << type_name<col_type>() << " c = col[j];";
-                src.new_line() << "if (w < ell_width) {";
-                src.new_line() << "  ell_col[idx + w * ell_pitch] = c;";
-                for(int i = 0; i < N * N; ++i)
-                src.new_line() << "  ell_val[" << i << " * ell_nnz + w * ell_pitch + idx] = val[" << i << " * nnz + j];";
-                src.new_line() << "} else {";
-                src.new_line() << "  csr_col[csr_head] = c;";
-                for(int i = 0; i < N * N; ++i)
-                src.new_line() << "  csr_val[" << i << " * csr_nnz + csr_head] = val[" << i << " * nnz + j];";
-                src.new_line() << "  ++csr_head;";
-                src.new_line() << "}";
-                src.close("}");
-                src.close("}");
-                src.end_kernel();
-
-                kernel = cache.insert(q, backend::kernel(q, src.str(), "convert_csr2ell"));
-            }
-
-            return kernel->second;
-        }
-
-        template <class PtrRange, class ColRange, class ValRange>
-        void convert(
-                const PtrRange &host_ptr,
-                const ColRange &host_col,
-                const ValRange &host_val
-                )
-        {
-            size_t nnz = host_ptr[n];
-
-            backend::device_vector<Ptr> Aptr(q, n + 1, &host_ptr[0]);
-            backend::device_vector<Col> Acol(q, nnz, nnz ? &host_col[0] : nullptr);
-            backend::device_vector<T>   Aval = create_device_vector(q, nnz, nnz ? &host_val[0] : nullptr);
-
-            /* 1. Get optimal ELL widths for local and remote parts. */
-            // Speed of ELL relative to CSR:
-            const double ell_vs_csr = 3.0;
-
-            // Find maximum widths for local and remote parts:
-            std::vector<backend::command_queue> ctx(1, q);
-            Reductor<int, MAX> max(ctx);
-
-            vex::vector<Ptr> ptr(q, Aptr);
-
-            VEX_FUNCTION(Ptr, row_width, (size_t, i)(const Ptr*, ptr),
-                    return ptr[i+1] - ptr[i];
-                    );
-
-            int max_width = max(row_width(element_index(0, n), raw_pointer(ptr)));
-
-            // Build width distribution histogram.
-            vex::vector<int> hist(ctx, max_width + 1);
-            hist = 0;
-            eval(atomic_add(&permutation(row_width(element_index(0, n), raw_pointer(ptr)))(hist), 1));
-
-            // Estimate optimal width for ELL part of the matrix,
-            // count nonzeros in CSR part of the matrix
-            ell_width = max_width;
-            {
-                auto h = hist.map(0);
-
-                for(int i = 0, rows = n; i < max_width; ++i) {
-                    rows -= h[i]; // Number of rows wider than i.
-                    if (ell_vs_csr * rows < n) {
-                        ell_width = i;
-                        break;
-                    }
-                }
-
-                for(int i = ell_width + 1; i <= max_width; ++i)
-                    csr_nnz += h[i] * (i - ell_width);
-            }
-
-            if (ell_width == 0) {
-                assert(csr_nnz == nnz);
-
-                csr_ptr = Aptr;
-                csr_col = Acol;
-                csr_val = Aval;
-
-                return;
-            }
-
-            if (csr_nnz) {
-                VEX_FUNCTION(int, csr_width, (size_t, ell_width)(size_t, i)(const Ptr*, ptr),
-                        if (i == 0) return 0;
-                        int w = ptr[i] - ptr[i-1];
-                        return (w > ell_width) ? (w - ell_width) : 0;
-                        );
-
-                vex::vector<ptr_type> csr_w(ctx, n+1);
-
-                csr_ptr = backend::device_vector<Ptr>(q, n + 1);
-                csr_col = backend::device_vector<Col>(q, csr_nnz);
-                csr_val = backend::device_vector<T>  (q, csr_nnz * N * N);
-
-                csr_w = csr_width(ell_width, element_index(), raw_pointer(ptr));
-                vector<ptr_type> csr_p(q, csr_ptr);
-                inclusive_scan(csr_w, csr_p);
-            }
-
-
-            /* 3. Split the input matrix into ELL and CSR submatrices. */
-            ell_col = backend::device_vector<Col>(q, ell_pitch * ell_width);
-            ell_val = backend::device_vector<T>  (q, ell_pitch * ell_width * N * N);
-
-            vex::vector<Col>(q, ell_col) = -1;
-
-            auto &convert = csr2ell_kernel();
-
-            convert.push_arg(n);
-            convert.push_arg(ell_width);
-            convert.push_arg(ell_pitch);
-            convert.push_arg(Aptr);
-            convert.push_arg(Acol);
-            convert.push_arg(Aval);
-            convert.push_arg(ell_col);
-            convert.push_arg(ell_val);
-            if (csr_nnz) {
-                convert.push_arg(csr_ptr);
-                convert.push_arg(csr_col);
-                convert.push_arg(csr_val);
-            } else {
-                convert.push_arg(static_cast<size_t>(0));
-                convert.push_arg(static_cast<size_t>(0));
-                convert.push_arg(static_cast<size_t>(0));
-            }
-            convert(q);
-        }
-};
-
-} // namespace sparse
-} // namespace vex
-
-namespace amgcl {
-namespace backend {
-
-template <typename T, int N>
-std::string vexcl_static_matrix_declaration() {
-    std::ostringstream s;
-    s << "typedef struct { " << vex::type_name<T>() << " data[" << N << "][" << N << "]; } "
-         "amgcl_matrix_" << vex::type_name<T>() << "_" << N << "x" << N << ";\n";
-    if (N != 1)
-    s << "typedef struct { " << vex::type_name<T>() << " data[" << N << "][" << 1 << "]; } "
-         "amgcl_matrix_" << vex::type_name<T>() << "_" << N << "x" << 1 << ";\n";
-    return s.str();
-}
-
-template <typename T, int N>
-struct vex_scale {
-    typedef static_matrix<T,N,1> vector;
-
-    struct apply_type : vex::UserFunction<apply_type, vector(T, vector)> {
-        apply_type() {}
-
-        static std::string name() {
-            return "scale_" + vex::type_name<vector>();
-        }
-
-        static void define(vex::backend::source_generator &src, const std::string &fname = name()) {
-            src.begin_function<vector>(fname);
-            src.begin_function_parameters();
-            src.parameter<T>("a");
-            src.parameter<vector>("m");
-            src.end_function_parameters();
-            for(int i = 0; i < N; ++i)
-                src.new_line() << "m.data[" << i << "][0] *= a;";
-            src.new_line() << "return m;";
-            src.end_function();
-        }
-    } const apply;
-};
-
-template <typename TS, typename TD, int N, class Enable = void> struct vex_convert;
-
-template <typename TS, typename TD, int N>
-struct vex_convert<TS, TD, N,
-    typename std::enable_if<!std::is_same<TS, TD>::value>::type>
-{
-    typedef static_matrix<TS,N,1> src_vector;
-    typedef static_matrix<TD,N,1> dst_vector;
-
-    struct apply_type : vex::UserFunction<apply_type, dst_vector(src_vector)> {
-        apply_type() {}
-
-        static std::string name() {
-            return "convert_" + vex::type_name<src_vector>() + "_" + vex::type_name<dst_vector>();
-        }
-
-        static void define(vex::backend::source_generator &src, const std::string &fname = name()) {
-            src.begin_function<dst_vector>(fname);
-            src.begin_function_parameters();
-            src.parameter<src_vector>("s");
-            src.end_function_parameters();
-            src.new_line() << vex::type_name<dst_vector>() << " d;";
-            for(int i = 0; i < N; ++i)
-                src.new_line() << "d.data[" << i << "][0] = s.data[" << i << "][0];";
-            src.new_line() << "return d;";
-            src.end_function();
-        }
-    } const apply;
-};
-
-template <typename TS, typename TD, int N>
-struct vex_convert<TS, TD, N,
-    typename std::enable_if<std::is_same<TS, TD>::value>::type>
-{
-    template <class X>
-    static const X& apply(const X &x) { return x; }
-};
-
-template <typename TA, typename TB, int N>
-struct vex_add {
-    typedef static_matrix<TA,N,1> vectorA;
-    typedef static_matrix<TB,N,1> vectorB;
-
-    struct apply_type : vex::UserFunction<apply_type, vectorA(vectorA, vectorB)> {
-        apply_type() {}
-
-        static std::string name() {
-            return "add_" + vex::type_name<vectorA>() + "_" + vex::type_name<vectorB>();
-        }
-
-        static void define(vex::backend::source_generator &src, const std::string &fname = name()) {
-            src.begin_function<vectorA>(fname);
-            src.begin_function_parameters();
-            src.parameter<vectorA>("a");
-            src.parameter<vectorB>("b");
-            src.end_function_parameters();
-            for(int i = 0; i < N; ++i)
-                src.new_line() << "a.data[" << i << "][0] += "
-                               << "b.data[" << i << "][0];";
-            src.new_line() << "return a;";
-            src.end_function();
-        }
-    } const apply;
-};
-
-template <typename TA, typename TB, int N>
-struct vex_sub {
-    typedef static_matrix<TA,N,1> vectorA;
-    typedef static_matrix<TB,N,1> vectorB;
-
-    struct apply_type : vex::UserFunction<apply_type, vectorA(vectorA, vectorB)> {
-        apply_type() {}
-
-        static std::string name() {
-            return "sub_" + vex::type_name<vectorA>() + "_" + vex::type_name<vectorB>();
-        }
-
-        static void define(vex::backend::source_generator &src, const std::string &fname = name()) {
-            src.begin_function<vectorA>(fname);
-            src.begin_function_parameters();
-            src.parameter<vectorA>("a");
-            src.parameter<vectorB>("b");
-            src.end_function_parameters();
-            for(int i = 0; i < N; ++i)
-                src.new_line() << "a.data[" << i << "][0] -= "
-                               << "b.data[" << i << "][0];";
-            src.new_line() << "return a;";
-            src.end_function();
-        }
-    } const apply;
-};
-
-template <typename TA, typename TX, int N>
-struct vex_mul {
-    typedef static_matrix<TA,N,N> matrix;
-    typedef static_matrix<TX,N,1> vectorX;
-    typedef static_matrix<TA,N,1> vectorY;
-
-    struct apply_type : vex::UserFunction<apply_type, vectorY(matrix, vectorX)> {
-        apply_type() {}
-
-        static std::string name() {
-            return "mul_" + vex::type_name<matrix>() + "_" + vex::type_name<vectorX>();
-        }
-
-        static void define(vex::backend::source_generator &src, const std::string &fname = name()) {
-            src.begin_function<vectorY>(fname);
-            src.begin_function_parameters();
-            src.parameter<matrix>("a");
-            src.parameter<vectorX>("b");
-            src.end_function_parameters();
-            src.new_line() << vex::type_name<vectorY>() << " c;";
-            for(int i = 0; i < N; ++i) {
-                src.new_line() << "c.data[" << i << "][0] = ";
-                for(int j = 0; j < N; ++j) {
-                    if (j) src << " + ";
-                    src << "a.data[" << i << "][" << j << "] * b.data[" << j << "][0]";
-                }
-                src << ";";
-            }
-            src.new_line() << "return c;";
-            src.end_function();
-        }
-    } const apply;
-};
-
-template <typename Alpha, typename Beta, typename TA, typename TX, typename TY, int B, typename C, typename P>
-struct spmv_impl<Alpha,
-    vex::sparse::distributed<vex::sparse::matrix<static_matrix<TA,B,B>, C, P>>,
-    vex::vector<static_matrix<TX,B,1>>, Beta, vex::vector<static_matrix<TY,B,1>>,
-    typename std::enable_if<(B > 1)>::type
-    >
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<static_matrix<TA,B,B>, C, P>> matrix;
-    typedef vex::vector<static_matrix<TX,B,1>> vectorX;
-    typedef vex::vector<static_matrix<TY,B,1>> vectorY;
-
-    static void apply(Alpha alpha, const matrix &A, const vectorX &x, Beta beta, vectorY &y)
-    {
-        if (beta)
-            y = vex_add<TY,TA,B>().apply(vex_scale<TY,B>().apply(beta, y), vex_scale<TA,B>().apply(alpha, A * x));
-        else
-            y = vex_convert<TA,TY,B>().apply(vex_scale<TA,B>().apply(alpha, A * x));
-    }
-};
-
-
-template <typename Alpha, typename Beta, typename TA, typename TX, typename TY, typename C, typename P>
-struct spmv_impl<Alpha,
-    vex::sparse::distributed<vex::sparse::matrix<TA, C, P>>,
-    vex::vector<TX>, Beta, vex::vector<TY>,
-    typename std::enable_if<
-        (math::static_rows<TA>::value == 1) && (
-                math::static_rows<TA>::value != math::static_rows<TX>::value ||
-                math::static_rows<TA>::value != math::static_rows<TY>::value
-                )
-        >::type>
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<TA, C, P>> matrix;
-    typedef vex::vector<TX> vectorx;
-    typedef vex::vector<TY> vectory;
-
-    static void apply(Alpha alpha, const matrix &A, const vectorx &x, Beta beta, vectory &y)
-    {
-        auto _x = x.template reinterpret<typename math::scalar_of<TX>::type>();
-        auto _y = y.template reinterpret<typename math::scalar_of<TY>::type>();
-        spmv(alpha, A, _x, beta, _y);
-    }
-};
-
-template <typename Alpha, typename Beta, typename TA, typename TX, typename TY, typename C, typename P>
-struct spmv_impl<Alpha,
-    vex::sparse::distributed<vex::sparse::matrix<TA, C, P>>,
-    vex::vector<TX>, Beta, vex::vector<TY>,
-    typename std::enable_if<
-        (math::static_rows<TA>::value > 1) && (
-                math::static_rows<TA>::value != math::static_rows<TX>::value ||
-                math::static_rows<TA>::value != math::static_rows<TY>::value
-                )
-        >::type>
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<TA, C, P>> matrix;
-    typedef vex::vector<TX> vectorx;
-    typedef vex::vector<TY> vectory;
-
-    static void apply(Alpha alpha, const matrix &A, const vectorx &x, Beta beta, vectory &y)
-    {
-        const int B = math::static_rows<TA>::value;
-        auto _x = x.template reinterpret<static_matrix<typename math::scalar_of<TX>::type, B, 1>>();
-        auto _y = y.template reinterpret<static_matrix<typename math::scalar_of<TY>::type, B, 1>>();
-        spmv(alpha, A, _x, beta, _y);
-    }
-};
-
-template <typename TB, typename TA, typename TX, typename TR, int B, typename C, typename P>
-struct residual_impl<
-    vex::sparse::distributed<vex::sparse::matrix<static_matrix<TA,B,B>, C, P>>,
-    vex::vector<static_matrix<TB,B,1>>,
-    vex::vector<static_matrix<TX,B,1>>,
-    vex::vector<static_matrix<TR,B,1>>,
-    typename std::enable_if<(B > 1)>::type
-    >
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<static_matrix<TA,B,B>, C, P>> matrix;
-    typedef vex::vector<static_matrix<TB,B,1>> vectorB;
-    typedef vex::vector<static_matrix<TX,B,1>> vectorX;
-    typedef vex::vector<static_matrix<TR,B,1>> vectorR;
-
-    static void apply(const vectorB &rhs, const matrix &A, const vectorX &x, vectorR &r)
-    {
-        r = vex_convert<TB,TR,B>().apply(vex_sub<TB, TA, B>().apply(rhs, A * x));
-    }
-};
-
-template <typename TB, typename TA, typename TX, typename TR, int B, typename C, typename P>
-struct residual_impl<
-    vex::sparse::distributed<vex::sparse::matrix<static_matrix<TA,B,B>, C, P>>,
-    vex::vector<TB>,
-    vex::vector<TX>,
-    vex::vector<TR>,
-    typename std::enable_if<
-        math::static_rows<TB>::value == 1 &&
-        math::static_rows<TX>::value == 1 &&
-        math::static_rows<TR>::value == 1 &&
-        (B > 1)
-        >::type
-    >
-{
-    typedef vex::sparse::distributed<vex::sparse::matrix<static_matrix<TA,B,B>, C, P>> matrix;
-    typedef vex::vector<TB> vectorB;
-    typedef vex::vector<TX> vectorX;
-    typedef vex::vector<TR> vectorR;
-
-    static void apply(const vectorB &b, const matrix &A, const vectorX &x, vectorR &r)
-    {
-        typedef static_matrix<TB,B,1> VB;
-        typedef static_matrix<TX,B,1> VX;
-        typedef static_matrix<TR,B,1> VR;
-
-        auto _b = b.template reinterpret<VB>();
-        auto _x = x.template reinterpret<VX>();
-        auto _r = r.template reinterpret<VR>();
-
-        _r = vex_convert<TB,TR,B>().apply(vex_sub<TB, TA, B>().apply(_b, A * _x));
-    }
-};
-
-template < typename Alpha, typename Beta, typename TX, typename TY, typename TZ, int B >
-struct vmul_impl<
-    Alpha, vex::vector< static_matrix<TX,B,B> >,
-    vex::vector< static_matrix<TY,B,1> >,
-    Beta, vex::vector< static_matrix<TZ,B,1> >
-    >
-{
-    typedef vex::vector< static_matrix<TX,B,B> > matrix;
-    typedef vex::vector< static_matrix<TY,B,1> > vectorY;
-    typedef vex::vector< static_matrix<TZ,B,1> > vectorZ;
-
-    static void apply(Alpha a, const matrix &x, const vectorY &y, Beta b, vectorZ &z)
-    {
-        if (b)
-            z = vex_add<TZ,TX,B>().apply(vex_scale<TZ,B>().apply(b, z), vex_scale<TX,B>().apply(a, vex_mul<TX,TY,B>().apply(x, y)));
-        else
-            z = vex_convert<TX,TZ,B>().apply(vex_scale<TX,B>().apply(a, vex_mul<TX,TY,B>().apply(x, y)));
-    }
-};
-
-template < typename T, int B >
-struct clear_impl< vex::vector< static_matrix<T,B,1> > >
-{
-    typedef static_matrix<T,B,1> vector_value;
-    typedef vex::vector<vector_value> vector;
-
-    static void apply(vector &x) {
-        x.template reinterpret<T>() = 0;
-    }
-};
-
-template < typename T, int B >
-struct copy_impl<
-    vex::vector< static_matrix<T,B,1> >,
-    vex::vector< static_matrix<T,B,1> >
-    >
-{
-    typedef vex::vector< static_matrix<T,B,1> > vector;
-
-    static void apply(const vector &x, vector &y) {
-        auto X = x.template reinterpret<T>();
-        auto Y = y.template reinterpret<T>();
-        Y = X;
-    }
-};
-
-template < typename A, typename B, typename TX, typename TY, int N >
-struct axpby_impl<
-    A, vex::vector< static_matrix<TX, N, 1> >,
-    B, vex::vector< static_matrix<TY, N, 1> >
-    >
-{
-    typedef vex::vector< static_matrix<TX,N,1> > vectorX;
-    typedef vex::vector< static_matrix<TY,N,1> > vectorY;
-
-    static void apply(A a, const vectorX &x, B b, vectorY &y) {
-        if (b)
-            y.template reinterpret<TY>() =
-                a * x.template reinterpret<TX>() +
-                b * y.template reinterpret<TY>();
-        else
-            y.template reinterpret<TY>() =
-                a * x.template reinterpret<TX>();
-    }
-};
-
-template < typename A, typename B, typename C, typename TX, typename TY, typename TZ, int N >
-struct axpbypcz_impl<
-    A, vex::vector< static_matrix<TX, N, 1> >,
-    B, vex::vector< static_matrix<TY, N, 1> >,
-    C, vex::vector< static_matrix<TZ, N, 1> >
-    >
-{
-    typedef vex::vector< static_matrix<TX,N,1> > vectorX;
-    typedef vex::vector< static_matrix<TY,N,1> > vectorY;
-    typedef vex::vector< static_matrix<TZ,N,1> > vectorZ;
-
-    static void apply(A a, const vectorX &x, B b, const vectorY &y, C c, vectorZ &z) {
-        if (c)
-            z.template reinterpret<TZ>() =
-                a * x.template reinterpret<TX>() +
-                b * y.template reinterpret<TY>() +
-                c * z.template reinterpret<TZ>();
-        else
-            z.template reinterpret<TZ>() =
-                a * x.template reinterpret<TX>() +
-                b * y.template reinterpret<TY>();
-    }
-};
-
-template < typename T, int B >
-struct inner_product_impl<
-    vex::vector< static_matrix<T,B,1> >,
-    vex::vector< static_matrix<T,B,1> >
-    >
-{
-    typedef T return_type;
-    typedef static_matrix<T,B,1> vector_value;
-    typedef vex::vector<vector_value> vector;
-
-    static return_type get(const vector &x, const vector &y) {
-        vex::Reductor<T, vex::SUM_Kahan> sum( x.queue_list() );
-        return sum( x.template reinterpret<T>() * y.template reinterpret<T>() );
-    }
-};
-
-namespace detail {
-
-template <class V1, class V2>
-struct common_scalar_backend< backend::vexcl<V1>, backend::vexcl<V2>,
-    typename std::enable_if<
-        math::static_rows<V1>::value != 1 ||
-        math::static_rows<V2>::value != 1
-        >::type>
-{
-    typedef typename math::scalar_of<V1>::type S1;
-    typedef typename math::scalar_of<V2>::type S2;
-
-    typedef
-        typename std::conditional<
-            (sizeof(S1) > sizeof(S2)), backend::vexcl<S1>, backend::vexcl<S2>
-            >::type
-        type;
-};
-
-} // namespace detail
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/backend/viennacl.hpp b/src/solvers/amgcl/backend/viennacl.hpp
deleted file mode 100644
index 73b993a..0000000
--- a/src/solvers/amgcl/backend/viennacl.hpp
+++ /dev/null
@@ -1,462 +0,0 @@
-#ifndef AMGCL_BACKEND_VIENNACL_HPP
-#define AMGCL_BACKEND_VIENNACL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/backend/viennacl.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  ViennaCL backend.
- */
-
-#include <type_traits>
-
-#include <viennacl/vector.hpp>
-#include <viennacl/compressed_matrix.hpp>
-#include <viennacl/ell_matrix.hpp>
-#include <viennacl/hyb_matrix.hpp>
-#include <viennacl/linalg/inner_prod.hpp>
-#include <viennacl/linalg/prod.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-
-namespace amgcl {
-
-namespace solver {
-
-/** Wrapper around solver::skyline_lu for use with the ViennaCL backend.
- * Copies the rhs to the host memory, solves the problem using the host CPU,
- * then copies the solution back to the compute device(s).
- */
-template <class T>
-struct viennacl_skyline_lu : solver::skyline_lu<T> {
-    typedef solver::skyline_lu<T> Base;
-
-    mutable std::vector<T> _rhs, _x;
-
-    template <class Matrix, class Params>
-    viennacl_skyline_lu(const Matrix &A, const Params&)
-        : Base(*A), _rhs(backend::rows(*A)), _x(backend::rows(*A))
-    { }
-
-    template <class Vec1, class Vec2>
-    void operator()(const Vec1 &rhs, Vec2 &x) const {
-        viennacl::fast_copy(rhs, _rhs);
-        static_cast<const Base*>(this)->operator()(_rhs, _x);
-        viennacl::fast_copy(_x, x);
-    }
-};
-
-}
-
-namespace backend {
-
-/// ViennaCL backend
-/**
- * This is a backend that uses types defined in the ViennaCL library
- * (http://viennacl.sourceforge.net).
- *
- * \param Matrix ViennaCL matrix to use with the backend. Possible choices are
- * viannacl::compressed_matrix<T>, viennacl::ell_matrix<T>, and
- * viennacl::hyb_matrix<T>.
- * \ingroup backends
- */
-template <
-    class Matrix,
-    class DirectSolver = solver::viennacl_skyline_lu<typename backend::value_type<Matrix>::type>
-    >
-struct viennacl {
-    typedef typename backend::value_type<Matrix>::type value_type;
-    typedef ptrdiff_t                                  index_type;
-    typedef ptrdiff_t                                  col_type;
-    typedef ptrdiff_t                                  ptr_type;
-    typedef Matrix                                     matrix;
-    typedef ::viennacl::vector<value_type>             vector;
-    typedef ::viennacl::vector<value_type>             matrix_diagonal;
-    typedef DirectSolver                               direct_solver;
-
-    struct provides_row_iterator : std::false_type {};
-
-    /// Backend parameters.
-    typedef amgcl::detail::empty_params params;
-
-    static std::string name() { return "viennacl"; }
-
-    /// Copy matrix from builtin backend.
-    static std::shared_ptr<matrix>
-    copy_matrix(
-            std::shared_ptr< typename builtin<value_type>::matrix > A,
-            const params&
-            )
-    {
-        auto m = std::make_shared<matrix>();
-        ::viennacl::copy(viennacl_matrix_adapter(*A), *m);
-        return m;
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(typename builtin<value_type>::vector const &x, const params&)
-    {
-        auto v = std::make_shared<vector>(x.size());
-        ::viennacl::fast_copy(x.data(), x.data() + x.size(), v->begin());
-        return v;
-    }
-
-    /// Copy vector from builtin backend.
-    static std::shared_ptr<vector>
-    copy_vector(
-            std::shared_ptr< typename builtin<value_type>::vector > x,
-            const params &prm
-            )
-    {
-        return copy_vector(*x, prm);
-    }
-
-    /// Create vector of the specified size.
-    static std::shared_ptr<vector>
-    create_vector(size_t size, const params&)
-    {
-        return std::make_shared<vector>(size);
-    }
-
-    /// Create direct solver for coarse level
-    static std::shared_ptr<direct_solver>
-    create_solver(std::shared_ptr< typename builtin<value_type>::matrix > A, const params &prm)
-    {
-        return std::make_shared<direct_solver>(A, prm);
-    }
-
-    private:
-        struct viennacl_matrix_adapter {
-            typedef ptrdiff_t index_type;
-            typedef size_t    size_type;
-
-            class const_iterator1;
-
-            class const_iterator2 {
-                public:
-                    bool operator!=(const const_iterator2 &it) const {
-                        return pos != it.pos;
-                    }
-
-                    const const_iterator2& operator++() {
-                        ++pos;
-                        return *this;
-                    }
-
-                    index_type index1() const {
-                        return row;
-                    }
-
-                    index_type index2() const {
-                        return col[pos];
-                    }
-
-                    value_type operator*() const {
-                        return val[pos];
-                    }
-                private:
-                    const_iterator2(index_type row, index_type pos,
-                            const index_type *col, const value_type *val)
-                        : row(row), pos(pos), col(col), val(val)
-                    { }
-
-                    index_type        row;
-                    index_type        pos;
-                    const index_type *col;
-                    const value_type *val;
-
-                    friend class const_iterator1;
-            };
-
-            class const_iterator1 {
-                public:
-                    bool operator!=(const const_iterator1 &it) const {
-                        return pos != it.pos;
-                    }
-
-                    const const_iterator1& operator++() {
-                        ++pos;
-                        return *this;
-                    }
-
-                    index_type index1() const {
-                        return pos;
-                    }
-
-                    const const_iterator2 begin() const {
-                        return const_iterator2(pos, row[pos], col, val);
-                    }
-
-                    const const_iterator2 end() const {
-                        return const_iterator2(pos, row[pos + 1], col, val);
-                    }
-                private:
-                    const_iterator1(index_type pos,
-                            const index_type *row,
-                            const index_type *col,
-                            const value_type *val
-                            )
-                        : pos(pos), row(row), col(col), val(val)
-                    { }
-
-                    index_type pos;
-                    const index_type *row;
-                    const index_type *col;
-                    const value_type *val;
-
-                    friend struct viennacl_matrix_adapter;
-            };
-
-            viennacl_matrix_adapter(
-                    const typename backend::builtin<value_type>::matrix &A)
-                : rows(A.nrows), cols(A.ncols),
-                  row(A.ptr), col(A.col), val(A.val)
-            { }
-
-            const_iterator1 begin1() const {
-                return const_iterator1(0, row, col, val);
-            }
-
-            const_iterator1 end1() const {
-                return const_iterator1(rows, row, col, val);
-            }
-
-            size_t size1() const {
-                return rows;
-            }
-
-            size_t size2() const {
-                return cols;
-            }
-            private:
-                size_t rows;
-                size_t cols;
-
-                const index_type *row;
-                const index_type *col;
-                const value_type *val;
-        };
-};
-
-template <class T>
-struct is_viennacl_matrix : std::false_type {};
-
-template <class V>
-struct is_viennacl_matrix< ::viennacl::compressed_matrix<V> > : std::true_type
-{};
-
-template <class V>
-struct is_viennacl_matrix< ::viennacl::hyb_matrix<V> > : std::true_type
-{};
-
-template <class V>
-struct is_viennacl_matrix< ::viennacl::ell_matrix<V> > : std::true_type
-{};
-
-template <class M>
-struct value_type<
-    M,
-    typename std::enable_if< is_viennacl_matrix<M>::value >::type
-    >
-{
-    typedef typename M::value_type::value_type type;
-};
-
-template <class V>
-struct value_type< ::viennacl::vector<V> >
-{
-    typedef V type;
-};
-
-template <class M>
-struct rows_impl<
-    M,
-    typename std::enable_if< is_viennacl_matrix<M>::value >::type
-    >
-{
-    static size_t get(const M &A) {
-        return A.size1();
-    }
-};
-
-template <class M>
-struct cols_impl<
-    M,
-    typename std::enable_if< is_viennacl_matrix<M>::value >::type
-    >
-{
-    static size_t get(const M &A) {
-        return A.size2();
-    }
-};
-
-template <class V>
-struct nonzeros_impl< ::viennacl::compressed_matrix<V> > {
-    static size_t get(const ::viennacl::compressed_matrix<V> &A) {
-        return A.nnz();
-    }
-};
-
-template <class V>
-struct nonzeros_impl< ::viennacl::ell_matrix<V> > {
-    static size_t get(const ::viennacl::ell_matrix<V> &A) {
-        return A.nnz();
-    }
-};
-
-template <class V>
-struct nonzeros_impl< ::viennacl::hyb_matrix<V> > {
-    static size_t get(const ::viennacl::hyb_matrix<V> &A) {
-        return A.ell_nnz() + A.csr_nnz();
-    }
-};
-
-template <class Alpha, class Mtx, class Beta, class Vec>
-struct spmv_impl<
-    Alpha, Mtx, Vec, Beta, Vec,
-    typename std::enable_if< is_viennacl_matrix<Mtx>::value >::type
-    >
-{
-    static void apply(Alpha alpha, const Mtx &A, const Vec &x, Beta beta, Vec &y)
-    {
-        if (beta)
-            y = alpha * ::viennacl::linalg::prod(A, x) + beta * y;
-        else
-            y = alpha * ::viennacl::linalg::prod(A, x);
-    }
-};
-
-template <class Mtx, class Vec>
-struct residual_impl<
-    Mtx, Vec, Vec, Vec,
-    typename std::enable_if< is_viennacl_matrix<Mtx>::value >::type
-    >
-{
-    typedef typename value_type<Mtx>::type V;
-
-    static void apply(const Vec &rhs, const Mtx &A, const Vec &x, Vec &r)
-    {
-        r = ::viennacl::linalg::prod(A, x);
-        r = rhs - r;
-    }
-};
-
-template < typename V >
-struct clear_impl< ::viennacl::vector<V> >
-{
-    static void apply(::viennacl::vector<V> &x)
-    {
-        x.clear();
-    }
-};
-
-template < typename V >
-struct inner_product_impl<
-    ::viennacl::vector<V>,
-    ::viennacl::vector<V>
-    >
-{
-    static V get(const ::viennacl::vector<V> &x, const ::viennacl::vector<V> &y)
-    {
-        return ::viennacl::linalg::inner_prod(x, y);
-    }
-};
-
-template < typename A, typename B, typename V >
-struct axpby_impl<
-    A, ::viennacl::vector<V>,
-    B, ::viennacl::vector<V>
-    >
-{
-    static void apply(
-            A a, const ::viennacl::vector<V> &x,
-            B b, ::viennacl::vector<V> &y
-            )
-    {
-        if (b)
-            y = a * x + b * y;
-        else
-            y = a * x;
-    }
-};
-
-template < typename A, typename B, typename C, typename V >
-struct axpbypcz_impl<
-    A, ::viennacl::vector<V>,
-    B, ::viennacl::vector<V>,
-    C, ::viennacl::vector<V>
-    >
-{
-    static void apply(
-            A a, const ::viennacl::vector<V> &x,
-            B b, const ::viennacl::vector<V> &y,
-            C c,       ::viennacl::vector<V> &z
-            )
-    {
-        if (c)
-            z = a * x + b * y + c * z;
-        else
-            z = a * x + b * y;
-    }
-};
-
-template < typename A, typename B, typename V >
-struct vmul_impl<
-    A, ::viennacl::vector<V>, ::viennacl::vector<V>,
-    B, ::viennacl::vector<V>
-    >
-{
-    static void apply(
-            A a, const ::viennacl::vector<V> &x, const ::viennacl::vector<V> &y,
-            B b, ::viennacl::vector<V> &z)
-    {
-        if (b)
-            z = a * ::viennacl::linalg::element_prod(x, y) + b * z;
-        else
-            z = a * ::viennacl::linalg::element_prod(x, y);
-    }
-};
-
-template < typename V >
-struct copy_impl<
-    ::viennacl::vector<V>,
-    ::viennacl::vector<V>
-    >
-{
-    static void apply(const ::viennacl::vector<V> &x, ::viennacl::vector<V> &y)
-    {
-        y = x;
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/aggregation.hpp b/src/solvers/amgcl/coarsening/aggregation.hpp
deleted file mode 100644
index e7d490c..0000000
--- a/src/solvers/amgcl/coarsening/aggregation.hpp
+++ /dev/null
@@ -1,164 +0,0 @@
-#ifndef AMGCL_COARSENING_AGGREGATION_HPP
-#define AMGCL_COARSENING_AGGREGATION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/aggregation.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Non-smoothed aggregation coarsening.
- */
-
-#include <tuple>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/coarsening/detail/scaled_galerkin.hpp>
-#include <amgcl/coarsening/pointwise_aggregates.hpp>
-#include <amgcl/coarsening/tentative_prolongation.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Coarsening strategies
-namespace coarsening {
-
-/**
- * \defgroup coarsening Coarsening strategies
- * \brief Coarsening strategies for AMG hirarchy construction.
- *
- * A coarsener in AMGCL is a class that takes a system matrix and returns three
- * operators:
- *
- * 1. Restriction operator R that downsamples the residual error to a
- *    coarser level in AMG hierarchy,
- * 2. Prolongation operator P that interpolates a correction computed on a
- *    coarser grid into a finer grid,
- * 3. System matrix \f$A^H\f$ at a coarser level that is usually computed as a
- *    Galerkin operator \f$A^H = R A^h P\f$.
- *
- * The AMG hierarchy is constructed by recursive invocation of the selected
- * coarsener.
- */
-
-/// Non-smoothed aggregation.
-/**
- * \ingroup coarsening
- */
-template <class Backend>
-struct aggregation {
-    typedef pointwise_aggregates Aggregates;
-
-    /// Coarsening parameters.
-    struct params {
-        /// Aggregation parameters.
-        Aggregates::params aggr;
-
-        /// Near nullspace parameters.
-        nullspace_params nullspace;
-
-        /// Over-interpolation factor \f$\alpha\f$.
-        /**
-         * In case of aggregation coarsening, coarse-grid
-         * correction of smooth error, and by this the overall convergence, can
-         * often be substantially improved by using "over-interpolation", that is,
-         * by multiplying the actual correction (corresponding to piecewise
-         * constant interpolation) by some factor \f$\alpha > 1\f$. Equivalently,
-         * this means that the coarse-level Galerkin operator is re-scaled by
-         * \f$1 / \alpha\f$:
-         * \f[I_h^HA_hI_H^h \to \frac{1}{\alpha}I_h^HA_hI_H^h.\f]
-         *
-         * \sa  \cite Stuben1999, Section 9.1 "Re-scaling of the Galerkin operator".
-         */
-        float over_interp;
-
-        params()
-            : over_interp(math::static_rows<typename Backend::value_type>::value == 1 ? 1.5f : 2.0f)
-        {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_CHILD(p, aggr),
-              AMGCL_PARAMS_IMPORT_CHILD(p, nullspace),
-              AMGCL_PARAMS_IMPORT_VALUE(p, over_interp)
-        {
-            check_params(p, {"aggr", "nullspace", "over_interp"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, aggr);
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, nullspace);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, over_interp);
-        }
-#endif
-    } prm;
-
-    aggregation(const params &prm = params()) : prm(prm) {}
-
-    /// Creates transfer operators for the given system matrix.
-    /**
-     * \param A   The system matrix.
-     * \param prm Coarsening parameters.
-     * \returns   A tuple of prolongation and restriction operators.
-     */
-    template <class Matrix>
-    std::tuple<
-        std::shared_ptr<Matrix>,
-        std::shared_ptr<Matrix>
-        >
-    transfer_operators(const Matrix &A) {
-        const size_t n = rows(A);
-
-        AMGCL_TIC("aggregates");
-        Aggregates aggr(A, prm.aggr, prm.nullspace.cols);
-        AMGCL_TOC("aggregates");
-
-        AMGCL_TIC("interpolation");
-        auto P = tentative_prolongation<Matrix>(
-                n, aggr.count, aggr.id, prm.nullspace, prm.aggr.block_size
-                );
-        AMGCL_TOC("interpolation");
-
-        return std::make_tuple(P, transpose(*P));
-    }
-
-    /// Creates system matrix for the coarser level.
-    /**
-     * \param A The system matrix at the finer level.
-     * \param P Prolongation operator returned by transfer_operators().
-     * \param R Restriction operator returned by transfer_operators().
-     * \returns System matrix for the coarser level.
-     */
-    template <class Matrix>
-    std::shared_ptr<Matrix>
-    coarse_operator(const Matrix &A, const Matrix &P, const Matrix &R) const {
-        return detail::scaled_galerkin(A, P, R, 1 / prm.over_interp);
-    }
-};
-
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/as_scalar.hpp b/src/solvers/amgcl/coarsening/as_scalar.hpp
deleted file mode 100644
index 218a2dc..0000000
--- a/src/solvers/amgcl/coarsening/as_scalar.hpp
+++ /dev/null
@@ -1,119 +0,0 @@
-#ifndef AMGCL_COARSENING_AS_SCALAR_HPP
-#define AMGCL_COARSENING_AS_SCALAR_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/as_scalar.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Scalar coarsening for block matrices.
- */
-
-#include <amgcl/adapter/block_matrix.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-// Takes a block matrix as input,
-// converts it to the scalar format,
-// applies the base coarsening,
-// converts the results back to block format.
-template <template <class> class Coarsening>
-struct as_scalar {
-    template <class Backend>
-    struct type {
-        typedef typename math::element_of<typename Backend::value_type>::type Scalar;
-        typedef backend::builtin<Scalar, typename Backend::col_type, typename Backend::ptr_type> BaseBackend;
-        typedef Coarsening<BaseBackend> Base;
-
-        typedef typename Base::params params;
-        Base base;
-
-        type(const params &prm = params()) : base(prm) {};
-
-        template <class Matrix>
-        typename std::enable_if<
-            backend::coarsening_is_supported<BaseBackend, Coarsening>::value &&
-            (math::static_rows<typename backend::value_type<Matrix>::type>::value > 1),
-            std::tuple<
-                std::shared_ptr<Matrix>,
-                std::shared_ptr<Matrix>
-                >
-            >::type
-        transfer_operators(const Matrix &B) {
-            typedef typename backend::value_type<Matrix>::type Block;
-            auto T = base.transfer_operators(*adapter::unblock_matrix(B));
-
-            auto &P = *std::get<0>(T);
-            auto &R = *std::get<1>(T);
-
-            backend::sort_rows(P);
-            backend::sort_rows(R);
-
-            return std::make_tuple(
-                    std::make_shared<Matrix>(adapter::block_matrix<Block>(P)),
-                    std::make_shared<Matrix>(adapter::block_matrix<Block>(R))
-                    );
-        }
-
-        template <class Matrix>
-        typename std::enable_if<
-            backend::coarsening_is_supported<BaseBackend, Coarsening>::value &&
-            (math::static_rows<typename backend::value_type<Matrix>::type>::value == 1),
-            std::tuple<
-                std::shared_ptr<Matrix>,
-                std::shared_ptr<Matrix>
-                >
-            >::type
-        transfer_operators(const Matrix &A) {
-            return base.transfer_operators(A);
-        }
-
-        template <class Matrix>
-        typename std::enable_if<
-            !backend::coarsening_is_supported<BaseBackend, Coarsening>::value,
-            std::tuple<
-                std::shared_ptr<Matrix>,
-                std::shared_ptr<Matrix>
-                >
-            >::type
-        transfer_operators(const Matrix&) {
-            throw std::logic_error("The coarsening is not supported by the backend");
-        }
-
-        template <class Matrix>
-        std::shared_ptr<Matrix>
-        coarse_operator(const Matrix &A, const Matrix &P, const Matrix &R) const {
-            return base.coarse_operator(A, P, R);
-        }
-    };
-};
-
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/detail/galerkin.hpp b/src/solvers/amgcl/coarsening/detail/galerkin.hpp
deleted file mode 100644
index 7f5a658..0000000
--- a/src/solvers/amgcl/coarsening/detail/galerkin.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_COARSENING_DETAIL_GALERKIN_HPP
-#define AMGCL_COARSENING_DETAIL_GALERKIN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/detail/galerkin.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Galerkin operator.
- */
-
-#include <memory>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace coarsening {
-namespace detail {
-
-template <class Matrix>
-std::shared_ptr<Matrix> galerkin(
-        const Matrix &A, const Matrix &P, const Matrix &R
-        )
-{
-    return product(R, *product(A, P));
-}
-
-} // namespace detail
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/detail/scaled_galerkin.hpp b/src/solvers/amgcl/coarsening/detail/scaled_galerkin.hpp
deleted file mode 100644
index 2e5fbcf..0000000
--- a/src/solvers/amgcl/coarsening/detail/scaled_galerkin.hpp
+++ /dev/null
@@ -1,59 +0,0 @@
-#ifndef AMGCL_COARSENING_DETAIL_SCALED_GALERKIN_HPP
-#define AMGCL_COARSENING_DETAIL_SCALED_GALERKIN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/detail/scaled_galerkin.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Scaled Galerkin operator.
- */
-
-#include <amgcl/coarsening/detail/galerkin.hpp>
-
-namespace amgcl {
-namespace coarsening {
-namespace detail {
-
-template <class Matrix>
-std::shared_ptr<Matrix> scaled_galerkin(
-        const Matrix &A,
-        const Matrix &P,
-        const Matrix &R,
-        float s
-        )
-{
-        auto a = galerkin(A, P, R);
-        scale(*a, s);
-        return a;
-}
-
-} // namespace detail
-} // namespace coarsening
-} // namespace amgcl
-
-
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/plain_aggregates.hpp b/src/solvers/amgcl/coarsening/plain_aggregates.hpp
deleted file mode 100644
index 0e34e94..0000000
--- a/src/solvers/amgcl/coarsening/plain_aggregates.hpp
+++ /dev/null
@@ -1,213 +0,0 @@
-#ifndef AMGCL_COARSENING_PLAIN_AGGREGATES_HPP
-#define AMGCL_COARSENING_PLAIN_AGGREGATES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/plain_aggregates.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Plain aggregation.
- */
-
-#include <vector>
-#include <numeric>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-/**
- * \defgroup aggregates Aggregates
- * \brief These classes control how fine-level variables are subdivided into
- * aggregates.
- */
-
-/// Plain aggregation.
-/**
- * Modification of a greedy aggregation scheme from \cite Vanek1996.
- * Connectivity is defined in a symmetric way, that is, two variables \f$i\f$
- * and \f$j\f$ are considered to be connected to each other if
- * \f$a_{ij}^2/a_{ii}a_{jj} > \varepsilon_{strong}\f$. Variables without
- * neighbours (resulting, e.g., from Dirichlet conditions) are excluded from
- * aggregation process. The aggregation is completed in a single pass over
- * variables: variables adjacent to a new aggregate are temporarily marked as
- * beloning to this aggregate. Later they may be claimed by other aggregates;
- * if nobody claims them, then they just stay in their initial aggregate.
- *
- * \ingroup aggregates
- */
-struct plain_aggregates {
-    /// Aggregation parameters.
-    struct params {
-        /// Parameter \f$\varepsilon_{strong}\f$ defining strong couplings.
-        /**
-         * Connectivity is defined in a symmetric way, that is, two variables
-         * \f$i\f$ and \f$j\f$ are considered to be connected to each other if
-         * \f$a_{ij}^2/a_{ii}a_{jj} > \varepsilon_{strong}\f$ with fixed \f$0 <
-         * \varepsilon_{strong} < 1.\f$
-         */
-        float eps_strong;
-
-        params() : eps_strong(0.08f) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, eps_strong)
-        {
-            check_params(p, {"eps_strong", "block_size"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, eps_strong);
-        }
-#endif
-    };
-
-    static const ptrdiff_t undefined = -1;
-    static const ptrdiff_t removed   = -2;
-
-    /// Number of aggregates.
-    size_t count;
-
-    /// Strong connectivity matrix.
-    /**
-     * This is just 'values' part of CRS matrix. 'col' and 'ptr' arrays are
-     * borrowed from the system matrix.
-     */
-    std::vector<char> strong_connection;
-
-    /// Aggerate id that each fine-level variable belongs to.
-    /** When id[i] < 0, then variable i stays at the fine level (this could be
-     * the case for a Dirichelt condition variable).*/
-    std::vector<ptrdiff_t> id;
-
-    /// Constructs aggregates for a given matrix.
-    /**
-     * \param A   The system matrix.
-     * \param prm Aggregation parameters.
-     */
-    template <class Matrix>
-    plain_aggregates(const Matrix &A, const params &prm)
-        : count(0),
-          strong_connection( backend::nonzeros(A) ),
-          id( backend::rows(A) )
-    {
-        typedef typename backend::value_type<Matrix>::type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        scalar_type eps_squared = prm.eps_strong * prm.eps_strong;
-
-        const size_t n = rows(A);
-
-        /* 1. Get strong connections */
-        auto dia = diagonal(A);
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            value_type eps_dia_i = eps_squared * (*dia)[i];
-
-            for(ptrdiff_t j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                ptrdiff_t c = A.col[j];
-                value_type v = A.val[j];
-
-                strong_connection[j] = (c != i) && (eps_dia_i * (*dia)[c] < v * v);
-            }
-        }
-
-        /* 2. Get aggregate ids */
-
-        // Remove lonely nodes.
-        size_t max_neib = 0;
-        for(size_t i = 0; i < n; ++i) {
-            ptrdiff_t j = A.ptr[i], e = A.ptr[i+1];
-            max_neib    = std::max<size_t>(max_neib, e - j);
-
-            ptrdiff_t state = removed;
-            for(; j < e; ++j)
-                if (strong_connection[j]) {
-                    state = undefined;
-                    break;
-                }
-
-            id[i] = state;
-        }
-
-        std::vector<ptrdiff_t> neib;
-        neib.reserve(max_neib);
-
-        // Perform plain aggregation
-        for(size_t i = 0; i < n; ++i) {
-            if (id[i] != undefined) continue;
-
-            // The point is not adjacent to a core of any previous aggregate:
-            // so its a seed of a new aggregate.
-            ptrdiff_t cur_id = static_cast<ptrdiff_t>(count++);
-            id[i] = cur_id;
-
-            // (*) Include its neighbors as well.
-            neib.clear();
-            for(ptrdiff_t j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                ptrdiff_t c = A.col[j];
-                if (strong_connection[j] && id[c] != removed) {
-                    id[c] = cur_id;
-                    neib.push_back(c);
-                }
-            }
-
-            // Temporarily mark undefined points adjacent to the new aggregate
-            // as members of the aggregate.
-            // If nobody claims them later, they will stay here.
-            for(ptrdiff_t c : neib) {
-                for(ptrdiff_t j = A.ptr[c], e = A.ptr[c+1]; j < e; ++j) {
-                    ptrdiff_t cc = A.col[j];
-                    if (strong_connection[j] && id[cc] == undefined)
-                        id[cc] = cur_id;
-                }
-            }
-        }
-
-        if (!count) throw error::empty_level();
-
-        // Some of the aggregates could potentially vanish during expansion
-        // step (*) above. We need to exclude those and renumber the rest.
-        std::vector<ptrdiff_t> cnt(count, 0);
-        for(ptrdiff_t i : id)
-            if (i >= 0) cnt[i] = 1;
-        std::partial_sum(cnt.begin(), cnt.end(), cnt.begin());
-
-        if (static_cast<ptrdiff_t>(count) > cnt.back()) {
-            count = cnt.back();
-
-            for(size_t i = 0; i < n; ++i)
-                if (id[i] >= 0) id[i] = cnt[id[i]] - 1;
-        }
-    }
-};
-
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/pointwise_aggregates.hpp b/src/solvers/amgcl/coarsening/pointwise_aggregates.hpp
deleted file mode 100644
index 79ed482..0000000
--- a/src/solvers/amgcl/coarsening/pointwise_aggregates.hpp
+++ /dev/null
@@ -1,197 +0,0 @@
-#ifndef AMGCL_COARSENING_POINTWISE_AGGREGATES_HPP
-#define AMGCL_COARSENING_POINTWISE_AGGREGATES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/pointwise_aggregates.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Pointwise aggregation.
- */
-
-#include <vector>
-#include <cmath>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/coarsening/plain_aggregates.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-/// Pointwise aggregation.
-/**
- * The system matrix should have block structure. It is reduced to a single
- * value per block and is subjected to coarsening::plain_aggregation.
- *
- * \ingroup aggregates
- */
-class pointwise_aggregates {
-    public:
-        /// Aggregation parameters.
-        struct params : plain_aggregates::params {
-            /// Block size for the system matrix.
-            /**
-             * When block_size=1, the scheme is equivalent to (and performs on
-             * par with) plain_aggregates.
-             */
-            unsigned block_size;
-
-            params() : block_size(1) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : plain_aggregates::params(p),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, block_size)
-            {
-                check_params(p, {"eps_strong", "block_size"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                plain_aggregates::params::get(p, path);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, block_size);
-            }
-#endif
-        };
-
-        static const ptrdiff_t undefined = -1;
-        static const ptrdiff_t removed   = -2;
-
-        /// \copydoc amgcl::coarsening::plain_aggregates::count
-        size_t count;
-
-        /// \copydoc amgcl::coarsening::plain_aggregates::strong_connection
-        std::vector<char> strong_connection;
-
-        /// \copydoc amgcl::coarsening::plain_aggregates::id
-        std::vector<ptrdiff_t> id;
-
-        /// \copydoc amgcl::coarsening::plain_aggregates::plain_aggregates
-        template <class Matrix>
-        pointwise_aggregates(const Matrix &A, const params &prm, unsigned min_aggregate)
-            : count(0)
-        {
-            if (prm.block_size == 1) {
-                plain_aggregates aggr(A, prm);
-
-                remove_small_aggregates(A.nrows, 1, min_aggregate, aggr);
-
-                count = aggr.count;
-                strong_connection.swap(aggr.strong_connection);
-                id.swap(aggr.id);
-            } else {
-                strong_connection.resize( nonzeros(A) );
-                id.resize( rows(A) );
-
-                auto ap = backend::pointwise_matrix(A, prm.block_size);
-                auto &Ap = *ap;
-
-                plain_aggregates pw_aggr(Ap, prm);
-
-                remove_small_aggregates(
-                        Ap.nrows, prm.block_size, min_aggregate, pw_aggr);
-
-                count = pw_aggr.count * prm.block_size;
-
-#pragma omp parallel
-                {
-                    std::vector<ptrdiff_t> j(prm.block_size);
-                    std::vector<ptrdiff_t> e(prm.block_size);
-
-#pragma omp for
-                    for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(Ap.nrows); ++ip) {
-                        ptrdiff_t ia = ip * prm.block_size;
-
-                        for(unsigned k = 0; k < prm.block_size; ++k, ++ia) {
-                            id[ia] = prm.block_size * pw_aggr.id[ip] + k;
-
-                            j[k] = A.ptr[ia];
-                            e[k] = A.ptr[ia+1];
-                        }
-
-                        for(ptrdiff_t jp = Ap.ptr[ip], ep = Ap.ptr[ip+1]; jp < ep; ++jp) {
-                            ptrdiff_t cp = Ap.col[jp];
-                            bool      sp = (cp == ip) || pw_aggr.strong_connection[jp];
-
-                            ptrdiff_t col_end = (cp + 1) * prm.block_size;
-
-                            for(unsigned k = 0; k < prm.block_size; ++k) {
-                                ptrdiff_t beg = j[k];
-                                ptrdiff_t end = e[k];
-
-                                while(beg < end && A.col[beg] < col_end) {
-                                    strong_connection[beg] = sp && A.col[beg] != (ia + k);
-                                    ++beg;
-                                }
-
-                                j[k] = beg;
-                            }
-                        }
-                    }
-                }
-            }
-        }
-
-        static void remove_small_aggregates(
-                size_t n, unsigned block_size, unsigned min_aggregate,
-                plain_aggregates &aggr
-                )
-        {
-            if (min_aggregate <= 1) return; // nothing to do
-
-            // Count entries in each of the aggregates
-            std::vector<ptrdiff_t> count(aggr.count, 0);
-
-            for(size_t i = 0; i < n; ++i) {
-                ptrdiff_t id = aggr.id[i];
-                if (id != removed) ++count[id];
-            }
-
-            // If any aggregate has less entries than required, remove it.
-            // Renumber the rest of the aggregates to leave no gaps.
-            size_t m = 0;
-            for(size_t i = 0; i < aggr.count; ++i) {
-                if (block_size * count[i] < min_aggregate) {
-                    count[i] = removed;
-                } else {
-                    count[i] = m++;
-                }
-            }
-
-            // Update aggregate count and aggregate ids.
-            aggr.count = m;
-
-            for(size_t i = 0; i < n; ++i) {
-                ptrdiff_t id = aggr.id[i];
-                if (id != removed) aggr.id[i] = count[id];
-            }
-        }
-};
-
-} // namespace coarsening
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/rigid_body_modes.hpp b/src/solvers/amgcl/coarsening/rigid_body_modes.hpp
deleted file mode 100644
index 41375d5..0000000
--- a/src/solvers/amgcl/coarsening/rigid_body_modes.hpp
+++ /dev/null
@@ -1,134 +0,0 @@
-#ifndef AMGCL_COARSENING_RIGID_BODY_MODES_HPP
-#define AMGCL_COARSENING_RIGID_BODY_MODES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/rigid_body_modes.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Create rigid body modes from coordinates.
- */
-
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-// Create rigid body modes from coordinate vector.
-// To be used as near-nullspace vectors with aggregation coarsening
-// for 2D or 3D elasticity problems.
-// The output matrix B may be transposed on demand
-// (to be used as a set of deflation vectors).
-template <class Vector>
-int rigid_body_modes(int ndim, const Vector &coo, std::vector<double> &B, bool transpose = false) {
-    precondition(ndim == 2 || ndim == 3, "Only 2D or 3D problems are supported");
-    precondition(coo.size() % ndim == 0, "Coordinate vector size should be divisible by ndim");
-
-    size_t n = coo.size();
-    int nmodes = (ndim == 2 ? 3 : 6);
-    B.resize(n * nmodes, 0.0);
-
-    const int stride1 = transpose ? 1 : nmodes;
-    const int stride2 = transpose ? n : 1;
-
-    double sn = 1 / sqrt(n);
-
-    if (ndim == 2) {
-        for(size_t i = 0; i < n; ++i) {
-            size_t nod = i / ndim;
-            size_t dim = i % ndim;
-
-            double x = coo[nod * 2 + 0];
-            double y = coo[nod * 2 + 1];
-
-            // Translation
-            B[i * stride1 + dim * stride2] = sn;
-
-            // Rotation
-            switch(dim) {
-                case 0:
-                    B[i * stride1 + 2 * stride2] = -y;
-                    break;
-                case 1:
-                    B[i * stride1 + 2 * stride2] = x;
-                    break;
-            }
-        }
-    } else if (ndim == 3) {
-        for(size_t i = 0; i < n; ++i) {
-            size_t nod = i / ndim;
-            size_t dim = i % ndim;
-
-            double x = coo[nod * 3 + 0];
-            double y = coo[nod * 3 + 1];
-            double z = coo[nod * 3 + 2];
-
-            // Translation
-            B[i * stride1 + dim * stride2] = sn;
-
-            // Rotation
-            switch(dim) {
-                case 0:
-                    B[i * stride1 + 3 * stride2] = y;
-                    B[i * stride1 + 5 * stride2] = z;
-                    break;
-                case 1:
-                    B[i * stride1 + 3 * stride2] = -x;
-                    B[i * stride1 + 4 * stride2] = -z;
-                    break;
-                case 2:
-                    B[i * stride1 + 4 * stride2] =  y;
-                    B[i * stride1 + 5 * stride2] = -x;
-                    break;
-            }
-        }
-    }
-
-    // Orthonormalization
-    std::array<double, 6> dot;
-    for(int i = ndim; i < nmodes; ++i) {
-        std::fill(dot.begin(), dot.end(), 0.0);
-        for(size_t j = 0; j < n; ++j) {
-            for(int k = 0; k < i; ++k)
-                dot[k] += B[j * stride1 + k * stride2] * B[j * stride1 + i * stride2];
-        }
-        double s = 0.0;
-        for(size_t j = 0; j < n; ++j) {
-            for(int k = 0; k < i; ++k)
-                B[j * stride1 + i * stride2] -= dot[k] * B[j * stride1 + k * stride2];
-            s += B[j * stride1 + i * stride2] * B[j * stride1 + i * stride2];
-        }
-        s = sqrt(s);
-        for(size_t j = 0; j < n; ++j)
-            B[j * stride1 + i * stride2] /= s;
-    }
-
-    return nmodes;
-}
-
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/ruge_stuben.hpp b/src/solvers/amgcl/coarsening/ruge_stuben.hpp
deleted file mode 100644
index eca2395..0000000
--- a/src/solvers/amgcl/coarsening/ruge_stuben.hpp
+++ /dev/null
@@ -1,458 +0,0 @@
-#ifndef AMGCL_COARSENING_RUGE_STUBEN_HPP
-#define AMGCL_COARSENING_RUGE_STUBEN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/ruge_stuben.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Ruge-Stuben coarsening with direct interpolation.
- */
-
-#include <algorithm>
-#include <numeric>
-
-#include <tuple>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/coarsening/detail/scaled_galerkin.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-/// Classic Ruge-Stuben coarsening with direct interpolation.
-/**
- * \ingroup coarsening
- * \sa \cite Stuben1999
- */
-
-template <class Backend>
-struct ruge_stuben {
-    /// Coarsening parameters.
-    struct params {
-        /// Parameter \f$\varepsilon_{str}\f$ defining strong couplings.
-        /**
-         * Variable \f$i\f$ is defined to be strongly negatively coupled to
-         * another variable, \f$j\f$, if \f[-a_{ij} \geq
-         * \varepsilon_{str}\max\limits_{a_{ik}<0}|a_{ik}|\quad \text{with
-         * fixed} \quad 0 < \varepsilon_{str} < 1.\f] In practice, a value of
-         * \f$\varepsilon_{str}=0.25\f$ is usually taken.
-         */
-        float eps_strong;
-
-        /// Truncate prolongation operator?
-        /**
-         * Interpolation operators, and, hence coarse operators may increase
-         * substabtially towards coarser levels. Without truncation, this may
-         * become too costly. Truncation ignores all interpolatory connections
-         * which are smaller (in absolute value) than the largest one by a
-         * factor of \f$\varepsilon_{tr}\f$. The remaining weights are rescaled
-         * so that the total sum remains unchanged. In practice, a value of
-         * \f$\varepsilon_{tr}=0.2\f$ is usually taken.
-         */
-        bool  do_trunc;
-
-        /// Truncation parameter \f$\varepsilon_{tr}\f$.
-        float eps_trunc;
-
-        params() : eps_strong(0.25f), do_trunc(true), eps_trunc(0.2f) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, eps_strong),
-              AMGCL_PARAMS_IMPORT_VALUE(p, do_trunc),
-              AMGCL_PARAMS_IMPORT_VALUE(p, eps_trunc)
-        {
-            check_params(p, {"eps_strong", "do_trunc", "eps_trunc"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, eps_strong);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, do_trunc);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, eps_trunc);
-        }
-#endif
-    } prm;
-
-    ruge_stuben(const params &prm = params()) : prm(prm) {}
-
-    /// \copydoc amgcl::coarsening::aggregation::transfer_operators
-    template <class Matrix>
-    std::tuple< std::shared_ptr<Matrix>, std::shared_ptr<Matrix> >
-    transfer_operators(const Matrix &A) const {
-        typedef typename backend::value_type<Matrix>::type Val;
-        typedef typename backend::col_type<Matrix>::type   Col;
-        typedef typename backend::ptr_type<Matrix>::type   Ptr;
-        typedef typename math::scalar_of<Val>::type        Scalar;
-
-        const size_t n = rows(A);
-
-        static const Scalar eps = amgcl::detail::eps<Scalar>(1);
-
-        static const Val zero = math::zero<Val>();
-
-        std::vector<char> cf(n, 'U');
-        backend::crs<char, Col, Ptr> S;
-
-        AMGCL_TIC("C/F split");
-        connect(A, prm.eps_strong, S, cf);
-        cfsplit(A, S, cf);
-        AMGCL_TOC("C/F split");
-
-        AMGCL_TIC("interpolation");
-        size_t nc = 0;
-        std::vector<ptrdiff_t> cidx(n);
-        for(size_t i = 0; i < n; ++i)
-            if (cf[i] == 'C') cidx[i] = static_cast<ptrdiff_t>(nc++);
-
-        if (!nc) throw error::empty_level();
-
-        auto P = std::make_shared<Matrix>();
-        P->set_size(n, nc, true);
-
-        std::vector<Val> Amin, Amax;
-
-        if (prm.do_trunc) {
-            Amin.resize(n);
-            Amax.resize(n);
-        }
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            if (cf[i] == 'C') {
-                ++P->ptr[i + 1];
-                continue;
-            }
-
-            if (prm.do_trunc) {
-                Val amin = zero, amax = zero;
-
-                for(ptrdiff_t j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j) {
-                    if (!S.val[j] || cf[ A.col[j] ] != 'C') continue;
-
-                    amin = std::min(amin, A.val[j]);
-                    amax = std::max(amax, A.val[j]);
-                }
-
-                Amin[i] = (amin *= prm.eps_trunc);
-                Amax[i] = (amax *= prm.eps_trunc);
-
-                for(ptrdiff_t j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j) {
-                    if (!S.val[j] || cf[A.col[j]] != 'C') continue;
-
-                    if (A.val[j] < amin || amax < A.val[j])
-                        ++P->ptr[i + 1];
-                }
-            } else {
-                for(ptrdiff_t j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j)
-                    if (S.val[j] && cf[A.col[j]] == 'C')
-                        ++P->ptr[i + 1];
-            }
-        }
-
-        P->set_nonzeros(P->scan_row_sizes());
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            ptrdiff_t row_head = P->ptr[i];
-
-            if (cf[i] == 'C') {
-                P->col[row_head] = cidx[i];
-                P->val[row_head] = math::identity<Val>();
-                continue;
-            }
-
-            Val dia   = zero;
-            Val a_num = zero, a_den = zero;
-            Val b_num = zero, b_den = zero;
-            Val d_neg = zero, d_pos = zero;
-
-            for(ptrdiff_t j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j) {
-                ptrdiff_t c = A.col[j];
-                Val  v = A.val[j];
-
-                if (c == i) {
-                    dia = v;
-                    continue;
-                }
-
-                if (v < zero) {
-                    a_num += v;
-                    if (S.val[j] && cf[c] == 'C') {
-                        a_den += v;
-                        if (prm.do_trunc && Amin[i] < v) d_neg += v;
-                    }
-                } else {
-                    b_num += v;
-                    if (S.val[j] && cf[c] == 'C') {
-                        b_den += v;
-                        if (prm.do_trunc && v < Amax[i]) d_pos += v;
-                    }
-                }
-            }
-
-            Scalar cf_neg = 1;
-            Scalar cf_pos = 1;
-
-            if (prm.do_trunc) {
-                if (math::norm(static_cast<Val>(a_den - d_neg)) > eps)
-                    cf_neg = math::norm(a_den) / math::norm(static_cast<Val>(a_den - d_neg));
-
-                if (math::norm(static_cast<Val>(b_den - d_pos)) > eps)
-                    cf_pos = math::norm(b_den) / math::norm(static_cast<Val>(b_den - d_pos));
-            }
-
-            if (zero < b_num && math::norm(b_den) < eps) dia += b_num;
-
-            Scalar alpha = math::norm(a_den) > eps ? -cf_neg * math::norm(a_num) / (math::norm(dia) * math::norm(a_den)) : 0;
-            Scalar beta  = math::norm(b_den) > eps ? -cf_pos * math::norm(b_num) / (math::norm(dia) * math::norm(b_den)) : 0;
-
-            for(ptrdiff_t j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j) {
-                ptrdiff_t c = A.col[j];
-                Val  v = A.val[j];
-
-                if (!S.val[j] || cf[c] != 'C') continue;
-                if (prm.do_trunc && Amin[i] <= v && v <= Amax[i]) continue;
-
-                P->col[row_head] = cidx[c];
-                P->val[row_head] = (v < zero ? alpha : beta) * v;
-                ++row_head;
-            }
-        }
-        AMGCL_TOC("interpolation");
-
-        return std::make_tuple(P, transpose(*P));
-    }
-
-    /// \copydoc amgcl::coarsening::aggregation::coarse_operator
-    template <class Matrix>
-    std::shared_ptr<Matrix>
-    coarse_operator(const Matrix &A, const Matrix &P, const Matrix &R) const {
-        return detail::galerkin(A, P, R);
-    }
-
-    private:
-        //-------------------------------------------------------------------
-        // On return S will hold both strong connection matrix (in S.val, which
-        // is piggybacking A.ptr and A.col), and its transposition (in S.ptr
-        // and S.val).
-        //
-        // Variables that have no positive connections are marked as F(ine).
-        //-------------------------------------------------------------------
-        template <typename Val, typename Col, typename Ptr>
-        static void connect(
-                backend::crs<Val,  Col, Ptr> const &A, float eps_strong,
-                backend::crs<char, Col, Ptr>       &S,
-                std::vector<char>                  &cf
-                )
-        {
-            typedef typename math::scalar_of<Val>::type Scalar;
-
-            const size_t n   = rows(A);
-            const size_t nnz = nonzeros(A);
-            const Scalar eps = amgcl::detail::eps<Scalar>(1);
-
-            S.nrows = S.ncols = n;
-            S.ptr = new Ptr[n+1];
-            S.val = new char[nnz];
-            S.ptr[0] = 0;
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                S.ptr[i+1] = 0;
-
-                Val a_min = math::zero<Val>();
-
-                for(auto a = row_begin(A, i); a; ++a)
-                    if (a.col() != i) a_min = std::min(a_min, a.value());
-
-                if (math::norm(a_min) < eps) {
-                    cf[i] = 'F';
-                    continue;
-                }
-
-                a_min *= eps_strong;
-
-                for(Ptr j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j)
-                    S.val[j] = (A.col[j] != i && A.val[j] < a_min);
-            }
-
-            // Transposition of S:
-            for(size_t i = 0; i < nnz; ++i)
-                if (S.val[i]) ++( S.ptr[ A.col[i] + 1] );
-
-            S.scan_row_sizes();
-            S.col = new Col[S.ptr[n]];
-
-            for(size_t i = 0; i < n; ++i)
-                for(Ptr j = A.ptr[i], e = A.ptr[i + 1]; j < e; ++j)
-                    if (S.val[j]) S.col[ S.ptr[ A.col[j] ]++ ] = i;
-
-            std::rotate(S.ptr, S.ptr + n, S.ptr + n + 1);
-            S.ptr[0] = 0;
-        }
-
-        // Split variables into C(oarse) and F(ine) sets.
-        template <typename Val, typename Col, typename Ptr>
-        static void cfsplit(
-                backend::crs<Val,  Col, Ptr> const &A,
-                backend::crs<char, Col, Ptr> const &S,
-                std::vector<char>                  &cf
-                )
-        {
-            const size_t n = rows(A);
-
-            std::vector<Col> lambda(n);
-
-            // Initialize lambdas:
-            for(size_t i = 0; i < n; ++i) {
-                Col temp = 0;
-                for(Ptr j = S.ptr[i], e = S.ptr[i+1]; j < e; ++j)
-                    temp += ( cf[ S.col[j] ] == 'U' ? 1 : 2 );
-                lambda[i] = temp;
-            }
-
-            // Keep track of variable groups with equal lambda values.
-            // ptr - start of a group;
-            // cnt - size of a group;
-            // i2n - variable number;
-            // n2i - vaiable position in a group.
-            std::vector<Ptr> ptr(n+1, 0);
-            std::vector<Ptr> cnt(n, 0);
-            std::vector<Ptr> i2n(n);
-            std::vector<Ptr> n2i(n);
-
-            for(size_t i = 0; i < n; ++i) ++ptr[lambda[i] + 1];
-
-            std::partial_sum(ptr.begin(), ptr.end(), ptr.begin());
-
-            for(size_t i = 0; i < n; ++i) {
-                Col lam = lambda[i];
-                Ptr idx = ptr[lam] + cnt[lam]++;
-                i2n[idx] = i;
-                n2i[i] = idx;
-            }
-
-            // Process variables by decreasing lambda value.
-            // 1. The vaiable with maximum value of lambda becomes next C-variable.
-            // 2. Its neighbours from S' become F-variables.
-            // 3. Keep lambda values in sync.
-            for(size_t top = n; top-- > 0; ) {
-                Ptr i   = i2n[top];
-                Col lam = lambda[i];
-
-                if (lam == 0) {
-                    std::replace(cf.begin(), cf.end(), 'U', 'C');
-                    break;
-                }
-
-                // Remove tne variable from its group.
-                --cnt[lam];
-
-                if (cf[i] == 'F') continue;
-
-                // Mark the variable as 'C'.
-                cf[i] = 'C';
-
-                // Its neighbours from S' become F-variables.
-                for(Ptr j = S.ptr[i], e = S.ptr[i + 1]; j < e; ++j) {
-                    Col c = S.col[j];
-
-                    if (cf[c] != 'U') continue;
-
-                    cf[c] = 'F';
-
-                    // Increase lambdas of the newly created F's neighbours.
-                    for(Ptr aj = A.ptr[c], ae = A.ptr[c + 1]; aj < ae; ++aj) {
-                        if (!S.val[aj]) continue;
-
-                        Col ac    = A.col[aj];
-                        Col lam_a = lambda[ac];
-
-                        if (cf[ac] != 'U' || static_cast<size_t>(lam_a) + 1 >= n)
-                            continue;
-
-                        Ptr old_pos = n2i[ac];
-                        Ptr new_pos = ptr[lam_a] + cnt[lam_a] - 1;
-
-                        n2i[i2n[old_pos]] = new_pos;
-                        n2i[i2n[new_pos]] = old_pos;
-
-                        std::swap(i2n[old_pos], i2n[new_pos]);
-
-                        --cnt[lam_a];
-                        ++cnt[lam_a + 1];
-                        ptr[lam_a + 1] = ptr[lam_a] + cnt[lam_a];
-
-                        lambda[ac] = lam_a + 1;
-                    }
-                }
-
-                // Decrease lambdas of the newly create C's neighbours.
-                for(Ptr j = A.ptr[i], e = A.ptr[i + 1]; j < e; j++) {
-                    if (!S.val[j]) continue;
-
-                    Col c   = A.col[j];
-                    Col lam = lambda[c];
-
-                    if (cf[c] != 'U' || lam == 0) continue;
-
-                    Ptr old_pos = n2i[c];
-                    Ptr new_pos = ptr[lam];
-
-                    n2i[i2n[old_pos]] = new_pos;
-                    n2i[i2n[new_pos]] = old_pos;
-
-                    std::swap(i2n[old_pos], i2n[new_pos]);
-
-                    --cnt[lam];
-                    ++cnt[lam - 1];
-                    ++ptr[lam];
-                    lambda[c] = lam - 1;
-                }
-            }
-        }
-};
-
-} // namespace coarsening
-
-namespace backend {
-
-template <class Backend>
-struct coarsening_is_supported<
-    Backend,
-    coarsening::ruge_stuben,
-    typename std::enable_if<
-        !std::is_arithmetic<typename backend::value_type<Backend>::type>::value
-        >::type
-    > : std::false_type
-{};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/runtime.hpp b/src/solvers/amgcl/coarsening/runtime.hpp
deleted file mode 100644
index c801dde..0000000
--- a/src/solvers/amgcl/coarsening/runtime.hpp
+++ /dev/null
@@ -1,299 +0,0 @@
-#ifndef AMGCL_COARSENING_RUNTIME_HPP
-#define AMGCL_COARSENING_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime-configurable coarsening.
- */
-
-#include <iostream>
-#include <stdexcept>
-#include <type_traits>
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/coarsening/ruge_stuben.hpp>
-#include <amgcl/coarsening/aggregation.hpp>
-#include <amgcl/coarsening/smoothed_aggregation.hpp>
-#include <amgcl/coarsening/smoothed_aggr_emin.hpp>
-#include <amgcl/coarsening/as_scalar.hpp>
-
-namespace amgcl {
-namespace runtime {
-
-/// Coarsening kinds.
-namespace coarsening {
-
-enum type {
-    ruge_stuben,            ///< Ruge-Stueben coarsening
-    aggregation,            ///< Aggregation
-    smoothed_aggregation,   ///< Smoothed aggregation
-    smoothed_aggr_emin      ///< Smoothed aggregation with energy minimization
-};
-
-inline std::ostream& operator<<(std::ostream &os, type c) {
-    switch (c) {
-        case ruge_stuben:
-            return os << "ruge_stuben";
-        case aggregation:
-            return os << "aggregation";
-        case smoothed_aggregation:
-            return os << "smoothed_aggregation";
-        case smoothed_aggr_emin:
-            return os << "smoothed_aggr_emin";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &c)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "ruge_stuben")
-        c = ruge_stuben;
-    else if (val == "aggregation")
-        c = aggregation;
-    else if (val == "smoothed_aggregation")
-        c = smoothed_aggregation;
-    else if (val == "smoothed_aggr_emin")
-        c = smoothed_aggr_emin;
-    else
-        throw std::invalid_argument("Invalid coarsening value. Valid choices are: "
-                "ruge_stuben, aggregation, smoothed_aggregation, smoothed_aggr_emin.");
-
-    return in;
-}
-
-template <class Backend>
-struct wrapper {
-    typedef boost::property_tree::ptree params;
-    type c;
-    bool as_scalar;
-    void *handle;
-
-    wrapper(params prm = params())
-        : c(prm.get("type", runtime::coarsening::smoothed_aggregation)),
-          handle(0)
-    {
-        if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-        typedef typename backend::value_type<Backend>::type value_type;
-        const bool block_value_type = math::static_rows<value_type>::value > 1;
-
-        as_scalar = (
-                block_value_type &&
-                c != ruge_stuben &&
-                prm.get("nullspace.cols", 0) > 0
-                );
-
-        switch(c) {
-
-#define AMGCL_RUNTIME_COARSENING(t) \
-            case t: \
-                if (as_scalar) { \
-                    handle = call_constructor<amgcl::coarsening::as_scalar<amgcl::coarsening::t>::type>(prm); \
-                } else { \
-                    handle = call_constructor<amgcl::coarsening::t>(prm); \
-                } \
-                break
-
-            AMGCL_RUNTIME_COARSENING(ruge_stuben);
-            AMGCL_RUNTIME_COARSENING(aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggr_emin);
-
-#undef AMGCL_RUNTIME_COARSENING
-
-            default:
-                throw std::invalid_argument("Unsupported coarsening type");
-        }
-    }
-
-    ~wrapper() {
-        switch(c) {
-
-#define AMGCL_RUNTIME_COARSENING(t) \
-            case t: \
-                if (as_scalar) { \
-                    call_destructor<amgcl::coarsening::as_scalar<amgcl::coarsening::t>::type>(); \
-                } else { \
-                    call_destructor<amgcl::coarsening::t>(); \
-                } \
-                break
-
-            AMGCL_RUNTIME_COARSENING(ruge_stuben);
-            AMGCL_RUNTIME_COARSENING(aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggr_emin);
-
-#undef AMGCL_RUNTIME_COARSENING
-        }
-    }
-
-    template <class Matrix>
-    std::tuple<
-        std::shared_ptr<Matrix>,
-        std::shared_ptr<Matrix>
-        >
-    transfer_operators(const Matrix &A) {
-        switch(c) {
-
-#define AMGCL_RUNTIME_COARSENING(t) \
-            case t: \
-                if (as_scalar) { \
-                    return make_operators<amgcl::coarsening::as_scalar<amgcl::coarsening::t>::type>(A); \
-                } \
-                return make_operators<amgcl::coarsening::t>(A)
-
-            AMGCL_RUNTIME_COARSENING(ruge_stuben);
-            AMGCL_RUNTIME_COARSENING(aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggr_emin);
-
-#undef AMGCL_RUNTIME_COARSENING
-
-            default:
-                throw std::invalid_argument("Unsupported coarsening type");
-        }
-    }
-
-    template <class Matrix>
-    std::shared_ptr<Matrix>
-    coarse_operator(const Matrix &A, const Matrix &P, const Matrix &R) const {
-        switch(c) {
-
-#define AMGCL_RUNTIME_COARSENING(t) \
-            case t: \
-                if (as_scalar) { \
-                    return make_coarse<amgcl::coarsening::as_scalar<amgcl::coarsening::t>::type>(A, P, R); \
-                } \
-                return make_coarse<amgcl::coarsening::t>(A, P, R)
-
-            AMGCL_RUNTIME_COARSENING(ruge_stuben);
-            AMGCL_RUNTIME_COARSENING(aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggregation);
-            AMGCL_RUNTIME_COARSENING(smoothed_aggr_emin);
-
-#undef AMGCL_RUNTIME_COARSENING
-
-            default:
-                throw std::invalid_argument("Unsupported coarsening type");
-        }
-    }
-
-    template <template <class> class Coarsening>
-    typename std::enable_if<
-        backend::coarsening_is_supported<Backend, Coarsening>::value,
-        void*
-    >::type
-    call_constructor(const params &prm) {
-        return static_cast<void*>(new Coarsening<Backend>(prm));
-    }
-
-    template <template <class> class Coarsening>
-    typename std::enable_if<
-        !backend::coarsening_is_supported<Backend, Coarsening>::value,
-        void*
-    >::type
-    call_constructor(const params&) {
-        throw std::logic_error("The coarsening is not supported by the backend");
-    }
-
-    template <template <class> class Coarsening>
-    typename std::enable_if<
-        backend::coarsening_is_supported<Backend, Coarsening>::value,
-        void
-    >::type
-    call_destructor() {
-        delete static_cast<Coarsening<Backend>*>(handle);
-    }
-
-    template <template <class> class Coarsening>
-    typename std::enable_if<
-        !backend::coarsening_is_supported<Backend, Coarsening>::value,
-        void
-    >::type
-    call_destructor() {
-    }
-
-    template <template <class> class Coarsening, class Matrix>
-    typename std::enable_if<
-        backend::coarsening_is_supported<Backend, Coarsening>::value,
-        std::tuple<
-            std::shared_ptr<Matrix>,
-            std::shared_ptr<Matrix>
-            >
-    >::type
-    make_operators(const Matrix &A) const {
-        return static_cast<Coarsening<Backend>*>(handle)->transfer_operators(A);
-    }
-
-    template <template <class> class Coarsening, class Matrix>
-    typename std::enable_if<
-        !backend::coarsening_is_supported<Backend, Coarsening>::value,
-        std::tuple<
-            std::shared_ptr<Matrix>,
-            std::shared_ptr<Matrix>
-            >
-    >::type
-    make_operators(const Matrix&) {
-        throw std::logic_error("The coarsening is not supported by the backend");
-    }
-
-    template <template <class> class Coarsening, class Matrix>
-    typename std::enable_if<
-        backend::coarsening_is_supported<Backend, Coarsening>::value,
-        std::shared_ptr<Matrix>
-    >::type
-    make_coarse(const Matrix &A, const Matrix &P, const Matrix &R) const {
-        return static_cast<Coarsening<Backend>*>(handle)->coarse_operator(A, P, R);
-    }
-
-    template <template <class> class Coarsening, class Matrix>
-    typename std::enable_if<
-        !backend::coarsening_is_supported<Backend, Coarsening>::value,
-        std::shared_ptr<Matrix>
-    >::type
-    make_coarse(const Matrix&, const Matrix&, const Matrix&) const {
-        throw std::logic_error("The coarsening is not supported by the backend");
-    }
-};
-
-} // namespace coarsening
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/smoothed_aggr_emin.hpp b/src/solvers/amgcl/coarsening/smoothed_aggr_emin.hpp
deleted file mode 100644
index 9ea533a..0000000
--- a/src/solvers/amgcl/coarsening/smoothed_aggr_emin.hpp
+++ /dev/null
@@ -1,363 +0,0 @@
-#ifndef AMGCL_COARSENING_SMOOTHED_AGGR_EMIN_HPP
-#define AMGCL_COARSENING_SMOOTHED_AGGR_EMIN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/smoothed_aggr_emin.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Smoothed aggregation with energy minimization coarsening.
- */
-
-#include <limits>
-
-#include <tuple>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/coarsening/detail/galerkin.hpp>
-#include <amgcl/coarsening/pointwise_aggregates.hpp>
-#include <amgcl/coarsening/tentative_prolongation.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/detail/sort_row.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-/// Smoothed aggregation with energy minimization.
-/**
- * \ingroup coarsening
- * \sa \cite Sala2008
- */
-template <class Backend>
-struct smoothed_aggr_emin {
-    typedef pointwise_aggregates Aggregates;
-
-    /// Coarsening parameters.
-    struct params {
-        /// Aggregation parameters.
-        Aggregates::params aggr;
-
-        /// Near nullspace parameters.
-        nullspace_params nullspace;
-
-        params() {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_CHILD(p, aggr),
-              AMGCL_PARAMS_IMPORT_CHILD(p, nullspace)
-        {
-            check_params(p, {"aggr", "nullspace"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, aggr);
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, nullspace);
-        }
-#endif
-    } prm;
-
-    smoothed_aggr_emin(const params &prm = params()) : prm(prm) {}
-
-    /// \copydoc amgcl::coarsening::aggregation::transfer_operators
-    template <class Matrix>
-    std::tuple<
-        std::shared_ptr<Matrix>,
-        std::shared_ptr<Matrix>
-        >
-    transfer_operators(const Matrix &A) {
-        typedef typename backend::value_type<Matrix>::type Val;
-        typedef typename backend::col_type<Matrix>::type   Col;
-        typedef typename backend::ptr_type<Matrix>::type   Ptr;
-        typedef ptrdiff_t Idx;
-
-        AMGCL_TIC("aggregates");
-        Aggregates aggr(A, prm.aggr, prm.nullspace.cols);
-        prm.aggr.eps_strong *= 0.5;
-        AMGCL_TOC("aggregates");
-
-        AMGCL_TIC("interpolation");
-        auto P_tent = tentative_prolongation<Matrix>(
-                rows(A), aggr.count, aggr.id, prm.nullspace, prm.aggr.block_size
-                );
-
-        // Filter the system matrix
-        backend::crs<Val, Col, Ptr> Af;
-        Af.set_size(rows(A), cols(A));
-        Af.ptr[0] = 0;
-
-        std::vector<Val> dia(Af.nrows);
-
-#pragma omp parallel for
-        for(Idx i = 0; i < static_cast<Idx>(Af.nrows); ++i) {
-            Idx row_begin = A.ptr[i];
-            Idx row_end   = A.ptr[i+1];
-            Idx row_width = row_end - row_begin;
-
-            Val D = math::zero<Val>();
-            for(Idx j = row_begin; j < row_end; ++j) {
-                Idx c = A.col[j];
-                Val v = A.val[j];
-
-                if (c == i)
-                    D += v;
-                else if (!aggr.strong_connection[j]) {
-                    D += v;
-                    --row_width;
-                }
-            }
-
-            dia[i] = D;
-            Af.ptr[i+1] = row_width;
-        }
-
-        Af.set_nonzeros(Af.scan_row_sizes());
-
-#pragma omp parallel for
-        for(Idx i = 0; i < static_cast<Idx>(Af.nrows); ++i) {
-            Idx row_begin = A.ptr[i];
-            Idx row_end   = A.ptr[i+1];
-            Idx row_head  = Af.ptr[i];
-
-            for(Idx j = row_begin; j < row_end; ++j) {
-                Idx c = A.col[j];
-
-                if (c == i) {
-                    Af.col[row_head] = i;
-                    Af.val[row_head] = dia[i];
-                    ++row_head;
-                } else if (aggr.strong_connection[j]) {
-                    Af.col[row_head] = c;
-                    Af.val[row_head] = A.val[j];
-                    ++row_head;
-                }
-            }
-        }
-
-        std::vector<Val> omega;
-
-        auto P = interpolation(Af, dia, *P_tent, omega);
-        auto R = restriction  (Af, dia, *P_tent, omega);
-        AMGCL_TOC("interpolation");
-
-        return std::make_tuple(P, R);
-    }
-
-    template <class Matrix>
-    std::shared_ptr<Matrix>
-    coarse_operator(const Matrix &A, const Matrix &P, const Matrix &R) const {
-        return detail::galerkin(A, P, R);
-    }
-
-    private:
-        template <class AMatrix, typename Val, typename Col, typename Ptr>
-        static std::shared_ptr< backend::crs<Val, Col, Ptr> >
-        interpolation(
-                const AMatrix &A, const std::vector<Val> &Adia,
-                const backend::crs<Val, Col, Ptr> &P_tent,
-                std::vector<Val> &omega
-                )
-        {
-            const size_t n  = rows(P_tent);
-            const size_t nc = cols(P_tent);
-
-            auto AP = product(A, P_tent, /*sort rows: */true);
-
-            omega.resize(nc, math::zero<Val>());
-            std::vector<Val> denum(nc, math::zero<Val>());
-
-#pragma omp parallel
-            {
-                std::vector<ptrdiff_t> marker(nc, -1);
-
-                // Compute A * Dinv * AP row by row and compute columnwise
-                // scalar products necessary for computation of omega. The
-                // actual results of matrix-matrix product are not stored.
-                std::vector<Col> adap_col(128);
-                std::vector<Val> adap_val(128);
-
-#pragma omp for
-                for(ptrdiff_t ia = 0; ia < static_cast<ptrdiff_t>(n); ++ia) {
-                    adap_col.clear();
-                    adap_val.clear();
-
-                    // Form current row of ADAP matrix.
-                    for(auto a = A.row_begin(ia); a; ++a) {
-                        Col ca  = a.col();
-                        Val va  = math::inverse(Adia[ca]) * a.value();
-
-                        for(auto p = AP->row_begin(ca); p; ++p) {
-                            Col c = p.col();
-                            Val v = va * p.value();
-
-                            if (marker[c] < 0) {
-                                marker[c] = adap_col.size();
-                                adap_col.push_back(c);
-                                adap_val.push_back(v);
-                            } else {
-                                adap_val[marker[c]] += v;
-                            }
-                        }
-                    }
-
-                    amgcl::detail::sort_row(
-                            &adap_col[0], &adap_val[0], adap_col.size()
-                            );
-
-                    // Update columnwise scalar products (AP,ADAP) and (ADAP,ADAP).
-                    // 1. (AP, ADAP)
-                    for(
-                            Ptr ja = AP->ptr[ia], ea = AP->ptr[ia + 1],
-                            jb = 0, eb = adap_col.size();
-                            ja < ea && jb < eb;
-                       )
-                    {
-                        Col ca = AP->col[ja];
-                        Col cb = adap_col[jb];
-
-                        if (ca < cb)
-                            ++ja;
-                        else if (cb < ca)
-                            ++jb;
-                        else /*ca == cb*/ {
-                            Val v = AP->val[ja] * adap_val[jb];
-#pragma omp critical
-                            omega[ca] += v;
-                            ++ja;
-                            ++jb;
-                        }
-                    }
-
-                    // 2. (ADAP, ADAP) (and clear marker)
-                    for(size_t j = 0, e = adap_col.size(); j < e; ++j) {
-                        Col c = adap_col[j];
-                        Val v = adap_val[j];
-#pragma omp critical
-                        denum[c] += v * v;
-                        marker[c] = -1;
-                    }
-                }
-            }
-
-            for(size_t i = 0, m = omega.size(); i < m; ++i)
-                omega[i] = math::inverse(denum[i]) * omega[i];
-
-            // Update AP to obtain P: P = (P_tent - D^-1 A P Omega)
-            /*
-             * Here we use the fact that if P(i,j) != 0,
-             * then with necessity AP(i,j) != 0:
-             *
-             * AP(i,j) = sum_k(A_ik P_kj), and A_ii != 0.
-             */
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                Val dia = math::inverse(Adia[i]);
-
-                for(Ptr ja = AP->ptr[i],    ea = AP->ptr[i+1],
-                        jp = P_tent.ptr[i], ep = P_tent.ptr[i+1];
-                        ja < ea; ++ja
-                   )
-                {
-                    Col ca = AP->col[ja];
-                    Val va = -dia * AP->val[ja] * omega[ca];
-
-                    for(; jp < ep; ++jp) {
-                        Col cp = P_tent.col[jp];
-                        if (cp > ca)
-                            break;
-
-                        if (cp == ca) {
-                            va += P_tent.val[jp];
-                            break;
-                        }
-                    }
-
-                    AP->val[ja] = va;
-                }
-            }
-
-            return AP;
-        }
-
-        template <typename AMatrix, typename Val, typename Col, typename Ptr>
-        static std::shared_ptr< backend::crs<Val, Col, Ptr> >
-        restriction(
-                const AMatrix &A, const std::vector<Val> &Adia,
-                const backend::crs<Val, Col, Ptr> &P_tent,
-                const std::vector<Val> &omega
-                )
-        {
-            const size_t nc = cols(P_tent);
-
-            auto R_tent = transpose(P_tent);
-            sort_rows(*R_tent);
-
-            auto RA = product(*R_tent, A, /*sort rows: */true);
-
-            // Compute R = R_tent - Omega R_tent A D^-1.
-            /*
-             * Here we use the fact that if R(i,j) != 0,
-             * then with necessity RA(i,j) != 0:
-             *
-             * RA(i,j) = sum_k(R_ik A_kj), and A_jj != 0.
-             */
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nc); ++i) {
-                Val w = omega[i];
-
-                for(Ptr ja = RA->ptr[i],     ea = RA->ptr[i+1],
-                        jr = R_tent->ptr[i], er = R_tent->ptr[i+1];
-                        ja < ea; ++ja
-                   )
-                {
-                    Col ca = RA->col[ja];
-                    Val va = -w * math::inverse(Adia[ca]) * RA->val[ja];
-
-                    for(; jr < er; ++jr) {
-                        Col cr = R_tent->col[jr];
-                        if (cr > ca)
-                            break;
-
-                        if (cr == ca) {
-                            va += R_tent->val[jr];
-                            break;
-                        }
-                    }
-
-                    RA->val[ja] = va;
-                }
-            }
-
-            return RA;
-        }
-};
-
-} // namespace coarsening
-} // namespace amgcl
-
-
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/smoothed_aggregation.hpp b/src/solvers/amgcl/coarsening/smoothed_aggregation.hpp
deleted file mode 100644
index 7953733..0000000
--- a/src/solvers/amgcl/coarsening/smoothed_aggregation.hpp
+++ /dev/null
@@ -1,248 +0,0 @@
-#ifndef AMGCL_COARSENING_SMOOTHED_AGGREGATION_HPP
-#define AMGCL_COARSENING_SMOOTHED_AGGREGATION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/smoothed_aggregation.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Smoothed aggregation coarsening scheme.
- */
-
-#ifdef _OPENMP
-#  include <omp.h>
-#endif
-
-#include <tuple>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/coarsening/detail/galerkin.hpp>
-#include <amgcl/coarsening/pointwise_aggregates.hpp>
-#include <amgcl/coarsening/tentative_prolongation.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace coarsening {
-
-/// Smoothed aggregation coarsening.
-/**
- * \ingroup coarsening
- * \sa \cite Vanek1996
- */
-template <class Backend>
-struct smoothed_aggregation {
-    typedef pointwise_aggregates Aggregates;
-
-    /// Coarsening parameters
-    struct params {
-        /// Aggregation parameters.
-        Aggregates::params aggr;
-
-        /// Near nullspace parameters.
-        nullspace_params nullspace;
-
-        /// Relaxation factor.
-        /**
-         * Used as a scaling for the damping factor omega.
-         * When estimate_spectral_radius is set, then
-         *   omega = relax * (4/3) / rho.
-         * Otherwise
-         *   omega = relax * (2/3).
-         *
-         * Piecewise constant prolongation \f$\tilde P\f$ from non-smoothed
-         * aggregation is improved by a smoothing to get the final prolongation
-         * matrix \f$P\f$. Simple Jacobi smoother is used here, giving the
-         * prolongation matrix
-         * \f[P = \left( I - \omega D^{-1} A^F \right) \tilde P.\f]
-         * Here \f$A^F = (a_{ij}^F)\f$ is the filtered matrix given by
-         * \f[
-         * a_{ij}^F =
-         * \begin{cases}
-         * a_{ij} \quad \text{if} \; j \in N_i\\
-         * 0 \quad \text{otherwise}
-         * \end{cases}, \quad \text{if}\; i \neq j,
-         * \quad a_{ii}^F = a_{ii} - \sum\limits_{j=1,j\neq i}^n
-         * \left(a_{ij} - a_{ij}^F \right),
-         * \f]
-         * where \f$N_i\f$ is the set of variables, strongly coupled to
-         * variable \f$i\f$, and \f$D\f$ denotes the diagonal of \f$A^F\f$.
-         */
-        float relax;
-
-        // Estimate the matrix spectral radius.
-        // This usually improves convergence rate and results in faster solves,
-        // but costs some time during setup.
-        bool estimate_spectral_radius;
-
-        // Number of power iterations to apply for the spectral radius
-        // estimation. Use Gershgorin disk theorem when power_iters = 0.
-        int power_iters;
-
-        params() : relax(1.0f), estimate_spectral_radius(false), power_iters(0) { }
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_CHILD(p, aggr),
-              AMGCL_PARAMS_IMPORT_CHILD(p, nullspace),
-              AMGCL_PARAMS_IMPORT_VALUE(p, relax),
-              AMGCL_PARAMS_IMPORT_VALUE(p, estimate_spectral_radius),
-              AMGCL_PARAMS_IMPORT_VALUE(p, power_iters)
-        {
-            check_params(p, {"aggr", "nullspace", "relax", "estimate_spectral_radius", "power_iters"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, aggr);
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, nullspace);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, relax);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, estimate_spectral_radius);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, power_iters);
-        }
-#endif
-    } prm;
-
-    smoothed_aggregation(const params &prm = params()) : prm(prm) {}
-
-    /// \copydoc amgcl::coarsening::aggregation::transfer_operators
-    template <class Matrix>
-    std::tuple< std::shared_ptr<Matrix>, std::shared_ptr<Matrix> >
-    transfer_operators(const Matrix &A) {
-        typedef typename backend::value_type<Matrix>::type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        const size_t n = rows(A);
-
-        AMGCL_TIC("aggregates");
-        Aggregates aggr(A, prm.aggr, prm.nullspace.cols);
-        prm.aggr.eps_strong *= 0.5;
-        AMGCL_TOC("aggregates");
-
-        auto P_tent = tentative_prolongation<Matrix>(
-                n, aggr.count, aggr.id, prm.nullspace, prm.aggr.block_size
-                );
-
-        auto P = std::make_shared<Matrix>();
-        P->set_size(rows(*P_tent), cols(*P_tent), true);
-
-        scalar_type omega = prm.relax;
-        if (prm.estimate_spectral_radius) {
-            omega *= static_cast<scalar_type>(4.0/3) / backend::spectral_radius<true>(A, prm.power_iters);
-        } else {
-            omega *= static_cast<scalar_type>(2.0/3);
-        }
-
-        AMGCL_TIC("smoothing");
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> marker(P->ncols, -1);
-
-            // Count number of entries in P.
-#pragma omp for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                for(ptrdiff_t ja = A.ptr[i], ea = A.ptr[i+1]; ja < ea; ++ja) {
-                    ptrdiff_t ca = A.col[ja];
-
-                    // Skip weak off-diagonal connections.
-                    if (ca != i && !aggr.strong_connection[ja])
-                        continue;
-
-                    for(ptrdiff_t jp = P_tent->ptr[ca], ep = P_tent->ptr[ca+1]; jp < ep; ++jp) {
-                        ptrdiff_t cp = P_tent->col[jp];
-
-                        if (marker[cp] != i) {
-                            marker[cp] = i;
-                            ++( P->ptr[i + 1] );
-                        }
-                    }
-                }
-            }
-        }
-
-        P->scan_row_sizes();
-        P->set_nonzeros();
-
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> marker(P->ncols, -1);
-
-            // Fill the interpolation matrix.
-#pragma omp for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-
-                // Diagonal of the filtered matrix is the original matrix
-                // diagonal minus its weak connections.
-                value_type dia = math::zero<value_type>();
-                for(ptrdiff_t j = A.ptr[i], e = A.ptr[i+1]; j < e; ++j) {
-                    if (A.col[j] == i || !aggr.strong_connection[j])
-                        dia += A.val[j];
-                }
-                if (!math::is_zero(dia)) dia = -omega * math::inverse(dia);
-
-                ptrdiff_t row_beg = P->ptr[i];
-                ptrdiff_t row_end = row_beg;
-                for(ptrdiff_t ja = A.ptr[i], ea = A.ptr[i + 1]; ja < ea; ++ja) {
-                    ptrdiff_t ca = A.col[ja];
-
-                    // Skip weak off-diagonal connections.
-                    if (ca != i && !aggr.strong_connection[ja]) continue;
-
-                    value_type va = (ca == i)
-                        ? static_cast<value_type>(static_cast<scalar_type>(1 - omega) * math::identity<value_type>())
-                        : dia * A.val[ja];
-
-                    for(ptrdiff_t jp = P_tent->ptr[ca], ep = P_tent->ptr[ca+1]; jp < ep; ++jp) {
-                        ptrdiff_t cp = P_tent->col[jp];
-                        value_type vp = P_tent->val[jp];
-
-                        if (marker[cp] < row_beg) {
-                            marker[cp] = row_end;
-                            P->col[row_end] = cp;
-                            P->val[row_end] = va * vp;
-                            ++row_end;
-                        } else {
-                            P->val[ marker[cp] ] += va * vp;
-                        }
-                    }
-                }
-            }
-        }
-        AMGCL_TOC("smoothing");
-
-        return std::make_tuple(P, transpose(*P));
-    }
-
-    /// \copydoc amgcl::coarsening::aggregation::coarse_operator
-    template <class Matrix>
-    std::shared_ptr<Matrix>
-    coarse_operator(const Matrix &A, const Matrix &P, const Matrix &R) const {
-        return detail::galerkin(A, P, R);
-    }
-};
-
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/coarsening/tentative_prolongation.hpp b/src/solvers/amgcl/coarsening/tentative_prolongation.hpp
deleted file mode 100644
index 6b235d6..0000000
--- a/src/solvers/amgcl/coarsening/tentative_prolongation.hpp
+++ /dev/null
@@ -1,233 +0,0 @@
-#ifndef AMGCL_COARSENING_TENTATIVE_PROLONGATION_HPP
-#define AMGCL_COARSENING_TENTATIVE_PROLONGATION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/coarsening/tentative_prolongation.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Tentative prolongation operator for aggregated AMG.
- */
-
-#include <vector>
-#include <algorithm>
-
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/detail/qr.hpp>
-
-namespace amgcl {
-namespace coarsening {
-namespace detail {
-    struct skip_negative {
-        const std::vector<ptrdiff_t> &key;
-        int block_size;
-
-        skip_negative(const std::vector<ptrdiff_t> &key, int block_size)
-            : key(key), block_size(block_size) { }
-
-        bool operator()(ptrdiff_t i, ptrdiff_t j) const {
-            // Cast to unsigned type to keep negative values at the end
-            return
-                static_cast<size_t>(key[i]) / block_size <
-                static_cast<size_t>(key[j]) / block_size;
-        }
-    };
-} // namespace detail
-
-
-//---------------------------------------------------------------------------
-struct nullspace_params {
-    /// Number of vectors in near nullspace.
-    int cols;
-
-    /// Near nullspace vectors.
-    /**
-     * The vectors are represented as columns of a 2D matrix stored in
-     * row-major order.
-     */
-    std::vector<double> B;
-
-    nullspace_params() : cols(0) {}
-
-#ifndef AMGCL_NO_BOOST
-    nullspace_params(const boost::property_tree::ptree &p)
-        : cols(p.get("cols", nullspace_params().cols))
-    {
-        double *b = 0;
-        b = p.get("B", b);
-
-        if (b) {
-            size_t rows = 0;
-            rows = p.get("rows", rows);
-
-            precondition(cols > 0,
-                    "Error in nullspace parameters: "
-                    "B is set, but cols is not"
-                    );
-
-            precondition(rows > 0,
-                    "Error in nullspace parameters: "
-                    "B is set, but rows is not"
-                    );
-
-            B.assign(b, b + rows * cols);
-        } else {
-            precondition(cols == 0,
-                    "Error in nullspace parameters: "
-                    "cols > 0, but B is empty"
-                    );
-        }
-
-        check_params(p, {"cols", "rows", "B"});
-    }
-
-    void get(boost::property_tree::ptree&, const std::string&) const {}
-#endif
-};
-
-/// Tentative prolongation operator
-/**
- * If near nullspace vectors are not provided, returns piecewise-constant
- * prolongation operator. If user provides near nullspace vectors, those are
- * used to improve the prolongation operator.
- * \see \cite Vanek2001
- */
-template <class Matrix>
-std::shared_ptr<Matrix> tentative_prolongation(
-        size_t n,
-        size_t naggr,
-        const std::vector<ptrdiff_t> aggr,
-        nullspace_params &nullspace,
-        int block_size
-        )
-{
-    typedef typename backend::value_type<Matrix>::type value_type;
-    typedef typename backend::col_type<Matrix>::type col_type;
-
-    auto P = std::make_shared<Matrix>();
-
-    AMGCL_TIC("tentative");
-    if (nullspace.cols > 0) {
-        ptrdiff_t nba = naggr / block_size;
-
-        // Sort fine points by aggregate number.
-        // Put points not belonging to any aggregate to the end of the list.
-        std::vector<ptrdiff_t> order(n);
-        for(size_t i = 0; i < n; ++i) order[i] = i;
-        std::stable_sort(order.begin(), order.end(), detail::skip_negative(aggr, block_size));
-        std::vector<ptrdiff_t> aggr_ptr(nba + 1, 0);
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            ptrdiff_t a = aggr[order[i]];
-            if (a < 0) break;
-            ++aggr_ptr[a / block_size + 1];
-        }
-        std::partial_sum(aggr_ptr.begin(), aggr_ptr.end(), aggr_ptr.begin());
-
-        // Precompute the shape of the prolongation operator.
-        // Each row contains exactly nullspace.cols non-zero entries.
-        // Rows that do not belong to any aggregate are empty.
-        P->set_size(n, nullspace.cols * nba);
-        P->ptr[0] = 0;
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-            P->ptr[i+1] = aggr[i] < 0 ? 0 : nullspace.cols;
-
-        P->scan_row_sizes();
-        P->set_nonzeros();
-
-        // Compute the tentative prolongation operator and null-space vectors
-        // for the coarser level.
-        std::vector<double> Bnew;
-        Bnew.resize(nba * nullspace.cols * nullspace.cols);
-
-#pragma omp parallel
-        {
-            amgcl::detail::QR<double> qr;
-            std::vector<double> Bpart;
-
-#pragma omp for
-            for(ptrdiff_t i = 0; i < nba; ++i) {
-                auto aggr_beg = aggr_ptr[i];
-                auto aggr_end = aggr_ptr[i+1];
-                auto d = aggr_end - aggr_beg;
-
-                Bpart.resize(d * nullspace.cols);
-
-                for(ptrdiff_t j = aggr_beg, jj = 0; j < aggr_end; ++j, ++jj) {
-                    ptrdiff_t ib = nullspace.cols * order[j];
-                    for(int k = 0; k < nullspace.cols; ++k)
-                        Bpart[jj + d * k] = nullspace.B[ib + k];
-                }
-
-                qr.factorize(d, nullspace.cols, &Bpart[0], amgcl::detail::col_major);
-
-                for(int ii = 0, kk = 0; ii < nullspace.cols; ++ii)
-                    for(int jj = 0; jj < nullspace.cols; ++jj, ++kk)
-                        Bnew[i * nullspace.cols * nullspace.cols + kk] = qr.R(ii,jj);
-
-                for(ptrdiff_t j = aggr_beg, ii = 0; j < aggr_end; ++j, ++ii) {
-                    col_type   *c = &P->col[P->ptr[order[j]]];
-                    value_type *v = &P->val[P->ptr[order[j]]];
-
-                    for(int jj = 0; jj < nullspace.cols; ++jj) {
-                        c[jj] = i * nullspace.cols + jj;
-                        // TODO: this is just a workaround to make non-scalar value
-                        // types compile. Most probably this won't actually work.
-                        v[jj] = qr.Q(ii,jj) * math::identity<value_type>();
-                    }
-                }
-            }
-        }
-
-        std::swap(nullspace.B, Bnew);
-    } else {
-        P->set_size(n, naggr);
-        P->ptr[0] = 0;
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-            P->ptr[i+1] = (aggr[i] >= 0);
-
-        P->set_nonzeros(P->scan_row_sizes());
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            if (aggr[i] >= 0) {
-                P->col[P->ptr[i]] = aggr[i];
-                P->val[P->ptr[i]] = math::identity<value_type>();
-            }
-        }
-    }
-    AMGCL_TOC("tentative");
-
-    return P;
-}
-
-} // namespace coarsening
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/deflated_solver.hpp b/src/solvers/amgcl/deflated_solver.hpp
deleted file mode 100644
index 9bfa46a..0000000
--- a/src/solvers/amgcl/deflated_solver.hpp
+++ /dev/null
@@ -1,276 +0,0 @@
-#ifndef AMGCL_DEFLATED_SOLVER_HPP
-#define AMGCL_DEFLATED_SOLVER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/deflated_solver.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Iterative preconditioned solver with deflation.
- */
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/detail/inverse.hpp>
-
-namespace amgcl {
-
-/// Convenience class that bundles together a preconditioner and an iterative solver.
-template <
-    class Precond,
-    class IterativeSolver
-    >
-class deflated_solver : public amgcl::detail::non_copyable {
-    static_assert(
-            backend::backends_compatible<
-                typename IterativeSolver::backend_type,
-                typename Precond::backend_type
-            >::value,
-            "Backends for preconditioner and iterative solver should be compatible"
-            );
-    public:
-        typedef typename IterativeSolver::backend_type backend_type;
-        typedef typename backend_type::matrix matrix;
-        typedef typename backend_type::vector vector;
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename backend_type::params backend_params;
-        typedef typename backend::builtin<value_type>::matrix build_matrix;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        /** Combined parameters of the bundled preconditioner and the iterative
-         * solver.
-         */
-        struct params {
-            int         nvec; ///< The number of deflation vectors
-            scalar_type *vec; ///< Deflation vectors as a [nvec x n] matrix
-
-            typename Precond::params         precond; ///< Preconditioner parameters.
-            typename IterativeSolver::params solver;  ///< Iterative solver parameters.
-
-            params() : nvec(0), vec(nullptr) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, nvec),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, vec),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, precond),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, solver)
-            {
-                check_params(p, {"nvec", "vec", "precond", "solver"});
-            }
-
-            void get( boost::property_tree::ptree &p,
-                    const std::string &path = ""
-                    ) const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, nvec);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, vec);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, precond);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, solver);
-            }
-#endif
-        } prm;
-
-        /** Sets up the preconditioner and creates the iterative solver. */
-        template <class Matrix>
-        deflated_solver(
-                const Matrix &A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(backend::rows(A)),
-            P(A, prm.precond, bprm),
-            S(backend::rows(A), prm.solver, bprm),
-            r(backend_type::create_vector(n, bprm)),
-            Z(prm.nvec),
-            E(prm.nvec * prm.nvec, 0),
-            d(prm.nvec)
-        {
-            init(A, bprm);
-        }
-
-        // Constructs the preconditioner and creates iterative solver.
-        // Takes shared pointer to the matrix in internal format.
-        deflated_solver(
-                std::shared_ptr<build_matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(backend::rows(*A)),
-            P(A, prm.precond, bprm),
-            S(backend::rows(*A), prm.solver, bprm),
-            r(backend_type::create_vector(n, bprm)),
-            Z(prm.nvec),
-            E(prm.nvec * prm.nvec, 0),
-            d(prm.nvec)
-        {
-            init(*A, bprm);
-        }
-
-        template <class Matrix>
-        void init(const Matrix &A, const backend_params &bprm) {
-            precondition(prm.nvec > 0 && prm.vec != nullptr, "Deflation vectors are not set!");
-
-            for(int i = 0; i < prm.nvec; ++i) {
-                Z[i] = backend_type::copy_vector(
-                        std::make_shared<backend::numa_vector<scalar_type>>(make_iterator_range(prm.vec + n * i, prm.vec + n * (i + 1))),
-                        bprm);
-            }
-
-            std::vector<scalar_type> AZ(prm.nvec);
-            std::fill(E.begin(), E.end(), math::zero<scalar_type>());
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                std::fill(AZ.begin(), AZ.end(), math::zero<scalar_type>());
-                for(auto a = backend::row_begin(A, i); a; ++a) {
-                    for(int j = 0; j < prm.nvec; ++j) {
-                        AZ[j] += a.value() * prm.vec[j * n + a.col()];
-                    }
-                }
-
-                for(int ii = 0, k = 0; ii < prm.nvec; ++ii) {
-                    for(int jj = 0; jj < prm.nvec; ++jj, ++k) {
-                        E[k] += prm.vec[i + ii * n] * AZ[jj];
-                    }
-                }
-            }
-
-            std::vector<scalar_type> t(E.size());
-            std::vector<int> p(prm.nvec);
-            detail::inverse(prm.nvec, E.data(), t.data(), p.data());
-        }
-
-        /** Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * \rst
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         * \endrst
-         */
-        template <class Matrix, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Vec1 &rhs, Vec2 &&x) const
-        {
-            project(rhs, x);
-            return S(A, *this, rhs, x);
-        }
-
-        /** Computes the solution for the given right-hand side \p rhs.
-         * Returns the number of iterations made and the achieved residual as a
-         * ``std::tuple``. The solution vector \p x provides initial
-         * approximation in input and holds the computed solution on output.
-         */
-        template <class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(const Vec1 &rhs, Vec2 &&x) const {
-            project(rhs, x);
-            return S(*this, rhs, x);
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            P.apply(rhs, x);
-            project(rhs, x);
-        }
-
-        template <class Vec1, class Vec2>
-        void project(const Vec1 &b, Vec2 &x) const {
-            // x += Z^T E^{-1} Z (b - Ax)
-            backend::residual(b, P.system_matrix(), x, *r);
-            std::fill(d.begin(), d.end(), math::zero<scalar_type>());
-            for(int j = 0; j < prm.nvec; ++j) {
-                auto fj = backend::inner_product(*Z[j], *r);
-                for(int i = 0; i < prm.nvec; ++i)
-                    d[i] += E[i*prm.nvec+j] * fj;
-            }
-            backend::lin_comb(prm.nvec, d, Z, 1, x);
-        }
-
-        /// Returns reference to the constructed preconditioner.
-        const Precond& precond() const {
-            return P;
-        }
-
-        /// Returns reference to the constructed preconditioner.
-        Precond& precond() {
-            return P;
-        }
-
-        /// Returns reference to the constructed iterative solver.
-        const IterativeSolver& solver() const {
-            return S;
-        }
-
-        /// Returns the system matrix in the backend format.
-        std::shared_ptr<typename Precond::matrix> system_matrix_ptr() const {
-            return P.system_matrix_ptr();
-        }
-
-        typename Precond::matrix const& system_matrix() const {
-            return P.system_matrix();
-        }
-
-#ifndef AMGCL_NO_BOOST
-        /// Stores the parameters used during construction into the property tree \p p.
-        void get_params(boost::property_tree::ptree &p) const {
-            prm.get(p);
-        }
-#endif
-
-        /// Returns the size of the system matrix.
-        size_t size() const {
-            return n;
-        }
-
-        size_t bytes() const {
-            return backend::bytes(S) + backend::bytes(P);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const deflated_solver &p) {
-            return os
-                << "Solver\n======\n" << p.S << std::endl
-                << "Preconditioner\n==============\n" << p.P;
-        }
-    private:
-        size_t           n;
-        Precond          P;
-        IterativeSolver  S;
-        std::shared_ptr<vector> r;
-        std::vector<std::shared_ptr<vector>> Z;
-        std::vector<scalar_type> E;
-        mutable std::vector<scalar_type> d;
-};
-
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/detail/inverse.hpp b/src/solvers/amgcl/detail/inverse.hpp
deleted file mode 100644
index 644ce7d..0000000
--- a/src/solvers/amgcl/detail/inverse.hpp
+++ /dev/null
@@ -1,102 +0,0 @@
-#ifndef AMGCL_DETAIL_INVERSE_HPP
-#define AMGCL_DETAIL_INVERSE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/detail/inverse.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Inverse of a dense matrix.
- */
-
-#include <algorithm>
-#include <cassert>
-#include <numeric>
-#include <utility>
-#include <amgcl/util.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace detail {
-
-    template <typename value_type>
-    static void inverse(int n, value_type *A, value_type *t, int *p) {
-        std::iota(p, p + n, 0);
-
-        // Perform LU-factorization of A in-place
-        for(int col = 0; col < n; ++col) {
-            // Find pivot element
-            int pivot_i = col;
-            using mag_type = typename math::scalar_of<value_type>::type;
-            mag_type pivot_mag = math::zero<mag_type>();
-            for (int i = col; i < n; ++i) {
-                int row = p[i];
-                mag_type mag = math::norm(A[row*n+col]);
-                if (mag > pivot_mag) {
-                    pivot_mag = mag;
-                    pivot_i = i;
-                }
-            }
-            std::swap(p[col], p[pivot_i]);
-            int pivot_row = p[col];
-            // We have found pivot element, perform Gauss elimination
-            value_type d = math::inverse(A[pivot_row*n+col]);
-            assert(!math::is_zero(d));
-            for (int i = col+1; i < n; ++i) {
-                int row = p[i];
-                A[row*n+col] *= d;
-                for(int j = col+1; j < n; ++j)
-                    A[row*n+j] -= A[row*n+col] * A[pivot_row*n+j];
-            }
-            A[pivot_row*n+col] = d;
-        }
-
-        // Invert identity matrix in-place to get the solution.
-        for(int k = 0; k < n; ++k) {
-            // Lower triangular solve:
-            for(int i = 0; i < n; ++i) {
-                int row = p[i];
-                value_type b = (row == k) ? math::identity<value_type>() : math::zero<value_type>();
-                for(int j = 0; j < i; ++j)
-                    b -= A[row*n+j] * t[j*n+k];
-                t[i*n+k] = b;
-            }
-
-            // Upper triangular solve:
-            for(int i = n; i --> 0; ) {
-                int row = p[i];
-                for(int j = i+1; j < n; ++j)
-                    t[i*n+k] -= A[row*n+j] * t[j*n+k];
-                t[i*n+k] *= A[row*n+i];
-            }
-        }
-
-        std::copy(t, t + n * n, A);
-    }
-
-} // namespace detail
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/detail/qr.hpp b/src/solvers/amgcl/detail/qr.hpp
deleted file mode 100644
index 5155c9c..0000000
--- a/src/solvers/amgcl/detail/qr.hpp
+++ /dev/null
@@ -1,601 +0,0 @@
-#ifndef AMGCL_DETAIL_QR_HPP
-#define AMGCL_DETAIL_QR_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/detail/qr.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  QR decomposition.
- *
- * This is a port of ZGEQR2 procedure from LAPACK and its dependencies.
- * The original code included the following copyright notice:
- * \verbatim
-   Copyright (c) 1992-2013 The University of Tennessee and The University
-                           of Tennessee Research Foundation.  All rights
-                           reserved.
-   Copyright (c) 2000-2013 The University of California Berkeley. All
-                           rights reserved.
-   Copyright (c) 2006-2013 The University of Colorado Denver.  All rights
-                           reserved.
-
-   $COPYRIGHT$
-
-   Additional copyrights may follow
-
-   $HEADER$
-
-   Redistribution and use in source and binary forms, with or without
-   modification, are permitted provided that the following conditions are
-   met:
-
-   - Redistributions of source code must retain the above copyright
-     notice, this list of conditions and the following disclaimer.
-
-   - Redistributions in binary form must reproduce the above copyright
-     notice, this list of conditions and the following disclaimer listed
-     in this license in the documentation and/or other materials
-     provided with the distribution.
-
-   - Neither the name of the copyright holders nor the names of its
-     contributors may be used to endorse or promote products derived from
-     this software without specific prior written permission.
-
-   The copyright holders provide no reassurances that the source code
-   provided does not infringe any patent, copyright, or any other
-   intellectual property rights of third parties.  The copyright holders
-   disclaim any liability to any recipient for claims brought against
-   recipient by any third party for infringement of that parties
-   intellectual property rights.
-
-   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
-   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
-   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- * \endverbatim
- */
-
-#include <vector>
-#include <complex>
-#include <cmath>
-
-#include <amgcl/util.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace detail {
-
-enum storage_order {
-    row_major,
-    col_major
-};
-
-template <class T>
-inline T real(T a) {
-    return a;
-}
-
-template <class T>
-inline T real(std::complex<T> a) {
-    return std::real(a);
-}
-
-/// In-place QR factorization.
-template <typename value_type, class Enable = void>
-class QR {
-    public:
-        QR() : m(0), n(0), row_stride(0), col_stride(0), r(NULL) {}
-
-        void compute(int rows, int cols, int row_stride, int col_stride, value_type *A) {
-            /*
-             *  Ported from ZGEQR2
-             *  ==================
-             *
-             *  Computes a QR factorization of an matrix A:
-             *  A = Q * R.
-             *
-             *  Arguments
-             *  =========
-             *
-             *  rows    The number of rows of the matrix A.
-             *  cols    The number of columns of the matrix A.
-             *
-             *  A       On entry, the rows by cols matrix A.
-             *          On exit, the elements on and above the diagonal of the
-             *          array contain the min(m,n) by n upper trapezoidal
-             *          matrix R (R is upper triangular if m >= n); the
-             *          elements below the diagonal, with the array TAU,
-             *          represent the unitary matrix Q as a product of
-             *          elementary reflectors (see Further Details).
-             *
-             *  Further Details
-             *  ===============
-             *
-             *  The matrix Q is represented as a product of elementary reflectors
-             *
-             *     Q = H(1) H(2) . . . H(k), where k = min(m,n).
-             *
-             *  Each H(i) has the form
-             *
-             *     H(i) = I - tau * v * v'
-             *
-             *  where tau is a value_type scalar, and v is a value_type vector
-             *  with v[0:i) = 0 and v[i] = 1; v[i:m) is stored on exit in
-             *  A[i+1:m)[i], and tau in tau[i].
-             *  ==============================================================
-             */
-            const int m = rows;
-            const int n = cols;
-            const int k = std::min(m, n);
-
-            if (k <= 0) return;
-
-            r = A;
-
-            tau.resize(k);
-
-            for(int i = 0, ii = 0; i < k; ++i, ii += row_stride + col_stride) {
-                // Generate elementary reflector H(i) to annihilate A[i+1:m)[i]
-                tau[i] = gen_reflector(m-i, A[ii], A + ii + row_stride, row_stride);
-
-                if (i+1 < n) {
-                    // Apply H(i)' to A[i:m)[i+1:n) from the left
-                    apply_reflector(m-i, n-i-1, A + ii, row_stride, math::adjoint(tau[i]),
-                            A + ii + col_stride, row_stride, col_stride);
-                }
-            }
-        }
-
-        void compute(int rows, int cols, value_type *A, storage_order order = row_major) {
-            int row_stride = (order == row_major ? cols : 1);
-            int col_stride = (order == row_major ? 1 : rows);
-            compute(rows, cols, row_stride, col_stride, A);
-        }
-
-        // Computes Q explicitly.
-        void factorize(int rows, int cols, int row_stride, int col_stride, value_type *A) {
-            /*
-             *  Ported from ZUNG2R
-             *  ==================
-             *
-             *  Generates an m by n matrix Q with orthonormal columns, which is
-             *  defined as the first n columns of a product of k elementary
-             *  reflectors of order m
-             *
-             *        Q  =  H(1) H(2) . . . H(k)
-             *
-             *  as returned by compute() [ZGEQR2].
-             *
-             *  ==============================================================
-             */
-            compute(rows, cols, row_stride, col_stride, A);
-
-            m = rows;
-            n = cols;
-
-            int k = std::min(m, n);
-
-            this->row_stride = row_stride;
-            this->col_stride = col_stride;
-
-            q.resize(m * n);
-
-            // Initialise columns k+1:n to zero.
-            // [In the original code these were initialized to the columns of
-            // the unit matrix, but since k = min(n,m), the main diagonal is
-            // never seen here].
-            for(int i = 0, ia = 0; i < m; ++i, ia += row_stride)
-                for(int j = k, ja = k * col_stride; j < n; ++j, ja += col_stride)
-                    q[ia + ja] = (i == j ? math::identity<value_type>() : math::zero<value_type>());
-
-            for(int i = k-1, ic = i * col_stride, ii = i*(row_stride + col_stride);
-                    i >= 0; --i, ic -= col_stride, ii -= row_stride + col_stride)
-            {
-                // Apply H(i) to A[i:m)[i+1:n) from the left
-                if (i < n-1)
-                    apply_reflector(m-i, n-i-1, r+ii, row_stride, tau[i], &q[ii+col_stride], row_stride, col_stride);
-
-                // Copy i-th reflector (including zeros and unit diagonal)
-                // to the column of Q to be processed next
-                for(int j = 0, jr = 0; j < i; ++j, jr += row_stride)
-                    q[jr+ic] = math::zero<value_type>();
-
-                q[ii] = math::identity<value_type>() - tau[i];
-
-                for(int j = i + 1, jr=j*row_stride; j < m; ++j, jr += row_stride)
-                    q[jr + ic] = -tau[i] * r[jr + ic];
-            }
-        }
-
-        void factorize(int rows, int cols, value_type *A, storage_order order = row_major) {
-            int row_stride = (order == row_major ? cols : 1);
-            int col_stride = (order == row_major ? 1 : rows);
-            factorize(rows, cols, row_stride, col_stride, A);
-        }
-
-        // Returns element of the matrix R.
-        value_type R(int i, int j) const {
-            if (j < i) return math::zero<value_type>();
-            return r[i*row_stride + j*col_stride];
-        }
-
-        // Returns element of the matrix Q.
-        value_type Q(int i, int j) const {
-            return q[i*row_stride + j*col_stride];
-        }
-
-        // Solves the system Q R x = f
-        void solve(
-                int rows, int cols, int row_stride, int col_stride, value_type *A,
-                const value_type *b, value_type *x, bool computed = false)
-        {
-            f.resize(rows);
-            std::copy(b, b + rows, f.begin());
-
-            if (rows >= cols) {
-                // We are solving overdetermined (tall) system Ax = f by
-                // writing the matrix A as A = QR and solving for x as
-                // x = R^-1 Q^-1 f = R^-1 Q^T f.
-                if (!computed) compute(rows, cols, row_stride, col_stride, A);
-
-                for(int i = 0, ii = 0; i < cols; ++i, ii += row_stride + col_stride)
-                    apply_reflector(rows-i, 1, r+ii, row_stride, math::adjoint(tau[i]), &f[i], 1, 1);
-
-                std::copy(f.begin(), f.begin()+cols, x);
-
-                for(int i = cols, ia = (cols-1) * col_stride; i --> 0; ia -= col_stride) {
-                    value_type rii = r[i*(row_stride+col_stride)];
-                    if (math::is_zero(rii)) continue;
-                    x[i] = math::inverse(rii) * x[i];
-
-                    for(int j = 0, ja = 0; j < i; ++j, ja += row_stride)
-                        x[j] -= r[ia + ja] * x[i];
-                }
-            } else {
-                // We are solving underdetermined (wide) system Ax = f by
-                // writing the matrix A^T as A^T = QR and solving for x as
-                // x = Q^-T R^-T f = Q R^-T f.
-                if (!computed) {
-                    for(int i = 0, n = cols * rows; i < n; ++i)
-                        A[i] = math::adjoint(A[i]);
-                    compute(cols, rows, col_stride, row_stride, A);
-                }
-
-                for(int i = 0, ia = 0; i < rows; ++i, ia += col_stride) {
-                    value_type rii = math::adjoint(r[i*(row_stride+col_stride)]);
-                    if (math::is_zero(rii)) continue;
-                    f[i] = math::inverse(rii) * f[i];
-
-                    for(int j = i+1, ja = j * row_stride; j < rows; ++j, ja += row_stride)
-                        f[j] -= math::adjoint(r[ia + ja]) * f[i];
-                }
-
-                std::copy(f.begin(), f.end(), x);
-                std::fill(x+rows, x+cols, math::zero<value_type>());
-
-                for(int i = rows; i --> 0; ) {
-                    int ii = i * (col_stride + row_stride);
-                    apply_reflector(cols-i, 1, r+ii, col_stride, tau[i], x+i, 1, 1);
-                }
-            }
-        }
-
-        void solve(
-                int rows, int cols, value_type *A, const value_type *b, value_type *x,
-                storage_order order = row_major, bool computed = false
-                )
-        {
-            int row_stride = (order == row_major ? cols : 1);
-            int col_stride = (order == row_major ? 1 : rows);
-            solve(rows, cols, row_stride, col_stride, A, b, x, computed);
-        }
-
-        size_t bytes() {
-            return sizeof(value_type) * (tau.size() + f.size() + q.size());
-        }
-
-    private:
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        static scalar_type sqr(scalar_type x) { return x * x; }
-
-        int m, n, row_stride, col_stride;
-
-        value_type *r;
-        std::vector<value_type> tau, f;
-        std::vector<value_type> q;
-
-        static value_type gen_reflector(int order, value_type &alpha, value_type *x, int stride) {
-            /*
-             *  Ported from ZLARFG
-             *  ==================
-             *
-             *  Generates a value_type elementary reflector H of order n, such
-             *  that
-             *
-             *        H' * ( alpha ) = ( beta ),   H' * H = I.
-             *             (   x   )   (   0  )
-             *
-             *  where alpha and beta are scalars, with beta real, and x is an
-             *  (n-1)-element value_type vector. H is represented in the form
-             *
-             *        H = I - tau * ( 1 ) * ( 1 v' ) ,
-             *                      ( v )
-             *
-             *  where tau is a value_type scalar and v is a value_type
-             *  (n-1)-element vector. Note that H is not hermitian.
-             *
-             *  If the elements of x are all zero and alpha is real,
-             *  then tau = 0 and H is taken to be the unit matrix.
-             *
-             *  Otherwise  1 <= real(tau) <= 2  and  abs(tau-1) <= 1 .
-             *
-             *  Arguments
-             *  =========
-             *
-             *  order   The order of the elementary reflector.
-             *
-             *  alpha   On entry, the value alpha.
-             *          On exit, it is overwritten with the value beta.
-             *
-             *  x       dimension (1+(order-2)*abs(stride))
-             *          On entry, the vector x.
-             *          On exit, it is overwritten with the vector v.
-             *
-             *  stride  The increment between elements of x.
-             *
-             *  Returns the value tau.
-             *
-             *  ==============================================================
-             */
-            value_type tau = math::zero<value_type>();
-            if (order <= 1) return tau;
-            int n = order - 1;
-
-            scalar_type xnorm2 = 0;
-            for(int i = 0, ii = 0; i < n; ++i, ii += stride)
-                xnorm2 += sqr(math::norm(x[ii]));
-
-            if (math::is_zero(xnorm2)) return tau;
-
-            scalar_type beta = -std::abs(sqrt(sqr(math::norm(alpha)) + xnorm2));
-            if (amgcl::detail::real(alpha) < 0) beta = -beta;
-
-            tau = math::identity<value_type>() - math::inverse(beta) * alpha;
-            alpha = math::inverse(alpha - beta * math::identity<value_type>());
-
-            for(int i = 0, ii = 0; i < n; ++i, ii += stride)
-                x[ii] = alpha * x[ii];
-
-            alpha = beta * math::identity<value_type>();
-            return tau;
-        }
-
-        static void apply_reflector(
-                int m, int n, const value_type *v, int v_stride, value_type tau,
-                value_type *C, int row_stride, int col_stride
-                )
-        {
-            /*
-             *  Ported from ZLARF
-             *  =================
-             *
-             *  Applies an elementary reflector H to an m-by-n matrix C from
-             *  the left. H is represented in the form
-             *
-             *        H = I - v * tau * v'
-             *
-             *  where tau is a value_type scalar and v is a value_type vector.
-             *
-             *  If tau = 0, then H is taken to be the unit matrix.
-             *
-             *  To apply H' (the conjugate transpose of H), supply adjoint(tau)
-             *  instead of tau.
-             *
-             *  Arguments
-             *  =========
-             *
-             *  m          The number of rows of the matrix C.
-             *
-             *  n          The number of columns of the matrix C.
-             *
-             *  v          The vector v in the representation of H.
-             *             v is not used if tau = 0.
-             *             The value of v[0] is ignored and assumed to be 1.
-             *
-             *  v_stride   The increment between elements of v.
-             *
-             *  tau        The value tau in the representation of H.
-             *
-             *  C          On entry, the m-by-n matrix C.
-             *             On exit, C is overwritten by the matrix H * C.
-             *
-             *  row_stride The increment between the rows of C.
-             *  col_stride The increment between the columns of C.
-             *
-             *  ==============================================================
-             */
-
-            if (math::is_zero(tau)) return;
-
-            // w = C` * v; C -= tau * v * w`
-            for(int i = 0, ia=0; i < n; ++i, ia += col_stride) {
-                value_type s = math::adjoint(C[ia]);
-                for(int j = 1, jv = v_stride, ja=row_stride; j < m; ++j, jv += v_stride, ja += row_stride) {
-                    s += math::adjoint(C[ja+ia]) * v[jv];
-                }
-
-                s = tau * math::adjoint(s);
-                C[ia] -= s;
-                for(int j = 1, jv = v_stride, ja=row_stride; j < m; ++j, jv += v_stride, ja += row_stride) {
-                    C[ja+ia] -= v[jv] * s;
-                }
-            }
-        }
-
-};
-
-template <class value_type>
-class QR<value_type, typename std::enable_if<math::is_static_matrix<value_type>::value>::type>
-{
-    public:
-        typedef typename amgcl::math::rhs_of<value_type>::type rhs_type;
-
-        QR() {}
-
-        void compute(int rows, int cols, int row_stride, int col_stride, value_type *A) {
-            const int M = math::static_rows<value_type>::value;
-            const int N = math::static_cols<value_type>::value;
-
-            m = rows;
-            n = cols;
-
-            r = A;
-
-            copy_to_scalar_buf(rows, cols, row_stride, col_stride, A);
-            base.compute(rows * M, cols * N, 1, rows * M, buf.data());
-        }
-
-        void factorize(int rows, int cols, int row_stride, int col_stride, value_type *A) {
-            const int M = math::static_rows<value_type>::value;
-            const int N = math::static_cols<value_type>::value;
-
-            m = rows * M;
-            n = cols * N;
-
-            r = A;
-
-            copy_to_scalar_buf(rows, cols, row_stride, col_stride, A);
-            base.factorize(m, n, 1, m, buf.data());
-        }
-
-        void factorize(int rows, int cols, value_type *A, storage_order order = row_major) {
-            int row_stride = (order == row_major ? cols : 1);
-            int col_stride = (order == row_major ? 1 : rows);
-            factorize(rows, cols, row_stride, col_stride, A);
-        }
-
-        value_type R(int i, int j) const {
-            const int N = math::static_rows<value_type>::value;
-            const int M = math::static_cols<value_type>::value;
-
-            value_type v;
-
-            if (j < i) {
-                v = math::zero<value_type>();
-            } else {
-                for(int ii = 0; ii < N; ++ii)
-                    for(int jj = 0; jj < M; ++jj)
-                        v(ii,jj) = base.R(i * N + ii, j * M + jj);
-            }
-
-            return v;
-        }
-
-        // Returns element of the matrix Q.
-        value_type Q(int i, int j) const {
-            const int N = math::static_rows<value_type>::value;
-            const int M = math::static_cols<value_type>::value;
-
-            value_type v;
-
-            for(int ii = 0; ii < N; ++ii)
-                for(int jj = 0; jj < M; ++jj)
-                    v(ii,jj) = base.Q(i * N + ii, j * M + jj);
-
-            return v;
-        }
-
-        // Solves the system Q R x = f
-        void solve(
-                int rows, int cols, int row_stride, int col_stride, value_type *A,
-                const rhs_type *f, rhs_type *x, bool computed = false)
-        {
-            const int M = math::static_rows<value_type>::value;
-            const int N = math::static_cols<value_type>::value;
-
-            m = rows * M;
-            n = cols * N;
-
-            r = A;
-
-            copy_to_scalar_buf(rows, cols, row_stride, col_stride, A);
-            base.solve(m, n, 1, m, buf.data(),
-                    reinterpret_cast<const scalar_type*>(f),
-                    reinterpret_cast<scalar_type*>(x),
-                    computed
-                    );
-        }
-
-        void solve(
-                int rows, int cols, value_type *A, const rhs_type *f, rhs_type *x,
-                storage_order order = row_major, bool computed = false
-                )
-        {
-            int row_stride = (order == row_major ? cols : 1);
-            int col_stride = (order == row_major ? 1 : rows);
-            solve(rows, cols, row_stride, col_stride, A, f, x, computed);
-        }
-
-        size_t bytes() const {
-            return base.bytes() + sizeof(scalar_type) * buf.size();
-        }
-
-    private:
-        typedef typename amgcl::math::scalar_of<value_type>::type scalar_type;
-
-        int m, n;
-        value_type *r;
-
-        QR<scalar_type> base;
-        std::vector<scalar_type> buf;
-
-        void copy_to_scalar_buf(int rows, int cols, int row_stride, int col_stride, value_type *A) {
-            const int M = math::static_rows<value_type>::value;
-            const int N = math::static_cols<value_type>::value;
-
-            buf.resize(M * rows * N * cols);
-
-            const int scalar_rows = M * rows;
-
-            for(int i = 0, ib = 0; i < rows; ++i)
-                for(int ii = 0; ii < M; ++ii, ++ib)
-                    for(int j = 0, jb = 0; j < cols; ++j)
-                        for(int jj = 0; jj < N; ++jj, jb += scalar_rows)
-                            buf[ib + jb] = A[i * row_stride + j * col_stride](ii, jj);
-        }
-};
-
-} // namespace detail
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/detail/sort_row.hpp b/src/solvers/amgcl/detail/sort_row.hpp
deleted file mode 100644
index a82ce0a..0000000
--- a/src/solvers/amgcl/detail/sort_row.hpp
+++ /dev/null
@@ -1,59 +0,0 @@
-#ifndef AMGCL_DETAIL_SORT_ROW_HPP
-#define AMGCL_DETAIL_SORT_ROW_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/detail/sort_row.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Sort row of CRS matrix by columns.
- */
-
-namespace amgcl {
-namespace detail {
-
-template <typename Col, typename Val>
-void sort_row(Col *col, Val *val, int n) {
-    for(int j = 1; j < n; ++j) {
-        Col c = col[j];
-        Val v = val[j];
-
-        int i = j - 1;
-
-        while(i >= 0 && col[i] > c) {
-            col[i + 1] = col[i];
-            val[i + 1] = val[i];
-            i--;
-        }
-
-        col[i + 1] = c;
-        val[i + 1] = v;
-    }
-}
-
-} // namespace detail
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/detail/spgemm.hpp b/src/solvers/amgcl/detail/spgemm.hpp
deleted file mode 100644
index df48067..0000000
--- a/src/solvers/amgcl/detail/spgemm.hpp
+++ /dev/null
@@ -1,509 +0,0 @@
-#ifndef AMGCL_DETAIL_SPGEMM_HPP
-#define AMGCL_DETAIL_SPGEMM_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/detail/spgemm.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Sparse matrix-matrix product algorithms.
- *
- * This implements two algorithms.
- *
- * The first is an OpenMP-enabled modification of classic algorithm from Saad
- * [1]. It is used whenever number of OpenMP cores is 4 or less.
- *
- * The second is Row-merge algorithm from Rupp et al. [2]. The algorithm
- * requires less memory and shows much better scalability than classic one.
- * It is used when number of OpenMP cores is more than 4.
- *
- * [1] Saad, Yousef. Iterative methods for sparse linear systems. Siam, 2003.
- * [2] Rupp K, Rudolf F, Weinbub J, Morhammer A, Grasser T, Jungel A. Optimized
- *     Sparse Matrix-Matrix Multiplication for Multi-Core CPUs, GPUs, and Xeon
- *     Phi. Submitted
- */
-#include <vector>
-#include <algorithm>
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/detail/sort_row.hpp>
-
-namespace amgcl {
-namespace backend {
-
-//---------------------------------------------------------------------------
-template <class AMatrix, class BMatrix, class CMatrix>
-void spgemm_saad(const AMatrix &A, const BMatrix &B, CMatrix &C, bool sort = true)
-{
-    typedef typename backend::value_type<CMatrix>::type Val;
-    typedef typename backend::col_type<CMatrix>::type Col;
-    typedef ptrdiff_t Idx;
-
-    C.set_size(A.nrows, B.ncols);
-    C.ptr[0] = 0;
-
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> marker(B.ncols, -1);
-
-#pragma omp for
-        for(Idx ia = 0; ia < static_cast<Idx>(A.nrows); ++ia) {
-            Col C_cols = 0;
-            for(Idx ja = A.ptr[ia], ea = A.ptr[ia+1]; ja < ea; ++ja) {
-                Col ca = A.col[ja];
-
-                for(Idx jb = B.ptr[ca], eb = B.ptr[ca+1]; jb < eb; ++jb) {
-                    Col cb = B.col[jb];
-                    if (marker[cb] != ia) {
-                        marker[cb]  = ia;
-                        ++C_cols;
-                    }
-                }
-            }
-            C.ptr[ia + 1] = C_cols;
-        }
-    }
-
-    C.set_nonzeros(C.scan_row_sizes());
-
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> marker(B.ncols, -1);
-
-#pragma omp for
-        for(Idx ia = 0; ia < static_cast<Idx>(A.nrows); ++ia) {
-            Idx row_beg = C.ptr[ia];
-            Idx row_end = row_beg;
-
-            for(Idx ja = A.ptr[ia], ea = A.ptr[ia+1]; ja < ea; ++ja) {
-                Col ca = A.col[ja];
-                Val va = A.val[ja];
-
-                for(Idx jb = B.ptr[ca], eb = B.ptr[ca+1]; jb < eb; ++jb) {
-                    Col cb = B.col[jb];
-                    Val vb = B.val[jb];
-
-                    if (marker[cb] < row_beg) {
-                        marker[cb] = row_end;
-                        C.col[row_end] = cb;
-                        C.val[row_end] = va * vb;
-                        ++row_end;
-                    } else {
-                        C.val[marker[cb]] += va * vb;
-                    }
-                }
-            }
-
-            if (sort) amgcl::detail::sort_row(
-                    C.col + row_beg, C.val + row_beg, row_end - row_beg);
-        }
-    }
-}
-
-//---------------------------------------------------------------------------
-template <bool need_out, class Idx>
-Idx* merge_rows(
-        const Idx *col1, const Idx *col1_end,
-        const Idx *col2, const Idx *col2_end,
-        Idx *col3
-        )
-{
-    while(col1 != col1_end && col2 != col2_end) {
-        Idx c1 = *col1;
-        Idx c2 = *col2;
-
-        if (c1 < c2) {
-            if (need_out) *col3 = c1;
-            ++col1;
-        } else if (c1 == c2) {
-            if (need_out) *col3 = c1;
-            ++col1;
-            ++col2;
-        } else {
-            if (need_out) *col3 = c2;
-            ++col2;
-        }
-        ++col3;
-    }
-
-    if (need_out) {
-        if (col1 < col1_end) {
-            return std::copy(col1, col1_end, col3);
-        } else if (col2 < col2_end) {
-            return std::copy(col2, col2_end, col3);
-        } else {
-            return col3;
-        }
-    } else {
-        return col3 + (col1_end - col1) + (col2_end - col2);
-    }
-}
-
-template <class Idx, class Val>
-Idx* merge_rows(
-        const Val &alpha1, const Idx *col1, const Idx *col1_end, const Val *val1,
-        const Val &alpha2, const Idx *col2, const Idx *col2_end, const Val *val2,
-        Idx *col3, Val *val3
-        )
-{
-    while(col1 != col1_end && col2 != col2_end) {
-        Idx c1 = *col1;
-        Idx c2 = *col2;
-
-        if (c1 < c2) {
-            ++col1;
-
-            *col3 = c1;
-            *val3 = alpha1 * (*val1++);
-        } else if (c1 == c2) {
-            ++col1;
-            ++col2;
-
-            *col3 = c1;
-            *val3 = alpha1 * (*val1++) + alpha2 * (*val2++);
-        } else {
-            ++col2;
-
-            *col3 = c2;
-            *val3 = alpha2 * (*val2++);
-        }
-
-        ++col3;
-        ++val3;
-    }
-
-    while(col1 < col1_end) {
-        *col3++ = *col1++;
-        *val3++ = alpha1 * (*val1++);
-    }
-
-    while(col2 < col2_end) {
-        *col3++ = *col2++;
-        *val3++ = alpha2 * (*val2++);
-    }
-
-    return col3;
-}
-
-template <class Col, class Ptr>
-Ptr prod_row_width(
-        const Col *acol, const Col *acol_end,
-        const Ptr *bptr, const Col *bcol,
-        Col *tmp_col1, Col *tmp_col2, Col *tmp_col3
-        )
-{
-    const Col nrows = acol_end - acol;
-
-    /* No rows to merge, nothing to do */
-    if (nrows == 0) return 0;
-
-    /* Single row, just copy it to output */
-    if (nrows == 1) return bptr[*acol + 1] - bptr[*acol];
-
-    /* Two rows, merge them */
-    if (nrows == 2) {
-        int a1 = acol[0];
-        int a2 = acol[1];
-
-        return merge_rows<false>(
-                bcol + bptr[a1], bcol + bptr[a1+1],
-                bcol + bptr[a2], bcol + bptr[a2+1],
-                tmp_col1
-                ) - tmp_col1;
-    }
-
-    /* Generic case (more than two rows).
-     *
-     * Merge rows by pairs, then merge the results together.
-     * When merging two rows, the result is always wider (or equal).
-     * Merging by pairs allows to work with short rows as often as possible.
-     */
-    // Merge first two.
-    Col a1 = *acol++;
-    Col a2 = *acol++;
-    Col c_col1 = merge_rows<true>(
-            bcol + bptr[a1], bcol + bptr[a1+1],
-            bcol + bptr[a2], bcol + bptr[a2+1],
-            tmp_col1
-            ) - tmp_col1;
-
-    // Go by pairs.
-    while(acol + 1 < acol_end) {
-        a1 = *acol++;
-        a2 = *acol++;
-
-        Col c_col2 = merge_rows<true>(
-                bcol + bptr[a1], bcol + bptr[a1+1],
-                bcol + bptr[a2], bcol + bptr[a2+1],
-                tmp_col2
-                ) - tmp_col2;
-
-        if (acol == acol_end) {
-            return merge_rows<false>(
-                    tmp_col1, tmp_col1 + c_col1,
-                    tmp_col2, tmp_col2 + c_col2,
-                    tmp_col3
-                    ) - tmp_col3;
-        } else {
-            c_col1 = merge_rows<true>(
-                    tmp_col1, tmp_col1 + c_col1,
-                    tmp_col2, tmp_col2 + c_col2,
-                    tmp_col3
-                    ) - tmp_col3;
-
-            std::swap(tmp_col1, tmp_col3);
-        }
-    }
-
-    // Merge the tail.
-    a2 = *acol;
-    return merge_rows<false>(
-            tmp_col1, tmp_col1 + c_col1,
-            bcol + bptr[a2], bcol + bptr[a2+1],
-            tmp_col2
-            ) - tmp_col2;
-}
-
-template <class Col, class Ptr, class Val>
-void prod_row(
-        const Col *acol, const Col *acol_end, const Val *aval,
-        const Ptr *bptr, const Col *bcol, const Val *bval,
-        Col *out_col, Val *out_val,
-        Col *tm2_col, Val *tm2_val,
-        Col *tm3_col, Val *tm3_val
-        )
-{
-    const Col nrows = acol_end - acol;
-
-    /* No rows to merge, nothing to do */
-    if (nrows == 0) return;
-
-    /* Single row, just copy it to output */
-    if (nrows == 1) {
-        Col ac = *acol;
-        Val av = *aval;
-
-        const Val *bv = bval + bptr[ac];
-        const Col *bc = bcol + bptr[ac];
-        const Col *be = bcol + bptr[ac+1];
-
-        while(bc != be) {
-            *out_col++ = *bc++;
-            *out_val++ = av * (*bv++);
-        }
-
-        return;
-    }
-
-    /* Two rows, merge them */
-    if (nrows == 2) {
-        Col ac1 = acol[0];
-        Col ac2 = acol[1];
-
-        Val av1 = aval[0];
-        Val av2 = aval[1];
-
-        merge_rows(
-                av1, bcol + bptr[ac1], bcol + bptr[ac1+1], bval + bptr[ac1],
-                av2, bcol + bptr[ac2], bcol + bptr[ac2+1], bval + bptr[ac2],
-                out_col, out_val
-                );
-
-        return;
-    }
-
-    /* Generic case (more than two rows).
-     *
-     * Merge rows by pairs, then merge the results together.
-     * When merging two rows, the result is always wider (or equal).
-     * Merging by pairs allows to work with short rows as often as possible.
-     */
-    // Merge first two.
-    Col ac1 = *acol++;
-    Col ac2 = *acol++;
-
-    Val av1 = *aval++;
-    Val av2 = *aval++;
-
-    Col *tm1_col = out_col;
-    Val *tm1_val = out_val;
-
-    Col c_col1 = merge_rows(
-            av1, bcol + bptr[ac1], bcol + bptr[ac1+1], bval + bptr[ac1],
-            av2, bcol + bptr[ac2], bcol + bptr[ac2+1], bval + bptr[ac2],
-            tm1_col, tm1_val
-            ) - tm1_col;
-
-    // Go by pairs.
-    while(acol + 1 < acol_end) {
-        ac1 = *acol++;
-        ac2 = *acol++;
-
-        av1 = *aval++;
-        av2 = *aval++;
-
-        Col c_col2 = merge_rows(
-                av1, bcol + bptr[ac1], bcol + bptr[ac1+1], bval + bptr[ac1],
-                av2, bcol + bptr[ac2], bcol + bptr[ac2+1], bval + bptr[ac2],
-                tm2_col, tm2_val
-                ) - tm2_col;
-
-        c_col1 = merge_rows(
-                math::identity<Val>(), tm1_col, tm1_col + c_col1, tm1_val,
-                math::identity<Val>(), tm2_col, tm2_col + c_col2, tm2_val,
-                tm3_col, tm3_val
-                ) - tm3_col;
-
-        std::swap(tm3_col, tm1_col);
-        std::swap(tm3_val, tm1_val);
-    }
-
-    // Merge the tail if there is one.
-    if (acol < acol_end) {
-        ac2 = *acol++;
-        av2 = *aval++;
-
-        c_col1 = merge_rows(
-                math::identity<Val>(), tm1_col, tm1_col + c_col1, tm1_val,
-                av2, bcol + bptr[ac2], bcol + bptr[ac2+1], bval + bptr[ac2],
-                tm3_col, tm3_val
-                ) - tm3_col;
-
-        std::swap(tm3_col, tm1_col);
-        std::swap(tm3_val, tm1_val);
-    }
-
-    // If we are lucky, tm1 now points to out.
-    // Otherwise, copy the results.
-    if (tm1_col != out_col) {
-        std::copy(tm1_col, tm1_col + c_col1, out_col);
-        std::copy(tm1_val, tm1_val + c_col1, out_val);
-    }
-}
-
-template <class AMatrix, class BMatrix, class CMatrix>
-void spgemm_rmerge(const AMatrix &A, const BMatrix &B, CMatrix &C) {
-    typedef typename backend::value_type<CMatrix>::type Val;
-    typedef typename backend::col_type<CMatrix>::type Col;
-    typedef ptrdiff_t Idx;
-
-    Idx max_row_width = 0;
-
-#pragma omp parallel
-    {
-        Idx my_max = 0;
-
-#pragma omp for
-        for(int i = 0; i < static_cast<Idx>(A.nrows); ++i) {
-            Idx row_beg = A.ptr[i];
-            Idx row_end = A.ptr[i+1];
-            Idx row_width = 0;
-            for(Idx j = row_beg; j < row_end; ++j) {
-                Idx a_col = A.col[j];
-                row_width += B.ptr[a_col + 1] - B.ptr[a_col];
-            }
-            my_max = std::max(my_max, row_width);
-        }
-
-#pragma omp critical
-        max_row_width = std::max(max_row_width, my_max);
-    }
-
-#ifdef _OPENMP
-    const int nthreads = omp_get_max_threads();
-#else
-    const int nthreads = 1;
-#endif
-
-    std::vector< std::vector<Col> > tmp_col(nthreads);
-    std::vector< std::vector<Val> > tmp_val(nthreads);
-
-    for(int i = 0; i < nthreads; ++i) {
-        tmp_col[i].resize(3 * max_row_width);
-        tmp_val[i].resize(2 * max_row_width);
-    }
-
-    C.set_size(A.nrows, B.ncols);
-    C.ptr[0] = 0;
-
-
-#pragma omp parallel
-    {
-#ifdef _OPENMP
-        const int tid = omp_get_thread_num();
-#else
-        const int tid = 0;
-#endif
-
-        Col *t_col = &tmp_col[tid][0];
-
-#pragma omp for
-        for(Idx i = 0; i < static_cast<Idx>(A.nrows); ++i) {
-            Idx row_beg = A.ptr[i];
-            Idx row_end = A.ptr[i+1];
-
-            C.ptr[i+1] = prod_row_width(
-                    A.col + row_beg, A.col + row_end, B.ptr, B.col,
-                    t_col, t_col + max_row_width, t_col + 2 * max_row_width
-                    );
-        }
-    }
-
-    C.set_nonzeros(C.scan_row_sizes());
-
-#pragma omp parallel
-    {
-#ifdef _OPENMP
-        const int tid = omp_get_thread_num();
-#else
-        const int tid = 0;
-#endif
-
-        Col *t_col = tmp_col[tid].data();
-        Val *t_val = tmp_val[tid].data();
-
-#pragma omp for
-        for(Idx i = 0; i < static_cast<Idx>(A.nrows); ++i) {
-            Idx row_beg = A.ptr[i];
-            Idx row_end = A.ptr[i+1];
-
-            prod_row(
-                    A.col + row_beg, A.col + row_end, A.val + row_beg,
-                    B.ptr, B.col, B.val,
-                    C.col + C.ptr[i], C.val + C.ptr[i],
-                    t_col, t_val, t_col + max_row_width, t_val + max_row_width
-                    );
-        }
-    }
-}
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/io/binary.hpp b/src/solvers/amgcl/io/binary.hpp
deleted file mode 100644
index 70a2583..0000000
--- a/src/solvers/amgcl/io/binary.hpp
+++ /dev/null
@@ -1,173 +0,0 @@
-#ifndef AMGCL_IO_BINARY_HPP
-#define AMGCL_IO_BINARY_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/io/binary.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Convenience functions for binary file I/O.
- */
-
-#include <vector>
-#include <string>
-#include <fstream>
-
-#include <amgcl/util.hpp>
-#include <amgcl/detail/sort_row.hpp>
-
-namespace amgcl {
-namespace io {
-
-/// Read single value from a binary file.
-template <class T>
-bool read(std::ifstream &f, T &val) {
-    return static_cast<bool>(f.read((char*)&val, sizeof(T)));
-}
-
-/// Read vector from a binary file.
-template <class T>
-bool read(std::ifstream &f, std::vector<T> &vec) {
-    return static_cast<bool>(f.read((char*)&vec[0], sizeof(T) * vec.size()));
-}
-
-/// Get size of the CRS matrix stored in a binary file
-template <typename IndexType>
-IndexType crs_size(const std::string &fname) {
-    std::ifstream f(fname.c_str(), std::ios::binary);
-    IndexType n;
-
-    precondition(f, "Failed to open matrix file");
-    precondition(read(f, n), "File I/O error");
-
-    return n;
-}
-
-/// Read CRS matrix from a binary file.
-template <typename SizeT, typename Ptr, typename Col, typename Val>
-void read_crs(
-        const std::string &fname,
-        SizeT &n,
-        std::vector<Ptr> &ptr,
-        std::vector<Col> &col,
-        std::vector<Val> &val,
-        ptrdiff_t row_beg = -1,
-        ptrdiff_t row_end = -1
-        )
-{
-    std::ifstream f(fname.c_str(), std::ios::binary);
-    precondition(f, "Failed to open matrix file");
-
-    precondition(read(f, n), "File I/O error");
-
-    if (row_beg < 0) row_beg = 0;
-    if (row_end < 0) row_end = n;
-
-    precondition(row_beg >= 0 && row_end <= static_cast<ptrdiff_t>(n),
-            "Wrong subset of rows is requested");
-
-    ptrdiff_t chunk = row_end - row_beg;
-
-    ptr.resize(chunk + 1);
-
-    size_t ptr_beg = sizeof(SizeT);
-    f.seekg(ptr_beg + row_beg * sizeof(Ptr));
-    precondition(read(f, ptr), "File I/O error");
-
-    Ptr nnz;
-    f.seekg(ptr_beg + n * sizeof(Ptr));
-    precondition(read(f, nnz), "File I/O error");
-
-    SizeT nnz_beg = ptr.front();
-    if (nnz_beg) for(auto &p : ptr) p -= nnz_beg;
-
-    col.resize(ptr.back());
-    val.resize(ptr.back());
-
-    size_t col_beg = ptr_beg + (n + 1) * sizeof(Ptr);
-    f.seekg(col_beg + nnz_beg * sizeof(Col));
-    precondition(read(f, col), "File I/O error");
-
-    f.seekg(col_beg + nnz * sizeof(Col) + nnz_beg * sizeof(Val));
-    precondition(read(f, val), "File I/O error");
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < chunk; ++i) {
-        Ptr beg = ptr[i];
-        Ptr end = ptr[i + 1];
-        amgcl::detail::sort_row(&col[beg], &val[beg], end - beg);
-    }
-}
-
-template <typename SizeT>
-void dense_size(const std::string &fname, SizeT &n, SizeT &m) {
-    std::ifstream f(fname.c_str(), std::ios::binary);
-    precondition(f, "Failed to open matrix file");
-
-    precondition(read(f, n), "File I/O error");
-    precondition(read(f, m), "File I/O error");
-}
-
-template <typename SizeT, typename Val>
-void read_dense(const std::string &fname,
-        SizeT &n, SizeT &m, std::vector<Val> &v,
-        ptrdiff_t row_beg = -1, ptrdiff_t row_end = -1)
-{
-    std::ifstream f(fname.c_str(), std::ios::binary);
-    precondition(f, "Failed to open matrix file");
-
-    precondition(read(f, n), "File I/O error");
-    precondition(read(f, m), "File I/O error");
-
-    if (row_beg < 0) row_beg = 0;
-    if (row_end < 0) row_end = n;
-
-    precondition(row_beg >= 0 && row_end <= static_cast<ptrdiff_t>(n),
-            "Wrong subset of rows is requested");
-
-    ptrdiff_t chunk = row_end - row_beg;
-
-    v.resize(chunk * m);
-
-    f.seekg(2 * sizeof(SizeT) + row_beg * m * sizeof(Val));
-    precondition(read(f, v), "File I/O error");
-}
-
-/// Write single value to a binary file.
-template <class T>
-bool write(std::ofstream &f, const T &val) {
-    return static_cast<bool>(f.write((char*)&val, sizeof(T)));
-}
-
-/// Write vector to a binary file.
-template <class T>
-bool write(std::ofstream &f, const std::vector<T> &vec) {
-    return static_cast<bool>(f.write((char*)&vec[0], sizeof(T) * vec.size()));
-}
-
-} // namespace io
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/io/ios_saver.hpp b/src/solvers/amgcl/io/ios_saver.hpp
deleted file mode 100644
index 973bbc2..0000000
--- a/src/solvers/amgcl/io/ios_saver.hpp
+++ /dev/null
@@ -1,56 +0,0 @@
-#ifndef AMGCL_IO_IOS_SAVER_HPP
-#define AMGCL_IO_IOS_SAVER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/io/ios_saver.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Save/Restore std::stream flags.
- */
-
-#include <ios>
-
-namespace amgcl {
-
-// Save ostream flags in constructor, restore in destructor
-struct ios_saver {
-    std::ios_base &s;
-    std::ios_base::fmtflags f;
-    std::streamsize p;
-
-    ios_saver(std::ios_base &s)
-        : s(s), f(s.flags()), p(s.precision())
-    {}
-
-    ~ios_saver() {
-        s.flags(f);
-        s.precision(p);
-    }
-};
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/io/mm.hpp b/src/solvers/amgcl/io/mm.hpp
deleted file mode 100644
index a533560..0000000
--- a/src/solvers/amgcl/io/mm.hpp
+++ /dev/null
@@ -1,420 +0,0 @@
-#ifndef AMGCL_IO_MM_HPP
-#define AMGCL_IO_MM_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/io/mm.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Readers for Matrix Market sparse matrices and dense vectors.
- */
-
-#include <vector>
-#include <string>
-#include <fstream>
-#include <sstream>
-#include <numeric>
-
-#include <type_traits>
-#include <tuple>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/detail/sort_row.hpp>
-
-namespace amgcl {
-namespace io {
-
-/// Matrix market reader.
-class mm_reader {
-    public:
-        /// Open the file by name
-        mm_reader(const std::string &fname) : f(fname) {
-            precondition(f, "Failed to open file \"" + fname + "\"");
-
-            // Read banner.
-            precondition(std::getline(f, line), format_error());
-
-            std::istringstream is(line);
-            std::string banner, mtx, coord, dtype, storage;
-
-            precondition(
-                    is >> banner >> mtx >> coord >> dtype >> storage,
-                    format_error());
-
-            precondition(banner  == "%%MatrixMarket", format_error("no banner"));
-            precondition(mtx     == "matrix",         format_error("not a matrix"));
-
-            if (storage == "general") {
-                _symmetric = false;
-            } else if (storage == "symmetric") {
-                _symmetric = true;
-            } else {
-                precondition(false, "unsupported storage type");
-            }
-
-            if (coord == "coordinate") {
-                _sparse = true;
-            } else if (coord == "array") {
-                _sparse = false;
-            } else {
-                precondition(false, format_error("unsupported coordinate type"));
-            }
-
-            if (dtype == "real") {
-                _complex = false;
-                _integer = false;
-            } else if (dtype == "complex") {
-                _complex = true;
-                _integer = false;
-            } else if (dtype == "integer") {
-                _complex = false;
-                _integer = true;
-            } else {
-                precondition(false, format_error("unsupported data type"));
-            }
-
-            // Skip comments.
-            do {
-                precondition(std::getline(f, line), format_error("unexpected eof"));
-            } while (line[0] == '%');
-
-            // The last line is comment-free and holds the matrix sizes
-            is.clear(); is.str(line);
-            precondition(is >> nrows >> ncols, format_error());
-        }
-
-        /// Matrix in the file is symmetric.
-        bool is_symmetric()  const { return _symmetric; }
-
-        /// Matrix in the file is sparse.
-        bool is_sparse()  const { return _sparse; }
-
-        /// Matrix in the file is complex-valued.
-        bool is_complex() const { return _complex; }
-
-        /// Matrix in the file is integer-valued.
-        bool is_integer() const { return _integer; }
-
-        /// Number of rows.
-        size_t rows() const { return nrows; }
-
-        /// Number of rows.
-        size_t cols() const { return ncols; }
-
-        /// Read sparse matrix from the file.
-        template <typename Idx, typename Val>
-        std::tuple<size_t, size_t> operator()(
-                std::vector<Idx> &ptr,
-                std::vector<Idx> &col,
-                std::vector<Val> &val,
-                ptrdiff_t row_beg = -1,
-                ptrdiff_t row_end = -1
-                )
-        {
-            precondition(_sparse, format_error("not a sparse matrix"));
-            precondition(amgcl::is_complex<Val>::value == _complex,
-                    _complex ?
-                        "attempt to read complex values into real vector" :
-                        "attempt to read real values into complex vector"
-                        );
-            precondition(std::is_integral<Val>::value == _integer,
-                    _integer ?
-                        "attempt to read integer values into real vector" :
-                        "attempt to read real values into integer vector"
-                        );
-
-            // Read sizes
-            ptrdiff_t n, m;
-            size_t nnz;
-            std::istringstream is;
-            {
-                // line already holds the matrix sizes
-                is.clear(); is.str(line);
-                precondition(is >> n >> m >> nnz, format_error());
-            }
-
-            if (row_beg < 0) row_beg = 0;
-            if (row_end < 0) row_end = n;
-
-            precondition(row_beg >= 0 && row_end <= n,
-                    "Wrong subset of rows is requested");
-
-            ptrdiff_t _nnz = _symmetric ? 2 * nnz : nnz;
-
-            if (row_beg != 0 || row_end != n)
-                _nnz *= 1.2 * (row_end - row_beg) / n;
-
-            std::vector<Idx> _row; _row.reserve(_nnz);
-            std::vector<Idx> _col; _col.reserve(_nnz);
-            std::vector<Val> _val; _val.reserve(_nnz);
-
-            ptrdiff_t chunk = row_end - row_beg;
-
-            ptr.resize(chunk + 1); std::fill(ptr.begin(), ptr.end(), 0);
-
-            for(size_t k = 0; k < nnz; ++k) {
-                precondition(std::getline(f, line), format_error("unexpected eof"));
-                is.clear(); is.str(line);
-
-                Idx i, j;
-                Val v;
-
-                precondition(is >> i >> j, format_error());
-
-                i -= 1;
-                j -= 1;
-
-                v = read_value<Val>(is);
-
-                if (row_beg <= i && i < row_end) {
-                    ++ptr[i - row_beg + 1];
-
-                    _row.push_back(i - row_beg);
-                    _col.push_back(j);
-                    _val.push_back(v);
-                }
-
-                if (_symmetric && i != j && row_beg <= j && j < row_end) {
-                    ++ptr[j - row_beg + 1];
-
-                    _row.push_back(j - row_beg);
-                    _col.push_back(i);
-                    _val.push_back(v);
-                }
-            }
-
-            std::partial_sum(ptr.begin(), ptr.end(), ptr.begin());
-
-            col.resize(ptr.back());
-            val.resize(ptr.back());
-
-            for(size_t k = 0, e = val.size(); k < e; ++k) {
-                Idx i = _row[k];
-                Idx j = _col[k];
-                Val v = _val[k];
-
-                Idx head = ptr[i]++;
-                col[head] = j;
-                val[head] = v;
-            }
-
-            std::rotate(ptr.begin(), ptr.end() - 1, ptr.end());
-            ptr.front() = 0;
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < chunk; ++i) {
-                Idx beg = ptr[i];
-                Idx end = ptr[i+1];
-
-                amgcl::detail::sort_row(&col[0] + beg, &val[0] + beg, end - beg);
-            }
-
-            return std::make_tuple(chunk, m);
-        }
-
-        /// Read dense array from the file.
-        template <typename Val>
-        std::tuple<size_t, size_t> operator()(
-                std::vector<Val> &val,
-                ptrdiff_t row_beg = -1,
-                ptrdiff_t row_end = -1
-                )
-        {
-            precondition(!_sparse, format_error("not a dense array"));
-            precondition(amgcl::is_complex<Val>::value == _complex,
-                    _complex ?
-                        "attempt to read complex values into real vector" :
-                        "attempt to read real values into complex vector"
-                        );
-            precondition(std::is_integral<Val>::value == _integer,
-                    _integer ?
-                        "attempt to read integer values into real vector" :
-                        "attempt to read real values into integer vector"
-                        );
-
-            // Read sizes
-            ptrdiff_t n, m;
-            std::istringstream is;
-            {
-                // line already holds the matrix sizes
-                is.clear(); is.str(line);
-                precondition(is >> n >> m, format_error());
-            }
-
-            if (row_beg < 0) row_beg = 0;
-            if (row_end < 0) row_end = n;
-
-            precondition(row_beg >= 0 && row_end <= n,
-                    "Wrong subset of rows is requested");
-
-            val.resize((row_end - row_beg) * m);
-
-            for(ptrdiff_t j = 0; j < m; ++j) {
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    precondition(std::getline(f, line), format_error("unexpected eof"));
-                    if (row_beg <= i && i < row_end) {
-                        is.clear(); is.str(line);
-                        val[(i - row_beg) * m + j] = read_value<Val>(is);
-                    }
-                }
-            }
-
-            return std::make_tuple(row_end - row_beg, m);
-        }
-    private:
-        std::ifstream f;
-        std::string line;
-
-        bool _sparse;
-        bool _symmetric;
-        bool _complex;
-        bool _integer;
-
-        size_t nrows, ncols;
-
-        std::string format_error(const std::string &msg = "") const {
-            std::string err_string = "MatrixMarket format error";
-            if (!msg.empty())
-                err_string += " (" + msg + ")";
-            return err_string;
-        }
-
-        template <typename T>
-        typename std::enable_if<amgcl::is_complex<T>::value, T>::type
-        read_value(std::istream &s) {
-            typename math::scalar_of<T>::type x,y;
-            precondition(s >> x >> y, format_error());
-            return T(x,y);
-        }
-
-        template <typename T>
-        typename std::enable_if<!amgcl::is_complex<T>::value, T>::type
-        read_value(std::istream &s) {
-            T x;
-            if (std::is_same<T, char>::value) {
-                // Special case:
-                // We want to read 8bit integers from MatrixMarket, not chars.
-                int i;
-                precondition(s >> i, format_error());
-                x = static_cast<char>(i);
-            } else {
-                precondition(s >> x, format_error());
-            }
-            return x;
-        }
-
-};
-
-namespace detail {
-template <typename Val>
-typename std::enable_if<is_complex<Val>::value, std::ostream&>::type
-write_value(std::ostream &s, Val v) {
-    return s << std::scientific << std::setprecision(20) << std::real(v) << " " << std::imag(v);
-}
-
-template <typename Val>
-typename std::enable_if<!is_complex<Val>::value, std::ostream&>::type
-write_value(std::ostream &s, Val v) {
-    return s << std::scientific << std::setprecision(20) << v;
-}
-
-} // namespace detail
-
-/// Write dense array in Matrix Market format.
-template <typename Val>
-void mm_write(
-        const std::string &fname,
-        const Val *data,
-        size_t rows,
-        size_t cols = 1
-        )
-{
-    std::ofstream f(fname.c_str());
-    precondition(f, "Failed to open file \"" + fname + "\" for writing");
-
-    // Banner
-    f << "%%MatrixMarket matrix array ";
-    if (is_complex<Val>::value) {
-        f << "complex ";
-    } else if(std::is_integral<Val>::value) {
-        f << "integer ";
-    } else {
-        f << "real ";
-    }
-    f << "general\n";
-
-    // Sizes
-    f << rows << " " << cols << "\n";
-
-    // Data
-    for(size_t j = 0; j < cols; ++j) {
-        for(size_t i = 0; i < rows; ++i) {
-            detail::write_value(f, data[i * cols + j]) << "\n";
-        }
-    }
-}
-
-/// Write sparse matrix in Matrix Market format.
-template <class Matrix>
-void mm_write(const std::string &fname, const Matrix &A) {
-    typedef typename backend::value_type<Matrix>::type Val;
-
-    const size_t rows = backend::rows(A);
-    const size_t cols = backend::cols(A);
-    const size_t nnz  = backend::nonzeros(A);
-
-    std::ofstream f(fname.c_str());
-    precondition(f, "Failed to open file \"" + fname + "\" for writing");
-
-    // Banner
-    f << "%%MatrixMarket matrix coordinate ";
-    if (is_complex<Val>::value) {
-        f << "complex ";
-    } else if(std::is_integral<Val>::value) {
-        f << "integer ";
-    } else {
-        f << "real ";
-    }
-    f << "general\n";
-
-    // Sizes
-    f << rows << " " << cols << " " << nnz << "\n";
-
-    // Data
-    for(size_t i = 0; i < rows; ++i) {
-        for(auto a = backend::row_begin(A, i); a; ++a) {
-            f << i + 1 << " " << a.col() + 1 << " ";
-            detail::write_value(f, a.value()) << "\n";
-        }
-    }
-}
-
-} // namespace io
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/make_block_solver.hpp b/src/solvers/amgcl/make_block_solver.hpp
deleted file mode 100644
index 97d106d..0000000
--- a/src/solvers/amgcl/make_block_solver.hpp
+++ /dev/null
@@ -1,81 +0,0 @@
-#ifndef AMGCL_MAKE_BLOCK_SOLVER_HPP
-#define AMGCL_MAKE_BLOCK_SOLVER_HPP
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/adapter/block_matrix.hpp>
-#include <amgcl/value_type/static_matrix.hpp>
-#include <amgcl/make_solver.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-namespace backend {
-
-} // namespace backend
-
-/* Creates solver that operates in non-scalar domain but may take scalar inputs
- * for the system matrix and the rhs/solution vectors.
- */
-template <class Precond, class IterativeSolver>
-class make_block_solver {
-    public:
-        typedef typename Precond::backend_type             backend_type;
-        typedef typename backend_type::value_type          value_type;
-        typedef typename backend_type::params              backend_params;
-        typedef typename backend_type::vector              vector;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        typedef typename make_solver<Precond, IterativeSolver>::params params;
-
-        template <class Matrix>
-        make_block_solver(
-                const Matrix &A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-        {
-            S = std::make_shared<Solver>(adapter::block_matrix<value_type>(A), prm, bprm);
-        }
-
-        template <class Matrix, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Vec1 &rhs, Vec2 &&x) const
-        {
-            auto F = backend::reinterpret_as_rhs<value_type>(rhs);
-            auto X = backend::reinterpret_as_rhs<value_type>(x);
-
-            return (*S)(A, F, X);
-        }
-
-        template <class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type>
-        operator()(const Vec1 &rhs, Vec2 &&x) const {
-            auto F = backend::reinterpret_as_rhs<value_type>(rhs);
-            auto X = backend::reinterpret_as_rhs<value_type>(x);
-
-            return (*S)(F, X);
-        }
-
-        std::shared_ptr<typename Precond::matrix> system_matrix_ptr() const {
-            return S->system_matrix_ptr();
-        }
-
-        typename Precond::matrix const& system_matrix() const {
-            return S->system_matrix();
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const make_block_solver &p) {
-            return os << *p.S << std::endl;
-        }
-
-        size_t bytes() const {
-            return backend::bytes(*S);
-        }
-    private:
-        typedef make_solver<Precond, IterativeSolver> Solver;
-        std::shared_ptr<Solver> S;
-};
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/make_solver.hpp b/src/solvers/amgcl/make_solver.hpp
deleted file mode 100644
index 444e4ec..0000000
--- a/src/solvers/amgcl/make_solver.hpp
+++ /dev/null
@@ -1,230 +0,0 @@
-#ifndef AMGCL_MAKE_SOLVER_HPP
-#define AMGCL_MAKE_SOLVER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/make_solver.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Tie an iterative solver and a preconditioner in a single class.
- */
-
-#include <type_traits>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Convenience class that bundles together a preconditioner and an iterative solver.
-template <
-    class Precond,
-    class IterativeSolver
-    >
-class make_solver : public amgcl::detail::non_copyable {
-    static_assert(
-            backend::backends_compatible<
-                typename IterativeSolver::backend_type,
-                typename Precond::backend_type
-            >::value,
-            "Backends for preconditioner and iterative solver should be compatible"
-            );
-    public:
-        typedef typename IterativeSolver::backend_type backend_type;
-        typedef typename backend_type::matrix matrix;
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename backend_type::col_type col_type;
-        typedef typename backend_type::ptr_type ptr_type;
-        typedef typename backend_type::params backend_params;
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        /** Combined parameters of the bundled preconditioner and the iterative
-         * solver.
-         */
-        struct params {
-            typename Precond::params         precond; ///< Preconditioner parameters.
-            typename IterativeSolver::params solver;  ///< Iterative solver parameters.
-
-            params() {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, precond),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, solver)
-            {
-                check_params(p, {"precond", "solver"});
-            }
-
-            void get( boost::property_tree::ptree &p,
-                    const std::string &path = ""
-                    ) const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, precond);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, solver);
-            }
-#endif
-        } prm;
-
-        /** Sets up the preconditioner and creates the iterative solver. */
-        template <class Matrix>
-        make_solver(
-                const Matrix &A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(backend::rows(A)),
-            P(A, prm.precond, bprm),
-            S(backend::rows(A), prm.solver, bprm)
-        {}
-
-        // Constructs the preconditioner and creates iterative solver.
-        // Takes shared pointer to the matrix in internal format.
-        make_solver(
-                std::shared_ptr<build_matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(backend::rows(*A)),
-            P(A, prm.precond, bprm),
-            S(backend::rows(*A), prm.solver, bprm)
-        {}
-
-        /** Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * \rst
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         * \endrst
-         */
-        template <class Matrix, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return S(A, P, rhs, x);
-        }
-
-        /** Computes the solution for the given right-hand side \p rhs.
-         * Returns the number of iterations made and the achieved residual as a
-         * ``std::tuple``. The solution vector \p x provides initial
-         * approximation in input and holds the computed solution on output.
-         */
-        template <class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(const Vec1 &rhs, Vec2 &&x) const {
-            return S(P, rhs, x);
-        }
-
-        /** Acts as a preconditioner. That is, applies the solver to the
-         * right-hand side \p rhs to get the solution \p x with zero initial
-         * approximation.  Iterative methods usually use estimated residual for
-         * exit condition.  For some problems the value of the estimated
-         * residual can get too far from the true residual due to round-off
-         * errors.  Nesting iterative solvers in this way may allow to shave
-         * the last bits off the error. The method should not be used directly
-         * but rather allows nesting ``make_solver`` classes as in the
-         * following example:
-         *
-         * \rst
-         * .. code-block:: cpp
-         *
-         *   typedef amgcl::make_solver<
-         *     amgcl::make_solver<
-         *       amgcl::amg<
-         *         Backend, amgcl::coarsening::smoothed_aggregation, amgcl::relaxation::spai0
-         *         >,
-         *       amgcl::solver::cg<Backend>
-         *       >,
-         *     amgcl::solver::cg<Backend>
-         *     > NestedSolver;
-         * \endrst
-         */
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            backend::clear(x);
-            (*this)(rhs, x);
-        }
-
-        /// Returns reference to the constructed preconditioner.
-        const Precond& precond() const {
-            return P;
-        }
-
-        /// Returns reference to the constructed preconditioner.
-        Precond& precond() {
-            return P;
-        }
-
-        /// Returns reference to the constructed iterative solver.
-        const IterativeSolver& solver() const {
-            return S;
-        }
-
-        /// Returns the system matrix in the backend format.
-        std::shared_ptr<typename Precond::matrix> system_matrix_ptr() const {
-            return P.system_matrix_ptr();
-        }
-
-        typename Precond::matrix const& system_matrix() const {
-            return P.system_matrix();
-        }
-
-#ifndef AMGCL_NO_BOOST
-        /// Stores the parameters used during construction into the property tree \p p.
-        void get_params(boost::property_tree::ptree &p) const {
-            prm.get(p);
-        }
-#endif
-
-        /// Returns the size of the system matrix.
-        size_t size() const {
-            return n;
-        }
-
-        size_t bytes() const {
-            return backend::bytes(S) + backend::bytes(P);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const make_solver &p) {
-            return os
-                << "Solver\n======\n" << p.S << std::endl
-                << "Preconditioner\n==============\n" << p.P;
-        }
-    private:
-        size_t           n;
-        Precond          P;
-        IterativeSolver  S;
-};
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/amg.hpp b/src/solvers/amgcl/mpi/amg.hpp
deleted file mode 100644
index 3f2ffa8..0000000
--- a/src/solvers/amgcl/mpi/amg.hpp
+++ /dev/null
@@ -1,499 +0,0 @@
-#ifndef AMGCL_MPI_AMG_HPP
-#define AMGCL_MPI_AMG_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/amg.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory AMG preconditioner.
- */
-
-#include <iostream>
-#include <iomanip>
-#include <list>
-#include <memory>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/direct_solver/skyline_lu.hpp>
-#include <amgcl/mpi/partition/merge.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-template <
-    class Backend,
-    class Coarsening,
-    class Relaxation,
-    class DirectSolver = direct::skyline_lu<typename Backend::value_type>,
-    class Repartition = partition::merge<Backend>
-    >
-class amg {
-    public:
-        typedef Backend                                    backend_type;
-        typedef typename Backend::params                   backend_params;
-        typedef typename Backend::value_type               value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef distributed_matrix<Backend>                matrix;
-        typedef typename Backend::vector                   vector;
-
-        struct params {
-            typedef typename Coarsening::params   coarsening_params;
-            typedef typename Relaxation::params   relax_params;
-            typedef typename DirectSolver::params direct_params;
-            typedef typename Repartition::params  repart_params;
-
-            coarsening_params coarsening;   ///< Coarsening parameters.
-            relax_params      relax;        ///< Relaxation parameters.
-            direct_params     direct;       ///< Direct solver parameters.
-            repart_params     repart;       ///< Repartition parameters.
-
-            /// Specifies when level is coarse enough to be solved directly.
-            /**
-             * If number of variables at a next level in the hierarchy becomes
-             * lower than this threshold, then the hierarchy construction is
-             * stopped and the linear system is solved directly at this level.
-             */
-            unsigned coarse_enough;
-
-            /// Use direct solver at the coarsest level.
-            /**
-             * When set, the coarsest level is solved with a direct solver.
-             * Otherwise a smoother is used as a solver.
-             */
-            bool direct_coarse;
-
-            /// Maximum number of levels.
-            /** If this number is reached while the size of the last level is
-             * greater that `coarse_enough`, then the coarsest level will not
-             * be solved exactly, but will use a smoother.
-             */
-            unsigned max_levels;
-
-            /// Number of pre-relaxations.
-            unsigned npre;
-
-            /// Number of post-relaxations.
-            unsigned npost;
-
-            /// Number of cycles (1 for V-cycle, 2 for W-cycle, etc.).
-            unsigned ncycle;
-
-            /// Number of cycles to make as part of preconditioning.
-            unsigned pre_cycles;
-
-            /// Keep matrices in internal format to allow for quick rebuild of the hierarchy
-            bool allow_rebuild;
-
-            params() :
-                coarse_enough(DirectSolver::coarse_enough()), direct_coarse(true),
-                max_levels( std::numeric_limits<unsigned>::max() ),
-                npre(1), npost(1), ncycle(1), pre_cycles(1),
-                allow_rebuild(false)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, coarsening),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, relax),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, direct),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, repart),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, coarse_enough),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, direct_coarse),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, max_levels),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, npre),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, npost),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ncycle),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, pre_cycles),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, allow_rebuild)
-            {
-                check_params(p, {"coarsening", "relax", "direct", "repart",
-                        "coarse_enough",  "direct_coarse", "max_levels",
-                        "npre", "npost", "ncycle", "pre_cycles",
-                        "allow_rebuild"});
-
-                amgcl::precondition(max_levels > 0, "max_levels should be positive");
-            }
-
-            void get(
-                    boost::property_tree::ptree &p,
-                    const std::string &path = ""
-                    ) const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, coarsening);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, relax);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, direct);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, repart);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, coarse_enough);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, direct_coarse);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, max_levels);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, npre);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, npost);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ncycle);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, pre_cycles);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, allow_rebuild);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        amg(
-                communicator comm,
-                const Matrix &A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(prm), comm(comm), repart(prm.repart)
-        {
-            init(std::make_shared<matrix>(comm, A, backend::rows(A)), bprm);
-        }
-
-        amg(
-                communicator comm,
-                std::shared_ptr<matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(prm), comm(comm), repart(prm.repart)
-        {
-            init(A, bprm);
-        }
-
-        /// Rebuild the hierarchy using the new system matrix.
-        /**
-         * This requires for prm.allow_rebuild to be set. The transfer
-         * operators created during the initial setup are reused.
-         */
-        template <class Matrix>
-        void rebuild(
-                const Matrix &M,
-                const backend_params &bprm = backend_params()
-                )
-        {
-            rebuild(std::make_shared<matrix>(comm, M, backend::rows(M)), bprm);
-        }
-
-        void rebuild(
-                std::shared_ptr<matrix> A,
-                const backend_params &bprm = backend_params()
-                )
-        {
-            precondition(prm.allow_rebuild,
-                    "allow_rebuild is not set!");
-            precondition(
-                    A->glob_rows() == system_matrix().glob_rows() &&
-                    A->glob_cols() == system_matrix().glob_cols(),
-                    "Matrix dimensions differ from the original ones!"
-                    );
-
-            AMGCL_TIC("rebuild");
-            Coarsening C(prm.coarsening);
-            for(auto &level : levels) {
-                A = level.rebuild(A, C, prm, bprm);
-            }
-            AMGCL_TOC("rebuild");
-        }
-
-        template <class Vec1, class Vec2>
-        void cycle(const Vec1 &rhs, Vec2 &&x) const {
-            cycle(levels.begin(), rhs, x);
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            if (prm.pre_cycles) {
-                backend::clear(x);
-                for(unsigned i = 0; i < prm.pre_cycles; ++i)
-                    cycle(levels.begin(), rhs, x);
-            } else {
-                backend::copy(rhs, x);
-            }
-        }
-
-        /// Returns the system matrix from the finest level.
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return A;
-        }
-
-        const matrix& system_matrix() const {
-            return *system_matrix_ptr();
-        }
-    private:
-        struct level {
-            ptrdiff_t nrows, nnz;
-            int active_procs;
-
-            std::shared_ptr<matrix>       A, P, R;
-            std::shared_ptr<vector>       f, u, t;
-            std::shared_ptr<Relaxation>   relax;
-            std::shared_ptr<DirectSolver> solve;
-
-            level() {}
-
-            level(
-                    std::shared_ptr<matrix> a,
-                    params &prm,
-                    const backend_params &bprm,
-                    bool direct = false
-                 )
-                : nrows(a->glob_rows()), nnz(a->glob_nonzeros()),
-                  f(Backend::create_vector(a->loc_rows(), bprm)),
-                  u(Backend::create_vector(a->loc_rows(), bprm))
-            {
-                int active = (a->loc_rows() > 0);
-                active_procs = a->comm().reduce(MPI_SUM, active);
-
-                sort_rows(*a);
-
-                if (direct) {
-                    AMGCL_TIC("direct solver");
-                    solve = std::make_shared<DirectSolver>(a->comm(), *a, prm.direct);
-                    AMGCL_TOC("direct solver");
-                } else {
-                    A = a;
-                    t = Backend::create_vector(a->loc_rows(), bprm);
-
-                    AMGCL_TIC("relaxation");
-                    relax = std::make_shared<Relaxation>(*a, prm.relax, bprm);
-                    AMGCL_TOC("relaxation");
-                }
-            }
-
-            std::shared_ptr<matrix> step_down(Coarsening &C, const Repartition &repart)
-            {
-                AMGCL_TIC("transfer operators");
-                std::tie(P, R) = C.transfer_operators(*A);
-
-                AMGCL_TIC("sort");
-                sort_rows(*P);
-                sort_rows(*R);
-                AMGCL_TOC("sort");
-
-                AMGCL_TOC("transfer operators");
-
-                if (P->glob_cols() == 0) {
-                    // Zero-sized coarse level in amgcl (diagonal matrix?)
-                    return std::shared_ptr<matrix>();
-                }
-
-                AMGCL_TIC("coarse operator");
-                auto Ac = C.coarse_operator(*A, *P, *R);
-                AMGCL_TOC("coarse operator");
-
-                if (repart.is_needed(*Ac)) {
-                    AMGCL_TIC("partition");
-                    auto I = repart(*Ac, block_size(C));
-                    auto J = transpose(*I);
-
-                    P  = product(*P, *I);
-                    R  = product(*J, *R);
-                    Ac = product(*J, *product(*Ac, *I));
-                    AMGCL_TOC("partition");
-                }
-
-                return Ac;
-            }
-
-            std::shared_ptr<matrix> rebuild(
-                    std::shared_ptr<matrix> A,
-                    const Coarsening &C,
-                    const params &prm,
-                    const backend_params &bprm
-                    )
-            {
-                if (relax) {
-                    relax = std::make_shared<Relaxation>(*A, prm.relax, bprm);
-                }
-
-                if (solve) {
-                    solve = std::make_shared<DirectSolver>(A->comm(), *A, prm.direct);
-                }
-
-                if (this->A) {
-                    this->A = A;
-                }
-
-                if (P && R) {
-                    A = C.coarse_operator(*A, *P, *R);
-                }
-
-                if (this->A) {
-                    this->A->move_to_backend(bprm);
-                }
-
-                return A;
-            }
-
-            void move_to_backend(const backend_params &bprm, bool keep_src = false) {
-                AMGCL_TIC("move to backend");
-                if (A) A->move_to_backend(bprm);
-                if (P) P->move_to_backend(bprm, keep_src);
-                if (R) R->move_to_backend(bprm, keep_src);
-                AMGCL_TOC("move to backend");
-            }
-
-            ptrdiff_t rows() const {
-                return nrows;
-            }
-
-            ptrdiff_t nonzeros() const {
-                return nnz;
-            }
-        };
-
-        typedef typename std::list<level>::const_iterator level_iterator;
-
-        communicator comm;
-        std::shared_ptr<matrix> A;
-        Repartition repart;
-        std::list<level> levels;
-
-        void init(std::shared_ptr<matrix> A, const backend_params &bprm)
-        {
-            A->comm().check(A->glob_rows() == A->glob_cols(), "Matrix should be square!");
-
-            this->A = A;
-            Coarsening C(prm.coarsening);
-            bool need_coarse = true;
-
-            while(A->glob_rows() > prm.coarse_enough) {
-                levels.push_back( level(A, prm, bprm) );
-
-                if (levels.size() >= prm.max_levels) {
-                    levels.back().move_to_backend(bprm, prm.allow_rebuild);
-                    break;
-                }
-
-                A = levels.back().step_down(C, repart);
-                levels.back().move_to_backend(bprm, prm.allow_rebuild);
-
-                if (!A) {
-                    // Zero-sized coarse level. Probably the system matrix on
-                    // this level is diagonal, should be easily solvable with a
-                    // couple of smoother iterations.
-                    need_coarse = false;
-                    break;
-                }
-            }
-
-            if (!A || A->glob_rows() > prm.coarse_enough) {
-                // The coarse matrix is still too big to be solved directly.
-                need_coarse = false;
-            }
-
-            if (A && need_coarse) {
-                levels.push_back(level(A, prm, bprm, prm.direct_coarse));
-                levels.back().move_to_backend(bprm, prm.allow_rebuild);
-            }
-
-            AMGCL_TIC("move to backend");
-            this->A->move_to_backend(bprm);
-            AMGCL_TOC("move to backend");
-        }
-
-        template <class Vec1, class Vec2>
-        void cycle(level_iterator lvl, const Vec1 &rhs, Vec2 &x) const {
-            level_iterator nxt = lvl, end = levels.end();
-            ++nxt;
-
-            if (nxt == end) {
-                if (lvl->solve) {
-                    AMGCL_TIC("direct solver");
-                    (*lvl->solve)(rhs, x);
-                    AMGCL_TOC("direct solver");
-                } else {
-                    AMGCL_TIC("relax");
-                    for (size_t i = 0; i < prm.npre;  ++i) lvl->relax->apply_pre(*lvl->A, rhs, x, *lvl->t);
-                    for (size_t i = 0; i < prm.npost; ++i) lvl->relax->apply_post(*lvl->A, rhs, x, *lvl->t);
-                    AMGCL_TOC("relax");
-                }
-            } else {
-                for (size_t j = 0; j < prm.ncycle; ++j) {
-                    AMGCL_TIC("relax");
-                    for(size_t i = 0; i < prm.npre; ++i)
-                        lvl->relax->apply_pre(*lvl->A, rhs, x, *lvl->t);
-                    AMGCL_TOC("relax");
-
-                    backend::residual(rhs, *lvl->A, x, *lvl->t);
-
-                    backend::spmv(math::identity<scalar_type>(), *lvl->R, *lvl->t, math::zero<scalar_type>(), *nxt->f);
-
-                    backend::clear(*nxt->u);
-                    cycle(nxt, *nxt->f, *nxt->u);
-
-                    backend::spmv(math::identity<scalar_type>(), *lvl->P, *nxt->u, math::identity<scalar_type>(), x);
-
-                    AMGCL_TIC("relax");
-                    for(size_t i = 0; i < prm.npost; ++i)
-                        lvl->relax->apply_post(*lvl->A, rhs, x, *lvl->t);
-                    AMGCL_TOC("relax");
-                }
-            }
-        }
-
-    template <class B, class C, class R, class D, class I>
-    friend std::ostream& operator<<(std::ostream &os, const amg<B, C, R, D, I> &a);
-};
-
-template <class B, class C, class R, class D, class I>
-std::ostream& operator<<(std::ostream &os, const amg<B, C, R, D, I> &a)
-{
-    typedef typename amg<B, C, R, D, I>::level level;
-    ios_saver ss(os);
-
-    size_t sum_dof = 0;
-    size_t sum_nnz = 0;
-
-    for(const level &lvl : a.levels) {
-        sum_dof += lvl.rows();
-        sum_nnz += lvl.nonzeros();
-    }
-
-    os << "Number of levels:    "   << a.levels.size()
-        << "\nOperator complexity: " << std::fixed << std::setprecision(2)
-        << 1.0 * sum_nnz / a.levels.front().nonzeros()
-        << "\nGrid complexity:     " << std::fixed << std::setprecision(2)
-        << 1.0 * sum_dof / a.levels.front().rows()
-        << "\n\nlevel     unknowns       nonzeros\n"
-        << "---------------------------------\n";
-
-    size_t depth = 0;
-    for(const level &lvl : a.levels) {
-        os << std::setw(5)  << depth++
-           << std::setw(13) << lvl.rows()
-           << std::setw(15) << lvl.nonzeros() << " ("
-           << std::setw(5) << std::fixed << std::setprecision(2)
-           << 100.0 * lvl.nonzeros() / sum_nnz
-           << "%) [" << lvl.active_procs << "]" << std::endl;
-    }
-
-    return os;
-}
-
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/block_preconditioner.hpp b/src/solvers/amgcl/mpi/block_preconditioner.hpp
deleted file mode 100644
index c5efe4f..0000000
--- a/src/solvers/amgcl/mpi/block_preconditioner.hpp
+++ /dev/null
@@ -1,105 +0,0 @@
-#ifndef AMGCL_MPI_BLOCK_PRECONDITIONER_HPP
-#define AMGCL_MPI_BLOCK_PRECONDITIONER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/block_preconditioner.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed block preconditioner.
- */
-
-#include <vector>
-
-#include <memory>
-
-#include <mpi.h>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-template <class Precond>
-class block_preconditioner {
-    public:
-        typedef typename Precond::params       params;
-        typedef typename Precond::backend_type backend_type;
-        typedef typename backend_type::params  backend_params;
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename backend_type::matrix     bmatrix;
-        typedef distributed_matrix<backend_type>  matrix;
-
-        template <class Matrix>
-        block_preconditioner(
-                communicator comm,
-                const Matrix &Astrip,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-        {
-            A = std::make_shared<matrix>(comm, Astrip, backend::rows(Astrip));
-            P = std::make_shared<Precond>(A->local(), prm, bprm);
-            A->set_local(P->system_matrix_ptr());
-            A->move_to_backend(bprm);
-        }
-
-        block_preconditioner(
-                communicator,
-                std::shared_ptr<matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) : A(A)
-        {
-            P = std::make_shared<Precond>(A->local(), prm, bprm);
-            A->set_local(P->system_matrix_ptr());
-            A->move_to_backend(bprm);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return A;
-        }
-
-        const matrix& system_matrix() const {
-            return *A;
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            P->apply(rhs, x);
-        }
-    private:
-        std::shared_ptr<matrix>  A;
-        std::shared_ptr<Precond> P;
-};
-
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/coarsening/aggregation.hpp b/src/solvers/amgcl/mpi/coarsening/aggregation.hpp
deleted file mode 100644
index 106bd9e..0000000
--- a/src/solvers/amgcl/mpi/coarsening/aggregation.hpp
+++ /dev/null
@@ -1,124 +0,0 @@
-#ifndef AMGCL_MPI_COARSENING_AGGREGATION_HPP
-#define AMGCL_MPI_COARSENING_AGGREGATION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/coarsening/aggregation.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed non-smoothed aggregation coarsening scheme.
- */
-
-#include <tuple>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/coarsening/detail/scaled_galerkin.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/coarsening/pmis.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace coarsening {
-
-template <class Backend>
-struct aggregation {
-    typedef typename Backend::value_type value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef backend::crs<value_type> build_matrix;
-
-    struct params {
-        // aggregation params
-        typedef typename pmis<Backend>::params aggr_params;
-        aggr_params aggr;
-
-        /// Over-interpolation factor \f$\alpha\f$.
-        /**
-         * In case of aggregation coarsening, coarse-grid
-         * correction of smooth error, and by this the overall convergence, can
-         * often be substantially improved by using "over-interpolation", that is,
-         * by multiplying the actual correction (corresponding to piecewise
-         * constant interpolation) by some factor \f$\alpha > 1\f$. Equivalently,
-         * this means that the coarse-level Galerkin operator is re-scaled by
-         * \f$1 / \alpha\f$:
-         * \f[I_h^HA_hI_H^h \to \frac{1}{\alpha}I_h^HA_hI_H^h.\f]
-         *
-         * \sa  \cite Stuben1999, Section 9.1 "Re-scaling of the Galerkin operator".
-         */
-        float over_interp;
-
-        params() : over_interp(1.5f) { }
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_CHILD(p, aggr),
-              AMGCL_PARAMS_IMPORT_VALUE(p, over_interp)
-        {
-            check_params(p, {"aggr", "over_interp"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, aggr);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, over_interp);
-        }
-#endif
-    } prm;
-
-    aggregation(const params &prm = params()) : prm(prm) {}
-
-    std::tuple<
-        std::shared_ptr< distributed_matrix<Backend> >,
-        std::shared_ptr< distributed_matrix<Backend> >
-        >
-    transfer_operators(const distributed_matrix<Backend> &A) {
-        pmis<Backend> aggr(A, prm.aggr);
-        return std::make_tuple(aggr.p_tent, transpose(*aggr.p_tent));
-    }
-
-    std::shared_ptr< distributed_matrix<Backend> >
-    coarse_operator(
-            const distributed_matrix<Backend> &A,
-            const distributed_matrix<Backend> &P,
-            const distributed_matrix<Backend> &R
-            ) const
-    {
-        return amgcl::coarsening::detail::scaled_galerkin(A, P, R, 1 / prm.over_interp);
-    }
-
-};
-
-template <class Backend>
-unsigned block_size(const aggregation<Backend> &c) {
-    return c.prm.aggr.block_size;
-}
-
-} // namespace coarsening
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/coarsening/pmis.hpp b/src/solvers/amgcl/mpi/coarsening/pmis.hpp
deleted file mode 100644
index 315651e..0000000
--- a/src/solvers/amgcl/mpi/coarsening/pmis.hpp
+++ /dev/null
@@ -1,1122 +0,0 @@
-#ifndef AMGCL_MPI_COARSENING_PMIS_HPP
-#define AMGCL_MPI_COARSENING_PMIS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/coarsening/pmis.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed PMIS aggregation.
- */
-
-#include <tuple>
-#include <memory>
-#include <numeric>
-#include <cassert>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/coarsening/tentative_prolongation.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace coarsening {
-
-template <class Backend>
-struct pmis {
-    typedef typename Backend::value_type value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef distributed_matrix<Backend> matrix;
-    typedef comm_pattern<Backend> CommPattern;
-    typedef backend::crs<value_type> build_matrix;
-    typedef backend::builtin<char> bool_backend;
-    typedef backend::crs<char>     bool_matrix;
-
-
-    struct params {
-        /// Near nullspace parameters.
-        amgcl::coarsening::nullspace_params nullspace;
-
-        // Strong connectivity threshold
-        scalar_type eps_strong;
-
-        // Block size for non-scalar problems.
-        unsigned    block_size;
-
-        params() : eps_strong(0.08), block_size(1) { }
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_CHILD(p, nullspace),
-              AMGCL_PARAMS_IMPORT_VALUE(p, eps_strong),
-              AMGCL_PARAMS_IMPORT_VALUE(p, block_size)
-        {
-            check_params(p, {"nullspace", "eps_strong", "block_size"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, nullspace);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, eps_strong);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, block_size);
-        }
-#endif
-    } &prm;
-
-    std::shared_ptr< distributed_matrix<bool_backend> > conn;
-    std::shared_ptr< matrix > p_tent;
-
-    pmis(const matrix &A, params &prm) : prm(prm) {
-        ptrdiff_t n = A.loc_rows();
-        std::vector<ptrdiff_t> state(n);
-        std::vector<int>       owner(n);
-
-        if (prm.block_size == 1) {
-            conn = conn_strength(A, prm.eps_strong);
-
-            ptrdiff_t naggr = aggregates(*conn, state, owner);
-            p_tent = tentative_prolongation(A.comm(), n, naggr, state, owner);
-        } else {
-            typedef typename math::scalar_of<value_type>::type scalar;
-            typedef backend::builtin<scalar> sbackend;
-
-            ptrdiff_t np = n / prm.block_size;
-
-            assert(np * prm.block_size == n && "Matrix size should be divisible by block_size");
-
-            distributed_matrix<sbackend> A_pw(A.comm(),
-                pointwise_matrix(*A.local(),  prm.block_size),
-                pointwise_matrix(*A.remote(), prm.block_size)
-                );
-
-            auto conn_pw = conn_strength(A_pw, prm.eps_strong);
-
-            std::vector<ptrdiff_t> state_pw(np);
-            std::vector<int>       owner_pw(np);
-
-            ptrdiff_t naggr = aggregates(*conn_pw, state_pw, owner_pw);
-
-            conn = std::make_shared< distributed_matrix<bool_backend> >(
-                    A.comm(),
-                    expand_conn(*A.local(),  *A_pw.local(),  *conn_pw->local(),  prm.block_size),
-                    expand_conn(*A.remote(), *A_pw.remote(), *conn_pw->remote(), prm.block_size)
-                    );
-
-#pragma omp parallel for
-            for(ptrdiff_t ip = 0; ip < np; ++ip) {
-                ptrdiff_t i = ip * prm.block_size;
-                ptrdiff_t s = state_pw[ip];
-                int       o = owner_pw[ip];
-
-                for(unsigned k = 0; k < prm.block_size; ++k) {
-                    state[i + k] = (s < 0) ? s : (s * prm.block_size + k);
-                    owner[i + k] = o;
-                }
-            }
-
-            p_tent = tentative_prolongation(A.comm(), n, naggr * prm.block_size, state, owner);
-        }
-    }
-
-    std::shared_ptr< distributed_matrix<bool_backend> >
-    squared_interface(const distributed_matrix<bool_backend> &A) {
-        const comm_pattern<bool_backend> &C = A.cpat();
-
-        bool_matrix &A_loc = *A.local();
-        bool_matrix &A_rem = *A.remote();
-
-        ptrdiff_t A_rows = A.loc_rows();
-
-        ptrdiff_t A_beg = A.loc_col_shift();
-        ptrdiff_t A_end = A_beg + A_rows;
-
-        auto a_nbr = remote_rows(C, A, false);
-        bool_matrix &A_nbr = *a_nbr;
-
-        // Build mapping from global to local column numbers in the remote part of
-        // the square matrix.
-        std::vector<ptrdiff_t> rem_cols(A_rem.nnz + A_nbr.nnz);
-
-        std::copy(A_nbr.col, A_nbr.col + A_nbr.nnz,
-                std::copy(A_rem.col, A_rem.col + A_rem.nnz, rem_cols.begin()));
-
-        std::sort(rem_cols.begin(), rem_cols.end());
-        rem_cols.erase(std::unique(rem_cols.begin(), rem_cols.end()), rem_cols.end());
-
-        ptrdiff_t n_rem_cols = 0;
-        std::unordered_map<ptrdiff_t, int> rem_idx(2 * rem_cols.size());
-        for(ptrdiff_t c : rem_cols) {
-            if (c >= A_beg && c < A_end) continue;
-            rem_idx[c] = n_rem_cols++;
-        }
-
-        // Build the product.
-        auto s_loc = std::make_shared<bool_matrix>();
-        auto s_rem = std::make_shared<bool_matrix>();
-
-        bool_matrix &S_loc = *s_loc;
-        bool_matrix &S_rem = *s_rem;
-
-        S_loc.set_size(A_rows, A_rows, false);
-        S_rem.set_size(A_rows, 0,      false);
-
-        S_loc.ptr[0] = 0;
-        S_rem.ptr[0] = 0;
-
-        AMGCL_TIC("analyze");
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> loc_marker(A_rows,     -1);
-            std::vector<ptrdiff_t> rem_marker(n_rem_cols, -1);
-
-#pragma omp for
-            for(ptrdiff_t ia = 0; ia < A_rows; ++ia) {
-                ptrdiff_t loc_cols = 0;
-                ptrdiff_t rem_cols = 0;
-
-                for(ptrdiff_t ja = A_rem.ptr[ia], ea = A_rem.ptr[ia + 1]; ja < ea; ++ja) {
-                    ptrdiff_t  ca = C.local_index(A_rem.col[ja]);
-
-                    for(ptrdiff_t jb = A_nbr.ptr[ca], eb = A_nbr.ptr[ca+1]; jb < eb; ++jb) {
-                        ptrdiff_t  cb = A_nbr.col[jb];
-
-                        if (cb >= A_beg && cb < A_end) {
-                            cb -= A_beg;
-
-                            if (loc_marker[cb] != ia) {
-                                loc_marker[cb]  = ia;
-                                ++loc_cols;
-                            }
-                        } else {
-                            cb = rem_idx[cb];
-
-                            if (rem_marker[cb] != ia) {
-                                rem_marker[cb]  = ia;
-                                ++rem_cols;
-                            }
-                        }
-                    }
-                }
-
-                for(ptrdiff_t ja = A_loc.ptr[ia], ea = A_loc.ptr[ia + 1]; ja < ea; ++ja) {
-                    ptrdiff_t  ca = A_loc.col[ja];
-
-                    for(ptrdiff_t jb = A_rem.ptr[ca], eb = A_rem.ptr[ca+1]; jb < eb; ++jb) {
-                        ptrdiff_t  cb = rem_idx[A_rem.col[jb]];
-
-                        if (rem_marker[cb] != ia) {
-                            rem_marker[cb]  = ia;
-                            ++rem_cols;
-                        }
-                    }
-
-                }
-
-                if (rem_cols) {
-                    for(ptrdiff_t ja = A_loc.ptr[ia], ea = A_loc.ptr[ia + 1]; ja < ea; ++ja) {
-                        ptrdiff_t  ca = A_loc.col[ja];
-
-                        for(ptrdiff_t jb = A_loc.ptr[ca], eb = A_loc.ptr[ca+1]; jb < eb; ++jb) {
-                            ptrdiff_t  cb = A_loc.col[jb];
-
-                            if (loc_marker[cb] != ia) {
-                                loc_marker[cb]  = ia;
-                                ++loc_cols;
-                            }
-                        }
-
-                    }
-                }
-
-                S_rem.ptr[ia + 1] = rem_cols;
-                S_loc.ptr[ia + 1] = rem_cols ? loc_cols : 0;
-            }
-        }
-        AMGCL_TOC("analyze");
-
-        S_loc.set_nonzeros(S_loc.scan_row_sizes(), false);
-        S_rem.set_nonzeros(S_rem.scan_row_sizes(), false);
-
-        AMGCL_TIC("compute");
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> loc_marker(A_rows,     -1);
-            std::vector<ptrdiff_t> rem_marker(n_rem_cols, -1);
-
-#pragma omp for
-            for(ptrdiff_t ia = 0; ia < A_rows; ++ia) {
-                ptrdiff_t loc_beg = S_loc.ptr[ia];
-                ptrdiff_t rem_beg = S_rem.ptr[ia];
-                ptrdiff_t loc_end = loc_beg;
-                ptrdiff_t rem_end = rem_beg;
-
-                if (rem_beg == S_rem.ptr[ia+1]) continue;
-
-                for(ptrdiff_t ja = A_loc.ptr[ia], ea = A_loc.ptr[ia + 1]; ja < ea; ++ja) {
-                    ptrdiff_t  ca = A_loc.col[ja];
-
-                    for(ptrdiff_t jb = A_loc.ptr[ca], eb = A_loc.ptr[ca+1]; jb < eb; ++jb) {
-                        ptrdiff_t  cb = A_loc.col[jb];
-
-                        if (loc_marker[cb] < loc_beg) {
-                            loc_marker[cb] = loc_end;
-                            S_loc.col[loc_end] = cb;
-                            ++loc_end;
-                        }
-                    }
-
-                    for(ptrdiff_t jb = A_rem.ptr[ca], eb = A_rem.ptr[ca+1]; jb < eb; ++jb) {
-                        ptrdiff_t  gb = A_rem.col[jb];
-                        ptrdiff_t  cb = rem_idx[gb];
-
-                        if (rem_marker[cb] < rem_beg) {
-                            rem_marker[cb] = rem_end;
-                            S_rem.col[rem_end] = gb;
-                            ++rem_end;
-                        }
-                    }
-                }
-
-                for(ptrdiff_t ja = A_rem.ptr[ia], ea = A_rem.ptr[ia + 1]; ja < ea; ++ja) {
-                    ptrdiff_t  ca = C.local_index(A_rem.col[ja]);
-
-                    for(ptrdiff_t jb = A_nbr.ptr[ca], eb = A_nbr.ptr[ca+1]; jb < eb; ++jb) {
-                        ptrdiff_t  gb = A_nbr.col[jb];
-
-                        if (gb >= A_beg && gb < A_end) {
-                            ptrdiff_t cb = gb - A_beg;
-
-                            if (loc_marker[cb] < loc_beg) {
-                                loc_marker[cb] = loc_end;
-                                S_loc.col[loc_end] = cb;
-                                ++loc_end;
-                            }
-                        } else {
-                            ptrdiff_t cb = rem_idx[gb];
-
-                            if (rem_marker[cb] < rem_beg) {
-                                rem_marker[cb] = rem_end;
-                                S_rem.col[rem_end] = gb;
-                                ++rem_end;
-                            }
-                        }
-                    }
-                }
-            }
-        }
-        AMGCL_TOC("compute");
-
-        return std::make_shared< distributed_matrix<bool_backend> >(A.comm(), s_loc, s_rem);
-    }
-
-    template <class B>
-    std::shared_ptr< distributed_matrix<bool_backend> >
-    conn_strength(const distributed_matrix<B> &A, scalar_type eps_strong) {
-        typedef typename B::value_type val_type;
-        typedef backend::crs<val_type> B_matrix;
-
-        AMGCL_TIC("conn_strength");
-        ptrdiff_t n = A.loc_rows();
-
-        const B_matrix &A_loc = *A.local();
-        const B_matrix &A_rem = *A.remote();
-        const comm_pattern<B> &C = A.cpat();
-
-        scalar_type eps_squared = eps_strong * eps_strong;
-
-        auto d = backend::diagonal(A_loc);
-        backend::numa_vector<val_type> &D = *d;
-
-        std::vector<val_type> D_loc(C.send.count());
-        std::vector<val_type> D_rem(C.recv.count());
-
-        for(size_t i = 0, nv = C.send.count(); i < nv; ++i)
-            D_loc[i] = D[C.send.col[i]];
-
-        C.exchange(&D_loc[0], &D_rem[0]);
-
-        auto s_loc = std::make_shared<bool_matrix>();
-        auto s_rem = std::make_shared<bool_matrix>();
-
-        bool_matrix &S_loc = *s_loc;
-        bool_matrix &S_rem = *s_rem;
-
-        S_loc.set_size(n, n, true);
-        S_rem.set_size(n, 0, true);
-
-        S_loc.val = new char[A_loc.nnz];
-        S_rem.val = new char[A_rem.nnz];
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            val_type eps_dia_i = eps_squared * D[i];
-
-            for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                ptrdiff_t c = A_loc.col[j];
-                val_type  v = A_loc.val[j];
-
-                if ((S_loc.val[j] = (c == i || (eps_dia_i * D[c] < v * v))))
-                    ++S_loc.ptr[i + 1];
-            }
-
-            for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j) {
-                ptrdiff_t c = C.local_index(A_rem.col[j]);
-                val_type  v = A_rem.val[j];
-
-                if ((S_rem.val[j] = (eps_dia_i * D_rem[c] < v * v)))
-                    ++S_rem.ptr[i + 1];
-            }
-        }
-
-        S_loc.nnz = S_loc.scan_row_sizes();
-        S_rem.nnz = S_rem.scan_row_sizes();
-
-        S_loc.col = new ptrdiff_t[S_loc.nnz];
-        S_rem.col = new ptrdiff_t[S_rem.nnz];
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            ptrdiff_t loc_head = S_loc.ptr[i];
-            ptrdiff_t rem_head = S_rem.ptr[i];
-
-            for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j)
-                if (S_loc.val[j]) S_loc.col[loc_head++] = A_loc.col[j];
-
-            for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j)
-                if (S_rem.val[j]) S_rem.col[rem_head++] = A_rem.col[j];
-        }
-        AMGCL_TOC("conn_strength");
-
-        return std::make_shared< distributed_matrix<bool_backend> >(
-                A.comm(), s_loc, s_rem);
-    }
-
-    ptrdiff_t aggregates(
-            const distributed_matrix<bool_backend> &A,
-            std::vector<ptrdiff_t> &loc_state,
-            std::vector<int>       &loc_owner
-            )
-    {
-        AMGCL_TIC("PMIS");
-        static const int tag_exc_cnt = 4001;
-        static const int tag_exc_pts = 4002;
-
-        const bool_matrix &A_loc = *A.local();
-        const bool_matrix &A_rem = *A.remote();
-
-        ptrdiff_t n = A_loc.nrows;
-
-        communicator comm = A.comm();
-
-        // 1. Get symbolic square of the connectivity matrix.
-        AMGCL_TIC("symbolic square");
-        auto S = squared_interface(A);
-        const bool_matrix &S_loc = *S->local();
-        const bool_matrix &S_rem = *S->remote();
-        const comm_pattern<bool_backend> &Sp = S->cpat();
-        AMGCL_TOC("symbolic square");
-
-        // 2. Apply PMIS algorithm to the symbolic square.
-        ptrdiff_t n_undone = 0;
-        std::vector<ptrdiff_t> rem_state(Sp.recv.count(), pmis::undone);
-        std::vector<int>       rem_owner(Sp.recv.count(), -1);
-        std::vector<ptrdiff_t> send_state(Sp.send.count());
-        std::vector<int>       send_owner(Sp.send.count());
-
-        // Remove lonely nodes.
-#pragma omp parallel for reduction(+:n_undone)
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            ptrdiff_t wl = A_loc.ptr[i+1] - A_loc.ptr[i];
-            ptrdiff_t wr = S_rem.ptr[i+1] - S_rem.ptr[i];
-
-            if (wl + wr == 1) {
-                loc_state[i] = pmis::deleted;
-                ++n_undone;
-            } else {
-                loc_state[i] = pmis::undone;
-            }
-
-            loc_owner[i] = -1;
-        }
-
-        n_undone = n - n_undone;
-
-        // Exchange state
-        for(ptrdiff_t i = 0, m = Sp.send.count(); i < m; ++i)
-            send_state[i] = loc_state[Sp.send.col[i]];
-        Sp.exchange(&send_state[0], &rem_state[0]);
-
-        std::vector< std::vector<ptrdiff_t> > send_pts(Sp.recv.nbr.size());
-        std::vector<ptrdiff_t> recv_pts;
-
-        std::vector<MPI_Request> send_cnt_req(Sp.recv.nbr.size());
-        std::vector<MPI_Request> send_pts_req(Sp.recv.nbr.size());
-
-        ptrdiff_t naggr = 0;
-
-        std::vector<ptrdiff_t> nbr;
-
-        while(true) {
-            for(size_t i = 0; i < Sp.recv.nbr.size(); ++i)
-                send_pts[i].clear();
-
-            if (n_undone) {
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    if (loc_state[i] != pmis::undone) continue;
-
-                    if (S_rem.ptr[i+1] > S_rem.ptr[i]) {
-                        // Boundary points
-                        bool selectable = true;
-                        for(ptrdiff_t j = S_rem.ptr[i], e = S_rem.ptr[i+1]; j < e; ++j) {
-                            int d,c;
-                            std::tie(d,c) = Sp.remote_info(S_rem.col[j]);
-
-                            if (rem_state[c] == pmis::undone && Sp.recv.nbr[d] > comm.rank) {
-                                selectable = false;
-                                break;
-                            }
-                        }
-
-                        if (!selectable) continue;
-
-                        ptrdiff_t id = naggr++;
-                        loc_owner[i] = comm.rank;
-                        loc_state[i] = id;
-                        --n_undone;
-
-                        // A gives immediate neighbors
-                        for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                            ptrdiff_t c = A_loc.col[j];
-                            if (c != i) {
-                                if (loc_state[c] == pmis::undone) --n_undone;
-                                loc_owner[c] = comm.rank;
-                                loc_state[c] = id;
-                            }
-                        }
-
-                        for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j) {
-                            ptrdiff_t c = A_rem.col[j];
-                            int d,k;
-                            std::tie(d,k) = Sp.remote_info(c);
-
-                            rem_state[k] = id;
-
-                            send_pts[d].push_back(c);
-                            send_pts[d].push_back(id);
-                        }
-
-                        // S gives removed neighbors
-                        for(ptrdiff_t j = S_loc.ptr[i], e = S_loc.ptr[i+1]; j < e; ++j) {
-                            ptrdiff_t c = S_loc.col[j];
-                            if (c != i && loc_state[c] == pmis::undone) {
-                                loc_owner[c] = comm.rank;
-                                loc_state[c] = id;
-                                --n_undone;
-                            }
-                        }
-
-                        for(ptrdiff_t j = S_rem.ptr[i], e = S_rem.ptr[i+1]; j < e; ++j) {
-                            ptrdiff_t c = S_rem.col[j];
-                            int d,k;
-                            std::tie(d,k) = Sp.remote_info(c);
-
-                            if (rem_state[k] == pmis::undone) {
-                                rem_state[k] = id;
-                                send_pts[d].push_back(c);
-                                send_pts[d].push_back(id);
-                            }
-                        }
-                    } else {
-                        // Inner points
-                        ptrdiff_t id = naggr++;
-                        loc_owner[i] = comm.rank;
-                        loc_state[i] = id;
-                        --n_undone;
-
-                        nbr.clear();
-
-                        for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                            ptrdiff_t c = A_loc.col[j];
-
-                            if (c != i && loc_state[c] != pmis::deleted) {
-                                if (loc_state[c] == pmis::undone) --n_undone;
-                                loc_owner[c] = comm.rank;
-                                loc_state[c] = id;
-                                nbr.push_back(c);
-                            }
-                        }
-
-                        for(ptrdiff_t k : nbr) {
-                            for(ptrdiff_t j = A_loc.ptr[k], e = A_loc.ptr[k+1]; j < e; ++j) {
-                                ptrdiff_t c = A_loc.col[j];
-                                if (c != k && loc_state[c] == pmis::undone) {
-                                    loc_owner[c] = comm.rank;
-                                    loc_state[c] = id;
-                                    --n_undone;
-                                }
-                            }
-                        }
-                    }
-                }
-            }
-
-            for(size_t i = 0; i < Sp.recv.nbr.size(); ++i) {
-                int npts = send_pts[i].size();
-                MPI_Isend(&npts, 1, MPI_INT, Sp.recv.nbr[i], tag_exc_cnt, comm, &send_cnt_req[i]);
-
-                if (!npts) continue;
-                MPI_Isend(&send_pts[i][0], npts, datatype<ptrdiff_t>(), Sp.recv.nbr[i], tag_exc_pts, comm, &send_pts_req[i]);
-            }
-
-            for(size_t i = 0; i < Sp.send.nbr.size(); ++i) {
-                int npts;
-                MPI_Recv(&npts, 1, MPI_INT, Sp.send.nbr[i], tag_exc_cnt, comm, MPI_STATUS_IGNORE);
-
-                if (!npts) continue;
-                recv_pts.resize(npts);
-                MPI_Recv(&recv_pts[0], npts, datatype<ptrdiff_t>(), Sp.send.nbr[i], tag_exc_pts, comm, MPI_STATUS_IGNORE);
-
-                for(int k = 0; k < npts; k += 2) {
-                    ptrdiff_t c  = recv_pts[k] - Sp.loc_col_shift();
-                    ptrdiff_t id = recv_pts[k+1];
-
-                    if (loc_state[c] == pmis::undone) --n_undone;
-
-                    loc_owner[c] = Sp.send.nbr[i];
-                    loc_state[c] = id;
-                }
-            }
-
-            for(size_t i = 0; i < Sp.recv.nbr.size(); ++i) {
-                int npts = send_pts[i].size();
-                MPI_Wait(&send_cnt_req[i], MPI_STATUS_IGNORE);
-                if (!npts) continue;
-                MPI_Wait(&send_pts_req[i], MPI_STATUS_IGNORE);
-            }
-
-            for(ptrdiff_t i = 0, m = Sp.send.count(); i < m; ++i)
-                send_state[i] = loc_state[Sp.send.col[i]];
-            Sp.exchange(&send_state[0], &rem_state[0]);
-
-            if (0 == comm.reduce(MPI_SUM, n_undone))
-                break;
-        }
-
-        // Some of the aggregates could potentially vanish during expansion
-        // step (*) above. We need to exclude those and renumber the rest.
-        AMGCL_TIC("drop empty aggregates");
-        for(ptrdiff_t i = 0, m = Sp.send.count(); i < m; ++i)
-            send_owner[i] = loc_owner[Sp.send.col[i]];
-        Sp.exchange(&send_owner[0], &rem_owner[0]);
-
-        std::vector<ptrdiff_t> new_id(naggr + 1, 0);
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            if (loc_owner[i] == comm.rank && loc_state[i] >= 0)
-                new_id[loc_state[i] + 1] = 1;
-        }
-
-        for(size_t i = 0; i < Sp.recv.count(); ++i) {
-            if (rem_owner[i] == comm.rank && rem_state[i] >= 0)
-                new_id[rem_state[i] + 1] = 1;
-        }
-
-        std::partial_sum(new_id.begin(), new_id.end(), new_id.begin());
-
-        if (comm.reduce(MPI_SUM, naggr - new_id.back()) > 0) {
-            naggr = new_id.back();
-
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                if (loc_owner[i] == comm.rank && loc_state[i] >= 0) {
-                    loc_state[i] = new_id[loc_state[i]];
-                }
-            }
-
-            for(size_t i = 0; i < Sp.recv.nbr.size(); ++i) {
-                send_pts[i].clear();
-            }
-
-            for (auto p = Sp.remote_begin(); p!= Sp.remote_end(); ++p) {
-                ptrdiff_t c = p->first;
-
-                int d, k;
-                std::tie(d, k) = p->second;
-
-                if (rem_owner[k] == comm.rank && rem_state[k] >= 0) {
-                    send_pts[d].push_back(c);
-                    send_pts[d].push_back(new_id[rem_state[k]]);
-                }
-            }
-
-            for(size_t i = 0; i < Sp.recv.nbr.size(); ++i) {
-                int npts = send_pts[i].size();
-                MPI_Isend(&npts, 1, MPI_INT, Sp.recv.nbr[i], tag_exc_cnt, comm, &send_cnt_req[i]);
-
-                if (!npts) continue;
-                MPI_Isend(&send_pts[i][0], npts, datatype<ptrdiff_t>(), Sp.recv.nbr[i], tag_exc_pts, comm, &send_pts_req[i]);
-            }
-
-            for(size_t i = 0; i < Sp.send.nbr.size(); ++i) {
-                int npts;
-                MPI_Recv(&npts, 1, MPI_INT, Sp.send.nbr[i], tag_exc_cnt, comm, MPI_STATUS_IGNORE);
-
-                if (!npts) continue;
-                recv_pts.resize(npts);
-                MPI_Recv(&recv_pts[0], npts, datatype<ptrdiff_t>(), Sp.send.nbr[i], tag_exc_pts, comm, MPI_STATUS_IGNORE);
-
-                for(int k = 0; k < npts; k += 2) {
-                    ptrdiff_t c  = recv_pts[k] - Sp.loc_col_shift();
-                    ptrdiff_t id = recv_pts[k+1];
-
-                    loc_state[c] = id;
-                }
-            }
-
-            for(size_t i = 0; i < Sp.recv.nbr.size(); ++i) {
-                int npts = send_pts[i].size();
-                MPI_Wait(&send_cnt_req[i], MPI_STATUS_IGNORE);
-                if (!npts) continue;
-                MPI_Wait(&send_pts_req[i], MPI_STATUS_IGNORE);
-            }
-        }
-
-        AMGCL_TOC("drop empty aggregates");
-        AMGCL_TOC("PMIS");
-
-        return naggr;
-    }
-
-    std::shared_ptr<matrix>
-    tentative_prolongation(communicator comm, ptrdiff_t n, ptrdiff_t naggr,
-            std::vector<ptrdiff_t> &state, std::vector<int> &owner)
-    {
-        auto p_loc = std::make_shared<build_matrix>();
-        auto p_rem = std::make_shared<build_matrix>();
-        build_matrix &P_loc = *p_loc;
-        build_matrix &P_rem = *p_rem;
-
-        AMGCL_TIC("tentative prolongation");
-
-        if (int null_cols = prm.nullspace.cols) {
-            ptrdiff_t nba = naggr / prm.block_size;
-
-            std::vector<ptrdiff_t> fdom = comm.exclusive_sum(n);
-            std::vector<ptrdiff_t> cdom = comm.exclusive_sum(naggr);
-
-            std::vector<int> scounts(comm.size, 0);
-            std::vector<int> rcounts(comm.size);
-
-            // Precompute the shape of the prolongation operator.
-            // Each row contains exactly nullspace.cols non-zero entries.
-            // Rows that do not belong to any aggregate are empty.
-            P_loc.set_size(n, null_cols * nba, true);
-            P_rem.set_size(n, 0, true);
-
-            // Also count the number of local DOFs in local aggregates
-            ptrdiff_t loc_dofs = 0;
-
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                if (state[i] == pmis::deleted) continue;
-
-                if (owner[i] == comm.rank) {
-                    P_loc.ptr[i+1] = null_cols;
-                    ++loc_dofs;
-                } else {
-                    P_rem.ptr[i+1] = null_cols;
-                    ++scounts[owner[i]];
-                }
-            }
-
-            // Setup the exchange
-            MPI_Request req;
-            MPI_Ialltoall(
-                    scounts.data(), 1, MPI_INT,
-                    rcounts.data(), 1, MPI_INT,
-                    comm, &req);
-
-            P_loc.set_nonzeros(P_loc.scan_row_sizes());
-            P_rem.set_nonzeros(P_rem.scan_row_sizes());
-
-            MPI_Wait(&req, MPI_STATUS_IGNORE);
-
-            int snbr = 0;
-            int rnbr = 0;
-            for(int i = 0; i < comm.size; ++i) {
-                if (scounts[i]) ++snbr;
-                if (rcounts[i]) ++rnbr;
-            }
-
-            std::vector<int> send_nbr; send_nbr.reserve(snbr);
-            std::vector<int> recv_nbr; recv_nbr.reserve(rnbr);
-            std::vector<int> send_ptr; send_ptr.reserve(snbr + 1); send_ptr.push_back(0);
-            std::vector<int> recv_ptr; recv_ptr.reserve(rnbr + 1); recv_ptr.push_back(0);
-
-            for(int i = 0; i < comm.size; ++i) {
-                if (scounts[i]) {
-                    send_nbr.push_back(i);
-                    send_ptr.push_back(send_ptr.back() + scounts[i]);
-                }
-                if (rcounts[i]) {
-                    recv_nbr.push_back(i);
-                    recv_ptr.push_back(recv_ptr.back() + rcounts[i]);
-                }
-            }
-
-            int send_dofs = send_ptr.back();
-            int recv_dofs = recv_ptr.back();
-
-            std::vector<ptrdiff_t> send_agg(send_dofs);             // IDs of the aggregates we are sending
-            std::vector<ptrdiff_t> send_dof(send_dofs);             // DOFs included in the aggregates
-            std::vector<double>    send_row(send_dofs * null_cols); // Rows of the nullspace matrix corresponding to the DOFs
-
-            std::vector<ptrdiff_t> recv_agg(recv_dofs);             // IDs of the aggregates we are receiving
-            std::vector<ptrdiff_t> recv_dof(recv_dofs);             // DOFs included in the aggregates
-            std::vector<double>    recv_row(recv_dofs * null_cols); // Rows of the nullspace matrix corresponding to the DOFs
-
-            // Prepare the data to send
-            std::vector<ptrdiff_t> send_rank_ptr(comm.size + 1); send_rank_ptr[0] = 0;
-            std::partial_sum(scounts.begin(), scounts.end(), send_rank_ptr.begin() + 1);
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                auto s = state[i];
-                auto o = owner[i];
-
-                if (s == pmis::deleted) continue;
-                if (o == comm.rank) continue;
-
-                auto head = send_rank_ptr[o]++;
-
-                send_agg[head] = s;
-                send_dof[head] = i + fdom[comm.rank];
-                std::copy_n(&prm.nullspace.B[i * null_cols], null_cols, &send_row[head * null_cols]);
-            }
-
-            // Exchange the data
-            std::vector<MPI_Request> send_req(3 * snbr);
-            std::vector<MPI_Request> recv_req(3 * rnbr);
-
-            for(int i = 0; i < rnbr; ++i) {
-                int n = recv_nbr[i];
-                int p = recv_ptr[i];
-                int w = recv_ptr[i + 1] - p;
-
-                MPI_Request *req = &recv_req[3 * i];
-
-                MPI_Irecv(&recv_agg[p], w, datatype<ptrdiff_t>(), n, tag_exc_agg, comm, &req[0]);
-                MPI_Irecv(&recv_dof[p], w, datatype<ptrdiff_t>(), n, tag_exc_dof, comm, &req[1]);
-                MPI_Irecv(&recv_row[null_cols * p], null_cols * w, datatype<double>(), n, tag_exc_row, comm, &req[2]);
-            }
-
-            for(int i = 0; i < snbr; ++i) {
-                int n = send_nbr[i];
-                int p = send_ptr[i];
-                int w = send_ptr[i + 1] - p;
-
-                MPI_Request *req = &send_req[3 * i];
-
-                MPI_Isend(&send_agg[p], w, datatype<ptrdiff_t>(), n, tag_exc_agg, comm, &req[0]);
-                MPI_Isend(&send_dof[p], w, datatype<ptrdiff_t>(), n, tag_exc_dof, comm, &req[1]);
-                MPI_Isend(&send_row[null_cols * p], null_cols * w, datatype<double>(), n, tag_exc_row, comm, &req[2]);
-            }
-
-            AMGCL_TIC("MPI Wait");
-            MPI_Waitall(recv_req.size(), recv_req.data(), MPI_STATUSES_IGNORE);
-            MPI_Waitall(send_req.size(), send_req.data(), MPI_STATUSES_IGNORE);
-            AMGCL_TOC("MPI Wait");
-
-            // Sort the fine-level points by the aggregate number.
-            // The order vector contains tuples of (aggr, dof, src, dst),
-            // where src points to a row in B, and dst points to a row in P
-            std::vector<std::tuple<ptrdiff_t, ptrdiff_t, double*, value_type*>> order;
-            order.reserve(loc_dofs + recv_dofs);
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                auto s = state[i];
-                auto o = owner[i];
-
-                if (s == pmis::deleted) continue;
-                if (o != comm.rank) continue;
-
-                order.emplace_back(s / prm.block_size, i + fdom[comm.rank],
-                        &prm.nullspace.B[i * null_cols], &P_loc.val[P_loc.ptr[i]]);
-            }
-            for(ptrdiff_t i = 0; i < recv_dofs; ++i) {
-                order.emplace_back(recv_agg[i] / prm.block_size, recv_dof[i],
-                        &recv_row[i * null_cols], nullptr);
-            }
-            std::sort(order.begin(), order.end());
-
-            std::vector<ptrdiff_t> aggr_ptr(nba + 1, 0);
-            for(size_t i = 0; i < order.size(); ++i)
-                ++aggr_ptr[std::get<0>(order[i])+1];
-            std::partial_sum(aggr_ptr.begin(), aggr_ptr.end(), aggr_ptr.begin());
-
-            // Compute the tentative prolongation operator and null-space vectors
-            // for the coarser level.
-            std::vector<double> Bnew;
-            Bnew.resize(nba * null_cols * null_cols);
-
-#pragma omp parallel
-            {
-                amgcl::detail::QR<double> qr;
-                std::vector<double> Bpart;
-
-#pragma omp for
-                for(ptrdiff_t i = 0; i < nba; ++i) {
-                    auto aggr_beg = aggr_ptr[i];
-                    auto aggr_end = aggr_ptr[i+1];
-                    auto d = aggr_end - aggr_beg;
-
-                    Bpart.resize(d * null_cols);
-
-                    for(ptrdiff_t j = aggr_beg, r = 0; j < aggr_end; ++j, ++r) {
-                        auto src = std::get<2>(order[j]);
-                        for(int c = 0; c < null_cols; ++c)
-                            Bpart[r + d * c] = src[c];
-                    }
-
-                    qr.factorize(d, null_cols, &Bpart[0], amgcl::detail::col_major);
-
-                    for(ptrdiff_t r = 0, k = i * null_cols * null_cols; r < null_cols; ++r)
-                        for(int c = 0; c < null_cols; ++c, ++k)
-                            Bnew[k] = qr.R(r,c);
-
-                    for(ptrdiff_t j = aggr_beg, r = 0; j < aggr_end; ++j, ++r) {
-                        auto src = std::get<2>(order[j]);
-                        auto dst = std::get<3>(order[j]);
-
-                        if (dst) {
-                            // TODO: this is just a workaround to make non-scalar value
-                            // types compile. Most probably this won't actually work.
-                            for(int c = 0; c < null_cols; ++c)
-                                dst[c] = qr.Q(r,c) * math::identity<value_type>();
-                        } else {
-                            for(int c = 0; c < null_cols; ++c)
-                                src[c] = qr.Q(r,c);
-                        }
-                    }
-                }
-            }
-
-            // Exchange the computed rows of the prolongation operator with the
-            // owners.
-            for(int i = 0; i < snbr; ++i) {
-                int n = send_nbr[i];
-                int p = send_ptr[i];
-                int w = send_ptr[i + 1] - p;
-                MPI_Irecv(&send_row[null_cols * p], null_cols * w, datatype<double>(), n, tag_exc_row, comm, &send_req[i]);
-            }
-
-            for(int i = 0; i < rnbr; ++i) {
-                int n = recv_nbr[i];
-                int p = recv_ptr[i];
-                int w = recv_ptr[i + 1] - p;
-                MPI_Isend(&recv_row[null_cols * p], null_cols * w, datatype<double>(), n, tag_exc_row, comm, &recv_req[i]);
-            }
-
-            // Fill column numbers
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                ptrdiff_t s = state[i];
-                if (s == pmis::deleted) continue;
-
-                int d = owner[i];
-                if (d == comm.rank) {
-                    auto col = &P_loc.col[P_loc.ptr[i]];
-                    for (int j = 0; j < null_cols; ++j) {
-                        col[j] = null_cols * s / prm.block_size + j;
-                    }
-                } else {
-                    auto col = &P_rem.col[P_rem.ptr[i]];
-                    for (int j = 0; j < null_cols; ++j) {
-                        col[j] = null_cols * (s + cdom[d]) / prm.block_size + j;
-                    }
-                }
-            }
-
-            AMGCL_TIC("MPI Wait");
-            MPI_Waitall(snbr, send_req.data(), MPI_STATUSES_IGNORE);
-            MPI_Waitall(rnbr, recv_req.data(), MPI_STATUSES_IGNORE);
-            AMGCL_TOC("MPI Wait");
-
-            // Use the P rows computed by the neighbors
-            for(ptrdiff_t k = 0; k < send_dofs; ++k) {
-                auto i = send_dof[k] - fdom[comm.rank];
-                auto src = &send_row[k * null_cols];
-                auto dst = &P_rem.val[P_rem.ptr[i]];
-
-                for(ptrdiff_t j = 0; j < null_cols; ++j) {
-                    dst[j] = src[j] * math::identity<value_type>();
-                }
-            }
-
-            std::swap(prm.nullspace.B, Bnew);
-        } else {
-            std::vector<ptrdiff_t> dom = comm.exclusive_sum(naggr);
-
-            P_loc.set_size(n, naggr, true);
-            P_rem.set_size(n, 0, true);
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                if (state[i] == pmis::deleted) continue;
-
-                if (owner[i] == comm.rank) {
-                    ++P_loc.ptr[i+1];
-                } else {
-                    ++P_rem.ptr[i+1];
-                }
-            }
-
-            P_loc.set_nonzeros(P_loc.scan_row_sizes());
-            P_rem.set_nonzeros(P_rem.scan_row_sizes());
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                ptrdiff_t s = state[i];
-                if (s == pmis::deleted) continue;
-
-                int d = owner[i];
-                if (d == comm.rank) {
-                    P_loc.col[P_loc.ptr[i]] = s;
-                    P_loc.val[P_loc.ptr[i]] = math::identity<value_type>();
-                } else {
-                    P_rem.col[P_rem.ptr[i]] = s + dom[d];
-                    P_rem.val[P_rem.ptr[i]] = math::identity<value_type>();
-                }
-            }
-        }
-        AMGCL_TOC("tentative prolongation");
-
-        return std::make_shared<matrix>(comm, p_loc, p_rem);
-    }
-
-    template <class pw_matrix>
-    std::shared_ptr<bool_matrix>
-    expand_conn(const build_matrix &A, const pw_matrix &Ap, const bool_matrix &Cp,
-            unsigned block_size) const
-    {
-        ptrdiff_t np = Cp.nrows;
-        ptrdiff_t n  = np * block_size;
-
-        auto c = std::make_shared<bool_matrix>();
-        bool_matrix &C = *c;
-
-        C.set_size(n, n, true);
-        C.val = new char[A.nnz];
-
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> j(block_size);
-            std::vector<ptrdiff_t> e(block_size);
-
-#pragma omp for
-            for(ptrdiff_t ip = 0; ip < np; ++ip) {
-                ptrdiff_t ia = ip * block_size;
-
-                for(unsigned k = 0; k < block_size; ++k) {
-                    j[k] = A.ptr[ia + k];
-                    e[k] = A.ptr[ia + k + 1];
-                }
-
-                for(ptrdiff_t jp = Ap.ptr[ip], ep = Ap.ptr[ip+1]; jp < ep; ++jp) {
-                    ptrdiff_t cp = Ap.col[jp];
-                    bool      sp = Cp.val[jp];
-
-                    ptrdiff_t col_end = (cp + 1) * block_size;
-
-                    for(unsigned k = 0; k < block_size; ++k) {
-                        ptrdiff_t beg = j[k];
-                        ptrdiff_t end = e[k];
-
-                        while(beg < end && A.col[beg] < col_end) {
-                            C.val[beg++] = sp;
-
-                            if (sp) ++C.ptr[ia + k + 1];
-                        }
-
-                        j[k] = beg;
-                    }
-                }
-            }
-        }
-
-        C.nnz = C.scan_row_sizes();
-        C.col = new ptrdiff_t[C.nnz];
-
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> j(block_size);
-            std::vector<ptrdiff_t> e(block_size);
-            std::vector<ptrdiff_t> h(block_size);
-
-#pragma omp for
-            for(ptrdiff_t ip = 0; ip < np; ++ip) {
-                ptrdiff_t ia = ip * block_size;
-
-                for(unsigned k = 0; k < block_size; ++k) {
-                    j[k] = A.ptr[ia + k];
-                    e[k] = A.ptr[ia + k + 1];
-                    h[k] = C.ptr[ia + k];
-                }
-
-                for(ptrdiff_t jp = Ap.ptr[ip], ep = Ap.ptr[ip+1]; jp < ep; ++jp) {
-                    ptrdiff_t cp = Ap.col[jp];
-                    bool      sp = Cp.val[jp];
-
-                    ptrdiff_t col_end = (cp + 1) * block_size;
-
-                    for(unsigned k = 0; k < block_size; ++k) {
-                        ptrdiff_t beg = j[k];
-                        ptrdiff_t end = e[k];
-                        ptrdiff_t hed = h[k];
-
-                        while(beg < end && A.col[beg] < col_end) {
-                            if (sp) C.col[hed++] = A.col[beg];
-                            ++beg;
-                        }
-
-                        j[k] = beg;
-                        h[k] = hed;
-                    }
-                }
-            }
-        }
-
-        return c;
-    }
-
-    private:
-        static const int undone = -2;
-        static const int deleted = -1;
-
-        static const int tag_exc_agg = 4011;
-        static const int tag_exc_dof = 4012;
-        static const int tag_exc_row = 4013;
-};
-
-} // namespace coarsening
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/coarsening/runtime.hpp b/src/solvers/amgcl/mpi/coarsening/runtime.hpp
deleted file mode 100644
index a01182b..0000000
--- a/src/solvers/amgcl/mpi/coarsening/runtime.hpp
+++ /dev/null
@@ -1,194 +0,0 @@
-#ifndef AMGCL_MPI_COARSENING_RUNTIME_HPP
-#define AMGCL_MPI_COARSENING_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/coarsening/aggregation.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime wrapper for distributed coarsening schemes.
- */
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/coarsening/aggregation.hpp>
-#include <amgcl/mpi/coarsening/smoothed_aggregation.hpp>
-
-namespace amgcl {
-namespace runtime {
-namespace mpi {
-namespace coarsening {
-
-enum type {
-    aggregation,
-    smoothed_aggregation
-};
-
-inline std::ostream& operator<<(std::ostream &os, type s)
-{
-    switch (s) {
-        case aggregation:
-            return os << "aggregation";
-        case smoothed_aggregation:
-            return os << "smoothed_aggregation";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &s)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "aggregation")
-        s = aggregation;
-    else if (val == "smoothed_aggregation")
-        s = smoothed_aggregation;
-    else
-        throw std::invalid_argument("Invalid coarsening value. Valid choices are: "
-                "aggregation, smoothed_aggregation.");
-
-    return in;
-}
-
-template <class Backend>
-struct wrapper {
-    typedef amgcl::mpi::distributed_matrix<Backend> matrix;
-    typedef boost::property_tree::ptree params;
-
-    type c;
-    void *handle;
-
-    wrapper(params prm = params())
-        : c(prm.get("type", smoothed_aggregation)), handle(0)
-    {
-        if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-        switch (c) {
-            case aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::aggregation<Backend> C;
-                    handle = static_cast<void*>(new C(prm));
-                }
-                break;
-            case smoothed_aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::smoothed_aggregation<Backend> C;
-                    handle = static_cast<void*>(new C(prm));
-                }
-                break;
-            default:
-                throw std::invalid_argument("Unsupported coarsening type");
-        }
-    }
-
-    ~wrapper() {
-        switch(c) {
-            case aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::aggregation<Backend> C;
-                    delete static_cast<C*>(handle);
-                }
-                break;
-            case smoothed_aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::smoothed_aggregation<Backend> C;
-                    delete static_cast<C*>(handle);
-                }
-                break;
-            default:
-                break;
-        }
-    }
-
-    std::tuple< std::shared_ptr<matrix>, std::shared_ptr<matrix> >
-    transfer_operators(const matrix &A) {
-        switch (c) {
-            case aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::aggregation<Backend> C;
-                    return static_cast<C*>(handle)->transfer_operators(A);
-                }
-            case smoothed_aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::smoothed_aggregation<Backend> C;
-                    return static_cast<C*>(handle)->transfer_operators(A);
-                }
-            default:
-                throw std::invalid_argument("Unsupported partition type");
-        }
-    }
-
-    std::shared_ptr<matrix>
-    coarse_operator(const matrix &A, const matrix &P, const matrix &R) const {
-        switch (c) {
-            case aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::aggregation<Backend> C;
-                    return static_cast<C*>(handle)->coarse_operator(A, P, R);
-                }
-            case smoothed_aggregation:
-                {
-                    typedef amgcl::mpi::coarsening::smoothed_aggregation<Backend> C;
-                    return static_cast<C*>(handle)->coarse_operator(A, P, R);
-                }
-            default:
-                throw std::invalid_argument("Unsupported partition type");
-        }
-    }
-};
-
-template <class Backend>
-unsigned block_size(const wrapper<Backend> &w) {
-    switch (w.c) {
-        case aggregation:
-            {
-                typedef amgcl::mpi::coarsening::aggregation<Backend> C;
-                return block_size(*static_cast<const C*>(w.handle));
-            }
-        case smoothed_aggregation:
-            {
-                typedef amgcl::mpi::coarsening::smoothed_aggregation<Backend> C;
-                return block_size(*static_cast<const C*>(w.handle));
-            }
-        default:
-            throw std::invalid_argument("Unsupported coarsening type");
-    }
-}
-
-} // namespace coarsening
-} // namespace mpi
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/coarsening/smoothed_aggregation.hpp b/src/solvers/amgcl/mpi/coarsening/smoothed_aggregation.hpp
deleted file mode 100644
index 9d27451..0000000
--- a/src/solvers/amgcl/mpi/coarsening/smoothed_aggregation.hpp
+++ /dev/null
@@ -1,213 +0,0 @@
-#ifndef AMGCL_MPI_COARSENING_SMOOTHED_AGGREGATION_HPP
-#define AMGCL_MPI_COARSENING_SMOOTHED_AGGREGATION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/coarsening/smoothed_aggregation.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed smoothed aggregation coarsening scheme.
- */
-
-#include <tuple>
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/coarsening/detail/galerkin.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/coarsening/pmis.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace coarsening {
-
-template <class Backend>
-struct smoothed_aggregation {
-    typedef typename Backend::value_type value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef backend::crs<value_type> build_matrix;
-
-    struct params {
-        // aggregation params
-        typedef typename pmis<Backend>::params aggr_params;
-        aggr_params aggr;
-
-        /// Relaxation factor.
-        scalar_type relax;
-
-        // Estimate the matrix spectral radius.
-        // This usually improves convergence rate and results in faster solves,
-        // but costs some time during setup.
-        bool estimate_spectral_radius;
-
-        // Number of power iterations to apply for the spectral radius
-        // estimation. Use Gershgorin disk theorem when power_iters = 0.
-        int power_iters;
-
-        params()
-            : relax(1.0f), estimate_spectral_radius(false), power_iters(0)
-        { }
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_CHILD(p, aggr),
-              AMGCL_PARAMS_IMPORT_VALUE(p, relax),
-              AMGCL_PARAMS_IMPORT_VALUE(p, estimate_spectral_radius),
-              AMGCL_PARAMS_IMPORT_VALUE(p, power_iters)
-        {
-            check_params(p, {"aggr", "relax", "estimate_spectral_radius", "power_iters"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, aggr);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, relax);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, estimate_spectral_radius);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, power_iters);
-        }
-#endif
-    } prm;
-
-    smoothed_aggregation(const params &prm = params()) : prm(prm) {}
-
-    std::tuple<
-        std::shared_ptr< distributed_matrix<Backend> >,
-        std::shared_ptr< distributed_matrix<Backend> >
-        >
-    transfer_operators(const distributed_matrix<Backend> &A) {
-        typedef distributed_matrix<Backend> DM;
-        typedef backend::crs<char> bool_matrix;
-
-        pmis<Backend> aggr(A, prm.aggr);
-        prm.aggr.eps_strong *= 0.5;
-
-        communicator comm = A.comm();
-        const build_matrix &A_loc = *A.local();
-        const build_matrix &A_rem = *A.remote();
-
-        bool_matrix &S_loc = *aggr.conn->local();
-        bool_matrix &S_rem = *aggr.conn->remote();
-
-        AMGCL_TIC("filtered matrix");
-        ptrdiff_t n = A.loc_rows();
-
-        scalar_type omega = prm.relax;
-        if (prm.estimate_spectral_radius) {
-            omega *= static_cast<scalar_type>(4.0/3) / backend::spectral_radius<true>(A, prm.power_iters);
-        } else {
-            omega *= static_cast<scalar_type>(2.0/3);
-        }
-
-        auto af_loc = std::make_shared<build_matrix>();
-        auto af_rem = std::make_shared<build_matrix>();
-
-        build_matrix &Af_loc = *af_loc;
-        build_matrix &Af_rem = *af_rem;
-
-        backend::numa_vector<value_type> Af_loc_val(S_loc.nnz, false);
-        backend::numa_vector<value_type> Af_rem_val(S_rem.nnz, false);
-
-        Af_loc.own_data = false;
-        Af_loc.nrows = S_loc.nrows;
-        Af_loc.ncols = S_loc.ncols;
-        Af_loc.nnz   = S_loc.nnz;
-        Af_loc.ptr   = S_loc.ptr;
-        Af_loc.col   = S_loc.col;
-        Af_loc.val   = Af_loc_val.data();
-
-        Af_rem.own_data = false;
-        Af_rem.nrows = S_rem.nrows;
-        Af_rem.ncols = S_rem.ncols;
-        Af_rem.nnz   = S_rem.nnz;
-        Af_rem.ptr   = S_rem.ptr;
-        Af_rem.col   = S_rem.col;
-        Af_rem.val   = Af_rem_val.data();
-
-        backend::numa_vector<value_type> Df(n, false);
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            ptrdiff_t loc_head = Af_loc.ptr[i];
-            ptrdiff_t rem_head = Af_rem.ptr[i];
-
-            value_type dia_f = math::zero<value_type>();
-
-            for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j)
-                if (A_loc.col[j] == i || !S_loc.val[j]) dia_f += A_loc.val[j];
-
-            for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j)
-                if (!S_rem.val[j]) dia_f += A_rem.val[j];
-
-            dia_f = -omega * math::inverse(dia_f);
-
-            for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                if (A_loc.col[j] == i) {
-                    Af_loc.val[loc_head++] = (1 - omega) * math::identity<value_type>();
-                } else if(S_loc.val[j]) {
-                    Af_loc.val[loc_head++] = dia_f * A_loc.val[j];
-                }
-            }
-
-            for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j) {
-                if (S_rem.val[j]) {
-                    Af_rem.val[rem_head++] = dia_f * A_rem.val[j];
-                }
-            }
-        }
-
-        auto Af = std::make_shared<DM>(comm, af_loc, af_rem);
-        AMGCL_TOC("filtered matrix");
-
-        // 5. Smooth tentative prolongation with the filtered matrix.
-        AMGCL_TIC("smoothing");
-        auto P = product(*Af, *aggr.p_tent);
-        AMGCL_TOC("smoothing");
-
-        return std::make_tuple(P, transpose(*P));
-    }
-
-    std::shared_ptr< distributed_matrix<Backend> >
-    coarse_operator(
-            const distributed_matrix<Backend> &A,
-            const distributed_matrix<Backend> &P,
-            const distributed_matrix<Backend> &R
-            ) const
-    {
-        return amgcl::coarsening::detail::galerkin(A, P, R);
-    }
-
-};
-
-template <class Backend>
-unsigned block_size(const smoothed_aggregation<Backend> &c) {
-    return c.prm.aggr.block_size;
-}
-
-} // namespace coarsening
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/cpr.hpp b/src/solvers/amgcl/mpi/cpr.hpp
deleted file mode 100644
index 5d22670..0000000
--- a/src/solvers/amgcl/mpi/cpr.hpp
+++ /dev/null
@@ -1,472 +0,0 @@
-#ifndef AMGCL_MPI_CPR_HPP
-#define AMGCL_MPI_CPR_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/cpr.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed CPR preconditioner.
- */
-
-#include <cassert>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-template <class PPrecond, class SPrecond>
-class cpr {
-    static_assert(
-            std::is_same<
-                typename PPrecond::backend_type,
-                typename SPrecond::backend_type
-                >::value,
-            "Backends for pressure and flow preconditioners should coinside!"
-            );
-
-    public:
-        typedef typename PPrecond::backend_type backend_type;
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename backend_type::matrix     bmatrix;
-        typedef typename backend_type::vector     vector;
-        typedef typename backend_type::params     backend_params;
-
-        typedef distributed_matrix<backend_type>  matrix;
-        typedef typename backend::builtin<value_type>::matrix build_matrix;
-
-        struct params {
-            typedef typename PPrecond::params pprecond_params;
-            typedef typename SPrecond::params sprecond_params;
-
-            pprecond_params pprecond;
-            sprecond_params sprecond;
-
-            int block_size;
-
-            params() : block_size(2) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, pprecond),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, sprecond),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, block_size)
-            {
-                check_params(p, {"pprecond", "sprecond", "block_size", "active_rows"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path = "") const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, pprecond);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, sprecond);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, block_size);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        cpr(
-                communicator comm,
-                const Matrix &K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(prm), comm(comm), n(backend::rows(K))
-        {
-            init(std::make_shared<matrix>(comm, K, backend::rows(K)), bprm);
-        }
-
-        cpr(
-                communicator comm,
-                std::shared_ptr<matrix> K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(prm), comm(comm), n(K->loc_rows())
-        {
-            init(K, bprm);
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            S->apply(rhs, x);
-            backend::residual(rhs, S->system_matrix(), x, *rs);
-
-            backend::spmv(one, *Fpp, *rs, zero, *rp);
-            P->apply(*rp, *xp);
-
-            backend::spmv(one, *Scatter, *xp, one, x);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return S->system_matrix_ptr();
-        }
-
-        const matrix& system_matrix() const {
-            return S->system_matrix();
-        }
-
-    private:
-        communicator comm;
-        size_t n, np;
-
-        std::shared_ptr<PPrecond> P;
-        std::shared_ptr<SPrecond> S;
-
-        std::shared_ptr<bmatrix> Fpp, Scatter;
-        std::shared_ptr<vector> rp, xp, rs;
-
-        void init(std::shared_ptr<matrix> K, const backend_params &bprm) {
-            typedef typename backend::row_iterator<build_matrix>::type row_iterator;
-            const int B = prm.block_size;
-
-            auto _K_loc = K->local();
-            auto _K_rem = K->remote();
-
-            auto &K_loc = *_K_loc;
-            auto &K_rem = *_K_rem;
-
-            np = n / B;
-
-            auto fpp = std::make_shared<build_matrix>();
-            fpp->set_size(np, n);
-            fpp->set_nonzeros(n);
-            fpp->ptr[0] = 0;
-
-            auto App_loc = std::make_shared<build_matrix>();
-            auto App_rem = std::make_shared<build_matrix>();
-
-            App_loc->set_size(np, np, true);
-            App_rem->set_size(np, 0,  true);
-
-            // Get the pressure matrix nonzero pattern,
-            // extract and invert block diagonals.
-#pragma omp parallel
-            {
-                std::vector<row_iterator> k; k.reserve(B);
-                multi_array<value_type, 2> v(B, B);
-
-#pragma omp for
-                for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(np); ++ip) {
-                    ptrdiff_t ik = ip * B;
-                    bool      done = true;
-                    ptrdiff_t cur_col = 0;
-
-                    // Local part
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(K_loc, ik + i));
-
-                        if (k.back()) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-
-                        fpp->col[ik + i] = ik + i;
-                    }
-                    fpp->ptr[ip+1] = ik + B;
-
-                    while (!done) {
-                        ++App_loc->ptr[ip+1];
-
-                        ptrdiff_t end = (cur_col + 1) * B;
-
-                        if (cur_col == ip) {
-                            // This is diagonal block.
-                            // Capture its (transposed) value,
-                            // invert it and put the relevant row into fpp.
-                            for(int i = 0; i < B; ++i)
-                                for(int j = 0; j < B; ++j) v(i,j) = 0;
-
-                            for(int i = 0; i < B; ++i)
-                                for(; k[i] && k[i].col() < end; ++k[i])
-                                    v(k[i].col() % B, i) = k[i].value();
-
-                            invert(v, &fpp->val[ik]);
-                        } else {
-                            // This is off-diagonal block.
-                            // Just skip it.
-                            for(int i = 0; i < B; ++i)
-                                while(k[i] && k[i].col() < end) ++k[i];
-                        }
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i]) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-
-                    // Remote part
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(K_rem, ik + i));
-
-                        if (k.back()) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-                    }
-
-                    while (!done) {
-                        ++App_rem->ptr[ip+1];
-
-                        ptrdiff_t end = (cur_col + 1) * B;
-
-                        for(int i = 0; i < B; ++i)
-                            while(k[i] && k[i].col() < end) ++k[i];
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i]) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-                }
-            }
-
-            App_loc->set_nonzeros(App_loc->scan_row_sizes());
-            App_rem->set_nonzeros(App_rem->scan_row_sizes());
-
-            auto scatter = std::make_shared<build_matrix>();
-            scatter->set_size(n, np);
-            scatter->set_nonzeros(np);
-            scatter->ptr[0] = 0;
-
-#pragma omp parallel
-            {
-                std::vector<row_iterator> k; k.reserve(B);
-
-#pragma omp for
-                for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(np); ++ip) {
-                    ptrdiff_t ik = ip * B;
-                    bool      done = true;
-                    ptrdiff_t cur_col;
-
-                    value_type *d = &fpp->val[ik];
-
-                    // Local part
-                    ptrdiff_t head = App_loc->ptr[ip];
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(K_loc, ik + i));
-
-                        if (k.back()) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-                    }
-
-                    while (!done) {
-                        ptrdiff_t  end = (cur_col + 1) * B;
-                        value_type app = 0;
-
-                        for(int i = 0; i < B; ++i) {
-                            for(; k[i] && k[i].col() < end; ++k[i]) {
-                                if (k[i].col() % B == 0) {
-                                    app += d[i] * k[i].value();
-                                }
-                            }
-                        }
-
-                        App_loc->col[head] = cur_col;
-                        App_loc->val[head] = app;
-                        ++head;
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i]) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-
-                    // Remote part
-                    head = App_rem->ptr[ip];
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(K_rem, ik + i));
-
-                        if (k.back()) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-                    }
-
-                    while (!done) {
-                        ptrdiff_t  end = (cur_col + 1) * B;
-                        value_type app = 0;
-
-                        for(int i = 0; i < B; ++i) {
-                            for(; k[i] && k[i].col() < end; ++k[i]) {
-                                if (k[i].col() % B == 0) {
-                                    app += d[i] * k[i].value();
-                                }
-                            }
-                        }
-
-                        App_rem->col[head] = cur_col;
-                        App_rem->val[head] = app;
-                        ++head;
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i]) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-
-                    scatter->col[ip] = ip;
-                    scatter->val[ip] = math::identity<value_type>();
-
-                    ptrdiff_t nnz = ip;
-                    for(int i = 0; i < B; ++i) {
-                        if (i == 0) ++nnz;
-                        scatter->ptr[ik + i + 1] = nnz;
-                    }
-                }
-            }
-
-            auto App = std::make_shared<matrix>(comm, App_loc, App_rem);
-
-            P = std::make_shared<PPrecond>(comm, App, prm.pprecond, bprm);
-            S = std::make_shared<SPrecond>(comm, K,   prm.sprecond, bprm);
-
-            Fpp     = backend_type::copy_matrix(fpp, bprm);
-            Scatter = backend_type::copy_matrix(scatter, bprm);
-
-            rp = backend_type::create_vector(np, bprm);
-            xp = backend_type::create_vector(np, bprm);
-            rs = backend_type::create_vector(n, bprm);
-        }
-
-        // Inverts dense matrix A;
-        // Returns the first column of the inverted matrix.
-        void invert(multi_array<value_type, 2> &A, value_type *y)
-        {
-            const int B = prm.block_size;
-
-            // Perform LU-factorization of A in-place
-            for(int k = 0; k < B; ++k) {
-                value_type d = A(k,k);
-                assert(!math::is_zero(d));
-                for(int i = k+1; i < B; ++i) {
-                    A(i,k) /= d;
-                    for(int j = k+1; j < B; ++j)
-                        A(i,j) -= A(i,k) * A(k,j);
-                }
-            }
-
-            // Invert unit vector in-place.
-            // Lower triangular solve:
-            for(int i = 0; i < B; ++i) {
-                value_type b = static_cast<value_type>(i == 0);
-                for(int j = 0; j < i; ++j)
-                    b -= A(i,j) * y[j];
-                y[i] = b;
-            }
-
-            // Upper triangular solve:
-            for(int i = B; i --> 0; ) {
-                for(int j = i+1; j < B; ++j)
-                    y[i] -= A(i,j) * y[j];
-                y[i] /= A(i,i);
-            }
-        }
-
-    template <class P, class S>
-    friend std::ostream& operator<<(std::ostream &os, const cpr<P, S> &cpr);
-};
-
-template <class P, class S>
-std::ostream& operator<<(std::ostream &os, const cpr<P, S> &cpr) {
-    os << "CPR (two-stage preconditioner)\n"
-          "### Pressure preconditioner:\n"
-       << *cpr.P << "\n"
-          "### Global preconditioner:\n"
-       << *cpr.S << std::endl;
-    return os;
-}
-
-} // namespace mpi
-} // namespace amgcl
-#endif
diff --git a/src/solvers/amgcl/mpi/direct_solver/eigen_splu.hpp b/src/solvers/amgcl/mpi/direct_solver/eigen_splu.hpp
deleted file mode 100644
index 430d822..0000000
--- a/src/solvers/amgcl/mpi/direct_solver/eigen_splu.hpp
+++ /dev/null
@@ -1,105 +0,0 @@
-#ifndef AMGCL_MPI_DIRECT_SOLVER_EIGEN_SPLU_HPP
-#define AMGCL_MPI_DIRECT_SOLVER_EIGEN_SPLU_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/mpi/direct_solver/eigen_splu.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  MPI wrapper for Eigen::SparseLU solver.
-
-This is a wrapper around Eigen SparseLU solver that provides a
-distributed direct solver interface but always works sequentially.
-*/
-
-#include <mpi.h>
-
-#include <memory>
-
-#include <Eigen/SparseLU>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/adapter/crs_tuple.hpp>
-#include <amgcl/solver/eigen.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/direct_solver/solver_base.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace direct {
-
-/// Provides distributed direct solver interface for Skyline LU solver.
-template <typename value_type>
-class eigen_splu : public solver_base< value_type, eigen_splu<value_type> > {
-    public:
-        typedef
-            amgcl::solver::EigenSolver<
-                Eigen::SparseLU<
-                    Eigen::SparseMatrix<value_type, Eigen::ColMajor, int>
-                    >
-                >
-            Solver;
-        typedef typename Solver::params params;
-        typedef backend::crs<value_type> build_matrix;
-
-        /// Constructor.
-        template <class Matrix>
-        eigen_splu(communicator comm, const Matrix &A,
-                const params &prm = params()) : prm(prm)
-        {
-            static_cast<Base*>(this)->init(comm, A);
-        }
-
-        static size_t coarse_enough() {
-            return Base::coarse_enough();
-        }
-
-        int comm_size(int /*n*/) const {
-            return 1;
-        }
-
-        void init(communicator, const build_matrix &A) {
-            S = std::make_shared<Solver>(A, prm);
-        }
-
-        /// Solves the problem for the given right-hand side.
-        /**
-         * \param rhs The right-hand side.
-         * \param x   The solution.
-         */
-        template <class Vec1, class Vec2>
-        void solve(const Vec1 &rhs, Vec2 &x) const {
-            (*S)(rhs, x);
-        }
-    private:
-        typedef solver_base< value_type, eigen_splu<value_type> > Base;
-        params prm;
-        std::shared_ptr<Solver> S;
-};
-
-} // namespace direct
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/direct_solver/pastix.hpp b/src/solvers/amgcl/mpi/direct_solver/pastix.hpp
deleted file mode 100644
index aaf488a..0000000
--- a/src/solvers/amgcl/mpi/direct_solver/pastix.hpp
+++ /dev/null
@@ -1,244 +0,0 @@
-#ifndef AMGCL_MPI_DIRECT_SOLVER_PASTIX_HPP
-#define AMGCL_MPI_DIRECT_SOLVER_PASTIX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/mpi/direct_solver/pastix.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  Wrapper for PaStiX distributed sparse solver.
-
-See http://pastix.gforge.inria.fr
-*/
-
-#ifdef _OPENMP
-#  include <omp.h>
-#endif
-
-#include <type_traits>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/direct_solver/solver_base.hpp>
-
-extern "C" {
-#include <pastix.h>
-}
-
-namespace amgcl {
-namespace mpi {
-namespace direct {
-
-/// Provides distributed direct solver interface for pastix solver.
-/**
- * \sa http://pastix.gforge.inria.fr, \cite Henon2002
- */
-template <typename value_type, bool Distrib=false>
-class pastix : public solver_base< value_type, pastix<value_type, Distrib> > {
-    public:
-        static_assert(
-                 std::is_same<value_type, float >::value ||
-                 std::is_same<value_type, double>::value,
-                 "Unsupported value type for pastix solver"
-                );
-
-        typedef backend::crs<value_type> build_matrix;
-
-        struct params {
-            int max_rows_per_process;
-
-            params()
-                : max_rows_per_process(50000)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, max_rows_per_process)
-            {
-                check_params(p, {"max_rows_per_process"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, max_rows_per_process);
-            }
-#endif
-        };
-
-        /// Constructor.
-        template <class Matrix>
-        pastix(communicator comm, const Matrix &A,
-                const params &prm = params()) : prm(prm), pastix_data(0)
-        {
-            static_cast<Base*>(this)->init(comm, A);
-        }
-
-        static size_t coarse_enough() {
-            return 10000;
-        }
-
-        int comm_size(int n) const {
-            return Distrib ? (n + prm.max_rows_per_process - 1) / prm.max_rows_per_process : 1;
-        }
-
-        void init(communicator C, const build_matrix &A) {
-            comm = C;
-            nrows = A.nrows;
-            ptr.assign(A.ptr, A.ptr + A.nrows + 1);
-            col.assign(A.col, A.col + A.nnz);
-            val.assign(A.val, A.val + A.nnz);
-
-            row.resize(nrows);
-            perm.resize(nrows);
-
-            if (!Distrib) inv_perm.resize(nrows);
-
-            std::vector<int> domain = comm.exclusive_sum(nrows);
-
-            // PaStiX needs 1-based matrices:
-            for(pastix_int_t &p : ptr) ++p;
-            for(pastix_int_t &c : col) ++c;
-
-            for(int i = 0, j = domain[comm.rank]; i < nrows; ++i)
-                row[i] = ++j;
-
-            // Initialize parameters with default values:
-            iparm[IPARM_MODIFY_PARAMETER] = API_NO;
-            call_pastix(API_TASK_INIT, API_TASK_INIT);
-
-            // Factorize the matrix.
-#ifdef NDEBUG
-            iparm[IPARM_VERBOSE        ] = API_VERBOSE_NOT;
-#else
-            iparm[IPARM_VERBOSE        ] = API_VERBOSE_YES;
-#endif
-            iparm[IPARM_RHS_MAKING     ] = API_RHS_B;
-            iparm[IPARM_SYM            ] = API_SYM_NO;
-            iparm[IPARM_FACTORIZATION  ] = API_FACT_LU;
-            iparm[IPARM_TRANSPOSE_SOLVE] = API_YES;
-#ifdef _OPENMP
-            iparm[IPARM_THREAD_NBR]      = omp_get_max_threads();
-#endif
-            call_pastix(API_TASK_ORDERING, API_TASK_NUMFACT);
-        }
-
-        /// Cleans up internal PaStiX data.
-        ~pastix() {
-            if(pastix_data) call_pastix(API_TASK_CLEAN, API_TASK_CLEAN);
-        }
-
-        /// Solves the problem for the given right-hand side.
-        /**
-         * \param rhs The right-hand side.
-         * \param x   The solution.
-         */
-        template <class Vec1, class Vec2>
-        void solve(const Vec1 &rhs, Vec2 &x) const {
-            for(int i = 0; i < nrows; ++i) x[i] = rhs[i];
-            call_pastix(API_TASK_SOLVE, API_TASK_SOLVE, &x[0]);
-        }
-    private:
-        typedef solver_base< value_type, pastix<value_type, Distrib> > Base;
-        params prm;
-        amgcl::mpi::communicator comm;
-
-        int nrows;
-
-        // Pastix internal data.
-        mutable pastix_data_t *pastix_data;
-
-        // Pastix parameters
-        mutable pastix_int_t   iparm[IPARM_SIZE];
-        mutable double         dparm[DPARM_SIZE];
-
-        std::vector<pastix_int_t> ptr;
-        std::vector<pastix_int_t> col;
-        std::vector<value_type>   val;
-
-        // Local to global mapping
-        std::vector<pastix_int_t> row;
-
-        // Permutation array
-        std::vector<pastix_int_t> perm;
-        std::vector<pastix_int_t> inv_perm;
-
-        void call_pastix(int beg, int end, value_type *x = NULL) const {
-            iparm[IPARM_START_TASK] = beg;
-            iparm[IPARM_END_TASK  ] = end;
-
-            call_pastix(x);
-        }
-
-        void call_pastix(double *x) const {
-            if (Distrib) {
-                d_dpastix(&pastix_data, comm, nrows,
-                        const_cast<pastix_int_t*>(&ptr[0]),
-                        const_cast<pastix_int_t*>(&col[0]),
-                        const_cast<double*      >(&val[0]),
-                        const_cast<pastix_int_t*>(&row[0]),
-                        const_cast<pastix_int_t*>(&perm[0]),
-                        NULL, x, 1, iparm, dparm
-                        );
-            } else {
-                d_pastix(&pastix_data, comm, nrows,
-                        const_cast<pastix_int_t*>(&ptr[0]),
-                        const_cast<pastix_int_t*>(&col[0]),
-                        const_cast<double*      >(&val[0]),
-                        const_cast<pastix_int_t*>(&perm[0]),
-                        const_cast<pastix_int_t*>(&inv_perm[0]),
-                        x, 1, iparm, dparm
-                        );
-            }
-        }
-
-        void call_pastix(float *x) const {
-            if (Distrib) {
-                s_dpastix(&pastix_data, comm, nrows,
-                        const_cast<pastix_int_t*>(&ptr[0]),
-                        const_cast<pastix_int_t*>(&col[0]),
-                        const_cast<float*       >(&val[0]),
-                        const_cast<pastix_int_t*>(&row[0]),
-                        const_cast<pastix_int_t*>(&perm[0]),
-                        NULL, x, 1, iparm, dparm
-                        );
-            } else {
-                s_pastix(&pastix_data, comm, nrows,
-                        const_cast<pastix_int_t*>(&ptr[0]),
-                        const_cast<pastix_int_t*>(&col[0]),
-                        const_cast<float*       >(&val[0]),
-                        const_cast<pastix_int_t*>(&perm[0]),
-                        const_cast<pastix_int_t*>(&inv_perm[0]),
-                        x, 1, iparm, dparm
-                        );
-            }
-        }
-};
-
-} // namespace direct
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/direct_solver/runtime.hpp b/src/solvers/amgcl/mpi/direct_solver/runtime.hpp
deleted file mode 100644
index 6c85eac..0000000
--- a/src/solvers/amgcl/mpi/direct_solver/runtime.hpp
+++ /dev/null
@@ -1,299 +0,0 @@
-#ifndef AMGCL_MPI_DIRECT_SOLVER_RUNTIME_HPP
-#define AMGCL_MPI_DIRECT_SOLVER_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/direct_solver/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime wrapper for distributed direct solvers.
- */
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/direct_solver/skyline_lu.hpp>
-#ifdef AMGCL_HAVE_EIGEN
-#  include <amgcl/mpi/direct_solver/eigen_splu.hpp>
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-#  include <amgcl/mpi/direct_solver/pastix.hpp>
-#endif
-
-namespace amgcl {
-namespace runtime {
-namespace mpi {
-namespace direct {
-
-enum type {
-    skyline_lu
-#ifdef AMGCL_HAVE_EIGEN
-  , eigen_splu
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-  , dpastix
-  , spastix
-#endif
-};
-
-inline std::ostream& operator<<(std::ostream &os, type s)
-{
-    switch (s) {
-        case skyline_lu:
-            return os << "skyline_lu";
-#ifdef AMGCL_HAVE_EIGEN
-        case eigen_splu:
-            return os << "eigen_splu";
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-        case dpastix:
-            return os << "dpastix";
-        case spastix:
-            return os << "spastix";
-#endif
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &s)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "skyline_lu")
-        s = skyline_lu;
-#ifdef AMGCL_HAVE_EIGEN
-    else if (val == "eigen_splu")
-        s = eigen_splu;
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-    else if (val == "dpastix")
-        s = dpastix;
-    else if (val == "spastix")
-        s = spastix;
-#endif
-    else
-        throw std::invalid_argument("Invalid direct solver value. Valid choices are: "
-                "skyline_lu"
-#ifdef AMGCL_HAVE_EIGEN
-                ", eigen_splu"
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-                ", dpastix"
-                ", spastix"
-#endif
-                ".");
-
-    return in;
-}
-
-template <class value_type>
-class solver {
-    public:
-        typedef boost::property_tree::ptree params;
-
-        template <class Matrix>
-        solver(amgcl::mpi::communicator comm, const Matrix &A, params prm = params())
-            : s(prm.get("type", skyline_lu))
-        {
-            if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-            switch (s) {
-                case skyline_lu:
-                    {
-                        typedef amgcl::mpi::direct::skyline_lu<value_type> S;
-                        handle = static_cast<void*>(new S(comm, A, prm));
-                    }
-                    break;
-#ifdef AMGCL_HAVE_EIGEN
-                case eigen_splu:
-                    {
-                        typedef amgcl::mpi::direct::eigen_splu<value_type> S;
-                        do_construct<S, value_type>(comm, A, prm);
-                    }
-                    break;
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-                case dpastix:
-                    {
-                        typedef amgcl::mpi::direct::pastix<value_type,true> S;
-                        do_construct<S, value_type>(comm, A, prm);
-                    }
-                    break;
-                case spastix:
-                    {
-                        typedef amgcl::mpi::direct::pastix<value_type,false> S;
-                        do_construct<S, value_type>(comm, A, prm);
-                    }
-                    break;
-#endif
-                default:
-                    throw std::invalid_argument("Unsupported direct solver type");
-            }
-        }
-
-        static size_t coarse_enough() {
-            return 3000 / math::static_rows<value_type>::value;
-        }
-
-        template <class Vec1, class Vec2>
-        void operator()(const Vec1 &rhs, Vec2 &x) const {
-            switch (s) {
-                case skyline_lu:
-                    {
-                        typedef amgcl::mpi::direct::skyline_lu<value_type> S;
-                        static_cast<const S*>(handle)->operator()(rhs, x);
-                    }
-                    break;
-#ifdef AMGCL_HAVE_EIGEN
-                case eigen_splu:
-                    {
-                        typedef amgcl::mpi::direct::eigen_splu<value_type> S;
-                        do_solve<S, value_type>(rhs, x);
-                    }
-                    break;
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-                case dpastix:
-                    {
-                        typedef amgcl::mpi::direct::pastix<value_type, true> S;
-                        do_solve<S, value_type>(rhs, x);
-                    }
-                    break;
-                case spastix:
-                    {
-                        typedef amgcl::mpi::direct::pastix<value_type, false> S;
-                        do_solve<S, value_type>(rhs, x);
-                    }
-                    break;
-#endif
-                default:
-                    throw std::invalid_argument("Unsupported direct solver type");
-            }
-        }
-
-        ~solver() {
-            switch (s) {
-                case skyline_lu:
-                    {
-                        typedef amgcl::mpi::direct::skyline_lu<value_type> S;
-                        delete static_cast<S*>(handle);
-                    }
-                    break;
-#ifdef AMGCL_HAVE_EIGEN
-                case eigen_splu:
-                    {
-                        typedef amgcl::mpi::direct::eigen_splu<value_type> S;
-                        do_destruct<S, value_type>();
-                    }
-                    break;
-#endif
-#ifdef AMGCL_HAVE_PASTIX
-                case dpastix:
-                    {
-                        typedef amgcl::mpi::direct::pastix<value_type, true> S;
-                        do_destruct<S, value_type>();
-                    }
-                    break;
-                case spastix:
-                    {
-                        typedef amgcl::mpi::direct::pastix<value_type, false> S;
-                        do_destruct<S, value_type>();
-                    }
-                    break;
-#endif
-                default:
-                    break;
-            }
-        }
-    private:
-        direct::type s;
-        void *handle;
-
-        template <class S, class V, class Matrix>
-        typename std::enable_if<
-            std::is_same<V, float>::value || std::is_same<V, double>::value,
-            void
-        >::type
-        do_construct(amgcl::mpi::communicator comm, const Matrix &A, const params &prm) {
-            handle = static_cast<void*>(new S(comm, A, prm));
-        }
-
-        template <class S, class V, class Matrix>
-        typename std::enable_if<
-            !std::is_same<V, float>::value && !std::is_same<V, double>::value,
-            void
-        >::type
-        do_construct(amgcl::mpi::communicator, const Matrix&, const params&) {
-            throw std::logic_error("The direct solver does not support the value type");
-        }
-
-        template <class S, class V, class Vec1, class Vec2>
-        typename std::enable_if<
-            std::is_same<V, float>::value || std::is_same<V, double>::value,
-            void
-        >::type
-        do_solve(const Vec1 &rhs, Vec2 &x) const {
-            static_cast<const S*>(handle)->operator()(rhs, x);
-        }
-
-        template <class S, class V, class Vec1, class Vec2>
-        typename std::enable_if<
-            !std::is_same<V, float>::value && !std::is_same<V, double>::value,
-            void
-        >::type
-        do_solve(const Vec1&, Vec2&) const {
-            throw std::logic_error("The direct solver does not support the value type");
-        }
-
-        template <class S, class V>
-        typename std::enable_if<
-            std::is_same<V, float>::value || std::is_same<V, double>::value,
-            void
-        >::type
-        do_destruct() {
-            delete static_cast<S*>(handle);
-        }
-
-        template <class S, class V>
-        typename std::enable_if<
-            !std::is_same<V, float>::value && !std::is_same<V, double>::value,
-            void
-        >::type
-        do_destruct() {
-        }
-};
-
-} // namespace direct
-} // namespace mpi
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/direct_solver/skyline_lu.hpp b/src/solvers/amgcl/mpi/direct_solver/skyline_lu.hpp
deleted file mode 100644
index 5bfe0e6..0000000
--- a/src/solvers/amgcl/mpi/direct_solver/skyline_lu.hpp
+++ /dev/null
@@ -1,99 +0,0 @@
-#ifndef AMGCL_MPI_DIRECT_SOLVER_SKYLINE_LU_HPP
-#define AMGCL_MPI_DIRECT_SOLVER_SKYLINE_LU_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/mpi/direct_solver/skyline_lu.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  MPI wrapper for Skyline LU factorization solver.
-
-This is a wrapper around Skyline LU factorization solver that provides a
-distributed direct solver interface but always works sequentially.
-*/
-
-#include <mpi.h>
-
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/adapter/crs_tuple.hpp>
-#include <amgcl/solver/skyline_lu.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/direct_solver/solver_base.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace direct {
-
-/// Provides distributed direct solver interface for Skyline LU solver.
-template <typename value_type>
-class skyline_lu : public solver_base< value_type, skyline_lu<value_type> > {
-    public:
-        typedef amgcl::solver::skyline_lu<value_type> Solver;
-        typedef typename Solver::params params;
-        typedef backend::crs<value_type> build_matrix;
-
-        /// Constructor.
-        template <class Matrix>
-        skyline_lu(communicator comm, const Matrix &A,
-                const params &prm = params()
-                ) : prm(prm)
-        {
-            static_cast<Base*>(this)->init(comm, A);
-        }
-
-        static size_t coarse_enough() {
-            return Solver::coarse_enough();
-        }
-
-        int comm_size(int /*n*/) const {
-            return 1;
-        }
-
-        void init(communicator, const build_matrix &A) {
-            S = std::make_shared<Solver>(A, prm);
-        }
-
-        /// Solves the problem for the given right-hand side.
-        /**
-         * \param rhs The right-hand side.
-         * \param x   The solution.
-         */
-        template <class Vec1, class Vec2>
-        void solve(const Vec1 &rhs, Vec2 &x) const {
-            (*S)(rhs, x);
-        }
-    private:
-        typedef solver_base< value_type, skyline_lu<value_type> > Base;
-        params prm;
-        std::shared_ptr<Solver> S;
-};
-
-} // namespace direct
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/direct_solver/solver_base.hpp b/src/solvers/amgcl/mpi/direct_solver/solver_base.hpp
deleted file mode 100644
index 3a6330c..0000000
--- a/src/solvers/amgcl/mpi/direct_solver/solver_base.hpp
+++ /dev/null
@@ -1,272 +0,0 @@
-#ifndef AMGCL_MPI_DIRECT_SOLVER_SOLVER_BASE_HPP
-#define AMGCL_MPI_DIRECT_SOLVER_SOLVER_BASE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/mpi/direct_solver/solver_base.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  Basic functionality for distributed direct solvers.
-*/
-
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace direct {
-
-template <class value_type, class Solver>
-class solver_base {
-    public:
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename math::rhs_of<value_type>::type    rhs_type;
-        typedef backend::crs<value_type> build_matrix;
-
-        solver_base() {}
-
-        void init(communicator comm, const build_matrix &Astrip) {
-            this->comm = comm;
-            n = Astrip.nrows;
-
-            std::vector<int> domain = comm.exclusive_sum(n);
-            std::vector<int> active; active.reserve(comm.size);
-
-            // Find out how many ranks are active (own non-zero matrix rows):
-            int active_rank = 0;
-            for(int i = 0; i < comm.size; ++i) {
-                if (domain[i+1] - domain[i] > 0) {
-                    if (comm.rank == i) active_rank = active.size();
-                    active.push_back(i);
-                }
-            }
-
-            // Consolidate the matrix on a fewer processes.
-            int nmasters = std::min<int>(active.size(), solver().comm_size(domain.back()));
-            int slaves_per_master = (active.size() + nmasters - 1) / nmasters;
-            int group_beg = (active_rank / slaves_per_master) * slaves_per_master;
-
-            group_master = active[group_beg];
-
-            // Communicator for masters (used to solve the coarse problem):
-            MPI_Comm_split(comm,
-                    comm.rank == group_master ? 0 : MPI_UNDEFINED,
-                    comm.rank, &masters_comm
-                    );
-
-            if (!n) return; // I am not active
-
-            // Shift from row pointers to row widths:
-            std::vector<ptrdiff_t> widths(n);
-            for(ptrdiff_t i = 0; i < n; ++i)
-                widths[i] = Astrip.ptr[i+1] - Astrip.ptr[i];
-
-            if (comm.rank == group_master) {
-                int group_end = std::min<int>(group_beg + slaves_per_master, active.size());
-                group_beg += 1;
-                int group_size = group_end - group_beg;
-
-                std::vector<MPI_Request> cnt_req(group_size);
-                std::vector<MPI_Request> col_req(group_size);
-                std::vector<MPI_Request> val_req(group_size);
-
-                solve_req.resize(group_size);
-                slaves.reserve(group_size);
-                counts.reserve(group_size);
-
-                // Count rows in local chunk of the consolidated matrix,
-                // see who is reporting to us.
-                int nloc = n;
-                for(int j = group_beg; j < group_end; ++j) {
-                    int i = active[j];
-
-                    int m = domain[i+1] - domain[i];
-                    nloc += m;
-                    counts.push_back(m);
-                    slaves.push_back(i);
-                }
-
-                // Get matrix chunks from my slaves.
-                build_matrix A;
-                A.set_size(nloc, domain.back(), false);
-                A.ptr[0] = 0;
-
-                cons_f.resize(A.nrows);
-                cons_x.resize(A.nrows);
-
-                int shift = n+1;
-                std::copy(widths.begin(), widths.end(), &A.ptr[1]);
-
-                for(int j = 0; j < group_size; ++j) {
-                    int i = slaves[j];
-
-                    MPI_Irecv(&A.ptr[shift], counts[j], datatype<ptrdiff_t>(),
-                            i, cnt_tag, comm, &cnt_req[j]);
-
-                    shift += counts[j];
-                }
-
-                MPI_Waitall(cnt_req.size(), &cnt_req[0], MPI_STATUSES_IGNORE);
-
-                A.set_nonzeros(A.scan_row_sizes());
-
-                std::copy(Astrip.col, Astrip.col + Astrip.nnz, A.col);
-                std::copy(Astrip.val, Astrip.val + Astrip.nnz, A.val);
-
-                shift = Astrip.nnz;
-                for(int j = 0, d0 = domain[comm.rank]; j < group_size; ++j) {
-                    int i = slaves[j];
-
-                    int nnz = A.ptr[domain[i+1] - d0] - A.ptr[domain[i] - d0];
-
-                    MPI_Irecv(A.col + shift, nnz, datatype<ptrdiff_t>(),
-                            i, col_tag, comm, &col_req[j]);
-
-                    MPI_Irecv(A.val + shift, nnz, datatype<value_type>(),
-                            i, val_tag, comm, &val_req[j]);
-
-                    shift += nnz;
-                }
-
-                MPI_Waitall(col_req.size(), &col_req[0], MPI_STATUSES_IGNORE);
-                MPI_Waitall(val_req.size(), &val_req[0], MPI_STATUSES_IGNORE);
-
-                solver().init(masters_comm, A);
-            } else {
-                MPI_Send(widths.data(), n, datatype<ptrdiff_t>(),
-                        group_master, cnt_tag, comm);
-                MPI_Send(Astrip.col, Astrip.nnz, datatype<ptrdiff_t>(),
-                        group_master, col_tag, comm);
-                MPI_Send(Astrip.val, Astrip.nnz, datatype<value_type>(),
-                        group_master, val_tag, comm);
-            }
-
-            host_v.resize(n);
-        }
-
-        template <class B>
-        void init(communicator comm, const distributed_matrix<B> &A) {
-            const build_matrix &A_loc = *A.local();
-            const build_matrix &A_rem = *A.remote();
-
-            build_matrix a;
-
-            a.set_size(A.loc_rows(), A.glob_cols(), false);
-            a.set_nonzeros(A_loc.nnz + A_rem.nnz);
-            a.ptr[0] = 0;
-
-            for(size_t i = 0, head = 0; i < A_loc.nrows; ++i) {
-                ptrdiff_t shift = A.loc_col_shift();
-
-                for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                    a.col[head] = A_loc.col[j] + shift;
-                    a.val[head] = A_loc.val[j];
-                    ++head;
-                }
-
-                for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j) {
-                    a.col[head] = A_rem.col[j];
-                    a.val[head] = A_rem.val[j];
-                    ++head;
-                }
-
-                a.ptr[i+1] = head;
-            }
-
-            init(comm, a);
-        }
-
-        virtual ~solver_base() {
-            if (masters_comm != MPI_COMM_NULL) MPI_Comm_free(&masters_comm);
-        }
-
-        Solver& solver() {
-            return *static_cast<Solver*>(this);
-        }
-
-        const Solver& solver() const {
-            return *static_cast<const Solver*>(this);
-        }
-
-        template <class VecF, class VecX>
-        void operator()(const VecF &f, VecX &x) const {
-            static const MPI_Datatype T = datatype<rhs_type>();
-
-            if (!n) return;
-
-            backend::copy(f, host_v);
-
-            if (comm.rank == group_master) {
-                std::copy(host_v.begin(), host_v.end(), cons_f.begin());
-
-                int shift = n, j = 0;
-                for(int i : slaves) {
-                    MPI_Irecv(&cons_f[shift], counts[j], T, i, rhs_tag, comm, &solve_req[j]);
-                    shift += counts[j++];
-                }
-
-                MPI_Waitall(solve_req.size(), &solve_req[0], MPI_STATUSES_IGNORE);
-
-                solver().solve(cons_f, cons_x);
-
-                std::copy(cons_x.begin(), cons_x.begin() + n, host_v.begin());
-                shift = n;
-                j = 0;
-
-                for(int i : slaves) {
-                    MPI_Isend(&cons_x[shift], counts[j], T, i, sol_tag, comm, &solve_req[j]);
-                    shift += counts[j++];
-                }
-
-                MPI_Waitall(solve_req.size(), &solve_req[0], MPI_STATUSES_IGNORE);
-            } else {
-                MPI_Send(&host_v[0], n, T, group_master, rhs_tag, comm);
-                MPI_Recv(&host_v[0], n, T, group_master, sol_tag, comm, MPI_STATUS_IGNORE);
-            }
-
-            backend::copy(host_v, x);
-        }
-    private:
-        static const int cnt_tag = 5001;
-        static const int col_tag = 5002;
-        static const int val_tag = 5003;
-        static const int rhs_tag = 5004;
-        static const int sol_tag = 5005;
-
-        communicator comm;
-        int          n;
-        int          group_master;
-        MPI_Comm     masters_comm;
-        std::vector<int> slaves;
-        std::vector<int> counts;
-        mutable std::vector<rhs_type> cons_f, cons_x, host_v;
-        mutable std::vector<MPI_Request> solve_req;
-};
-
-} // namespace direct
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/distributed_matrix.hpp b/src/solvers/amgcl/mpi/distributed_matrix.hpp
deleted file mode 100644
index e3bf131..0000000
--- a/src/solvers/amgcl/mpi/distributed_matrix.hpp
+++ /dev/null
@@ -1,1314 +0,0 @@
-#ifndef AMGCL_MPI_DISTRIBUTED_MATRIX_HPP
-#define AMGCL_MPI_DISTRIBUTED_MATRIX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-#include <vector>
-#include <algorithm>
-
-#include <memory>
-#include <unordered_map>
-#include <random>
-
-#include <mpi.h>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/util.hpp>
-
-/**
- * \file   amgcl/mpi/distributed_matrix.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed matrix implementation.
- */
-
-namespace amgcl {
-namespace mpi {
-
-template <class Backend>
-class comm_pattern {
-    public:
-        typedef typename Backend::value_type value_type;
-        typedef typename math::rhs_of<value_type>::type rhs_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename Backend::matrix matrix;
-        typedef typename Backend::vector vector;
-        typedef typename Backend::params backend_params;
-
-        struct {
-            std::vector<ptrdiff_t> nbr;
-            std::vector<ptrdiff_t> ptr;
-            std::vector<ptrdiff_t> col;
-
-            size_t count() const {
-                return col.size();
-            }
-
-            mutable std::vector<rhs_type>    val;
-            mutable std::vector<MPI_Request> req;
-        } send;
-
-        struct {
-            std::vector<ptrdiff_t> nbr;
-            std::vector<ptrdiff_t> ptr;
-
-            size_t count() const {
-                return val.size();
-            }
-
-            mutable std::vector<rhs_type>    val;
-            mutable std::vector<MPI_Request> req;
-        } recv;
-
-        std::shared_ptr<vector> x_rem;
-
-        comm_pattern(
-                communicator comm,
-                ptrdiff_t n_loc_cols,
-                size_t n_rem_cols, const ptrdiff_t *p_rem_cols
-                ) : comm(comm), loc_cols(n_loc_cols)
-        {
-            AMGCL_TIC("communication pattern");
-            // Get domain boundaries
-            std::vector<ptrdiff_t> domain = comm.exclusive_sum(n_loc_cols);
-            loc_beg = domain[comm.rank];
-
-            // Renumber remote columns,
-            // find out how many remote values we need from each process.
-            std::vector<ptrdiff_t> rem_cols(p_rem_cols, p_rem_cols + n_rem_cols);
-
-            std::sort(rem_cols.begin(), rem_cols.end());
-            rem_cols.erase(std::unique(rem_cols.begin(), rem_cols.end()), rem_cols.end());
-
-            ptrdiff_t ncols = rem_cols.size();
-            ptrdiff_t rnbr = 0, snbr = 0, send_size = 0;
-
-            {
-                std::vector<int> rcounts(comm.size, 0);
-                std::vector<int> scounts(comm.size);
-
-                // Build index for column renumbering;
-                // count how many domains send us data and how much.
-                idx.reserve(2 * ncols);
-                for(int i = 0, d = 0, last = -1; i < ncols; ++i) {
-                    while(rem_cols[i] >= domain[d + 1]) ++d;
-
-                    ++rcounts[d];
-
-                    if (last < d) {
-                        last = d;
-                        ++rnbr;
-                    }
-
-                    idx.insert(idx.end(), std::make_pair(
-                                rem_cols[i], std::make_tuple(rnbr-1,i)));
-                }
-
-                recv.val.resize(ncols);
-                recv.req.resize(rnbr);
-
-                recv.nbr.reserve(rnbr);
-                recv.ptr.reserve(rnbr + 1); recv.ptr.push_back(0);
-
-                for(int d = 0; d < comm.size; ++d) {
-                    if (rcounts[d]) {
-                        recv.nbr.push_back(d);
-                        recv.ptr.push_back(recv.ptr.back() + rcounts[d]);
-                    }
-                }
-
-                MPI_Alltoall(rcounts.data(), 1, MPI_INT, scounts.data(), 1, MPI_INT, comm);
-
-                for(ptrdiff_t d = 0; d < comm.size; ++d) {
-                    if (scounts[d]) {
-                        ++snbr;
-                        send_size += scounts[d];
-                    }
-                }
-
-                send.col.resize(send_size);
-                send.val.resize(send_size);
-                send.req.resize(snbr);
-
-                send.nbr.reserve(snbr);
-                send.ptr.reserve(snbr + 1); send.ptr.push_back(0);
-
-                for(ptrdiff_t d = 0; d < comm.size; ++d) {
-                    if (scounts[d]) {
-                        send.nbr.push_back(d);
-                        send.ptr.push_back(send.ptr.back() + scounts[d]);
-                    }
-                }
-            }
-
-            // What columns do you need from me?
-            for(size_t i = 0; i < send.nbr.size(); ++i)
-                MPI_Irecv(&send.col[send.ptr[i]], send.ptr[i+1] - send.ptr[i],
-                        datatype<ptrdiff_t>(), send.nbr[i], tag_exc_cols, comm, &send.req[i]);
-
-            // Here is what I need from you:
-            for(size_t i = 0; i < recv.nbr.size(); ++i)
-                MPI_Isend(&rem_cols[recv.ptr[i]], recv.ptr[i+1] - recv.ptr[i],
-                        datatype<ptrdiff_t>(), recv.nbr[i], tag_exc_cols, comm, &recv.req[i]);
-
-            AMGCL_TIC("MPI Wait");
-            MPI_Waitall(recv.req.size(), recv.req.data(), MPI_STATUSES_IGNORE);
-            MPI_Waitall(send.req.size(), send.req.data(), MPI_STATUSES_IGNORE);
-            AMGCL_TOC("MPI Wait");
-
-            // Shift columns to send to local numbering:
-            for(ptrdiff_t &c : send.col) c -= loc_beg;
-
-            AMGCL_TOC("communication pattern");
-        }
-
-        template <class OtherBackend>
-        comm_pattern(const comm_pattern<OtherBackend> &C) :
-            comm(C.comm),
-            idx(C.idx),
-            loc_beg(C.loc_beg),
-            loc_cols(C.loc_cols)
-        {
-            send.nbr = C.send.nbr;
-            send.ptr = C.send.ptr;
-            send.col = C.send.col;
-            send.val.resize(C.send.val.size());
-            send.req.resize(C.send.req.size());
-
-            recv.nbr = C.recv.nbr;
-            recv.ptr = C.recv.ptr;
-            recv.val.resize(C.recv.val.size());
-            recv.req.resize(C.recv.req.size());
-        }
-
-        void move_to_backend(const backend_params &bprm = backend_params()) {
-            if (!x_rem) {
-                x_rem  = Backend::create_vector(recv.count(), bprm);
-            }
-
-            if (!gather) {
-                gather = std::make_shared<Gather>(loc_cols, send.col, bprm);
-            }
-        }
-
-        int domain(ptrdiff_t col) const {
-            return std::get<0>(idx.at(col));
-        }
-
-        int local_index(ptrdiff_t col) const {
-            return std::get<1>(idx.at(col));
-        }
-
-        std::tuple<int, int> remote_info(ptrdiff_t col) const {
-            return idx.at(col);
-        }
-
-        std::unordered_map<ptrdiff_t, std::tuple<int, int> >::const_iterator
-        remote_begin() const {
-            return idx.cbegin();
-        }
-
-        std::unordered_map<ptrdiff_t, std::tuple<int, int> >::const_iterator
-        remote_end() const {
-            return idx.cend();
-        }
-
-        size_t renumber(size_t n, ptrdiff_t *col) const {
-            for(size_t i = 0; i < n; ++i)
-                col[i] = std::get<1>(idx.at(col[i]));
-            return recv.count();
-        }
-
-        bool needs_remote() const {
-            return !recv.val.empty();
-        }
-
-        template <class Vector>
-        void start_exchange(const Vector &x) const {
-            // Start receiving ghost values from our neighbours.
-            for(size_t i = 0; i < recv.nbr.size(); ++i)
-                MPI_Irecv(&recv.val[recv.ptr[i]], recv.ptr[i+1] - recv.ptr[i],
-                        datatype<rhs_type>(), recv.nbr[i], tag_exc_vals, comm, &recv.req[i]);
-
-            // Start sending our data to neighbours.
-            if (!send.val.empty()) {
-                (*gather)(x, send.val);
-
-                for(size_t i = 0; i < send.nbr.size(); ++i)
-                    MPI_Isend(&send.val[send.ptr[i]], send.ptr[i+1] - send.ptr[i],
-                            datatype<rhs_type>(), send.nbr[i], tag_exc_vals, comm, &send.req[i]);
-            }
-        }
-
-        void finish_exchange() const {
-            AMGCL_TIC("MPI Wait");
-            MPI_Waitall(recv.req.size(), recv.req.data(), MPI_STATUSES_IGNORE);
-            MPI_Waitall(send.req.size(), send.req.data(), MPI_STATUSES_IGNORE);
-            AMGCL_TOC("MPI Wait");
-
-            if (!recv.val.empty())
-                backend::copy(recv.val, *x_rem);
-        }
-
-        template <typename T>
-        void exchange(const T *send_val, T *recv_val) const {
-            for(size_t i = 0; i < recv.nbr.size(); ++i)
-                MPI_Irecv(&recv_val[recv.ptr[i]], recv.ptr[i+1] - recv.ptr[i],
-                        datatype<T>(), recv.nbr[i], tag_exc_vals, comm, &recv.req[i]);
-
-            for(size_t i = 0; i < send.nbr.size(); ++i)
-                MPI_Isend(const_cast<T*>(&send_val[send.ptr[i]]), send.ptr[i+1] - send.ptr[i],
-                        datatype<T>(), send.nbr[i], tag_exc_vals, comm, &send.req[i]);
-
-            AMGCL_TIC("MPI Wait");
-            MPI_Waitall(recv.req.size(), recv.req.data(), MPI_STATUSES_IGNORE);
-            MPI_Waitall(send.req.size(), send.req.data(), MPI_STATUSES_IGNORE);
-            AMGCL_TOC("MPI Wait");
-        }
-
-        communicator mpi_comm() const {
-            return comm;
-        }
-
-        ptrdiff_t loc_col_shift() const {
-            return loc_beg;
-        }
-
-    private:
-        typedef typename Backend::gather Gather;
-
-        static const int tag_set_comm = 1001;
-        static const int tag_exc_cols = 1002;
-        static const int tag_exc_vals = 1003;
-
-        communicator comm;
-
-        std::unordered_map<ptrdiff_t, std::tuple<int, int> > idx;
-        std::shared_ptr<Gather> gather;
-        ptrdiff_t loc_beg, loc_cols;
-
-        template <class B>
-        friend class comm_pattern;
-};
-
-template <class Backend>
-class distributed_matrix {
-    public:
-        typedef typename Backend::value_type value_type;
-        typedef typename math::rhs_of<value_type>::type rhs_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename Backend::params backend_params;
-        typedef typename Backend::matrix matrix;
-        typedef comm_pattern<Backend> CommPattern;
-        typedef backend::crs<value_type> build_matrix;
-
-        distributed_matrix(
-                communicator comm,
-                std::shared_ptr<build_matrix> a_loc,
-                std::shared_ptr<build_matrix> a_rem,
-                std::shared_ptr<CommPattern>  c = std::shared_ptr<CommPattern>()
-                )
-            : a_loc(a_loc), a_rem(a_rem)
-        {
-            if (c) {
-                C = c;
-            } else {
-                C = std::make_shared<CommPattern>(comm, a_loc->ncols, a_rem->nnz, a_rem->col);
-            }
-
-            a_rem->ncols = C->recv.count();
-
-            n_loc_rows     = a_loc->nrows;
-            n_loc_cols     = a_loc->ncols;
-            n_loc_nonzeros = a_loc->nnz + a_rem->nnz;
-
-            n_glob_rows     = comm.reduce(MPI_SUM, n_loc_rows);
-            n_glob_cols     = comm.reduce(MPI_SUM, n_loc_cols);
-            n_glob_nonzeros = comm.reduce(MPI_SUM, n_loc_nonzeros);
-        }
-
-        // Copy the distributed_matrix from another backend
-        template <class OtherBackend>
-        distributed_matrix(const distributed_matrix<OtherBackend> &A)
-            : a_loc(std::make_shared<build_matrix>(*A.local())),
-              a_rem(std::make_shared<build_matrix>(*A.remote()))
-        {
-            C = std::make_shared<CommPattern>(A.cpat());
-
-            this->a_rem->ncols = C->recv.count();
-
-            n_loc_rows      = A.loc_rows();
-            n_loc_cols      = A.loc_cols();
-            n_loc_nonzeros  = A.loc_nonzeros();
-            n_glob_rows     = A.glob_rows();
-            n_glob_cols     = A.glob_cols();
-            n_glob_nonzeros = A.glob_nonzeros();
-        }
-
-        template <class Matrix>
-        distributed_matrix(
-                communicator comm,
-                const Matrix &A,
-                ptrdiff_t _n_loc_cols = -1)
-            : n_loc_rows(backend::rows(A)),
-              n_loc_cols(_n_loc_cols < 0 ? n_loc_rows : _n_loc_cols),
-              n_loc_nonzeros(backend::nonzeros(A))
-        {
-            // Get sizes of each domain in comm.
-            std::vector<ptrdiff_t> domain = comm.exclusive_sum(n_loc_cols);
-            ptrdiff_t loc_beg = domain[comm.rank];
-            ptrdiff_t loc_end = domain[comm.rank + 1];
-
-            n_glob_cols     = domain.back();
-            n_glob_rows     = comm.reduce(MPI_SUM, n_loc_rows);
-            n_glob_nonzeros = comm.reduce(MPI_SUM, n_loc_nonzeros);
-
-            // Split the matrix into local and remote parts.
-            a_loc = std::make_shared<build_matrix>();
-            a_rem = std::make_shared<build_matrix>();
-
-            build_matrix &A_loc = *a_loc;
-            build_matrix &A_rem = *a_rem;
-
-            A_loc.set_size(n_loc_rows, n_loc_cols, true);
-            A_rem.set_size(n_loc_rows, 0, true);
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n_loc_rows; ++i) {
-                for(auto a = backend::row_begin(A, i); a; ++a) {
-                    ptrdiff_t c = a.col();
-
-                    if (loc_beg <= c && c < loc_end)
-                        ++A_loc.ptr[i + 1];
-                    else
-                        ++A_rem.ptr[i + 1];
-                }
-            }
-
-            A_loc.set_nonzeros(A_loc.scan_row_sizes());
-            A_rem.set_nonzeros(A_rem.scan_row_sizes());
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n_loc_rows; ++i) {
-                ptrdiff_t loc_head = A_loc.ptr[i];
-                ptrdiff_t rem_head = A_rem.ptr[i];
-
-                for(auto a = backend::row_begin(A, i); a; ++a) {
-                    ptrdiff_t  c = a.col();
-                    value_type v = a.value();
-
-                    if (loc_beg <= c && c < loc_end) {
-                        A_loc.col[loc_head] = c - loc_beg;
-                        A_loc.val[loc_head] = v;
-                        ++loc_head;
-                    } else {
-                        A_rem.col[rem_head] = c;
-                        A_rem.val[rem_head] = v;
-                        ++rem_head;
-                    }
-                }
-            }
-
-            C = std::make_shared<CommPattern>(comm, n_loc_cols, a_rem->nnz, a_rem->col);
-            a_rem->ncols = C->recv.count();
-        }
-
-        communicator comm() const {
-            return C->mpi_comm();
-        }
-
-        std::shared_ptr<build_matrix> local() const {
-            return a_loc;
-        }
-
-        std::shared_ptr<build_matrix> remote() const {
-            return a_rem;
-        }
-
-        std::shared_ptr<matrix> local_backend() const {
-            return A_loc;
-        }
-
-        std::shared_ptr<matrix> remote_backend() const {
-            return A_rem;
-        }
-
-        ptrdiff_t loc_rows() const {
-            return n_loc_rows;
-        }
-
-        ptrdiff_t loc_cols() const {
-            return n_loc_cols;
-        }
-
-        ptrdiff_t loc_col_shift() const {
-            return C->loc_col_shift();
-        }
-
-        ptrdiff_t loc_nonzeros() const {
-            return n_loc_nonzeros;
-        }
-
-        ptrdiff_t glob_rows() const {
-            return n_glob_rows;
-        }
-
-        ptrdiff_t glob_cols() const {
-            return n_glob_cols;
-        }
-
-        ptrdiff_t glob_nonzeros() const {
-            return n_glob_nonzeros;
-        }
-
-        const comm_pattern<Backend>& cpat() const {
-            return *C;
-        }
-
-        void set_local(std::shared_ptr<matrix> a) {
-            A_loc = a;
-        }
-
-        void move_to_backend(const backend_params &bprm = backend_params(), bool keep_src = false) {
-            AMGCL_TIC("move to backend");
-            if (!A_loc) {
-                A_loc = Backend::copy_matrix(a_loc, bprm);
-            }
-
-            if (!A_rem && a_rem && a_rem->nnz > 0) {
-                std::vector<ptrdiff_t> backup;
-                if (keep_src) {
-                    backup.assign(a_rem->col, a_rem->col + a_rem->nnz);
-                }
-
-                C->renumber(a_rem->nnz, a_rem->col);
-                A_rem = Backend::copy_matrix(a_rem, bprm);
-
-                if (keep_src) {
-                    std::copy(backup.begin(), backup.end(), a_rem->col);
-                }
-            }
-
-            C->move_to_backend(bprm);
-
-            if (!keep_src) {
-                a_loc.reset();
-                a_rem.reset();
-            }
-            AMGCL_TOC("move to backend");
-        }
-
-        template <class A, class VecX, class B, class VecY>
-        void mul(A alpha, const VecX &x, B beta, VecY &y) const {
-            const auto one = math::identity<scalar_type>();
-
-            C->start_exchange(x);
-
-            // Compute local part of the product.
-            backend::spmv(alpha, *A_loc, x, beta, y);
-
-            // Compute remote part of the product.
-            C->finish_exchange();
-
-            if (C->needs_remote())
-                backend::spmv(alpha, *A_rem, *C->x_rem, one, y);
-        }
-
-        template <class Vec1, class Vec2, class Vec3>
-        void residual(const Vec1 &f, const Vec2 &x, Vec3 &r) const {
-            const auto one = math::identity<scalar_type>();
-
-            C->start_exchange(x);
-            backend::residual(f, *A_loc, x, r);
-
-            C->finish_exchange();
-
-            if (C->needs_remote())
-                backend::spmv(-one, *A_rem, *C->x_rem, one, r);
-        }
-
-    private:
-        std::shared_ptr<CommPattern>  C;
-        std::shared_ptr<matrix> A_loc, A_rem;
-        std::shared_ptr<build_matrix> a_loc, a_rem;
-
-        ptrdiff_t n_loc_rows, n_glob_rows;
-        ptrdiff_t n_loc_cols, n_glob_cols;
-        ptrdiff_t n_loc_nonzeros, n_glob_nonzeros;
-};
-
-template <class Backend>
-std::shared_ptr< distributed_matrix<Backend> >
-transpose(const distributed_matrix<Backend> &A) {
-    AMGCL_TIC("MPI Transpose");
-    typedef typename Backend::value_type value_type;
-    typedef comm_pattern<Backend>        CommPattern;
-    typedef backend::crs<value_type>     build_matrix;
-
-    static const int tag_cnt = 2001;
-    static const int tag_col = 2002;
-    static const int tag_val = 2003;
-
-    communicator comm = A.comm();
-    const CommPattern &C = A.cpat();
-
-    build_matrix &A_loc = *A.local();
-    build_matrix &A_rem = *A.remote();
-
-    ptrdiff_t nrows = A_loc.ncols;
-    ptrdiff_t ncols = A_loc.nrows;
-
-    std::vector<MPI_Request> recv_cnt_req(C.send.req.size());
-    std::vector<MPI_Request> recv_col_req(C.send.req.size());
-    std::vector<MPI_Request> recv_val_req(C.send.req.size());
-
-    std::vector<MPI_Request> send_cnt_req(C.recv.req.size());
-    std::vector<MPI_Request> send_col_req(C.recv.req.size());
-    std::vector<MPI_Request> send_val_req(C.recv.req.size());
-
-    // Our transposed remote part becomes remote part of someone else,
-    // and the other way around.
-    std::shared_ptr<build_matrix> t_ptr;
-    {
-        std::vector<ptrdiff_t> tmp_col(A_rem.col, A_rem.col + A_rem.nnz);
-        C.renumber(tmp_col.size(), tmp_col.data());
-
-        ptrdiff_t *a_rem_col = tmp_col.data();
-        std::swap(a_rem_col, A_rem.col);
-
-        t_ptr = backend::transpose(A_rem);
-
-        std::swap(a_rem_col, A_rem.col);
-    }
-    build_matrix &t_rem = *t_ptr;
-
-    // Shift to global numbering:
-    std::vector<ptrdiff_t> domain = comm.exclusive_sum(ncols);
-    ptrdiff_t loc_beg = domain[comm.rank];
-    for(size_t i = 0; i < t_rem.nnz; ++i)
-        t_rem.col[i] += loc_beg;
-
-    // Shift from row pointers to row sizes:
-    std::vector<ptrdiff_t> row_size(t_rem.nrows);
-    for(size_t i = 0; i < t_rem.nrows; ++i)
-        row_size[i] = t_rem.ptr[i+1] - t_rem.ptr[i];
-
-    // Sizes of transposed remote blocks:
-    // 1. Exchange rem_ptr
-    std::vector<ptrdiff_t> rem_ptr(C.send.count() + 1); rem_ptr[0] = 0;
-
-    for(size_t i = 0; i < C.send.nbr.size(); ++i) {
-        ptrdiff_t beg = C.send.ptr[i];
-        ptrdiff_t end = C.send.ptr[i + 1];
-
-        MPI_Irecv(&rem_ptr[beg + 1], end - beg, datatype<ptrdiff_t>(),
-                C.send.nbr[i], tag_cnt, comm, &recv_cnt_req[i]);
-    }
-
-    for(size_t i = 0; i < C.recv.nbr.size(); ++i) {
-        ptrdiff_t beg = C.recv.ptr[i];
-        ptrdiff_t end = C.recv.ptr[i + 1];
-
-        MPI_Isend(&row_size[beg], end - beg, datatype<ptrdiff_t>(),
-                C.recv.nbr[i], tag_cnt, comm, &send_cnt_req[i]);
-    }
-
-    AMGCL_TIC("MPI Wait");
-    MPI_Waitall(recv_cnt_req.size(), recv_cnt_req.data(), MPI_STATUSES_IGNORE);
-    AMGCL_TOC("MPI Wait");
-    std::partial_sum(rem_ptr.begin(), rem_ptr.end(), rem_ptr.begin());
-
-    // 2. Start exchange of rem_col, rem_val
-    std::vector<ptrdiff_t>  rem_col(rem_ptr.back());
-    std::vector<value_type> rem_val(rem_ptr.back());
-
-    for(size_t i = 0; i < C.send.nbr.size(); ++i) {
-        ptrdiff_t rbeg = C.send.ptr[i];
-        ptrdiff_t rend = C.send.ptr[i + 1];
-
-        ptrdiff_t cbeg = rem_ptr[rbeg];
-        ptrdiff_t cend = rem_ptr[rend];
-
-        MPI_Irecv(&rem_col[cbeg], cend - cbeg, datatype<ptrdiff_t>(),
-                C.send.nbr[i], tag_col, comm, &recv_col_req[i]);
-
-        MPI_Irecv(&rem_val[cbeg], cend - cbeg, datatype<value_type>(),
-                C.send.nbr[i], tag_val, comm, &recv_val_req[i]);
-    }
-
-    for(size_t i = 0; i < C.recv.nbr.size(); ++i) {
-        ptrdiff_t rbeg = C.recv.ptr[i];
-        ptrdiff_t rend = C.recv.ptr[i + 1];
-
-        ptrdiff_t cbeg = t_rem.ptr[rbeg];
-        ptrdiff_t cend = t_rem.ptr[rend];
-
-        MPI_Isend(&t_rem.col[cbeg], cend - cbeg, datatype<ptrdiff_t>(),
-                C.recv.nbr[i], tag_col, comm, &send_col_req[i]);
-
-        MPI_Isend(&t_rem.val[cbeg], cend - cbeg, datatype<value_type>(),
-                C.recv.nbr[i], tag_val, comm, &send_val_req[i]);
-    }
-
-    // 3. While rem_col and rem_val are in flight,
-    //    start constructing our remote part:
-    auto T_ptr = std::make_shared<build_matrix>();
-    build_matrix &T_rem = *T_ptr;
-    T_rem.set_size(nrows, 0, true);
-
-    for(size_t i = 0; i < C.send.count(); ++i)
-        T_rem.ptr[1 + C.send.col[i]] += rem_ptr[i+1] - rem_ptr[i];
-
-    T_rem.scan_row_sizes();
-    T_rem.set_nonzeros();
-
-    // 4. Finish rem_col and rem_val exchange, and
-    //    finish contruction of our remote part.
-    AMGCL_TIC("MPI Wait");
-    MPI_Waitall(recv_col_req.size(), recv_col_req.data(), MPI_STATUSES_IGNORE);
-    MPI_Waitall(recv_val_req.size(), recv_val_req.data(), MPI_STATUSES_IGNORE);
-    AMGCL_TOC("MPI Wait");
-
-    for(size_t i = 0; i < C.send.count(); ++i) {
-        ptrdiff_t row  = C.send.col[i];
-        ptrdiff_t head = T_rem.ptr[row];
-
-        for(ptrdiff_t j = rem_ptr[i]; j < rem_ptr[i+1]; ++j, ++head) {
-            T_rem.col[head] = rem_col[j];
-            T_rem.val[head] = rem_val[j];
-        }
-
-        T_rem.ptr[row] = head;
-    }
-
-    std::rotate(T_rem.ptr, T_rem.ptr + nrows, T_rem.ptr + nrows + 1);
-    T_rem.ptr[0] = 0;
-
-    AMGCL_TIC("MPI Wait");
-    MPI_Waitall(send_cnt_req.size(), send_cnt_req.data(), MPI_STATUSES_IGNORE);
-    MPI_Waitall(send_col_req.size(), send_col_req.data(), MPI_STATUSES_IGNORE);
-    MPI_Waitall(send_val_req.size(), send_val_req.data(), MPI_STATUSES_IGNORE);
-    AMGCL_TOC("MPI Wait");
-
-    AMGCL_TOC("MPI Transpose");
-
-    return std::make_shared< distributed_matrix<Backend> >(
-            comm, backend::transpose(A_loc), T_ptr);
-}
-
-template <class Backend>
-std::shared_ptr< backend::crs<typename Backend::value_type> >
-remote_rows(
-        const comm_pattern<Backend> &C,
-        const distributed_matrix<Backend> &B,
-        bool need_values = true
-        )
-{
-    typedef typename Backend::value_type value_type;
-    typedef backend::crs<value_type>     build_matrix;
-
-    static const int tag_ptr = 3001;
-    static const int tag_col = 3002;
-    static const int tag_val = 3003;
-
-    AMGCL_TIC("remote_rows");
-    communicator comm = C.mpi_comm();
-
-    build_matrix &B_loc = *B.local();
-    build_matrix &B_rem = *B.remote();
-    ptrdiff_t B_beg = B.loc_col_shift();
-
-    size_t nrecv = C.recv.nbr.size();
-    size_t nsend = C.send.nbr.size();
-
-    // Create blocked matrix to send to each domain
-    // that needs data from us:
-    std::vector<MPI_Request> send_ptr_req(nsend);
-    std::vector<MPI_Request> send_col_req(nsend);
-    std::vector<MPI_Request> send_val_req(nsend);
-
-    std::vector<build_matrix> send_rows(nsend);
-
-    for(size_t k = 0; k < nsend; ++k) {
-        ptrdiff_t beg = C.send.ptr[k];
-        ptrdiff_t end = C.send.ptr[k + 1];
-
-        build_matrix &m = send_rows[k];
-        m.set_size(end - beg, 0, false);
-
-        for(ptrdiff_t i = 0, ii = beg; ii < end; ++i, ++ii) {
-            ptrdiff_t r = C.send.col[ii];
-
-            ptrdiff_t w =
-                (B_loc.ptr[r + 1] - B_loc.ptr[r]) +
-                (B_rem.ptr[r + 1] - B_rem.ptr[r]);
-
-            m.ptr[i] = w;
-            m.nnz += w;
-        }
-
-        MPI_Isend(m.ptr, m.nrows, datatype<ptrdiff_t>(),
-                C.send.nbr[k], tag_ptr, comm, &send_ptr_req[k]);
-
-        m.set_nonzeros(m.nnz, need_values);
-
-        for(ptrdiff_t i = 0, ii = beg, head = 0; ii < end; ++i, ++ii) {
-            ptrdiff_t r = C.send.col[ii];
-
-            // Contribution of the local part:
-            for(ptrdiff_t j = B_loc.ptr[r]; j < B_loc.ptr[r+1]; ++j) {
-                m.col[head] = B_loc.col[j] + B_beg;
-
-                if (need_values) m.val[head] = B_loc.val[j];
-
-                ++head;
-            }
-
-            // Contribution of the remote part:
-            for(ptrdiff_t j = B_rem.ptr[r]; j < B_rem.ptr[r+1]; ++j) {
-                m.col[head] = B_rem.col[j];
-
-                if (need_values) m.val[head] = B_rem.val[j];
-
-                ++head;
-            }
-        }
-
-        MPI_Isend(m.col, m.nnz, datatype<ptrdiff_t>(),
-                C.send.nbr[k], tag_col, comm, &send_col_req[k]);
-        if (need_values)
-            MPI_Isend(m.val, m.nnz, datatype<value_type>(),
-                    C.send.nbr[k], tag_val, comm, &send_val_req[k]);
-    }
-
-    // Receive rows of B in block format from our neighbors:
-    std::vector<MPI_Request> recv_ptr_req(nrecv);
-    std::vector<MPI_Request> recv_col_req(nrecv);
-    std::vector<MPI_Request> recv_val_req(nrecv);
-
-    auto B_nbr = std::make_shared<build_matrix>();
-    B_nbr->set_size(C.recv.count(), 0, false);
-    B_nbr->ptr[0] = 0;
-
-    for(size_t k = 0; k < nrecv; ++k) {
-        ptrdiff_t beg = C.recv.ptr[k];
-        ptrdiff_t end = C.recv.ptr[k + 1];
-
-        MPI_Irecv(&B_nbr->ptr[beg + 1], end - beg, datatype<ptrdiff_t>(),
-                C.recv.nbr[k], tag_ptr, comm, &recv_ptr_req[k]);
-    }
-
-    AMGCL_TIC("MPI Wait");
-    MPI_Waitall(recv_ptr_req.size(), recv_ptr_req.data(), MPI_STATUSES_IGNORE);
-    AMGCL_TOC("MPI Wait");
-
-    B_nbr->set_nonzeros(B_nbr->scan_row_sizes(), need_values);
-
-    for(size_t k = 0; k < nrecv; ++k) {
-        ptrdiff_t rbeg = C.recv.ptr[k];
-        ptrdiff_t rend = C.recv.ptr[k + 1];
-
-        ptrdiff_t cbeg = B_nbr->ptr[rbeg];
-        ptrdiff_t cend = B_nbr->ptr[rend];
-
-        MPI_Irecv(&B_nbr->col[cbeg], cend - cbeg, datatype<ptrdiff_t>(),
-                C.recv.nbr[k], tag_col, comm, &recv_col_req[k]);
-
-        if (need_values)
-            MPI_Irecv(&B_nbr->val[cbeg], cend - cbeg, datatype<value_type>(),
-                    C.recv.nbr[k], tag_val, comm, &recv_val_req[k]);
-    }
-
-    AMGCL_TIC("MPI Wait");
-    MPI_Waitall(send_ptr_req.size(), send_ptr_req.data(), MPI_STATUSES_IGNORE);
-    MPI_Waitall(send_col_req.size(), send_col_req.data(), MPI_STATUSES_IGNORE);
-    MPI_Waitall(recv_col_req.size(), recv_col_req.data(), MPI_STATUSES_IGNORE);
-
-    if (need_values) {
-        MPI_Waitall(send_val_req.size(), send_val_req.data(), MPI_STATUSES_IGNORE);
-        MPI_Waitall(recv_val_req.size(), recv_val_req.data(), MPI_STATUSES_IGNORE);
-    }
-    AMGCL_TOC("MPI Wait");
-
-    AMGCL_TOC("remote_rows");
-    return B_nbr;
-}
-
-template <class Backend>
-std::shared_ptr< distributed_matrix<Backend> >
-product(const distributed_matrix<Backend> &A, const distributed_matrix<Backend> &B) {
-    typedef typename Backend::value_type value_type;
-    typedef backend::crs<value_type>     build_matrix;
-    AMGCL_TIC("product");
-
-    const comm_pattern<Backend> &Acp = A.cpat();
-
-    build_matrix &A_loc = *A.local();
-    build_matrix &A_rem = *A.remote();
-    build_matrix &B_loc = *B.local();
-    build_matrix &B_rem = *B.remote();
-
-    ptrdiff_t A_rows = A.loc_rows();
-    ptrdiff_t B_cols = B.loc_cols();
-
-    ptrdiff_t B_beg = B.loc_col_shift();
-    ptrdiff_t B_end = B_beg + B_cols;
-
-    auto b_nbr = remote_rows(Acp, B);
-    build_matrix &B_nbr = *b_nbr;
-
-    // Build mapping from global to local column numbers in the remote part of
-    // the product matrix.
-    std::vector<ptrdiff_t> rem_cols(B_rem.nnz + B_nbr.nnz);
-
-    std::copy(B_nbr.col, B_nbr.col + B_nbr.nnz,
-            std::copy(B_rem.col, B_rem.col + B_rem.nnz, rem_cols.begin()));
-
-    std::sort(rem_cols.begin(), rem_cols.end());
-    rem_cols.erase(std::unique(rem_cols.begin(), rem_cols.end()), rem_cols.end());
-
-    ptrdiff_t n_rem_cols = 0;
-    std::unordered_map<ptrdiff_t, int> rem_idx(2 * rem_cols.size());
-    for(ptrdiff_t c : rem_cols) {
-        if (c >= B_beg && c < B_end) continue;
-        rem_idx[c] = n_rem_cols++;
-    }
-
-    // Build the product.
-    auto c_loc = std::make_shared<build_matrix>();
-    auto c_rem = std::make_shared<build_matrix>();
-
-    build_matrix &C_loc = *c_loc;
-    build_matrix &C_rem = *c_rem;
-
-    C_loc.set_size(A_rows, B_cols, false);
-    C_rem.set_size(A_rows, 0,      false);
-
-    C_loc.ptr[0] = 0;
-    C_rem.ptr[0] = 0;
-
-    AMGCL_TIC("analyze");
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> loc_marker(B_end - B_beg, -1);
-        std::vector<ptrdiff_t> rem_marker(n_rem_cols,    -1);
-
-#pragma omp for
-        for(ptrdiff_t ia = 0; ia < A_rows; ++ia) {
-            ptrdiff_t loc_cols = 0;
-            ptrdiff_t rem_cols = 0;
-
-            for(ptrdiff_t ja = A_loc.ptr[ia], ea = A_loc.ptr[ia + 1]; ja < ea; ++ja) {
-                ptrdiff_t  ca = A_loc.col[ja];
-
-                for(ptrdiff_t jb = B_loc.ptr[ca], eb = B_loc.ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t  cb = B_loc.col[jb];
-
-                    if (loc_marker[cb] != ia) {
-                        loc_marker[cb]  = ia;
-                        ++loc_cols;
-                    }
-                }
-
-                for(ptrdiff_t jb = B_rem.ptr[ca], eb = B_rem.ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t  cb = rem_idx[B_rem.col[jb]];
-
-                    if (rem_marker[cb] != ia) {
-                        rem_marker[cb]  = ia;
-                        ++rem_cols;
-                    }
-                }
-            }
-
-            for(ptrdiff_t ja = A_rem.ptr[ia], ea = A_rem.ptr[ia + 1]; ja < ea; ++ja) {
-                ptrdiff_t  ca = Acp.local_index(A_rem.col[ja]);
-
-                for(ptrdiff_t jb = B_nbr.ptr[ca], eb = B_nbr.ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t  cb = B_nbr.col[jb];
-
-                    if (cb >= B_beg && cb < B_end) {
-                        cb -= B_beg;
-
-                        if (loc_marker[cb] != ia) {
-                            loc_marker[cb]  = ia;
-                            ++loc_cols;
-                        }
-                    } else {
-                        cb = rem_idx[cb];
-
-                        if (rem_marker[cb] != ia) {
-                            rem_marker[cb]  = ia;
-                            ++rem_cols;
-                        }
-                    }
-                }
-            }
-
-            C_loc.ptr[ia + 1] = loc_cols;
-            C_rem.ptr[ia + 1] = rem_cols;
-        }
-    }
-    AMGCL_TOC("analyze");
-
-    C_loc.set_nonzeros(C_loc.scan_row_sizes());
-    C_rem.set_nonzeros(C_rem.scan_row_sizes());
-
-    AMGCL_TIC("compute");
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> loc_marker(B_end - B_beg, -1);
-        std::vector<ptrdiff_t> rem_marker(n_rem_cols,    -1);
-
-#pragma omp for
-        for(ptrdiff_t ia = 0; ia < A_rows; ++ia) {
-            ptrdiff_t loc_beg = C_loc.ptr[ia];
-            ptrdiff_t rem_beg = C_rem.ptr[ia];
-            ptrdiff_t loc_end = loc_beg;
-            ptrdiff_t rem_end = rem_beg;
-
-            for(ptrdiff_t ja = A_loc.ptr[ia], ea = A_loc.ptr[ia + 1]; ja < ea; ++ja) {
-                ptrdiff_t  ca = A_loc.col[ja];
-                value_type va = A_loc.val[ja];
-
-                for(ptrdiff_t jb = B_loc.ptr[ca], eb = B_loc.ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t  cb = B_loc.col[jb];
-                    value_type vb = B_loc.val[jb];
-
-                    if (loc_marker[cb] < loc_beg) {
-                        loc_marker[cb] = loc_end;
-
-                        C_loc.col[loc_end] = cb;
-                        C_loc.val[loc_end] = va * vb;
-
-                        ++loc_end;
-                    } else {
-                        C_loc.val[loc_marker[cb]] += va * vb;
-                    }
-                }
-
-                for(ptrdiff_t jb = B_rem.ptr[ca], eb = B_rem.ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t  gb = B_rem.col[jb];
-                    ptrdiff_t  cb = rem_idx[gb];
-                    value_type vb = B_rem.val[jb];
-
-                    if (rem_marker[cb] < rem_beg) {
-                        rem_marker[cb] = rem_end;
-
-                        C_rem.col[rem_end] = gb;
-                        C_rem.val[rem_end] = va * vb;
-
-                        ++rem_end;
-                    } else {
-                        C_rem.val[rem_marker[cb]] += va * vb;
-                    }
-                }
-            }
-
-            for(ptrdiff_t ja = A_rem.ptr[ia], ea = A_rem.ptr[ia + 1]; ja < ea; ++ja) {
-                ptrdiff_t  ca = Acp.local_index(A_rem.col[ja]);
-                value_type va = A_rem.val[ja];
-
-                for(ptrdiff_t jb = B_nbr.ptr[ca], eb = B_nbr.ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t  gb = B_nbr.col[jb];
-                    value_type vb = B_nbr.val[jb];
-
-                    if (gb >= B_beg && gb < B_end) {
-                        ptrdiff_t cb = gb - B_beg;
-
-                        if (loc_marker[cb] < loc_beg) {
-                            loc_marker[cb] = loc_end;
-
-                            C_loc.col[loc_end] = cb;
-                            C_loc.val[loc_end] = va * vb;
-
-                            ++loc_end;
-                        } else {
-                            C_loc.val[loc_marker[cb]] += va * vb;
-                        }
-                    } else {
-                        ptrdiff_t cb = rem_idx[gb];
-
-                        if (rem_marker[cb] < rem_beg) {
-                            rem_marker[cb] = rem_end;
-
-                            C_rem.col[rem_end] = gb;
-                            C_rem.val[rem_end] = va * vb;
-
-                            ++rem_end;
-                        } else {
-                            C_rem.val[rem_marker[cb]] += va * vb;
-                        }
-                    }
-                }
-            }
-        }
-    }
-    AMGCL_TOC("compute");
-    AMGCL_TOC("product");
-
-    return std::make_shared<distributed_matrix<Backend> >(A.comm(), c_loc, c_rem);
-}
-
-template <class Backend, class T>
-void scale(distributed_matrix<Backend> &A, T s) {
-    typedef typename Backend::value_type value_type;
-    typedef backend::crs<value_type> build_matrix;
-
-    build_matrix &A_loc = *A.local();
-    build_matrix &A_rem = *A.remote();
-
-    ptrdiff_t n = A_loc.nrows;
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j)
-                A_loc.val[j] *= s;
-            for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j)
-                A_rem.val[j] *= s;
-        }
-}
-
-template <class Backend>
-void sort_rows(distributed_matrix<Backend> &A) {
-    backend::sort_rows(*A.local());
-    backend::sort_rows(*A.remote());
-}
-
-} // namespace mpi
-
-namespace backend {
-
-template <class Backend>
-struct rows_impl< mpi::distributed_matrix<Backend> >
-{
-    static size_t get(const mpi::distributed_matrix<Backend> &A) {
-        return A.loc_rows();
-    }
-};
-
-template <class Backend, class Alpha, class Vec1, class Beta,  class Vec2>
-struct spmv_impl<Alpha, mpi::distributed_matrix<Backend>, Vec1, Beta, Vec2>
-{
-    static void apply(
-            Alpha alpha,
-            const mpi::distributed_matrix<Backend> &A,
-            const Vec1 &x, Beta beta, Vec2 &y)
-    {
-        A.mul(alpha, x, beta, y);
-    }
-};
-
-template <class Backend, class Vec1, class Vec2, class Vec3>
-struct residual_impl<mpi::distributed_matrix<Backend>, Vec1, Vec2, Vec3>
-{
-    static void apply(
-            const Vec1 &rhs,
-            const mpi::distributed_matrix<Backend> &A,
-            const Vec2 &x, Vec3 &r)
-    {
-        A.residual(rhs, x, r);
-    }
-};
-
-// Diagonal of the matrix
-template <class Backend>
-std::shared_ptr< numa_vector<typename Backend::value_type> >
-diagonal(const mpi::distributed_matrix<Backend> &A, bool invert = false) {
-    return diagonal(*A.local(), invert);
-}
-
-// Estimate spectral radius of the matrix.
-template <bool scale, class Backend>
-typename math::scalar_of<typename Backend::value_type>::type
-spectral_radius(const mpi::distributed_matrix<Backend> &A, int power_iters = 0)
-{
-    AMGCL_TIC("spectral radius");
-    typedef typename Backend::value_type               value_type;
-    typedef typename math::rhs_of<value_type>::type    rhs_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef backend::crs<value_type>                   build_matrix;
-
-    mpi::communicator comm = A.comm();
-
-    const build_matrix &A_loc = *A.local();
-    const build_matrix &A_rem = *A.remote();
-    const mpi::comm_pattern<Backend> &C = A.cpat();
-
-    const ptrdiff_t n = A_loc.nrows;
-    scalar_type radius = 0;
-
-    if (power_iters <= 0) {
-#pragma omp parallel
-        {
-            scalar_type emax = 0;
-            value_type  dia = math::identity<value_type>();
-
-#pragma omp for nowait
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                scalar_type s = 0;
-
-                for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                    ptrdiff_t  c = A_loc.col[j];
-                    value_type v = A_loc.val[j];
-
-                    s += math::norm(v);
-
-                    if (scale && c == i) dia = v;
-                }
-
-                for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j)
-                    s += math::norm(A_rem.val[j]);
-
-                if (scale) s *= math::norm(math::inverse(dia));
-
-                emax = std::max(emax, s);
-            }
-
-#pragma omp critical
-            radius = std::max(radius, emax);
-        }
-    } else {
-        backend::numa_vector<rhs_type>   b0(n, false), b1(n, false);
-        backend::numa_vector<ptrdiff_t>  rem_col(A_rem.nnz, false);
-
-        // Fill the initial vector with random values.
-        // Also extract the inverted matrix diagonal values.
-        scalar_type b0_loc_norm = 0;
-
-#pragma omp parallel
-        {
-#ifdef _OPENMP
-            int tid = omp_get_thread_num();
-            int nt  = omp_get_max_threads();
-#else
-            int tid = 0;
-            int nt  = 1;
-#endif
-            std::mt19937 rng(comm.size * nt + tid);
-            std::uniform_real_distribution<scalar_type> rnd(-1, 1);
-
-            scalar_type t_norm = 0;
-
-#pragma omp for nowait
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                rhs_type v = math::constant<rhs_type>(rnd(rng));
-
-                b0[i] = v;
-                t_norm += math::norm(math::inner_product(v,v));
-
-                for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j) {
-                    rem_col[j] = C.local_index(A_rem.col[j]);
-                }
-            }
-
-#pragma omp critical
-            b0_loc_norm += t_norm;
-        }
-
-        scalar_type b0_norm = comm.reduce(MPI_SUM, b0_loc_norm);
-
-        // Normalize b0
-        b0_norm = 1 / sqrt(b0_norm);
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            b0[i] = b0_norm * b0[i];
-        }
-
-        std::vector<rhs_type> b0_send(C.send.count());
-        std::vector<rhs_type> b0_recv(C.recv.count());
-
-        for(size_t i = 0, m = C.send.count(); i < m; ++i)
-            b0_send[i] = b0[C.send.col[i]];
-        C.exchange(b0_send.data(), b0_recv.data());
-
-        for(int iter = 0; iter < power_iters;) {
-            // b1 = (D * A) * b0
-            // b1_norm = ||b1||
-            // radius = <b1,b0>
-            scalar_type b1_loc_norm = 0;
-            scalar_type loc_radius = 0;
-
-#pragma omp parallel
-            {
-                scalar_type t_norm = 0;
-                scalar_type t_radi = 0;
-                value_type  dia = math::identity<value_type>();
-
-#pragma omp for nowait
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    rhs_type s = math::zero<rhs_type>();
-
-                    for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                        ptrdiff_t  c = A_loc.col[j];
-                        value_type v = A_loc.val[j];
-                        if (scale && c == i) dia = v;
-                        s += v * b0[c];
-                    }
-
-                    for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j)
-                        s += A_rem.val[j] * b0_recv[rem_col[j]];
-
-                    if (scale) s = math::inverse(dia) * s;
-
-                    t_norm += math::norm(math::inner_product(s, s));
-                    t_radi += math::norm(math::inner_product(s, b0[i]));
-
-                    b1[i] = s;
-                }
-
-#pragma omp critical
-                {
-                    b1_loc_norm += t_norm;
-                    loc_radius  += t_radi;
-                }
-            }
-
-            radius = comm.reduce(MPI_SUM, loc_radius);
-
-            if (++iter < power_iters) {
-                scalar_type b1_norm;
-                b1_norm = comm.reduce(MPI_SUM, b1_loc_norm);
-
-                // b0 = b1 / b1_norm
-                b1_norm = 1 / sqrt(b1_norm);
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    b0[i] = b1_norm * b1[i];
-                }
-
-                for(size_t i = 0, m = C.send.count(); i < m; ++i)
-                    b0_send[i] = b0[C.send.col[i]];
-                C.exchange(b0_send.data(), b0_recv.data());
-            }
-        }
-    }
-    AMGCL_TOC("spectral radius");
-
-    return radius < 0 ? static_cast<scalar_type>(2) : radius;
-}
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/inner_product.hpp b/src/solvers/amgcl/mpi/inner_product.hpp
deleted file mode 100644
index ee2383d..0000000
--- a/src/solvers/amgcl/mpi/inner_product.hpp
+++ /dev/null
@@ -1,72 +0,0 @@
-#ifndef AMGCL_MPI_INNER_PRODUCT_HPP
-#define AMGCL_MPI_INNER_PRODUCT_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/inner_product.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Inner product for distributed vectors.
- */
-
-#include <mpi.h>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-struct inner_product {
-    communicator comm;
-
-    inner_product(communicator comm) : comm(comm) {}
-
-    template <class Vec1, class Vec2>
-    typename math::inner_product_impl<
-        typename backend::value_type<Vec1>::type
-        >::return_type
-    operator()(const Vec1 &x, const Vec2 &y) const {
-        typedef typename backend::value_type<Vec1>::type value_type;
-        typedef typename math::inner_product_impl<value_type>::return_type coef_type;
-
-        AMGCL_TIC("inner product");
-        coef_type sum = comm.reduce(MPI_SUM, backend::inner_product(x, y));
-        AMGCL_TOC("inner product");
-
-        return sum;
-    }
-
-    int rank() const {
-        return comm.rank;
-    }
-};
-
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/make_solver.hpp b/src/solvers/amgcl/mpi/make_solver.hpp
deleted file mode 100644
index f41ee10..0000000
--- a/src/solvers/amgcl/mpi/make_solver.hpp
+++ /dev/null
@@ -1,196 +0,0 @@
-#ifndef AMGCL_MPI_MAKE_SOLVER_HPP
-#define AMGCL_MPI_MAKE_SOLVER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/block_preconditioner.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Iterative solver wrapper for distributed linear systmes.
- */
-
-#include <iostream>
-
-#include <boost/property_tree/ptree.hpp>
-#include <memory>
-
-#include <mpi.h>
-
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-template <
-    class Precond,
-    class IterativeSolver
-    >
-class make_solver : public amgcl::detail::non_copyable {
-    static_assert(
-            backend::backends_compatible<
-                typename IterativeSolver::backend_type,
-                typename Precond::backend_type
-            >::value,
-            "Backends for preconditioner and iterative solver should be compatible"
-            );
-    public:
-        typedef typename IterativeSolver::backend_type backend_type;
-        typedef amgcl::mpi::distributed_matrix<typename Precond::backend_type> matrix;
-        typedef typename backend_type::value_type value_type;
-        typedef typename backend_type::params backend_params;
-        typedef typename backend::builtin<value_type>::matrix build_matrix;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        struct params {
-            typename Precond::params precond; ///< Preconditioner parameters.
-            typename IterativeSolver::params  solver;  ///< Iterative solver parameters.
-
-            params() {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, precond),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, solver)
-            {
-                check_params(p, {"precond", "solver"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path = "") const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, precond);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, solver);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        make_solver(
-                communicator comm, const Matrix &A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(backend::rows(A)),
-            P(comm, A, prm.precond, bprm),
-            S(backend::rows(A), prm.solver, bprm, mpi::inner_product(comm))
-        {}
-
-        make_solver(
-                communicator comm, std::shared_ptr<matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(A->loc_rows()),
-            P(comm, A, prm.precond, bprm),
-            S(n, prm.solver, bprm, mpi::inner_product(comm))
-        {
-        }
-
-        template <class Backend>
-        make_solver(
-                communicator comm, std::shared_ptr<distributed_matrix<Backend>> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(A->loc_rows()),
-            P(comm, std::make_shared<matrix>(*A), prm.precond, bprm),
-            S(n, prm.solver, bprm, mpi::inner_product(comm))
-        {
-            A->move_to_backend(bprm);
-        }
-
-        make_solver(
-                communicator comm, std::shared_ptr<build_matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm), n(backend::rows(*A)),
-            P(comm, A, prm.precond, bprm),
-            S(backend::rows(*A), prm.solver, bprm, mpi::inner_product(comm))
-        {}
-
-        template <class Matrix, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return S(A, P, rhs, x);
-        }
-
-        template <class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(const Vec1 &rhs, Vec2 &&x) const {
-            return S(P, rhs, x);
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            backend::clear(x);
-            (*this)(rhs, x);
-        }
-
-        const Precond& precond() const {
-            return P;
-        }
-
-        Precond& precond() {
-            return P;
-        }
-
-        const IterativeSolver& solver() const {
-            return S;
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return P.system_matrix_ptr();
-        }
-
-        const matrix& system_matrix() const {
-            return P.system_matrix();
-        }
-
-#ifndef AMGCL_NO_BOOST
-        void get_params(boost::property_tree::ptree &p) const {
-            prm.get(p);
-        }
-#endif
-
-        size_t size() const {
-            return n;
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const make_solver &M) {
-            return os << M.S << std::endl << M.P;
-        }
-    private:
-        size_t n;
-
-        Precond P;
-        IterativeSolver  S;
-};
-
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/partition/merge.hpp b/src/solvers/amgcl/mpi/partition/merge.hpp
deleted file mode 100644
index b472315..0000000
--- a/src/solvers/amgcl/mpi/partition/merge.hpp
+++ /dev/null
@@ -1,143 +0,0 @@
-#ifndef AMGCL_MPI_REPARTITION_MERGE_HPP
-#define AMGCL_MPI_REPARTITION_MERGE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/partition/merge.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Dummy partitioner (merges consecutive domains together).
- */
-
-#include <memory>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/partition/util.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace partition {
-
-template <class Backend>
-struct merge {
-    typedef typename Backend::value_type value_type;
-    typedef distributed_matrix<Backend>  matrix;
-
-    struct params {
-        bool      enable;
-        ptrdiff_t min_per_proc;
-        int       shrink_ratio;
-
-        params() :
-            enable(false), min_per_proc(10000), shrink_ratio(8)
-        {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, enable),
-              AMGCL_PARAMS_IMPORT_VALUE(p, min_per_proc),
-              AMGCL_PARAMS_IMPORT_VALUE(p, shrink_ratio)
-        {
-            check_params(p, {"enable", "min_per_proc", "shrink_ratio"});
-        }
-
-        void get(
-                boost::property_tree::ptree &p,
-                const std::string &path = ""
-                ) const
-        {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, enable);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, min_per_proc);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, shrink_ratio);
-        }
-#endif
-    } prm;
-
-    merge(const params &prm = params()) : prm(prm) {}
-
-    bool is_needed(const matrix &A) const {
-        if (!prm.enable) return false;
-
-        communicator comm = A.comm();
-        ptrdiff_t n = A.loc_rows();
-        std::vector<ptrdiff_t> row_dom = comm.exclusive_sum(n);
-
-        int non_empty = 0;
-        ptrdiff_t min_n = std::numeric_limits<ptrdiff_t>::max();
-        for(int i = 0; i < comm.size; ++i) {
-            ptrdiff_t m = row_dom[i+1] - row_dom[i];
-            if (m) {
-                min_n = std::min(min_n, m);
-                ++non_empty;
-            }
-        }
-
-        return (non_empty > 1) && (min_n <= prm.min_per_proc);
-    }
-
-    std::shared_ptr<matrix> operator()(const matrix &A, unsigned /*block_size*/ = 1) const {
-        communicator comm = A.comm();
-        ptrdiff_t nrows = A.loc_rows();
-
-        std::vector<ptrdiff_t> row_dom = comm.exclusive_sum(nrows);
-        std::vector<ptrdiff_t> col_dom(comm.size + 1);
-
-        for(int i = 0; i <= comm.size; ++i)
-            col_dom[i] = row_dom[std::min<int>(i * prm.shrink_ratio, comm.size)];
-
-        int old_domains = 0;
-        int new_domains = 0;
-
-        for(int i = 0; i < comm.size; ++i) {
-            if (row_dom[i+1] > row_dom[i]) ++old_domains;
-            if (col_dom[i+1] > col_dom[i]) ++new_domains;
-        }
-
-        if (comm.rank == 0)
-            std::cout << "Partitioning[MERGE] " << old_domains << " -> " << new_domains << std::endl;
-
-        ptrdiff_t row_beg = row_dom[comm.rank];
-        ptrdiff_t col_beg = col_dom[comm.rank];
-        ptrdiff_t col_end = col_dom[comm.rank + 1];
-
-        std::vector<ptrdiff_t> perm(nrows);
-        for(ptrdiff_t i = 0; i < nrows; ++i) {
-            perm[i] = i + row_beg;
-        }
-
-        return graph_perm_matrix<Backend>(comm, col_beg, col_end, perm);
-    }
-
-};
-
-
-} // namespace partition
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/partition/parmetis.hpp b/src/solvers/amgcl/mpi/partition/parmetis.hpp
deleted file mode 100644
index 5e002ec..0000000
--- a/src/solvers/amgcl/mpi/partition/parmetis.hpp
+++ /dev/null
@@ -1,214 +0,0 @@
-#ifndef AMGCL_MPI_REPARTITION_PARMETIS_HPP
-#define AMGCL_MPI_REPARTITION_PARMETIS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/partition/parmetis.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  ParMETIS partitioner.
- */
-
-#include <memory>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/partition/util.hpp>
-
-#include <parmetis.h>
-
-namespace amgcl {
-namespace mpi {
-namespace partition {
-
-template <class Backend>
-struct parmetis {
-    typedef typename Backend::value_type value_type;
-    typedef distributed_matrix<Backend>  matrix;
-
-    struct params {
-        bool      shrink;
-        ptrdiff_t min_per_proc;
-        int       shrink_ratio;
-
-        params() :
-            shrink(false), min_per_proc(10000), shrink_ratio(8)
-        {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, shrink),
-              AMGCL_PARAMS_IMPORT_VALUE(p, min_per_proc),
-              AMGCL_PARAMS_IMPORT_VALUE(p, shrink_ratio)
-        {
-            check_params(p, {"shrink", "min_per_proc", "shrink_ratio"});
-        }
-
-        void get(
-                boost::property_tree::ptree &p,
-                const std::string &path = ""
-                ) const
-        {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, shrink);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, min_per_proc);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, shrink_ratio);
-        }
-#endif
-    } prm;
-
-    parmetis(const params &prm = params()) : prm(prm) {}
-
-    bool is_needed(const matrix &A) const {
-        if (!prm.shrink) return false;
-
-        communicator comm = A.comm();
-        ptrdiff_t n = A.loc_rows();
-        std::vector<ptrdiff_t> row_dom = comm.exclusive_sum(n);
-
-        int non_empty = 0;
-        ptrdiff_t min_n = std::numeric_limits<ptrdiff_t>::max();
-        for(int i = 0; i < comm.size; ++i) {
-            ptrdiff_t m = row_dom[i+1] - row_dom[i];
-            if (m) {
-                min_n = std::min(min_n, m);
-                ++non_empty;
-            }
-        }
-
-        return (non_empty > 1) && (min_n <= prm.min_per_proc);
-    }
-
-    std::shared_ptr<matrix> operator()(const matrix &A, unsigned block_size = 1) const {
-        communicator comm = A.comm();
-        idx_t n = A.loc_rows();
-        ptrdiff_t row_beg = A.loc_col_shift();
-
-        // Partition the graph.
-        int active = (n > 0);
-        int active_ranks = comm.reduce(MPI_SUM, active);
-        int shrink = prm.shrink ? prm.shrink_ratio : 1;
-
-        idx_t npart = std::max(1, active_ranks / shrink);
-
-        if (comm.rank == 0)
-            std::cout << "Partitioning[ParMETIS] " << active_ranks << " -> " << npart << std::endl;
-
-
-        std::vector<ptrdiff_t> perm(n);
-        ptrdiff_t col_beg, col_end;
-
-        if (npart == 1) {
-            col_beg = (comm.rank == 0) ? 0 : A.glob_rows();
-            col_end = A.glob_rows();
-
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                perm[i] = row_beg + i;
-            }
-        } else {
-            if (block_size == 1) {
-                std::tie(col_beg, col_end) = partition(A, npart, perm);
-            } else {
-                typedef typename math::scalar_of<value_type>::type scalar;
-                typedef backend::builtin<scalar> sbackend;
-                ptrdiff_t np = n / block_size;
-
-                distributed_matrix<sbackend> A_pw(A.comm(),
-                    pointwise_matrix(*A.local(),  block_size),
-                    pointwise_matrix(*A.remote(), block_size)
-                    );
-
-                std::vector<ptrdiff_t> perm_pw(np);
-
-                std::tie(col_beg, col_end) = partition(A_pw, npart, perm_pw);
-
-                col_beg *= block_size;
-                col_end *= block_size;
-
-                for(ptrdiff_t ip = 0; ip < np; ++ip) {
-                    ptrdiff_t i = ip * block_size;
-                    ptrdiff_t j = perm_pw[ip] * block_size;
-
-                    for(unsigned k = 0; k < block_size; ++k)
-                        perm[i + k] = j + k;
-                }
-            }
-        }
-
-        return graph_perm_matrix<Backend>(comm, col_beg, col_end, perm);
-    }
-
-    template <class B>
-    std::tuple<ptrdiff_t, ptrdiff_t>
-    partition(const distributed_matrix<B> &A, idx_t npart, std::vector<ptrdiff_t> &perm) const {
-        communicator comm = A.comm();
-        idx_t n = A.loc_rows();
-        int active = (n > 0);
-
-        std::vector<idx_t> ptr;
-        std::vector<idx_t> col;
-
-        symm_graph(A, ptr, col);
-
-        idx_t wgtflag = 0;
-        idx_t numflag = 0;
-        idx_t options = 0;
-        idx_t edgecut = 0;
-        idx_t ncon    = 1;
-
-        std::vector<real_t> tpwgts(npart, 1.0 / npart);
-        std::vector<real_t> ubvec(ncon, 1.05);
-        std::vector<idx_t>  part(n);
-        if (!n) part.reserve(1); // So that part.data() is not NULL
-
-        MPI_Comm scomm;
-        MPI_Comm_split(comm, active ? 0 : MPI_UNDEFINED, comm.rank, &scomm);
-
-        if (active) {
-            communicator sc(scomm);
-            std::vector<idx_t> vtxdist = sc.exclusive_sum(n);
-
-            sc.check(
-                    METIS_OK == ParMETIS_V3_PartKway( &vtxdist[0], &ptr[0],
-                        &col[0], NULL, NULL, &wgtflag, &numflag, &ncon,
-                        &npart, &tpwgts[0], &ubvec[0], &options, &edgecut,
-                        &part[0], &scomm),
-                    "Error in ParMETIS"
-                    );
-
-            MPI_Comm_free(&scomm);
-        }
-
-        return graph_perm_index(comm, npart, part, perm);
-    }
-};
-
-
-} // namespace partition
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/partition/ptscotch.hpp b/src/solvers/amgcl/mpi/partition/ptscotch.hpp
deleted file mode 100644
index b2f47cb..0000000
--- a/src/solvers/amgcl/mpi/partition/ptscotch.hpp
+++ /dev/null
@@ -1,216 +0,0 @@
-#ifndef AMGCL_MPI_REPARTITION_PTSCOTCH_HPP
-#define AMGCL_MPI_REPARTITION_PTSCOTCH_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/partition/ptscotch.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  PT-SCOTCH partitioner.
- */
-
-#include <memory>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/partition/util.hpp>
-
-#include <ptscotch.h>
-
-namespace amgcl {
-namespace mpi {
-namespace partition {
-
-template <class Backend>
-struct ptscotch {
-    typedef typename Backend::value_type value_type;
-    typedef distributed_matrix<Backend>  matrix;
-
-    struct params {
-        bool      shrink;
-        ptrdiff_t min_per_proc;
-        int       shrink_ratio;
-
-        params() :
-            shrink(false), min_per_proc(10000), shrink_ratio(8)
-        {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, shrink),
-              AMGCL_PARAMS_IMPORT_VALUE(p, min_per_proc),
-              AMGCL_PARAMS_IMPORT_VALUE(p, shrink_ratio)
-        {
-            check_params(p, {"shrink", "min_per_proc", "shrink_ratio"});
-        }
-
-        void get(
-                boost::property_tree::ptree &p,
-                const std::string &path = ""
-                ) const
-        {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, shrink);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, min_per_proc);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, shrink_ratio);
-        }
-#endif
-    } prm;
-
-    ptscotch(const params &prm = params()) : prm(prm) {}
-
-    bool is_needed(const matrix &A) const {
-        if (!prm.shrink) return false;
-
-        communicator comm = A.comm();
-        ptrdiff_t n = A.loc_rows();
-        std::vector<ptrdiff_t> row_dom = comm.exclusive_sum(n);
-
-        int non_empty = 0;
-        ptrdiff_t min_n = std::numeric_limits<ptrdiff_t>::max();
-        for(int i = 0; i < comm.size; ++i) {
-            ptrdiff_t m = row_dom[i+1] - row_dom[i];
-            if (m) {
-                min_n = std::min(min_n, m);
-                ++non_empty;
-            }
-        }
-
-        return (non_empty > 1) && (min_n <= prm.min_per_proc);
-    }
-
-    std::shared_ptr<matrix> operator()(const matrix &A, unsigned block_size = 1) const {
-        communicator comm = A.comm();
-        ptrdiff_t n = A.loc_rows();
-        ptrdiff_t row_beg = A.loc_col_shift();
-
-        // Partition the graph.
-        int active = (n > 0);
-        int active_ranks = comm.reduce(MPI_SUM, active);
-        int shrink = prm.shrink ? prm.shrink_ratio : 1;
-
-        SCOTCH_Num npart = std::max(1, active_ranks / shrink);
-
-        if (comm.rank == 0)
-            std::cout << "Partitioning[PT-Scotch] " << active_ranks << " -> " << npart << std::endl;
-
-        std::vector<ptrdiff_t> perm(n);
-        ptrdiff_t col_beg, col_end;
-
-        if (npart == 1) {
-            col_beg = (comm.rank == 0) ? 0 : A.glob_rows();
-            col_end = A.glob_rows();
-
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                perm[i] = row_beg + i;
-            }
-        } else {
-            if (block_size == 1) {
-                std::tie(col_beg, col_end) = partition(A, npart, perm);
-            } else {
-                typedef typename math::scalar_of<value_type>::type scalar;
-                typedef backend::builtin<scalar> sbackend;
-
-                ptrdiff_t np = n / block_size;
-
-                distributed_matrix<sbackend> A_pw(A.comm(),
-                    pointwise_matrix(*A.local(),  block_size),
-                    pointwise_matrix(*A.remote(), block_size)
-                    );
-
-                std::vector<ptrdiff_t> perm_pw(np);
-
-                std::tie(col_beg, col_end) = partition(A_pw, npart, perm_pw);
-
-                col_beg *= block_size;
-                col_end *= block_size;
-
-                for(ptrdiff_t ip = 0; ip < np; ++ip) {
-                    ptrdiff_t i = ip * block_size;
-                    ptrdiff_t j = perm_pw[ip] * block_size;
-
-                    for(unsigned k = 0; k < block_size; ++k)
-                        perm[i + k] = j + k;
-                }
-            }
-        }
-
-        return graph_perm_matrix<Backend>(comm, col_beg, col_end, perm);
-    }
-
-    static void check(communicator comm, int ierr) {
-        comm.check(ierr == 0, "SCOTCH error");
-    }
-
-    template <class B>
-    std::tuple<ptrdiff_t, ptrdiff_t>
-    partition(const distributed_matrix<B> &A, SCOTCH_Num npart, std::vector<ptrdiff_t> &perm) const {
-        communicator comm = A.comm();
-        ptrdiff_t n = A.loc_rows();
-
-        std::vector<SCOTCH_Num> ptr;
-        std::vector<SCOTCH_Num> col;
-        std::vector<SCOTCH_Num> part(n);
-        if (!n) part.reserve(1); // So that part.data() is not NULL
-
-        symm_graph(A, ptr, col);
-
-        SCOTCH_Dgraph G;
-        check(comm, SCOTCH_dgraphInit(&G, comm));
-        check(comm, SCOTCH_dgraphBuild(&G,
-                    0,          // baseval
-                    n,          // vertlocnbr
-                    n,          // vertlocmax
-                    &ptr[0],    // vertloctab
-                    NULL,       // vendloctab
-                    NULL,       // veloloctab
-                    NULL,       // vlblloctab
-                    ptr.back(), // edgelocnbr
-                    ptr.back(), // edgelocsiz
-                    &col[0],    // edgeloctab
-                    NULL,       // edgegsttab
-                    NULL        // edloloctab
-                    ));
-        check(comm, SCOTCH_dgraphCheck(&G));
-
-        SCOTCH_Strat S;
-        check(comm, SCOTCH_stratInit(&S));
-
-        check(comm, SCOTCH_dgraphPart(&G, npart, &S, &part[0]));
-
-        SCOTCH_stratExit(&S);
-        SCOTCH_dgraphExit(&G);
-
-        return graph_perm_index(comm, npart, part, perm);
-    }
-};
-
-
-} // namespace partition
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/partition/runtime.hpp b/src/solvers/amgcl/mpi/partition/runtime.hpp
deleted file mode 100644
index c593b21..0000000
--- a/src/solvers/amgcl/mpi/partition/runtime.hpp
+++ /dev/null
@@ -1,248 +0,0 @@
-#ifndef AMGCL_MPI_REPARTITION_RUNTIME_HPP
-#define AMGCL_MPI_REPARTITION_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/partition/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime wrapper for distributed partitioners.
- */
-
-#include <memory>
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/mpi/partition/merge.hpp>
-#ifdef AMGCL_HAVE_SCOTCH
-#  include <amgcl/mpi/partition/ptscotch.hpp>
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-#  include <amgcl/mpi/partition/parmetis.hpp>
-#endif
-
-namespace amgcl {
-namespace runtime {
-namespace mpi {
-namespace partition {
-
-enum type {
-    merge
-#ifdef AMGCL_HAVE_SCOTCH
-  , ptscotch
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-  , parmetis
-#endif
-};
-
-inline std::ostream& operator<<(std::ostream &os, type s)
-{
-    switch (s) {
-        case merge:
-            return os << "merge";
-#ifdef AMGCL_HAVE_SCOTCH
-        case ptscotch:
-            return os << "ptscotch";
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-        case parmetis:
-            return os << "parmetis";
-#endif
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &s)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "merge")
-        s = merge;
-#ifdef AMGCL_HAVE_SCOTCH
-    else if (val == "ptscotch")
-        s = ptscotch;
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-    else if (val == "parmetis")
-        s = parmetis;
-#endif
-    else
-        throw std::invalid_argument("Invalid partitioner value. Valid choices are: "
-                "merge"
-#ifdef AMGCL_HAVE_SCOTCH
-                ", ptscotch"
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-                ", parmetis"
-#endif
-                ".");
-
-    return in;
-}
-
-template <class Backend>
-struct wrapper {
-    typedef amgcl::mpi::distributed_matrix<Backend> matrix;
-    typedef boost::property_tree::ptree params;
-
-    type t;
-    void *handle;
-
-    wrapper(params prm = params()) : t(prm.get("type",
-#if defined(AMGCL_HAVE_SCOTCH)
-                ptscotch
-#elif defined(AMGCL_HAVE_PARMETIS)
-                parmetis
-#else
-                merge
-#endif
-                )), handle(0)
-    {
-        if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-        switch (t) {
-            case merge:
-                {
-                    typedef amgcl::mpi::partition::merge<Backend> R;
-                    handle = static_cast<void*>(new R(prm));
-                }
-                break;
-#ifdef AMGCL_HAVE_SCOTCH
-            case ptscotch:
-                {
-                    typedef amgcl::mpi::partition::ptscotch<Backend> R;
-                    handle = static_cast<void*>(new R(prm));
-                }
-                break;
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-            case parmetis:
-                {
-                    typedef amgcl::mpi::partition::parmetis<Backend> R;
-                    handle = static_cast<void*>(new R(prm));
-                }
-                break;
-#endif
-            default:
-                throw std::invalid_argument("Unsupported partition type");
-        }
-    }
-
-    ~wrapper() {
-        switch(t) {
-            case merge:
-                {
-                    typedef amgcl::mpi::partition::merge<Backend> R;
-                    delete static_cast<R*>(handle);
-                }
-                break;
-#ifdef AMGCL_HAVE_SCOTCH
-            case ptscotch:
-                {
-                    typedef amgcl::mpi::partition::ptscotch<Backend> R;
-                    delete static_cast<R*>(handle);
-                }
-                break;
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-            case parmetis:
-                {
-                    typedef amgcl::mpi::partition::parmetis<Backend> R;
-                    delete static_cast<R*>(handle);
-                }
-                break;
-#endif
-            default:
-                break;
-        }
-    }
-
-    bool is_needed(const matrix &A) const {
-        switch (t) {
-            case merge:
-                {
-                    typedef amgcl::mpi::partition::merge<Backend> R;
-                    return static_cast<const R*>(handle)->is_needed(A);
-                }
-#ifdef AMGCL_HAVE_SCOTCH
-            case ptscotch:
-                {
-                    typedef amgcl::mpi::partition::ptscotch<Backend> R;
-                    return static_cast<const R*>(handle)->is_needed(A);
-                }
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-            case parmetis:
-                {
-                    typedef amgcl::mpi::partition::parmetis<Backend> R;
-                    return static_cast<const R*>(handle)->is_needed(A);
-                }
-#endif
-            default:
-                throw std::invalid_argument("Unsupported partition type");
-        }
-    }
-
-    std::shared_ptr<matrix> operator()(const matrix &A, unsigned block_size = 1) const {
-        switch (t) {
-            case merge:
-                {
-                    typedef amgcl::mpi::partition::merge<Backend> R;
-                    return static_cast<const R*>(handle)->operator()(A, block_size);
-                }
-#ifdef AMGCL_HAVE_SCOTCH
-            case ptscotch:
-                {
-                    typedef amgcl::mpi::partition::ptscotch<Backend> R;
-                    return static_cast<const R*>(handle)->operator()(A, block_size);
-                }
-#endif
-#ifdef AMGCL_HAVE_PARMETIS
-            case parmetis:
-                {
-                    typedef amgcl::mpi::partition::parmetis<Backend> R;
-                    return static_cast<const R*>(handle)->operator()(A, block_size);
-                }
-#endif
-            default:
-                throw std::invalid_argument("Unsupported partition type");
-        }
-    }
-};
-
-} // namespace partition
-} // namespace mpi
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/partition/util.hpp b/src/solvers/amgcl/mpi/partition/util.hpp
deleted file mode 100644
index 48ba60c..0000000
--- a/src/solvers/amgcl/mpi/partition/util.hpp
+++ /dev/null
@@ -1,324 +0,0 @@
-#ifndef AMGCL_MPI_REPARTITION_UTIL_HPP
-#define AMGCL_MPI_REPARTITION_UTIL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/partition/util.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Repartitioning utils
- */
-
-#include <vector>
-#include <algorithm>
-#include <numeric>
-
-#include <tuple>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace partition {
-
-template <class Backend, class Ptr, class Col>
-void symm_graph(const distributed_matrix<Backend> &A,
-        std::vector<Ptr> &ptr, std::vector<Col> &col)
-{
-    typedef typename Backend::value_type value_type;
-    typedef backend::crs<value_type> build_matrix;
-
-    AMGCL_TIC("symm graph");
-
-    build_matrix &A_loc = *A.local();
-    build_matrix &A_rem = *A.remote();
-
-    ptrdiff_t n = A_loc.nrows;
-    ptrdiff_t row_beg = A.loc_col_shift();
-
-    auto T = transpose(A);
-
-    build_matrix &T_loc = *T->local();
-    build_matrix &T_rem = *T->remote();
-
-    // Build symmetric graph
-    ptr.resize(n + 1, 0);
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        using amgcl::detail::sort_row;
-
-        ptrdiff_t A_loc_beg = A_loc.ptr[i];
-        ptrdiff_t A_loc_end = A_loc.ptr[i+1];
-
-        ptrdiff_t A_rem_beg = A_rem.ptr[i];
-        ptrdiff_t A_rem_end = A_rem.ptr[i+1];
-
-        ptrdiff_t T_loc_beg = T_loc.ptr[i];
-        ptrdiff_t T_loc_end = T_loc.ptr[i+1];
-
-        ptrdiff_t T_rem_beg = T_rem.ptr[i];
-        ptrdiff_t T_rem_end = T_rem.ptr[i+1];
-
-        sort_row(A_loc.col + A_loc_beg, A_loc.val + A_loc_beg, A_loc_end - A_loc_beg);
-        sort_row(A_rem.col + A_rem_beg, A_rem.val + A_rem_beg, A_rem_end - A_rem_beg);
-
-        sort_row(T_loc.col + T_loc_beg, T_loc.val + T_loc_beg, T_loc_end - T_loc_beg);
-        sort_row(T_rem.col + T_rem_beg, T_rem.val + T_rem_beg, T_rem_end - T_rem_beg);
-
-        Ptr row_width = 0;
-
-        for(ptrdiff_t ja = A_loc_beg, jt = T_loc_beg; ja < A_loc_end || jt < T_loc_end;) {
-            ptrdiff_t c;
-            if (ja == A_loc_end) {
-                c = T_loc.col[jt];
-                ++jt;
-            } else if (jt == T_loc_end) {
-                c = A_loc.col[ja];
-                ++ja;
-            } else {
-                ptrdiff_t ca = A_loc.col[ja];
-                ptrdiff_t ct = T_loc.col[jt];
-                if (ca < ct) {
-                    c = ca;
-                    ++ja;
-                } else if (ca == ct) {
-                    c = ca;
-                    ++ja;
-                    ++jt;
-                } else {
-                    c = ct;
-                    ++jt;
-                }
-            }
-
-            if (c != i) ++row_width;
-        }
-
-        for(ptrdiff_t ja = A_rem_beg, jt = T_rem_beg; ja < A_rem_end || jt < T_rem_end;) {
-            if (ja == A_rem_end) {
-                ++jt;
-            } else if (jt == T_rem_end) {
-                ++ja;
-            } else {
-                ptrdiff_t ca = A_rem.col[ja];
-                ptrdiff_t ct = T_rem.col[jt];
-                if (ca < ct) {
-                    ++ja;
-                } else if (ca == ct) {
-                    ++ja;
-                    ++jt;
-                } else {
-                    ++jt;
-                }
-            }
-
-            ++row_width;
-        }
-
-        ptr[i+1] = row_width;
-    }
-
-    std::partial_sum(ptr.begin(), ptr.end(), ptr.begin());
-
-    col.resize(ptr.back());
-    if (col.empty()) col.reserve(1); // So that col.data() is not NULL
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        ptrdiff_t A_loc_beg = A_loc.ptr[i];
-        ptrdiff_t A_loc_end = A_loc.ptr[i+1];
-
-        ptrdiff_t A_rem_beg = A_rem.ptr[i];
-        ptrdiff_t A_rem_end = A_rem.ptr[i+1];
-
-        ptrdiff_t T_loc_beg = T_loc.ptr[i];
-        ptrdiff_t T_loc_end = T_loc.ptr[i+1];
-
-        ptrdiff_t T_rem_beg = T_rem.ptr[i];
-        ptrdiff_t T_rem_end = T_rem.ptr[i+1];
-
-        Ptr head = ptr[i];
-
-        for(ptrdiff_t ja = A_loc_beg, jt = T_loc_beg; ja < A_loc_end || jt < T_loc_end;) {
-            ptrdiff_t c;
-            if (ja == A_loc_end) {
-                c = T_loc.col[jt];
-                ++jt;
-            } else if (jt == T_loc_end) {
-                c = A_loc.col[ja];
-                ++ja;
-            } else {
-                ptrdiff_t ca = A_loc.col[ja];
-                ptrdiff_t ct = T_loc.col[jt];
-
-                if (ca < ct) {
-                    c = ca;
-                    ++ja;
-                } else if (ca == ct) {
-                    c = ca;
-                    ++ja;
-                    ++jt;
-                } else {
-                    c = ct;
-                    ++jt;
-                }
-            }
-            if (c != i) col[head++] = c + row_beg;
-        }
-
-        for(ptrdiff_t ja = A_rem_beg, jt = T_rem_beg; ja < A_rem_end || jt < T_rem_end;) {
-            if (ja == A_rem_end) {
-                col[head] = T_rem.col[jt];
-                ++jt;
-            } else if (jt == T_rem_end) {
-                col[head] = A_rem.col[ja];
-                ++ja;
-            } else {
-                ptrdiff_t ca = A_rem.col[ja];
-                ptrdiff_t ct = T_rem.col[jt];
-
-                if (ca < ct) {
-                    col[head] = ca;
-                    ++ja;
-                } else if (ca == ct) {
-                    col[head] = ca;
-                    ++ja;
-                    ++jt;
-                } else {
-                    col[head] = ct;
-                    ++jt;
-                }
-            }
-            ++head;
-        }
-    }
-
-    AMGCL_TOC("symm graph");
-}
-
-template <class Idx>
-std::tuple<ptrdiff_t, ptrdiff_t> graph_perm_index(
-        communicator comm, int npart, const std::vector<Idx> &part,
-        std::vector<ptrdiff_t> &perm)
-{
-    AMGCL_TIC("perm index");
-    ptrdiff_t n = part.size();
-    perm.resize(n);
-
-    std::vector<ptrdiff_t> loc_part_cnt(npart, 0);
-    std::vector<ptrdiff_t> loc_part_beg(npart, 0);
-    std::vector<ptrdiff_t> glo_part_cnt(npart);
-    std::vector<ptrdiff_t> glo_part_beg(npart + 1);
-
-    for(Idx p : part) ++loc_part_cnt[p];
-
-    MPI_Exscan(&loc_part_cnt[0], &loc_part_beg[0], npart, datatype<ptrdiff_t>(), MPI_SUM, comm);
-    MPI_Allreduce(&loc_part_cnt[0], &glo_part_cnt[0], npart, datatype<ptrdiff_t>(), MPI_SUM, comm);
-
-    glo_part_beg[0] = 0;
-    std::partial_sum(glo_part_cnt.begin(), glo_part_cnt.end(), glo_part_beg.begin() + 1);
-
-    std::vector<ptrdiff_t> cnt(npart, 0);
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        Idx p = part[i];
-        perm[i] = glo_part_beg[p] + loc_part_beg[p] + cnt[p]++;
-    }
-
-    AMGCL_TOC("perm index");
-    return std::make_tuple(
-            glo_part_beg[std::min(npart, comm.rank)],
-            glo_part_beg[std::min(npart, comm.rank + 1)]
-            );
-}
-
-template <class Backend, class Idx>
-std::shared_ptr< distributed_matrix<Backend> > graph_perm_matrix(
-        communicator comm, ptrdiff_t col_beg, ptrdiff_t col_end,
-        const std::vector<Idx> &perm)
-{
-    typedef typename Backend::value_type value_type;
-    typedef backend::crs<value_type> build_matrix;
-
-    AMGCL_TIC("perm matrix");
-
-    ptrdiff_t n = perm.size();
-    ptrdiff_t ncols = col_end - col_beg;
-
-    auto i_loc = std::make_shared<build_matrix>();
-    auto i_rem = std::make_shared<build_matrix>();
-
-    build_matrix &I_loc = *i_loc;
-    build_matrix &I_rem = *i_rem;
-
-    I_loc.set_size(n, ncols, false);
-    I_rem.set_size(n, 0, false);
-
-    I_loc.ptr[0] = 0;
-    I_rem.ptr[0] = 0;
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        ptrdiff_t j = perm[i];
-
-        if (col_beg <= j && j < col_end) {
-            I_loc.ptr[i+1] = 1;
-            I_rem.ptr[i+1] = 0;
-        } else {
-            I_loc.ptr[i+1] = 0;
-            I_rem.ptr[i+1] = 1;
-        }
-    }
-
-    I_loc.set_nonzeros(I_loc.scan_row_sizes());
-    I_rem.set_nonzeros(I_rem.scan_row_sizes());
-
-#pragma omp parallel for
-    for(ptrdiff_t i = 0; i < n; ++i) {
-        ptrdiff_t j = perm[i];
-
-        if (col_beg <= j && j < col_end) {
-            ptrdiff_t k = I_loc.ptr[i];
-            I_loc.col[k] = j - col_beg;
-            I_loc.val[k] = math::identity<value_type>();
-        } else {
-            ptrdiff_t k = I_rem.ptr[i];
-            I_rem.col[k] = j;
-            I_rem.val[k] = math::identity<value_type>();
-        }
-    }
-
-    AMGCL_TOC("perm matrix");
-    return std::make_shared< distributed_matrix<Backend> >(comm, i_loc, i_rem);
-}
-
-} // namespace partition
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/preconditioner.hpp b/src/solvers/amgcl/mpi/preconditioner.hpp
deleted file mode 100644
index 4644167..0000000
--- a/src/solvers/amgcl/mpi/preconditioner.hpp
+++ /dev/null
@@ -1,326 +0,0 @@
-#ifndef AMGCL_MPI_PRECONDITIONER_HPP
-#define AMGCL_MPI_PRECONDITIONER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/preconditioner.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime wrapper around mpi preconditioners.
- */
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <iostream>
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/mpi/amg.hpp>
-#include <amgcl/mpi/coarsening/runtime.hpp>
-#include <amgcl/mpi/relaxation/runtime.hpp>
-#include <amgcl/mpi/direct_solver/runtime.hpp>
-#include <amgcl/mpi/partition/runtime.hpp>
-#include <amgcl/mpi/relaxation/as_preconditioner.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-#include <amgcl/mpi/util.hpp>
-
-namespace amgcl {
-namespace runtime {
-namespace mpi {
-
-/// Preconditioner kinds.
-namespace precond_class {
-enum type {
-    amg,            ///< AMG
-    relaxation      ///< Single-level relaxation
-};
-
-inline std::ostream& operator<<(std::ostream &os, type p) {
-    switch (p) {
-        case amg:
-            return os << "amg";
-        case relaxation:
-            return os << "relaxation";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &p)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "amg")
-        p = amg;
-    else if (val == "relaxation")
-        p = relaxation;
-    else
-        throw std::invalid_argument("Invalid preconditioner class. "
-                "Valid choices are: amg, relaxation");
-
-    return in;
-}
-} // namespace precond_class
-
-template <class Backend>
-class preconditioner {
-    public:
-        typedef Backend backend_type;
-        typedef typename backend_type::params backend_params;
-        typedef boost::property_tree::ptree params;
-        typedef typename backend_type::value_type value_type;
-        typedef amgcl::mpi::distributed_matrix<backend_type> matrix;
-
-        template <class Matrix>
-        preconditioner(
-                amgcl::mpi::communicator comm,
-                const Matrix &Astrip,
-                params prm = params(),
-                const backend_params &bprm = backend_params()
-                ) : _class(prm.get("class", precond_class::amg)), handle(0)
-        {
-            init(std::make_shared<matrix>(comm, Astrip, backend::rows(Astrip)), prm, bprm);
-        }
-
-        preconditioner(
-                amgcl::mpi::communicator,
-                std::shared_ptr<matrix> A,
-                params prm = params(),
-                const backend_params &bprm = backend_params()
-                ) : _class(prm.get("class", precond_class::amg)), handle(0)
-        {
-            init(A, prm, bprm);
-        }
-
-        ~preconditioner() {
-            switch (_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::mpi::amg<
-                                Backend,
-                                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                                amgcl::runtime::mpi::direct::solver<value_type>,
-                                amgcl::runtime::mpi::partition::wrapper<Backend>
-                                >
-                            Precond;
-
-                        delete static_cast<Precond*>(handle);
-                    }
-                    break;
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::mpi::relaxation::as_preconditioner<
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>
-                                >
-                            Precond;
-
-                        delete static_cast<Precond*>(handle);
-                    }
-                    break;
-                default:
-                    break;
-            }
-        }
-
-        template <class Matrix>
-        void rebuild(
-                const Matrix &A,
-                const backend_params &bprm = backend_params()
-                )
-        {
-            switch (_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::mpi::amg<
-                                Backend,
-                                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                                amgcl::runtime::mpi::direct::solver<value_type>,
-                                amgcl::runtime::mpi::partition::wrapper<Backend>
-                                >
-                            Precond;
-
-                        static_cast<Precond*>(handle)->rebuild(A, bprm);
-                    }
-                    break;
-                default:
-                    std::cerr << "rebuild is a noop unless the preconditioner is AMG" << std::endl;
-                    return;
-            }
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::mpi::amg<
-                                Backend,
-                                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                                amgcl::runtime::mpi::direct::solver<value_type>,
-                                amgcl::runtime::mpi::partition::wrapper<Backend>
-                                >
-                            Precond;
-
-                        static_cast<Precond*>(handle)->apply(rhs, x);
-                    }
-                    break;
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::mpi::relaxation::as_preconditioner<
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>
-                                >
-                            Precond;
-
-                        static_cast<Precond*>(handle)->apply(rhs, x);
-                    }
-                    break;
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-        /// Returns the system matrix from the finest level.
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::mpi::amg<
-                                Backend,
-                                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                                amgcl::runtime::mpi::direct::solver<value_type>,
-                                amgcl::runtime::mpi::partition::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return static_cast<Precond*>(handle)->system_matrix_ptr();
-                    }
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::mpi::relaxation::as_preconditioner<
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return static_cast<Precond*>(handle)->system_matrix_ptr();
-                    }
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-        const matrix& system_matrix() const {
-            return *system_matrix_ptr();
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const preconditioner &p) {
-            switch(p._class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::mpi::amg<
-                                Backend,
-                                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                                amgcl::runtime::mpi::direct::solver<value_type>,
-                                amgcl::runtime::mpi::partition::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return os << *static_cast<Precond*>(p.handle);
-                    }
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::mpi::relaxation::as_preconditioner<
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return os << *static_cast<Precond*>(p.handle);
-                    }
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-    private:
-        precond_class::type _class;
-        void *handle;
-
-        void init(std::shared_ptr<matrix> A, params &prm, const backend_params &bprm) {
-            if (!prm.erase("class")) AMGCL_PARAM_MISSING("class");
-
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::mpi::amg<
-                                Backend,
-                                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                                amgcl::runtime::mpi::direct::solver<value_type>,
-                                amgcl::runtime::mpi::partition::wrapper<Backend>
-                                >
-                            Precond;
-
-                        handle = static_cast<void*>(new Precond(A->comm(), A, prm, bprm));
-                    }
-                    break;
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::mpi::relaxation::as_preconditioner<
-                                amgcl::runtime::mpi::relaxation::wrapper<Backend>
-                                >
-                            Precond;
-
-                        handle = static_cast<void*>(new Precond(A->comm(), A, prm, bprm));
-                    }
-                    break;
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-};
-
-} // namespace mpi
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/as_preconditioner.hpp b/src/solvers/amgcl/mpi/relaxation/as_preconditioner.hpp
deleted file mode 100644
index 9fa70b8..0000000
--- a/src/solvers/amgcl/mpi/relaxation/as_preconditioner.hpp
+++ /dev/null
@@ -1,105 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_AS_PRECONDITIONER_HPP
-#define AMGCL_MPI_RELAXATION_AS_PRECONDITIONER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/as_preconditioner.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Use a distributed amgcl smoother as a standalone preconditioner.
- */
-
-#include <vector>
-#include <memory>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/mpi/util.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Relaxation>
-struct as_preconditioner {
-    typedef typename Relaxation::params                params;
-    typedef typename Relaxation::backend_type          backend_type;
-    typedef typename backend_type::params              backend_params;
-    typedef typename backend_type::value_type          value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef distributed_matrix<backend_type>           matrix;
-    typedef typename backend_type::vector              vector;
-
-    template <class Matrix>
-    as_preconditioner(
-            communicator comm,
-            const Matrix &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-       ) : A(std::make_shared>(comm, A, backend::rows(A))),
-           S(A, prm, bprm)
-    {
-        this->A->move_to_backend(bprm);
-    }
-
-    as_preconditioner(
-            communicator,
-            std::shared_ptr<matrix> A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-       ) : A(A), S(*A, prm, bprm)
-    {
-        this->A->move_to_backend(bprm);
-    }
-
-    template <class Vec1, class Vec2>
-    void apply(const Vec1 &rhs, Vec2 &&x) const {
-        S.apply(*A, rhs, x);
-    }
-
-    std::shared_ptr<matrix> system_matrix_ptr() const {
-        return A;
-    }
-
-    const matrix& system_matrix() const {
-        return *system_matrix_ptr();
-    }
-
-    private:
-        std::shared_ptr<matrix> A;
-        Relaxation S;
-
-        friend std::ostream& operator<<(std::ostream &os, const as_preconditioner &p) {
-            os << "Relaxation as preconditioner" << std::endl;
-            os << "  unknowns: " << p.system_matrix().glob_rows() << std::endl;
-            os << "  nonzeros: " << p.system_matrix().glob_nonzeros() << std::endl;
-
-            return os;
-        }
-};
-
-} // namespace relaxation
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/chebyshev.hpp b/src/solvers/amgcl/mpi/relaxation/chebyshev.hpp
deleted file mode 100644
index 92d224f..0000000
--- a/src/solvers/amgcl/mpi/relaxation/chebyshev.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_CHEBYSHEV_HPP
-#define AMGCL_MPI_RELAXATION_CHEBYSHEV_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/chebyshev.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory Chebyshev relaxation scheme.
- */
-
-#include <amgcl/relaxation/chebyshev.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct chebyshev : public amgcl::relaxation::chebyshev<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::chebyshev<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    chebyshev(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(A, prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/damped_jacobi.hpp b/src/solvers/amgcl/mpi/relaxation/damped_jacobi.hpp
deleted file mode 100644
index a736edd..0000000
--- a/src/solvers/amgcl/mpi/relaxation/damped_jacobi.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_DAMPED_JACOBI_HPP
-#define AMGCL_MPI_RELAXATION_DAMPED_JACOBI_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/damped_jacobi.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory damped Jacobi relaxation scheme.
- */
-
-#include <amgcl/relaxation/damped_jacobi.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct damped_jacobi : public amgcl::relaxation::damped_jacobi<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::damped_jacobi<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    damped_jacobi(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/gauss_seidel.hpp b/src/solvers/amgcl/mpi/relaxation/gauss_seidel.hpp
deleted file mode 100644
index 720e135..0000000
--- a/src/solvers/amgcl/mpi/relaxation/gauss_seidel.hpp
+++ /dev/null
@@ -1,79 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_GAUSS_SEIDEL_HPP
-#define AMGCL_MPI_RELAXATION_GAUSS_SEIDEL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/gauss_seidel.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory Gauss-Seidel relaxation scheme.
- */
-
-#include <amgcl/relaxation/gauss_seidel.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct gauss_seidel : public amgcl::relaxation::gauss_seidel<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::gauss_seidel<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    gauss_seidel(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &t) const
-    {
-        Base::apply_pre(*A.local_backend(), rhs, x, t);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &t) const
-    {
-        Base::apply_post(*A.local_backend(), rhs, x, t);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        Base::apply(*A.local_backend(), rhs, x);
-    }
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/ilu0.hpp b/src/solvers/amgcl/mpi/relaxation/ilu0.hpp
deleted file mode 100644
index afec5df..0000000
--- a/src/solvers/amgcl/mpi/relaxation/ilu0.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_ILU0_HPP
-#define AMGCL_MPI_RELAXATION_ILU0_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/ilu0.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory incomplete LU with zero fill-in relaxation scheme.
- */
-
-#include <amgcl/relaxation/ilu0.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct ilu0 : public amgcl::relaxation::ilu0<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::ilu0<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    ilu0(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/iluk.hpp b/src/solvers/amgcl/mpi/relaxation/iluk.hpp
deleted file mode 100644
index 8b2fa0c..0000000
--- a/src/solvers/amgcl/mpi/relaxation/iluk.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_ILUK_HPP
-#define AMGCL_MPI_RELAXATION_ILUK_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/iluk.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory incomplete LU with fill-in level.
- */
-
-#include <amgcl/relaxation/iluk.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct iluk : public amgcl::relaxation::iluk<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::iluk<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    iluk(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/ilup.hpp b/src/solvers/amgcl/mpi/relaxation/ilup.hpp
deleted file mode 100644
index b502b4b..0000000
--- a/src/solvers/amgcl/mpi/relaxation/ilup.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_ILUP_HPP
-#define AMGCL_MPI_RELAXATION_ILUP_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/ilup.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory incomplete LU with fill-in level.
- */
-
-#include <amgcl/relaxation/ilup.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct ilup : public amgcl::relaxation::ilup<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::ilup<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    ilup(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/ilut.hpp b/src/solvers/amgcl/mpi/relaxation/ilut.hpp
deleted file mode 100644
index 53124ad..0000000
--- a/src/solvers/amgcl/mpi/relaxation/ilut.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_ILUT_HPP
-#define AMGCL_MPI_RELAXATION_ILUT_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/ilut.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory incomplete LU with thresholding relaxation scheme.
- */
-
-#include <amgcl/relaxation/ilut.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct ilut : public amgcl::relaxation::ilut<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::ilut<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    ilut(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/runtime.hpp b/src/solvers/amgcl/mpi/relaxation/runtime.hpp
deleted file mode 100644
index 896afc2..0000000
--- a/src/solvers/amgcl/mpi/relaxation/runtime.hpp
+++ /dev/null
@@ -1,337 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_RUNTIME_HPP
-#define AMGCL_MPI_RELAXATION_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory sparse approximate inverse relaxation scheme.
- */
-
-#include <memory>
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/relaxation/runtime.hpp>
-#include <amgcl/mpi/relaxation/spai0.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace runtime {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct wrapper {
-    typedef Backend                     backend_type;
-    typedef typename Backend::params    backend_params;
-    typedef boost::property_tree::ptree params;
-
-    runtime::relaxation::type r;
-    void *handle;
-
-    wrapper(const amgcl::mpi::distributed_matrix<Backend> &A,
-            params prm, const backend_params &bprm = backend_params())
-      : r(prm.get("type", runtime::relaxation::spai0)), handle(0)
-    {
-        if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-        switch(r) {
-
-#define AMGCL_RELAX_DISTR(type) \
-            case runtime::relaxation::type: \
-                handle = static_cast<void*>(new amgcl::mpi::relaxation::type<Backend>(A, prm, bprm)); \
-                break
-
-#define AMGCL_RELAX_LOCAL_DISTR(type) \
-            case runtime::relaxation::type: \
-                handle = call_constructor<amgcl::relaxation::type>(A, prm, bprm); \
-                break;
-
-#define AMGCL_RELAX_LOCAL_LOCAL(type) \
-            case runtime::relaxation::type: \
-                handle = call_constructor<amgcl::relaxation::type>(*A.local(), prm, bprm); \
-                break;
-
-            AMGCL_RELAX_DISTR(spai0);
-            AMGCL_RELAX_LOCAL_DISTR(chebyshev);
-            AMGCL_RELAX_LOCAL_LOCAL(damped_jacobi);
-            AMGCL_RELAX_LOCAL_LOCAL(ilu0);
-            AMGCL_RELAX_LOCAL_LOCAL(iluk);
-            AMGCL_RELAX_LOCAL_LOCAL(ilup);
-            AMGCL_RELAX_LOCAL_LOCAL(ilut);
-            AMGCL_RELAX_LOCAL_LOCAL(spai1);
-            AMGCL_RELAX_LOCAL_LOCAL(gauss_seidel);
-
-#undef AMGCL_RELAX_LOCAL_LOCAL
-#undef AMGCL_RELAX_LOCAL_DISTR
-#undef AMGCL_RELAX_DISTR
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    ~wrapper() {
-        switch(r) {
-#define AMGCL_RELAX_DISTR(type) \
-            case runtime::relaxation::type: \
-                delete static_cast<amgcl::mpi::relaxation::type<Backend>*>(handle); \
-                break
-
-#define AMGCL_RELAX_LOCAL(type) \
-            case runtime::relaxation::type: \
-                delete static_cast<amgcl::relaxation::type<Backend>*>(handle); \
-                break;
-
-            AMGCL_RELAX_DISTR(spai0);
-            AMGCL_RELAX_LOCAL(damped_jacobi);
-            AMGCL_RELAX_LOCAL(ilu0);
-            AMGCL_RELAX_LOCAL(iluk);
-            AMGCL_RELAX_LOCAL(ilup);
-            AMGCL_RELAX_LOCAL(ilut);
-            AMGCL_RELAX_LOCAL(spai1);
-            AMGCL_RELAX_LOCAL(chebyshev);
-            AMGCL_RELAX_LOCAL(gauss_seidel);
-
-#undef AMGCL_RELAX_LOCAL
-#undef AMGCL_RELAX_DISTR
-
-            default:
-                break;
-        }
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp) const {
-        switch(r) {
-
-#define AMGCL_RELAX_DISTR(type) \
-            case runtime::relaxation::type: \
-                static_cast<const amgcl::mpi::relaxation::type<Backend>*>(handle)->apply_pre(A, rhs, x, tmp); \
-                break
-
-#define AMGCL_RELAX_LOCAL_DISTR(type) \
-            case runtime::relaxation::type: \
-                call_apply_pre<amgcl::relaxation::type>(A, rhs, x, tmp); \
-                break;
-
-#define AMGCL_RELAX_LOCAL_LOCAL(type) \
-            case runtime::relaxation::type: \
-                call_apply_pre<amgcl::relaxation::type>(*A.local_backend(), rhs, x, tmp); \
-                break;
-
-            AMGCL_RELAX_DISTR(spai0);
-            AMGCL_RELAX_LOCAL_DISTR(damped_jacobi);
-            AMGCL_RELAX_LOCAL_DISTR(ilu0);
-            AMGCL_RELAX_LOCAL_DISTR(iluk);
-            AMGCL_RELAX_LOCAL_DISTR(ilup);
-            AMGCL_RELAX_LOCAL_DISTR(ilut);
-            AMGCL_RELAX_LOCAL_DISTR(spai1);
-            AMGCL_RELAX_LOCAL_DISTR(chebyshev);
-            AMGCL_RELAX_LOCAL_LOCAL(gauss_seidel);
-
-#undef AMGCL_RELAX_LOCAL_LOCAL
-#undef AMGCL_RELAX_LOCAL_DISTR
-#undef AMGCL_RELAX_DISTR
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp) const {
-        switch(r) {
-
-#define AMGCL_RELAX_DISTR(type) \
-            case runtime::relaxation::type: \
-                static_cast<const amgcl::mpi::relaxation::type<Backend>*>(handle)->apply_post(A, rhs, x, tmp); \
-                break
-
-#define AMGCL_RELAX_LOCAL_DISTR(type) \
-            case runtime::relaxation::type: \
-                call_apply_post<amgcl::relaxation::type>(A, rhs, x, tmp); \
-                break;
-
-#define AMGCL_RELAX_LOCAL_LOCAL(type) \
-            case runtime::relaxation::type: \
-                call_apply_post<amgcl::relaxation::type>(*A.local_backend(), rhs, x, tmp); \
-                break;
-
-            AMGCL_RELAX_DISTR(spai0);
-            AMGCL_RELAX_LOCAL_DISTR(damped_jacobi);
-            AMGCL_RELAX_LOCAL_DISTR(ilu0);
-            AMGCL_RELAX_LOCAL_DISTR(iluk);
-            AMGCL_RELAX_LOCAL_DISTR(ilup);
-            AMGCL_RELAX_LOCAL_DISTR(ilut);
-            AMGCL_RELAX_LOCAL_DISTR(spai1);
-            AMGCL_RELAX_LOCAL_DISTR(chebyshev);
-            AMGCL_RELAX_LOCAL_LOCAL(gauss_seidel);
-
-#undef AMGCL_RELAX_LOCAL_LOCAL
-#undef AMGCL_RELAX_LOCAL_DISTR
-#undef AMGCL_RELAX_DISTR
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix &A, const VectorRHS &rhs, VectorX &x) const {
-        switch(r) {
-
-#define AMGCL_RELAX_DISTR(type) \
-            case runtime::relaxation::type: \
-                static_cast<const amgcl::mpi::relaxation::type<Backend>*>(handle)->apply(A, rhs, x); \
-                break
-
-#define AMGCL_RELAX_LOCAL_DISTR(type) \
-            case runtime::relaxation::type: \
-                call_apply<amgcl::relaxation::type>(A, rhs, x); \
-                break;
-
-#define AMGCL_RELAX_LOCAL_LOCAL(type) \
-            case runtime::relaxation::type: \
-                call_apply<amgcl::relaxation::type>(*A.local_backend(), rhs, x); \
-                break;
-
-            AMGCL_RELAX_DISTR(spai0);
-            AMGCL_RELAX_LOCAL_DISTR(damped_jacobi);
-            AMGCL_RELAX_LOCAL_LOCAL(gauss_seidel);
-            AMGCL_RELAX_LOCAL_DISTR(ilu0);
-            AMGCL_RELAX_LOCAL_DISTR(iluk);
-            AMGCL_RELAX_LOCAL_DISTR(ilup);
-            AMGCL_RELAX_LOCAL_DISTR(ilut);
-            AMGCL_RELAX_LOCAL_DISTR(spai1);
-            AMGCL_RELAX_LOCAL_DISTR(chebyshev);
-
-#undef AMGCL_RELAX_LOCAL_LOCAL
-#undef AMGCL_RELAX_LOCAL_DISTR
-#undef AMGCL_RELAX_DISTR
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    template <template <class> class Relaxation, class Matrix>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void*
-    >::type
-    call_constructor(
-            const Matrix &A, const params &prm, const backend_params &bprm)
-    {
-        return static_cast<void*>(new Relaxation<Backend>(A, prm, bprm));
-    }
-
-    template <template <class> class Relaxation, class Matrix>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void*
-    >::type
-    call_constructor(const Matrix&, const params&, const backend_params&)
-    {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp) const
-    {
-        static_cast<Relaxation<Backend>*>(handle)->apply_pre(A, rhs, x, tmp);
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_pre(const Matrix&, const VectorRHS&, VectorX&, VectorTMP&) const {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp) const
-    {
-        static_cast<Relaxation<Backend>*>(handle)->apply_post(A, rhs, x, tmp);
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_post(const Matrix&, const VectorRHS&, VectorX&, VectorTMP&) const {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        static_cast<Relaxation<Backend>*>(handle)->apply(A, rhs, x);
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply(const Matrix&, const VectorRHS&, VectorX&) const {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-};
-
-} // namespace relaxation
-} // namespace mpi
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/spai0.hpp b/src/solvers/amgcl/mpi/relaxation/spai0.hpp
deleted file mode 100644
index 54ab3f8..0000000
--- a/src/solvers/amgcl/mpi/relaxation/spai0.hpp
+++ /dev/null
@@ -1,127 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_SPAI0_HPP
-#define AMGCL_MPI_RELAXATION_SPAI0_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/spai0.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory sparse approximate inverse relaxation scheme.
- */
-
-#include <memory>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct spai0 {
-    typedef Backend                                    backend_type;
-    typedef typename Backend::value_type               value_type;
-    typedef typename Backend::matrix_diagonal          matrix_diagonal;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef amgcl::detail::empty_params                params;
-    typedef typename Backend::params                   backend_params;
-
-    spai0(
-            const distributed_matrix<Backend> &A,
-            const params &, const backend_params &bprm = backend_params()
-         )
-    {
-        typedef backend::crs<value_type> build_matrix;
-
-        const ptrdiff_t n = A.loc_rows();
-        const build_matrix &A_loc = *A.local();
-        const build_matrix &A_rem = *A.remote();
-
-        auto m = std::make_shared< backend::numa_vector<value_type> >(n, false);
-        typedef backend::crs<value_type> build_matrix;
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < n; ++i) {
-            value_type  num = math::zero<value_type>();
-            scalar_type den = math::zero<scalar_type>();
-
-            for(ptrdiff_t j = A_loc.ptr[i], e = A_loc.ptr[i+1]; j < e; ++j) {
-                value_type v = A_loc.val[j];
-                scalar_type norm_v = math::norm(v);
-                den += norm_v * norm_v;
-                if (A_loc.col[j] == i) num += v;
-            }
-
-            for(ptrdiff_t j = A_rem.ptr[i], e = A_rem.ptr[i+1]; j < e; ++j) {
-                value_type v = A_rem.val[j];
-                scalar_type norm_v = math::norm(v);
-                den += norm_v * norm_v;
-            }
-
-            (*m)[i] = math::inverse(den) * num;
-        }
-
-        M = Backend::copy_vector(m, bprm);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        static const scalar_type one = math::identity<scalar_type>();
-        backend::residual(rhs, A, x, tmp);
-        backend::vmul(one, *M, tmp, one, x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        static const scalar_type one = math::identity<scalar_type>();
-        backend::residual(rhs, A, x, tmp);
-        backend::vmul(one, *M, tmp, one, x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply( const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::vmul(math::identity<scalar_type>(), *M, rhs, math::zero<scalar_type>(), x);
-    }
-
-    private:
-        std::shared_ptr<matrix_diagonal> M;
-};
-
-} // namespace relaxation
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/relaxation/spai1.hpp b/src/solvers/amgcl/mpi/relaxation/spai1.hpp
deleted file mode 100644
index e9b4ba7..0000000
--- a/src/solvers/amgcl/mpi/relaxation/spai1.hpp
+++ /dev/null
@@ -1,60 +0,0 @@
-#ifndef AMGCL_MPI_RELAXATION_SPAI1_HPP
-#define AMGCL_MPI_RELAXATION_SPAI1_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/relaxation/spai1.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed memory sparse approximate inverse relaxation scheme.
- */
-
-#include <amgcl/relaxation/spai1.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace relaxation {
-
-template <class Backend>
-struct spai1 : public amgcl::relaxation::spai1<Backend> {
-    typedef Backend backend_type;
-    typedef amgcl::relaxation::spai1<Backend> Base;
-    typedef typename Backend::params backend_params;
-    typedef typename Base::params params;
-
-    spai1(
-            const distributed_matrix<Backend> &A,
-            const params &prm = params(),
-            const backend_params &bprm = backend_params()
-         ) : Base(*A.local(), prm, bprm)
-    {}
-};
-
-} // namespace
-} // mpi
-} // amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/schur_pressure_correction.hpp b/src/solvers/amgcl/mpi/schur_pressure_correction.hpp
deleted file mode 100644
index ffa3bc3..0000000
--- a/src/solvers/amgcl/mpi/schur_pressure_correction.hpp
+++ /dev/null
@@ -1,674 +0,0 @@
-#ifndef AMGCL_MPI_SCHUR_PRESSURE_CORRECTION_HPP
-#define AMGCL_MPI_SCHUR_PRESSURE_CORRECTION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/schur_pressure_correction.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed Schur complement pressure correction preconditioner.
- */
-
-#include <vector>
-
-#include <memory>
-
-#include <amgcl/util.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/backend/detail/mixing.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-template <class USolver, class PSolver>
-class schur_pressure_correction {
-    static_assert(
-            std::is_same<
-                typename USolver::backend_type,
-                typename PSolver::backend_type
-                >::value,
-            "Backends for pressure and flow preconditioners should coincide!"
-            );
-
-    public:
-        typedef
-            typename backend::detail::common_scalar_backend<
-                typename USolver::backend_type,
-                typename PSolver::backend_type
-                >::type
-            backend_type;
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename backend_type::matrix     bmatrix;
-        typedef typename backend_type::vector     vector;
-        typedef typename backend_type::params     backend_params;
-
-        typedef distributed_matrix<backend_type> matrix;
-
-        typedef typename backend::builtin<value_type>::matrix build_matrix;
-
-        struct params {
-            typedef typename USolver::params usolver_params;
-            typedef typename PSolver::params psolver_params;
-
-            usolver_params usolver;
-            psolver_params psolver;
-
-            std::vector<char> pmask;
-
-            // Variant of block preconditioner to use in apply()
-            // 1: schur pressure correction:
-            //      S p = fp - Kpu Kuu^-1 fu
-            //      Kuu u = fu - Kup p
-            // 2: Block triangular:
-            //      S p = fp
-            //      Kuu u = fu - Kup p
-            int type;
-
-            // Approximate Kuu^-1 with inverted diagonal of Kuu during
-            // construction of matrix-less Schur complement.
-            // When false, USolver is used instead.
-            bool approx_schur;
-
-            // Use 1/sum_j(abs(Kuu_{i,j})) instead of dia(Kuu)^-1
-            // as approximation for the Kuu^-1 (as in SIMPLEC algorithm)
-            bool simplec_dia;
-
-            int verbose;
-
-            params() : type(1), approx_schur(false), simplec_dia(true), verbose(0) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, usolver),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, psolver),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, type),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, approx_schur),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, simplec_dia),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                size_t n = 0;
-
-                n = p.get("pmask_size", n);
-
-                amgcl::precondition(n > 0,
-                        "Error in schur_complement parameters: "
-                        "pmask_size is not set");
-
-                if (p.count("pmask_pattern")) {
-                    pmask.resize(n, 0);
-
-                    std::string pattern = p.get("pmask_pattern", std::string());
-                    switch (pattern[0]) {
-                        case '%':
-                            {
-                                int start  = std::atoi(pattern.substr(1).c_str());
-                                int stride = std::atoi(pattern.substr(3).c_str());
-                                for(size_t i = start; i < n; i += stride) pmask[i] = 1;
-                            }
-                            break;
-                        case '<':
-                            {
-                                size_t m = std::atoi(pattern.c_str()+1);
-                                for(size_t i = 0; i < std::min(m, n); ++i) pmask[i] = 1;
-                            }
-                            break;
-                        case '>':
-                            {
-                                size_t m = std::atoi(pattern.c_str()+1);
-                                for(size_t i = m; i < n; ++i) pmask[i] = 1;
-                            }
-                            break;
-                        default:
-                            amgcl::precondition(false, "Unknown pattern in pmask_pattern");
-                    }
-                } else if (p.count("pmask")) {
-                    void *pm = 0;
-                    pm = p.get("pmask", pm);
-                    pmask.assign(static_cast<char*>(pm), static_cast<char*>(pm) + n);
-                } else {
-                    amgcl::precondition(false,
-                            "Error in schur_complement parameters: "
-                            "neither pmask_pattern, nor pmask is set"
-                            );
-                }
-
-                check_params(p, {
-                        "usolver", "psolver", "type", "approx_schur",
-                        "simplec_dia", "pmask_size", "verbose"
-                        },
-                        {"pmask", "pmask_pattern"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path = "") const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, usolver);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, psolver);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, type);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, approx_schur);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, simplec_dia);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        schur_pressure_correction(
-                communicator comm,
-                const Matrix &K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : prm(prm), comm(comm)
-        {
-            this->K = std::make_shared<matrix>(comm, K, backend::rows(K));
-            init(bprm);
-        }
-
-        schur_pressure_correction(
-                communicator comm,
-                std::shared_ptr<matrix> K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : prm(prm), comm(comm), K(K)
-        {
-            init(bprm);
-        }
-
-        void init(const backend_params &bprm) {
-            using std::tie;
-            using std::make_tuple;
-            using std::shared_ptr;
-            using std::make_shared;
-
-            auto _K_loc = K->local();
-            auto _K_rem = K->remote();
-
-            build_matrix &K_loc = *_K_loc;
-            build_matrix &K_rem = *_K_rem;
-
-            ptrdiff_t n = K->loc_rows();
-
-            // Count pressure and flow variables.
-            AMGCL_TIC("count pressure/flow vars");
-            std::vector<ptrdiff_t> idx(n);
-            ptrdiff_t np = 0, nu = 0;
-
-            for(ptrdiff_t i = 0; i < n; ++i)
-                idx[i] = (prm.pmask[i] ? np++ : nu++);
-            AMGCL_TOC("count pressure/flow vars");
-
-            AMGCL_TIC("setup communication");
-            // We know what points each of our neighbors needs from us;
-            // and we know if those points are pressure or flow.
-            // We can immediately provide them with our renumbering scheme.
-            std::vector<ptrdiff_t> pdomain = comm.exclusive_sum(np);
-            std::vector<ptrdiff_t> udomain = comm.exclusive_sum(nu);
-            ptrdiff_t p_beg = pdomain[comm.rank];
-            ptrdiff_t u_beg = udomain[comm.rank];
-
-            const CommPattern &C = this->K->cpat();
-            ptrdiff_t nsend = C.send.count(), nrecv = C.recv.count();
-            std::vector<char>      smask(nsend), rmask(nrecv);
-            std::vector<ptrdiff_t> s_idx(nsend), r_idx(nrecv);
-
-            for(ptrdiff_t i = 0; i < nsend; ++i) {
-                ptrdiff_t c = C.send.col[i];
-                smask[i] = prm.pmask[c];
-                s_idx[i] = idx[c] + (smask[i] ? p_beg : u_beg);
-            }
-
-            C.exchange(&smask[0], &rmask[0]);
-            C.exchange(&s_idx[0], &r_idx[0]);
-            AMGCL_TOC("setup communication");
-
-            // Fill the subblocks of the system matrix.
-            // K_rem->col may be used as direct indices into rmask and r_idx.
-            AMGCL_TIC("schur blocks");
-            this->K->move_to_backend(bprm);
-
-            auto Kpp_loc = make_shared<build_matrix>();
-            auto Kpp_rem = make_shared<build_matrix>();
-            auto Kuu_loc = make_shared<build_matrix>();
-            auto Kuu_rem = make_shared<build_matrix>();
-
-            auto Kpu_loc = make_shared<build_matrix>();
-            auto Kpu_rem = make_shared<build_matrix>();
-            auto Kup_loc = make_shared<build_matrix>();
-            auto Kup_rem = make_shared<build_matrix>();
-
-            Kpp_loc->set_size(np, np, true);
-            Kpp_rem->set_size(np, 0, true);
-
-            Kuu_loc->set_size(nu, nu, true);
-            Kuu_rem->set_size(nu, 0, true);
-
-            Kpu_loc->set_size(np, nu, true);
-            Kpu_rem->set_size(np, 0, true);
-
-            Kup_loc->set_size(nu, np, true);
-            Kup_rem->set_size(nu, 0, true);
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                ptrdiff_t ci = idx[i];
-                char      pi = prm.pmask[i];
-
-                for(auto a = row_begin(K_loc, i); a; ++a) {
-                    char pj = prm.pmask[a.col()];
-
-                    if (pi) {
-                        if (pj) {
-                            ++Kpp_loc->ptr[ci + 1];
-                        } else {
-                            ++Kpu_loc->ptr[ci + 1];
-                        }
-                    } else {
-                        if (pj) {
-                            ++Kup_loc->ptr[ci + 1];
-                        } else {
-                            ++Kuu_loc->ptr[ci + 1];
-                        }
-                    }
-                }
-
-                for(auto a = row_begin(K_rem, i); a; ++a) {
-                    char pj = rmask[a.col()];
-
-                    if (pi) {
-                        if (pj) {
-                            ++Kpp_rem->ptr[ci + 1];
-                        } else {
-                            ++Kpu_rem->ptr[ci + 1];
-                        }
-                    } else {
-                        if (pj) {
-                            ++Kup_rem->ptr[ci + 1];
-                        } else {
-                            ++Kuu_rem->ptr[ci + 1];
-                        }
-                    }
-                }
-            }
-
-            Kpp_loc->set_nonzeros(Kpp_loc->scan_row_sizes());
-            Kpp_rem->set_nonzeros(Kpp_rem->scan_row_sizes());
-
-            Kuu_loc->set_nonzeros(Kuu_loc->scan_row_sizes());
-            Kuu_rem->set_nonzeros(Kuu_rem->scan_row_sizes());
-
-            Kpu_loc->set_nonzeros(Kpu_loc->scan_row_sizes());
-            Kpu_rem->set_nonzeros(Kpu_rem->scan_row_sizes());
-
-            Kup_loc->set_nonzeros(Kup_loc->scan_row_sizes());
-            Kup_rem->set_nonzeros(Kup_rem->scan_row_sizes());
-
-            // Fill subblocks of the system matrix.
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                ptrdiff_t ci = idx[i];
-                char      pi = prm.pmask[i];
-
-                ptrdiff_t pp_loc_head = 0, pp_rem_head = 0;
-                ptrdiff_t uu_loc_head = 0, uu_rem_head = 0;
-                ptrdiff_t pu_loc_head = 0, pu_rem_head = 0;
-                ptrdiff_t up_loc_head = 0, up_rem_head = 0;
-
-                if(pi) {
-                    pp_loc_head = Kpp_loc->ptr[ci];
-                    pp_rem_head = Kpp_rem->ptr[ci];
-                    pu_loc_head = Kpu_loc->ptr[ci];
-                    pu_rem_head = Kpu_rem->ptr[ci];
-                } else {
-                    uu_loc_head = Kuu_loc->ptr[ci];
-                    uu_rem_head = Kuu_rem->ptr[ci];
-                    up_loc_head = Kup_loc->ptr[ci];
-                    up_rem_head = Kup_rem->ptr[ci];
-                }
-
-                for(auto a = row_begin(K_loc, i); a; ++a) {
-                    ptrdiff_t  j = a.col();
-                    value_type v = a.value();
-                    char      pj = prm.pmask[j];
-                    ptrdiff_t cj = idx[j];
-
-                    if (pi) {
-                        if (pj) {
-                            Kpp_loc->col[pp_loc_head] = cj;
-                            Kpp_loc->val[pp_loc_head] = v;
-                            ++pp_loc_head;
-                        } else {
-                            Kpu_loc->col[pu_loc_head] = cj;
-                            Kpu_loc->val[pu_loc_head] = v;
-                            ++pu_loc_head;
-                        }
-                    } else {
-                        if (pj) {
-                            Kup_loc->col[up_loc_head] = cj;
-                            Kup_loc->val[up_loc_head] = v;
-                            ++up_loc_head;
-                        } else {
-                            Kuu_loc->col[uu_loc_head] = cj;
-                            Kuu_loc->val[uu_loc_head] = v;
-                            ++uu_loc_head;
-                        }
-                    }
-                }
-
-                for(auto a = row_begin(K_rem, i); a; ++a) {
-                    ptrdiff_t  j = a.col();
-                    value_type v = a.value();
-                    char      pj = rmask[j];
-                    ptrdiff_t cj = r_idx[j];
-
-                    if (pi) {
-                        if (pj) {
-                            Kpp_rem->col[pp_rem_head] = cj;
-                            Kpp_rem->val[pp_rem_head] = v;
-                            ++pp_rem_head;
-                        } else {
-                            Kpu_rem->col[pu_rem_head] = cj;
-                            Kpu_rem->val[pu_rem_head] = v;
-                            ++pu_rem_head;
-                        }
-                    } else {
-                        if (pj) {
-                            Kup_rem->col[up_rem_head] = cj;
-                            Kup_rem->val[up_rem_head] = v;
-                            ++up_rem_head;
-                        } else {
-                            Kuu_rem->col[uu_rem_head] = cj;
-                            Kuu_rem->val[uu_rem_head] = v;
-                            ++uu_rem_head;
-                        }
-                    }
-                }
-            }
-
-            auto Kpp = std::make_shared<matrix>(comm, Kpp_loc, Kpp_rem);
-            auto Kuu = std::make_shared<matrix>(comm, Kuu_loc, Kuu_rem);
-
-            Kpu = make_shared<matrix>(comm, Kpu_loc, Kpu_rem);
-            Kup = make_shared<matrix>(comm, Kup_loc, Kup_rem);
-
-            Kpu->move_to_backend(bprm);
-            Kup->move_to_backend(bprm);
-            AMGCL_TOC("schur blocks");
-
-            AMGCL_TIC("usolver")
-            U = make_shared<USolver>(comm, Kuu, prm.usolver, bprm);
-            AMGCL_TOC("usolver")
-            AMGCL_TIC("psolver")
-            P = make_shared<PSolver>(comm, Kpp, prm.psolver, bprm);
-            AMGCL_TOC("psolver")
-
-            AMGCL_TIC("other");
-            rhs_u = backend_type::create_vector(nu, bprm);
-            rhs_p = backend_type::create_vector(np, bprm);
-
-            u = backend_type::create_vector(nu, bprm);
-            p = backend_type::create_vector(np, bprm);
-
-            tmp = backend_type::create_vector(nu, bprm);
-
-            if (prm.approx_schur) {
-                std::shared_ptr<backend::numa_vector<value_type>> Kuu_dia;
-                AMGCL_TIC("Kuu diagonal");
-                if (prm.simplec_dia) {
-                    Kuu_dia = std::make_shared<backend::numa_vector<value_type>>(nu, false);
-#pragma omp parallel
-                    for(ptrdiff_t i = 0; i < nu; ++i) {
-                        value_type s = math::zero<value_type>();
-                        for(ptrdiff_t j = Kuu_loc->ptr[i], e = Kuu_loc->ptr[i+1]; j < e; ++j) {
-                            s += math::norm(Kuu_loc->val[j]);
-                        }
-                        for(ptrdiff_t j = Kuu_rem->ptr[i], e = Kuu_rem->ptr[i+1]; j < e; ++j) {
-                            s += math::norm(Kuu_rem->val[j]);
-                        }
-                        (*Kuu_dia)[i] = math::inverse(s);
-                    }
-                } else {
-                    Kuu_dia = diagonal(*Kuu_loc, /*invert = */true);
-                }
-
-                M = backend_type::copy_vector(Kuu_dia, bprm);
-                AMGCL_TOC("Kuu diagonal");
-            }
-
-            // Scatter/Gather matrices
-            AMGCL_TIC("scatter/gather");
-            auto x2u = std::make_shared<build_matrix>();
-            auto x2p = std::make_shared<build_matrix>();
-            auto u2x = std::make_shared<build_matrix>();
-            auto p2x = std::make_shared<build_matrix>();
-
-            x2u->set_size(nu, n, true);
-            x2p->set_size(np, n, true);
-            u2x->set_size(n, nu, true);
-            p2x->set_size(n, np, true);
-
-            {
-                ptrdiff_t x2u_head = 0, x2u_idx = 0;
-                ptrdiff_t x2p_head = 0, x2p_idx = 0;
-                ptrdiff_t u2x_head = 0, u2x_idx = 0;
-                ptrdiff_t p2x_head = 0, p2x_idx = 0;
-
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    if (prm.pmask[i]) {
-                        x2p->ptr[++x2p_idx] = ++x2p_head;
-                        ++p2x_head;
-                    } else {
-                        x2u->ptr[++x2u_idx] = ++x2u_head;
-                        ++u2x_head;
-                    }
-
-                    p2x->ptr[++p2x_idx] = p2x_head;
-                    u2x->ptr[++u2x_idx] = u2x_head;
-                }
-            }
-
-            x2u->set_nonzeros();
-            x2p->set_nonzeros();
-            u2x->set_nonzeros();
-            p2x->set_nonzeros();
-
-            {
-                ptrdiff_t x2u_head = 0;
-                ptrdiff_t x2p_head = 0;
-                ptrdiff_t u2x_head = 0;
-                ptrdiff_t p2x_head = 0;
-
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    ptrdiff_t j = idx[i];
-
-                    if (prm.pmask[i]) {
-                        x2p->col[x2p_head] = i;
-                        x2p->val[x2p_head] = math::identity<value_type>();
-                        ++x2p_head;
-
-                        p2x->col[p2x_head] = j;
-                        p2x->val[p2x_head] = math::identity<value_type>();
-                        ++p2x_head;
-                    } else {
-                        x2u->col[x2u_head] = i;
-                        x2u->val[x2u_head] = math::identity<value_type>();
-                        ++x2u_head;
-
-                        u2x->col[u2x_head] = j;
-                        u2x->val[u2x_head] = math::identity<value_type>();
-                        ++u2x_head;
-                    }
-                }
-            }
-
-            this->x2u = backend_type::copy_matrix(x2u, bprm);
-            this->x2p = backend_type::copy_matrix(x2p, bprm);
-            this->u2x = backend_type::copy_matrix(u2x, bprm);
-            this->p2x = backend_type::copy_matrix(p2x, bprm);
-            AMGCL_TOC("scatter/gather");
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return K;
-        }
-
-        const matrix& system_matrix() const {
-            return *K;
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            AMGCL_TIC("split variables");
-            backend::spmv(one, *x2u, rhs, zero, *rhs_u);
-            backend::spmv(one, *x2p, rhs, zero, *rhs_p);
-            AMGCL_TOC("split variables");
-
-            if (prm.type == 1) {
-                // Ai u = rhs_u
-                AMGCL_TIC("solve U");
-                backend::clear(*u);
-                report("U1", (*U)(*rhs_u, *u));
-                AMGCL_TOC("solve U");
-
-                // rhs_p -= Kpu u
-                AMGCL_TIC("solve P");
-                backend::spmv(-one, *Kpu, *u, one, *rhs_p);
-
-                // S p = rhs_p
-                backend::clear(*p);
-                report("P", (*P)(*this, *rhs_p, *p));
-                AMGCL_TOC("solve P");
-
-                // rhs_u -= Kup p
-                AMGCL_TIC("Update U");
-                backend::spmv(-one, *Kup, *p, one, *rhs_u);
-
-                // Ai u = rhs_u
-                backend::clear(*u);
-                report("U2", (*U)(*rhs_u, *u));
-                AMGCL_TOC("Update U");
-            } else if (prm.type == 2) {
-                // S p = rhs_p
-                AMGCL_TIC("solve P");
-                backend::clear(*p);
-                report("P", (*P)(*this, *rhs_p, *p));
-                AMGCL_TOC("solve P");
-
-                // Ai u = fu - Kup p
-                AMGCL_TIC("solve U");
-                backend::spmv(-one, *Kup, *p, one, *rhs_u);
-                backend::clear(*u);
-                report("U", (*U)(*rhs_u, *u));
-                AMGCL_TOC("solve U");
-            }
-
-            AMGCL_TIC("merge variables");
-            backend::spmv(one, *u2x, *u, zero, x);
-            backend::spmv(one, *p2x, *p, one, x);
-            AMGCL_TOC("merge variables");
-        }
-
-        template <class Alpha, class Vec1, class Beta, class Vec2>
-        void spmv(Alpha alpha, const Vec1 &x, Beta beta, Vec2 &y) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            // y = beta y + alpha S x, where S = Kpp - Kpu Kuu^-1 Kup
-            AMGCL_TIC("matrix-free spmv");
-            backend::spmv(alpha, P->system_matrix(), x, beta, y);
-
-            backend::spmv(one, *Kup, x, zero, *tmp);
-
-            if (prm.approx_schur) {
-                backend::vmul(one, *M, *tmp, zero, *u);
-            } else {
-                backend::clear(*u);
-                (*U)(*tmp, *u);
-            }
-            backend::spmv(-alpha, *Kpu, *u, one, y);
-            AMGCL_TOC("matrix-free spmv");
-        }
-    private:
-        typedef comm_pattern<backend_type> CommPattern;
-        communicator comm;
-
-        std::shared_ptr<bmatrix>  x2p, x2u, p2x, u2x;
-        std::shared_ptr<matrix> K, Kpu, Kup;
-        std::shared_ptr<vector>  rhs_u, rhs_p, u, p, tmp;
-        std::shared_ptr<typename backend_type::matrix_diagonal> M;
-
-        std::shared_ptr<USolver> U;
-        std::shared_ptr<PSolver> P;
-
-#ifdef AMGCL_DEBUG
-        template <typename I, typename E>
-        void report(const std::string &name, const std::tuple<I, E> &c) const {
-            if (comm.rank == 0 && prm.report >= 1) {
-                std::cout << name << " (" << std::get<0>(c) << ", " << std::get<1>(c) << ")\n";
-            }
-        }
-#else
-        template <typename I, typename E>
-        void report(const std::string&, const std::tuple<I, E>&) const {
-        }
-#endif
-
-};
-
-} // namespace mpi
-
-namespace backend {
-
-template <class US, class PS, class Alpha, class Beta, class Vec1, class Vec2>
-struct spmv_impl< Alpha, mpi::schur_pressure_correction<US, PS>, Vec1, Beta, Vec2>
-{
-    static void apply(Alpha alpha, const mpi::schur_pressure_correction<US, PS> &A, const Vec1 &x, Beta beta, Vec2 &y)
-    {
-        A.spmv(alpha, x, beta, y);
-    }
-};
-
-template <class US, class PS, class Vec1, class Vec2, class Vec3>
-struct residual_impl< mpi::schur_pressure_correction<US, PS>, Vec1, Vec2, Vec3>
-{
-    static void apply(const Vec1 &rhs, const mpi::schur_pressure_correction<US, PS> &A, const Vec2 &x, Vec3 &r)
-    {
-        backend::copy(rhs, r);
-        A.spmv(-1, x, 1, r);
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/bicgstab.hpp b/src/solvers/amgcl/mpi/solver/bicgstab.hpp
deleted file mode 100644
index 5fed3eb..0000000
--- a/src/solvers/amgcl/mpi/solver/bicgstab.hpp
+++ /dev/null
@@ -1,52 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_BICGSTAB_HPP
-#define AMGCL_MPI_SOLVER_BICGSTAB_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/bicgstab.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for BiCGStab iterative method.
- */
-
-#include <amgcl/solver/bicgstab.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class bicgstab : public amgcl::solver::bicgstab<Backend, InnerProduct> {
-    typedef amgcl::solver::bicgstab<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/bicgstabl.hpp b/src/solvers/amgcl/mpi/solver/bicgstabl.hpp
deleted file mode 100644
index 920afd6..0000000
--- a/src/solvers/amgcl/mpi/solver/bicgstabl.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_BICGSTABL_HPP
-#define AMGCL_MPI_SOLVER_BICGSTABL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/bicgstabl.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for BiCGStab(L) iterative method.
- */
-
-#include <amgcl/solver/bicgstabl.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class bicgstabl : public amgcl::solver::bicgstabl<Backend, InnerProduct> {
-    typedef amgcl::solver::bicgstabl<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/cg.hpp b/src/solvers/amgcl/mpi/solver/cg.hpp
deleted file mode 100644
index d628dc4..0000000
--- a/src/solvers/amgcl/mpi/solver/cg.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_CG_HPP
-#define AMGCL_MPI_SOLVER_CG_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/cg.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for CG iterative method.
- */
-
-#include <amgcl/solver/cg.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class cg : public amgcl::solver::cg<Backend, InnerProduct> {
-    typedef amgcl::solver::cg<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/fgmres.hpp b/src/solvers/amgcl/mpi/solver/fgmres.hpp
deleted file mode 100644
index 727997f..0000000
--- a/src/solvers/amgcl/mpi/solver/fgmres.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_FGMRES_HPP
-#define AMGCL_MPI_SOLVER_FGMRES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/fgmres.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for FGMRES iterative method.
- */
-
-#include <amgcl/solver/fgmres.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class fgmres : public amgcl::solver::fgmres<Backend, InnerProduct> {
-    typedef amgcl::solver::fgmres<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/gmres.hpp b/src/solvers/amgcl/mpi/solver/gmres.hpp
deleted file mode 100644
index af51355..0000000
--- a/src/solvers/amgcl/mpi/solver/gmres.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_GMRES_HPP
-#define AMGCL_MPI_SOLVER_GMRES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/gmres.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for GMRES iterative method.
- */
-
-#include <amgcl/solver/gmres.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class gmres : public amgcl::solver::gmres<Backend, InnerProduct> {
-    typedef amgcl::solver::gmres<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/idrs.hpp b/src/solvers/amgcl/mpi/solver/idrs.hpp
deleted file mode 100644
index 2fa329c..0000000
--- a/src/solvers/amgcl/mpi/solver/idrs.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_IDRS_HPP
-#define AMGCL_MPI_SOLVER_IDRS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/idrs.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for IDR(s) iterative method.
- */
-
-#include <amgcl/solver/idrs.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class idrs : public amgcl::solver::idrs<Backend, InnerProduct> {
-    typedef amgcl::solver::idrs<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/lgmres.hpp b/src/solvers/amgcl/mpi/solver/lgmres.hpp
deleted file mode 100644
index ba593ad..0000000
--- a/src/solvers/amgcl/mpi/solver/lgmres.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_LGMRES_HPP
-#define AMGCL_MPI_SOLVER_LGMRES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/lgmres.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for LGMRES iterative method.
- */
-
-#include <amgcl/solver/lgmres.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class lgmres : public amgcl::solver::lgmres<Backend, InnerProduct> {
-    typedef amgcl::solver::lgmres<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/preonly.hpp b/src/solvers/amgcl/mpi/solver/preonly.hpp
deleted file mode 100644
index 22c3f70..0000000
--- a/src/solvers/amgcl/mpi/solver/preonly.hpp
+++ /dev/null
@@ -1,52 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_PREONLY_HPP
-#define AMGCL_MPI_SOLVER_PREONLY_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/preonly.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for the PreOnly iterative method.
- */
-
-#include <amgcl/solver/preonly.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class preonly : public amgcl::solver::preonly<Backend, InnerProduct> {
-    typedef amgcl::solver::preonly<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/richardson.hpp b/src/solvers/amgcl/mpi/solver/richardson.hpp
deleted file mode 100644
index cefa1ab..0000000
--- a/src/solvers/amgcl/mpi/solver/richardson.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_RICHARDSON_HPP
-#define AMGCL_MPI_SOLVER_RICHARDSON_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/richardson.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI wrapper for Richardson iteration.
- */
-
-#include <amgcl/solver/richardson.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = mpi::inner_product>
-class richardson : public amgcl::solver::richardson<Backend, InnerProduct> {
-    typedef amgcl::solver::richardson<Backend, InnerProduct> Base;
-    public:
-        using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/mpi/solver/runtime.hpp b/src/solvers/amgcl/mpi/solver/runtime.hpp
deleted file mode 100644
index dcc124c..0000000
--- a/src/solvers/amgcl/mpi/solver/runtime.hpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#ifndef AMGCL_MPI_SOLVER_RUNTIME_HPP
-#define AMGCL_MPI_SOLVER_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/solver/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime-configurable MPI wrapper around amgcl iterative solvers.
- */
-
-#include <amgcl/solver/runtime.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-
-namespace amgcl {
-namespace runtime { 
-namespace mpi {
-namespace solver {
-
-template <class Backend, class InnerProduct = amgcl::mpi::inner_product>
-struct wrapper : public amgcl::runtime::solver::wrapper<Backend, InnerProduct> {
-    typedef amgcl::runtime::solver::wrapper<Backend, InnerProduct> Base;
-    using Base::Base;
-};
-
-} // namespace solver
-} // namespace mpi
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/subdomain_deflation.hpp b/src/solvers/amgcl/mpi/subdomain_deflation.hpp
deleted file mode 100644
index 09ba26a..0000000
--- a/src/solvers/amgcl/mpi/subdomain_deflation.hpp
+++ /dev/null
@@ -1,610 +0,0 @@
-#ifndef AMGCL_MPI_SUBDOMAIN_DEFLATION_HPP
-#define AMGCL_MPI_SUBDOMAIN_DEFLATION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2014-2015, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/subdomain_deflatedion.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Distributed solver based on subdomain deflation.
- */
-
-#include <vector>
-#include <algorithm>
-#include <numeric>
-#include <memory>
-#include <functional>
-
-#include <mpi.h>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/adapter/crs_tuple.hpp>
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/direct_solver/skyline_lu.hpp>
-#include <amgcl/mpi/inner_product.hpp>
-#include <amgcl/mpi/distributed_matrix.hpp>
-
-namespace amgcl {
-namespace mpi {
-
-/// Pointwise constant deflation vectors.
-struct constant_deflation {
-    const int block_size;
-    /// Constructor
-    /**
-     * \param block_size Number of degrees of freedom per grid point
-     */
-    constant_deflation(int block_size = 1) : block_size(block_size) {}
-
-    int dim() const {
-        return block_size;
-    }
-
-    int operator()(ptrdiff_t row, int j) const {
-        return row % block_size == j;
-    }
-};
-
-template <class SDD, class Matrix>
-struct sdd_projected_matrix {
-    typedef typename SDD::value_type value_type;
-
-    const SDD    &S;
-    const Matrix &A;
-
-    sdd_projected_matrix(const SDD &S, const Matrix &A) : S(S), A(A) {}
-
-    template <class T, class Vec1, class Vec2>
-    void mul(T alpha, const Vec1 &x, T beta, Vec2 &y) const {
-        AMGCL_TIC("top/spmv");
-        backend::spmv(alpha, A, x, beta, y);
-        AMGCL_TOC("top/spmv");
-
-        S.project(y);
-    }
-
-    template <class Vec1, class Vec2, class Vec3>
-    void residual(const Vec1 &f, const Vec2 &x, Vec3 &r) const {
-        AMGCL_TIC("top/residual");
-        backend::residual(f, A, x, r);
-        AMGCL_TOC("top/residual");
-
-        S.project(r);
-    }
-};
-
-template <class SDD, class Matrix>
-sdd_projected_matrix<SDD, Matrix> make_sdd_projected_matrix(const SDD &S, const Matrix &A) {
-    return sdd_projected_matrix<SDD, Matrix>(S, A);
-}
-
-/// Distributed solver based on subdomain deflation.
-/**
- * \sa \cite Frank2001
- */
-template <
-    class LocalPrecond,
-    class IterativeSolver,
-    class DirectSolver = mpi::direct::skyline_lu<typename LocalPrecond::backend_type::value_type>
-    >
-class subdomain_deflation {
-    public:
-        typedef typename LocalPrecond::backend_type backend_type;
-        typedef typename backend_type::params backend_params;
-
-        struct params {
-            typename LocalPrecond::params local;
-            typename IterativeSolver::params isolver;
-            typename DirectSolver::params dsolver;
-
-            // Number of deflation vectors.
-            unsigned num_def_vec;
-
-            // Value of deflation vector at the given row and column.
-            std::function<double(ptrdiff_t, unsigned)> def_vec;
-
-            params() {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, local),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, isolver),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, dsolver),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, num_def_vec)
-            {
-                void *ptr = 0;
-                ptr = p.get("def_vec", ptr);
-
-                amgcl::precondition(ptr,
-                        "Error in subdomain_deflation parameters: "
-                        "def_vec is not set");
-
-                def_vec = *static_cast<std::function<double(ptrdiff_t, unsigned)>*>(ptr);
-
-                check_params(p, {"local", "isolver", "dsolver", "num_def_vec", "def_vec"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, local);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, isolver);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, dsolver);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, num_def_vec);
-            }
-#endif
-        };
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename backend_type::matrix     bmatrix;
-        typedef typename backend_type::vector     vector;
-        typedef distributed_matrix<backend_type>  matrix;
-
-
-        template <class Matrix>
-        subdomain_deflation(
-                communicator comm,
-                const Matrix &Astrip,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-        : comm(comm),
-          nrows(backend::rows(Astrip)), ndv(prm.num_def_vec),
-          dtype( datatype<value_type>() ), dv_start(comm.size + 1, 0),
-          Z( ndv ), q( backend_type::create_vector(nrows, bprm) ),
-          S(nrows, prm.isolver, bprm, mpi::inner_product(comm))
-        {
-            A = std::make_shared<matrix>(comm, Astrip, nrows);
-            init(prm, bprm);
-        }
-
-        subdomain_deflation(
-                communicator comm,
-                std::shared_ptr<matrix> A,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-        : comm(comm),
-          nrows(A->loc_rows()), ndv(prm.num_def_vec),
-          dtype( datatype<value_type>() ), A(A), dv_start(comm.size + 1, 0),
-          Z( ndv ), q( backend_type::create_vector(nrows, bprm) ),
-          S(nrows, prm.isolver, bprm, mpi::inner_product(comm))
-        {
-            init(prm, bprm);
-        }
-
-        void init(
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-        {
-            AMGCL_TIC("setup deflation");
-            typedef backend::crs<value_type, ptrdiff_t>                build_matrix;
-
-            // Lets see how many deflation vectors are there.
-            std::vector<ptrdiff_t> dv_size(comm.size);
-            MPI_Allgather(&ndv, 1, datatype<ptrdiff_t>(), &dv_size[0], 1, datatype<ptrdiff_t>(), comm);
-
-            std::partial_sum(dv_size.begin(), dv_size.end(), dv_start.begin() + 1);
-            nz = dv_start.back();
-
-            df.resize(ndv);
-            dx.resize(ndv);
-            dd = backend_type::create_vector(ndv, bprm);
-
-            auto az_loc = std::make_shared<build_matrix>();
-            auto az_rem = std::make_shared<build_matrix>();
-
-            auto a_loc = A->local();
-            auto a_rem = A->remote();
-
-            const comm_pattern<backend_type> &Acp = A->cpat();
-
-            // Fill deflation vectors.
-            AMGCL_TIC("copy deflation vectors");
-            {
-                std::vector<value_type> z(nrows);
-                for(int j = 0; j < ndv; ++j) {
-#pragma omp parallel for
-                    for(ptrdiff_t i = 0; i < nrows; ++i)
-                        z[i] = prm.def_vec(i, j);
-                    Z[j] = backend_type::copy_vector(z, bprm);
-                }
-            }
-            AMGCL_TOC("copy deflation vectors");
-
-            AMGCL_TIC("first pass");
-            az_loc->set_size(nrows, ndv, true);
-            az_loc->set_nonzeros(nrows * dv_size[comm.rank]);
-            az_rem->set_size(nrows, 0, true);
-            // 1. Build local part of AZ matrix.
-            // 2. Count remote nonzeros
-#pragma omp parallel
-            {
-                std::vector<ptrdiff_t> marker(Acp.recv.nbr.size(), -1);
-
-#pragma omp for
-                for(ptrdiff_t i = 0; i < nrows; ++i) {
-                    ptrdiff_t az_loc_head = i * ndv;
-                    az_loc->ptr[i+1] = az_loc_head + ndv;
-
-                    for(ptrdiff_t j = 0; j < ndv; ++j) {
-                        az_loc->col[az_loc_head + j] = j;
-                        az_loc->val[az_loc_head + j] = math::zero<value_type>();
-                    }
-
-                    for(ptrdiff_t j = a_loc->ptr[i], e = a_loc->ptr[i+1]; j < e; ++j) {
-                        ptrdiff_t  c = a_loc->col[j];
-                        value_type v = a_loc->val[j];
-
-                        for(ptrdiff_t j = 0; j < ndv; ++j)
-                            az_loc->val[az_loc_head + j] += v * prm.def_vec(c, j);
-                    }
-
-                    for(ptrdiff_t j = a_rem->ptr[i], e = a_rem->ptr[i+1]; j < e; ++j) {
-                        int d = Acp.domain(a_rem->col[j]);
-
-                        if (marker[d] != i) {
-                            marker[d] = i;
-                            az_rem->ptr[i+1] += dv_size[d];
-                        }
-                    }
-                }
-            }
-            az_rem->set_nonzeros(az_rem->scan_row_sizes());
-            AMGCL_TOC("first pass");
-
-            // Create local preconditioner.
-            AMGCL_TIC("local preconditioner");
-            P = std::make_shared<LocalPrecond>( *a_loc, prm.local, bprm );
-            AMGCL_TOC("local preconditioner");
-
-            A->set_local(P->system_matrix_ptr());
-            A->move_to_backend(bprm);
-
-            AMGCL_TIC("remote(A*Z)");
-            /* Construct remote part of AZ */
-            // Exchange deflation vectors
-            std::vector<ptrdiff_t> zrecv_ptr(Acp.recv.nbr.size() + 1, 0);
-            std::vector<ptrdiff_t> zcol_ptr;
-            zcol_ptr.reserve(Acp.recv.count() + 1);
-            zcol_ptr.push_back(0);
-
-            for(size_t i = 0; i < Acp.recv.nbr.size(); ++i) {
-                ptrdiff_t ncols = Acp.recv.ptr[i + 1] - Acp.recv.ptr[i];
-                ptrdiff_t nvecs = dv_size[Acp.recv.nbr[i]];
-                ptrdiff_t size = nvecs * ncols;
-                zrecv_ptr[i + 1] = zrecv_ptr[i] + size;
-
-                for(ptrdiff_t j = 0; j < ncols; ++j)
-                    zcol_ptr.push_back(zcol_ptr.back() + nvecs);
-            }
-
-            std::vector<value_type> zrecv(zrecv_ptr.back());
-            std::vector<value_type> zsend(Acp.send.count() * ndv);
-
-            for(size_t i = 0; i < Acp.recv.nbr.size(); ++i) {
-                ptrdiff_t begin = zrecv_ptr[i];
-                ptrdiff_t size  = zrecv_ptr[i + 1] - begin;
-
-                MPI_Irecv(&zrecv[begin], size, dtype, Acp.recv.nbr[i],
-                        tag_exc_vals, comm, &Acp.recv.req[i]);
-            }
-
-            for(size_t i = 0, k = 0; i < Acp.send.count(); ++i)
-                for(ptrdiff_t j = 0; j < ndv; ++j, ++k)
-                    zsend[k] = prm.def_vec(Acp.send.col[i], j);
-
-            for(size_t i = 0; i < Acp.send.nbr.size(); ++i)
-                MPI_Isend(
-                        &zsend[ndv * Acp.send.ptr[i]], ndv * (Acp.send.ptr[i+1] - Acp.send.ptr[i]),
-                        dtype, Acp.send.nbr[i], tag_exc_vals, comm, &Acp.send.req[i]);
-
-            MPI_Waitall(Acp.recv.req.size(), &Acp.recv.req[0], MPI_STATUSES_IGNORE);
-            MPI_Waitall(Acp.send.req.size(), &Acp.send.req[0], MPI_STATUSES_IGNORE);
-
-#pragma omp parallel
-            {
-                std::vector<ptrdiff_t> marker(nz, -1);
-
-                // AZ_rem = Arem * Z
-#pragma omp for
-                for(ptrdiff_t i = 0; i < nrows; ++i) {
-                    ptrdiff_t az_rem_head = az_rem->ptr[i];
-                    ptrdiff_t az_rem_tail = az_rem_head;
-
-                    for(auto a = backend::row_begin(*a_rem, i); a; ++a) {
-                        ptrdiff_t  c = a.col();
-                        value_type v = a.value();
-
-                        // Domain the column belongs to
-                        ptrdiff_t d = Acp.recv.nbr[
-                            std::upper_bound(Acp.recv.ptr.begin(), Acp.recv.ptr.end(), c) -
-                                Acp.recv.ptr.begin() - 1];
-
-                        value_type *zval = &zrecv[ zcol_ptr[c] ];
-                        for(ptrdiff_t j = 0, k = dv_start[d]; j < dv_size[d]; ++j, ++k) {
-                            if (marker[k] < az_rem_head) {
-                                marker[k] = az_rem_tail;
-                                az_rem->col[az_rem_tail] = k;
-                                az_rem->val[az_rem_tail] = v * zval[j];
-                                ++az_rem_tail;
-                            } else {
-                                az_rem->val[marker[k]] += v * zval[j];
-                            }
-                        }
-                    }
-                }
-            }
-            AMGCL_TOC("remote(A*Z)");
-
-            /* Build solver for the deflated matrix E. */
-            AMGCL_TIC("assemble E");
-
-            // Count nonzeros in E.
-            std::vector<int> nbrs; // processes we are talking to
-            nbrs.reserve(1 + Acp.send.nbr.size() + Acp.recv.nbr.size());
-            std::set_union(
-                    Acp.send.nbr.begin(), Acp.send.nbr.end(),
-                    Acp.recv.nbr.begin(), Acp.recv.nbr.end(),
-                    std::back_inserter(nbrs));
-            nbrs.push_back(comm.rank);
-
-            build_matrix E;
-            E.set_size(ndv, nz, false);
-
-            {
-                ptrdiff_t nnz = 0;
-                for(int j : nbrs) nnz += dv_size[j];
-                for(int k = 0; k <= ndv; ++k)
-                    E.ptr[k] = k * nnz;
-            }
-            E.set_nonzeros(E.nnz = E.ptr[ndv]);
-
-            // Build local strip of E.
-#ifdef _OPENMP
-            int nthreads = omp_get_max_threads();
-#else
-            int nthreads = 1;
-#endif
-            multi_array<value_type, 3> erow(nthreads, ndv, nz);
-            std::fill_n(erow.data(), erow.size(), 0);
-
-            {
-                ptrdiff_t dv_offset = dv_start[comm.rank];
-#pragma omp parallel
-                {
-#ifdef _OPENMP
-                    const int tid = omp_get_thread_num();
-#else
-                    const int tid = 0;
-#endif
-                    std::vector<value_type> z(ndv);
-
-#pragma omp for
-                    for(ptrdiff_t i = 0; i < nrows; ++i) {
-                        for(ptrdiff_t j = 0; j < ndv; ++j)
-                            z[j] = prm.def_vec(i,j);
-
-                        for(ptrdiff_t k = az_loc->ptr[i], e = az_loc->ptr[i+1]; k < e; ++k) {
-                            ptrdiff_t  c = az_loc->col[k] + dv_offset;
-                            value_type v = az_loc->val[k];
-
-                            for(ptrdiff_t j = 0; j < ndv; ++j)
-                                erow(tid, j, c) += v * z[j];
-                        }
-
-                        for(ptrdiff_t k = az_rem->ptr[i], e = az_rem->ptr[i+1]; k < e; ++k) {
-                            ptrdiff_t  c = az_rem->col[k];
-                            value_type v = az_rem->val[k];
-
-                            for(ptrdiff_t j = 0; j < ndv; ++j)
-                                erow(tid, j, c) += v * z[j];
-                        }
-                    }
-                }
-            }
-
-            for(int i = 0; i < ndv; ++i) {
-                int row_head = E.ptr[i];
-                for(int j : nbrs) {
-                    for(int k = 0; k < dv_size[j]; ++k) {
-                        int c = dv_start[j] + k;
-                        value_type v = math::zero<value_type>();
-                        for(int t = 0; t < nthreads; ++t)
-                            v += erow(t, i, c);
-
-                        E.col[row_head] = c;
-                        E.val[row_head] = v;
-
-                        ++row_head;
-                    }
-                }
-            }
-            AMGCL_TOC("assemble E");
-
-            AMGCL_TIC("factorize E");
-            this->E = std::make_shared<DirectSolver>(comm, E, prm.dsolver);
-            AMGCL_TOC("factorize E");
-
-            AMGCL_TIC("finish(A*Z)");
-            AZ = std::make_shared<matrix>(comm, az_loc, az_rem);
-            AZ->move_to_backend(bprm);
-            AMGCL_TOC("finish(A*Z)");
-            AMGCL_TOC("setup deflation");
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            size_t iters;
-            double error;
-            backend::clear(x);
-            std::tie(iters, error) = (*this)(rhs, x);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return A;
-        }
-
-        const matrix& system_matrix() const {
-            return *A;
-        }
-
-        template <class Matrix, class Vec1, class Vec2>
-        std::tuple<size_t, value_type> operator()(
-                const Matrix &A, const Vec1 &rhs, Vec2 &&x) const
-        {
-            std::tuple<size_t, value_type> cnv = S(make_sdd_projected_matrix(*this, A), *P, rhs, x);
-            postprocess(rhs, x);
-            return cnv;
-        }
-
-        template <class Vec1, class Vec2>
-        std::tuple<size_t, value_type>
-        operator()(const Vec1 &rhs, Vec2 &&x) const {
-            std::tuple<size_t, value_type> cnv = S(make_sdd_projected_matrix(*this, *A), *P, rhs, x);
-            postprocess(rhs, x);
-            return cnv;
-        }
-
-        size_t size() const {
-            return nrows;
-        }
-
-        template <class Vector>
-        void project(Vector &x) const {
-            const auto one = math::identity<scalar_type>();
-
-            AMGCL_TIC("project");
-
-            AMGCL_TIC("local inner product");
-            for(ptrdiff_t j = 0; j < ndv; ++j)
-                df[j] = backend::inner_product(x, *Z[j]);
-            AMGCL_TOC("local inner product");
-
-            coarse_solve(df, dx);
-
-            AMGCL_TIC("spmv");
-            backend::copy(dx, *dd);
-            backend::spmv(-one, *AZ, *dd, one, x);
-            AMGCL_TOC("spmv");
-
-            AMGCL_TOC("project");
-        }
-    private:
-        static const int tag_exc_vals = 2011;
-        static const int tag_exc_dmat = 3011;
-        static const int tag_exc_dvec = 4011;
-        static const int tag_exc_lnnz = 5011;
-
-        communicator comm;
-        ptrdiff_t nrows, ndv, nz;
-
-        MPI_Datatype dtype;
-
-        std::shared_ptr<matrix> A, AZ;
-        std::shared_ptr<LocalPrecond> P;
-
-        mutable std::vector<value_type> df, dx;
-        std::vector<ptrdiff_t> dv_start;
-
-        std::vector< std::shared_ptr<vector> > Z;
-
-        std::shared_ptr<DirectSolver> E;
-
-        std::shared_ptr<vector> q;
-        std::shared_ptr<vector> dd;
-
-        IterativeSolver S;
-
-        void coarse_solve(std::vector<value_type> &f, std::vector<value_type> &x) const
-        {
-            AMGCL_TIC("coarse solve");
-            (*E)(f, x);
-            AMGCL_TOC("coarse solve");
-        }
-
-        template <class Vec1, class Vec2>
-        void postprocess(const Vec1 &rhs, Vec2 &x) const {
-            const auto one = math::identity<scalar_type>();
-
-            AMGCL_TIC("postprocess");
-
-            // q = rhs - Ax
-            backend::copy(rhs, *q);
-            backend::spmv(-one, *A, x, one, *q);
-
-            // df = transp(Z) * (rhs - Ax)
-            AMGCL_TIC("local inner product");
-            for(ptrdiff_t j = 0; j < ndv; ++j)
-                df[j] = backend::inner_product(*q, *Z[j]);
-            AMGCL_TOC("local inner product");
-
-            // dx = inv(E) * df
-            coarse_solve(df, dx);
-
-            // x += Z * dx
-            backend::lin_comb(ndv, dx, Z, one, x);
-
-            AMGCL_TOC("postprocess");
-        }
-
-};
-
-} // namespace mpi
-
-namespace backend {
-
-template <
-    class SDD, class Matrix,
-    class Alpha, class Beta, class Vec1, class Vec2
-    >
-struct spmv_impl<
-    Alpha, mpi::sdd_projected_matrix<SDD, Matrix>, Vec1, Beta, Vec2
-    >
-{
-    typedef mpi::sdd_projected_matrix<SDD, Matrix> M;
-
-    static void apply(Alpha alpha, const M &A, const Vec1 &x, Beta beta, Vec2 &y)
-    {
-        A.mul(alpha, x, beta, y);
-    }
-};
-
-template <class SDD, class Matrix, class Vec1, class Vec2, class Vec3>
-struct residual_impl<mpi::sdd_projected_matrix<SDD, Matrix>, Vec1, Vec2, Vec3>
-{
-    typedef mpi::sdd_projected_matrix<SDD, Matrix> M;
-
-    static void apply(const Vec1 &rhs, const M &A, const Vec2 &x, Vec3 &r) {
-        A.residual(rhs, x, r);
-    }
-};
-
-} // namespace backend
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/mpi/util.hpp b/src/solvers/amgcl/mpi/util.hpp
deleted file mode 100644
index 34e45e9..0000000
--- a/src/solvers/amgcl/mpi/util.hpp
+++ /dev/null
@@ -1,236 +0,0 @@
-#ifndef AMGCL_MPI_UTIL_HPP
-#define AMGCL_MPI_UTIL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2014, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/mpi/util.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  MPI utilities.
- */
-
-#include <vector>
-#include <numeric>
-#include <complex>
-
-#include <type_traits>
-#include <amgcl/value_type/interface.hpp>
-
-#include <mpi.h>
-
-namespace amgcl {
-namespace mpi {
-
-/// Converts C type to MPI datatype.
-template <class T, class Enable = void>
-struct datatype_impl {
-    static MPI_Datatype get() {
-        static const MPI_Datatype t = create();
-        return t;
-    }
-
-    static MPI_Datatype create() {
-        typedef typename math::scalar_of<T>::type S;
-        MPI_Datatype t;
-        int n = sizeof(T) / sizeof(S);
-        MPI_Type_contiguous(n, datatype_impl<S>::get(), &t);
-        MPI_Type_commit(&t);
-        return t;
-    }
-};
-
-template <>
-struct datatype_impl<float> {
-    static MPI_Datatype get() { return MPI_FLOAT; }
-};
-
-template <>
-struct datatype_impl<double> {
-    static MPI_Datatype get() { return MPI_DOUBLE; }
-};
-
-template <>
-struct datatype_impl<long double> {
-    static MPI_Datatype get() { return MPI_LONG_DOUBLE; }
-};
-
-template <>
-struct datatype_impl<int> {
-    static MPI_Datatype get() { return MPI_INT; }
-};
-
-template <>
-struct datatype_impl<unsigned> {
-    static MPI_Datatype get() { return MPI_UNSIGNED; }
-};
-
-template <>
-struct datatype_impl<long long> {
-    static MPI_Datatype get() { return MPI_LONG_LONG_INT; }
-};
-
-template <>
-struct datatype_impl<unsigned long long> {
-    static MPI_Datatype get() { return MPI_UNSIGNED_LONG_LONG; }
-};
-
-template <>
-struct datatype_impl< std::complex<double> > {
-    static MPI_Datatype get() { return MPI_CXX_DOUBLE_COMPLEX; }
-};
-
-template <>
-struct datatype_impl< std::complex<float> > {
-    static MPI_Datatype get() { return MPI_CXX_FLOAT_COMPLEX; }
-};
-
-template <typename T>
-struct datatype_impl<T,
-    typename std::enable_if<
-        std::is_same<T, ptrdiff_t>::value &&
-        !std::is_same<ptrdiff_t, long long>::value &&
-        !std::is_same<ptrdiff_t, int>::value
-        >::type
-    > : std::conditional<
-        sizeof(ptrdiff_t) == sizeof(int), datatype_impl<int>, datatype_impl<long long>
-        >::type
-{};
-
-template <typename T>
-struct datatype_impl<T,
-    typename std::enable_if<
-        std::is_same<T, size_t>::value &&
-        !std::is_same<size_t, unsigned long long>::value &&
-        !std::is_same<ptrdiff_t, unsigned int>::value
-        >::type
-    >
-    : std::conditional<
-        sizeof(size_t) == sizeof(unsigned), datatype_impl<unsigned>, datatype_impl<unsigned long long>
-        >::type
-{};
-
-template <>
-struct datatype_impl<char> {
-    static MPI_Datatype get() { return MPI_CHAR; }
-};
-
-template <typename T>
-MPI_Datatype datatype() {
-    return datatype_impl<T>::get();
-}
-
-/// Convenience wrapper around MPI_Init/MPI_Finalize.
-struct init {
-    init(int* argc, char ***argv) {
-        MPI_Init(argc, argv);
-    }
-
-    ~init() {
-        MPI_Finalize();
-    }
-};
-
-/// Convenience wrapper around MPI_Init_threads/MPI_Finalize.
-struct init_thread {
-    init_thread(int* argc, char ***argv) {
-        int _;
-        MPI_Init_thread(argc, argv, MPI_THREAD_MULTIPLE, &_);
-    }
-
-    ~init_thread() {
-        MPI_Finalize();
-    }
-};
-
-/// Convenience wrapper around MPI_Comm.
-struct communicator {
-    MPI_Comm comm;
-    int      rank;
-    int      size;
-
-    communicator() {}
-
-    communicator(MPI_Comm comm) : comm(comm) {
-        MPI_Comm_rank(comm, &rank);
-        MPI_Comm_size(comm, &size);
-    };
-
-    operator MPI_Comm() const {
-        return comm;
-    }
-
-    /// Exclusive sum over mpi communicator
-    template <typename T>
-    std::vector<T> exclusive_sum(T n) const {
-        std::vector<T> v(size + 1); v[0] = 0;
-        MPI_Allgather(&n, 1, datatype<T>(), &v[1], 1, datatype<T>(), comm);
-        std::partial_sum(v.begin(), v.end(), v.begin());
-        return v;
-    }
-
-    template <typename T>
-    T reduce(MPI_Op op, const T &lval) const {
-        const int elems = math::static_rows<T>::value * math::static_cols<T>::value;
-        T gval;
-
-        MPI_Allreduce((void*)&lval, &gval, elems, datatype<T>(), op, comm);
-        return gval;
-    }
-
-    /// Communicator-wise condition checking.
-    /**
-     * Checks conditions at each process in the communicator;
-     *
-     * If the condition is false on any of the participating processes, outputs the
-     * provided message together with the ranks of the offending process.
-     * After that each process in the communicator throws.
-     */
-    template <class Condition, class Message>
-    void check(const Condition &cond, const Message &message) {
-        int lc = static_cast<int>(cond);
-        int gc = reduce(MPI_PROD, lc);
-
-        if (!gc) {
-            std::vector<int> c(size);
-            MPI_Gather(&lc, 1, MPI_INT, &c[0], size, MPI_INT, 0, comm);
-            if (rank == 0) {
-                std::cerr << "Failed assumption: " << message << std::endl;
-                std::cerr << "Offending processes:";
-                for (int i = 0; i < size; ++i)
-                    if (!c[i]) std::cerr << " " << i;
-                std::cerr << std::endl;
-            }
-            MPI_Barrier(comm);
-            throw std::runtime_error(message);
-        }
-    }
-
-};
-
-} // namespace mpi
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/perf_counter/clock.hpp b/src/solvers/amgcl/perf_counter/clock.hpp
deleted file mode 100644
index 02c9bd5..0000000
--- a/src/solvers/amgcl/perf_counter/clock.hpp
+++ /dev/null
@@ -1,72 +0,0 @@
-#ifndef AMGCL_PERF_COUNTER_CLOCK_HPP
-#define AMGCL_PERF_COUNTER_CLOCK_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/perf_counter/clock.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Clock class.
- *
- * A minimal wrapper around either omp_get_wtime() or std::clock().
- */
-
-#ifdef _OPENMP
-#  include <omp.h>
-#else
-#  include <ctime>
-#endif
-
-namespace amgcl {
-
-/// Performance counters for use with amgcl::profiler
-namespace perf_counter {
-
-/// Clock class.
-/**
- * Uses omp_get_wtime() when available, std::clock() otherwise.
- */
-struct clock {
-    typedef double value_type;
-
-    static const char* units() {
-        return "s";
-    }
-
-    /// Current time point.
-    static double current() {
-#ifdef _OPENMP
-        return omp_get_wtime();
-#else
-        return std::clock() / static_cast<double>(CLOCKS_PER_SEC);
-#endif
-    }
-};
-
-} // namespace perf_counter
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/perf_counter/cray_energy.hpp b/src/solvers/amgcl/perf_counter/cray_energy.hpp
deleted file mode 100644
index 2278e7c..0000000
--- a/src/solvers/amgcl/perf_counter/cray_energy.hpp
+++ /dev/null
@@ -1,72 +0,0 @@
-#ifndef AMGCL_PERF_COUNTER_CRAY_ENERGY_HPP
-#define AMGCL_PERF_COUNTER_CRAY_ENERGY_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2016 Mohammad Siahatgar <siahatgar@luis.uni-hannover.de>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/perf_counter/cray_energy.hpp
- * \author Mohammad Siahatgar <siahatgar@luis.uni-hannover.de>
- * \brief  Cray energy counter.
- */
-
-#include <fstream>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace perf_counter {
-
-class cray_energy {
-    public:
-        typedef long long value_type;
-
-        cray_energy() : f(attribute_path()) {
-            precondition(f, std::string("Failed to open ") + attribute_path());
-        }
-
-        static const char* units() {
-            return "J";
-        }
-
-        value_type current() {
-            f.clear();
-            f.seekg(0, std::ios::beg);
-
-            value_type v;
-            f >> v;
-            return v;
-        }
-    private:
-        static const char* attribute_path() {
-            return "/sys/cray/pm_counters/energy";
-        }
-
-        std::ifstream f;
-};
-
-} // namespace perf_counter
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/perf_counter/mpi_aggregator.hpp b/src/solvers/amgcl/perf_counter/mpi_aggregator.hpp
deleted file mode 100644
index 907b434..0000000
--- a/src/solvers/amgcl/perf_counter/mpi_aggregator.hpp
+++ /dev/null
@@ -1,123 +0,0 @@
-#ifndef AMGCL_PERF_COUNTER_MPI_AGGREGATOR_HPP
-#define AMGCL_PERF_COUNTER_MPI_AGGREGATOR_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2016 Mohammad Siahatgar <siahatgar@luis.uni-hannover.de>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/perf_counter/mpi_aggregator.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Aggregate performace counter over MPI.
- */
-
-#include <functional>
-#include <cmath>
-#include <type_traits>
-#include <amgcl/mpi/util.hpp>
-
-namespace amgcl {
-namespace perf_counter {
-
-template <class Counter, bool SingleReaderPerNode = true>
-class mpi_aggregator {
-    public:
-        typedef typename Counter::value_type value_type;
-
-        mpi_aggregator(MPI_Comm comm = MPI_COMM_WORLD)
-            : world(comm), dtype(amgcl::mpi::datatype<value_type>())
-        {
-            if (SingleReaderPerNode) {
-                typedef std::integral_constant<bool, sizeof(size_t) == sizeof(int)>::type _32bit;
-
-                char node_name[MPI_MAX_PROCESSOR_NAME];
-                int node_name_len, node_master;
-
-                MPI_Get_processor_name(node_name, &node_name_len);
-                MPI_Comm_split(world, name_hash(node_name, _32bit()), world.rank, &node_comm);
-                MPI_Allreduce(&world.rank, &node_master, 1, MPI_INT, MPI_MIN, node_comm);
-
-                reader = (world.rank == node_master);
-                MPI_Comm_split(world, reader, world.rank, &reader_comm);
-            }
-        }
-
-        ~mpi_aggregator() {
-            if (SingleReaderPerNode) {
-                MPI_Comm_free(&node_comm);
-                MPI_Comm_free(&reader_comm);
-            }
-        }
-
-        static const char* units() {
-            return Counter::units();
-        }
-
-        value_type current() {
-            value_type gval;
-
-            if (SingleReaderPerNode) {
-                if (reader) {
-                    value_type lval = counter.current();
-                    MPI_Allreduce(&lval, &gval, 1, dtype, MPI_SUM, reader_comm);
-                }
-
-                MPI_Bcast(&gval, 1, dtype, 0, node_comm);
-            } else {
-                value_type lval = counter.current();
-                MPI_Allreduce(&lval, &gval, 1, dtype, MPI_SUM, world);
-            }
-
-            return gval;
-        }
-    private:
-        amgcl::mpi::communicator world;
-        MPI_Datatype dtype;
-
-        bool reader;
-        MPI_Comm node_comm, reader_comm;
-
-        Counter counter;
-
-        int name_hash(const char *name, std::true_type) {
-            return std::hash<std::string>()(name);
-        }
-
-        int name_hash(const char *name, std::false_type) {
-            union {
-                size_t full;
-                struct {
-                    int lo, hi;
-                } part;
-            } h;
-
-            h.full = std::hash<std::string>()(name);
-            return std::abs(h.part.lo ^ h.part.hi);
-        }
-};
-
-} // namespace perf_counter
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/preconditioner/cpr.hpp b/src/solvers/amgcl/preconditioner/cpr.hpp
deleted file mode 100644
index e02a947..0000000
--- a/src/solvers/amgcl/preconditioner/cpr.hpp
+++ /dev/null
@@ -1,561 +0,0 @@
-#ifndef AMGCL_PRECONDITIONER_CPR_HPP
-#define AMGCL_PRECONDITIONER_CPR_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/preconditioner/cpr.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Two stage preconditioner of the Constrained Pressure Residual type.
- */
-
-#include <vector>
-#include <memory>
-#include <cassert>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace preconditioner {
-
-template <class PPrecond, class SPrecond>
-class cpr {
-    static_assert(
-            math::static_rows<typename PPrecond::backend_type::value_type>::value == 1,
-            "Pressure backend should have scalar value type!"
-            );
-
-    static_assert(
-            backend::backends_compatible<
-                typename PPrecond::backend_type,
-                typename SPrecond::backend_type
-                >::value,
-            "Backends for pressure and flow preconditioners should coincide!"
-            );
-
-    public:
-        typedef typename SPrecond::backend_type backend_type;
-        typedef typename PPrecond::backend_type backend_type_p;
-
-        typedef typename backend_type::value_type   value_type;
-        typedef typename backend_type::matrix       matrix;
-        typedef typename backend_type::vector       vector;
-        typedef typename backend_type_p::value_type value_type_p;
-        typedef typename backend_type_p::matrix     matrix_p;
-        typedef typename backend_type_p::vector     vector_p;
-
-        typedef typename backend_type::params       backend_params;
-
-        typedef typename backend::builtin<value_type>::matrix   build_matrix;
-        typedef typename backend::builtin<value_type_p>::matrix build_matrix_p;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        struct params {
-            typedef typename PPrecond::params pprecond_params;
-            typedef typename SPrecond::params sprecond_params;
-
-            pprecond_params pprecond;
-            sprecond_params sprecond;
-
-            int    block_size;
-            size_t active_rows;
-
-            params()
-                : block_size(math::static_rows<value_type>::value == 1 ? 2 : math::static_rows<value_type>::value),
-                  active_rows(0) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, pprecond),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, sprecond),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, block_size),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, active_rows)
-            {
-                check_params(p, {"pprecond", "sprecond", "block_size", "active_rows"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path = "") const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, pprecond);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, sprecond);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, block_size);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, active_rows);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        cpr(
-                const Matrix &K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(prm), n(backend::rows(K))
-        {
-            init(std::make_shared<build_matrix>(K), bprm,
-                    std::integral_constant<bool, math::static_rows<value_type>::value == 1>());
-        }
-
-        cpr(
-                std::shared_ptr<build_matrix> K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-           ) : prm(prm), n(backend::rows(*K))
-        {
-            init(K, bprm,
-                    std::integral_constant<bool, math::static_rows<value_type>::value == 1>());
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            AMGCL_TIC("sprecond");
-            S->apply(rhs, x);
-            AMGCL_TOC("sprecond");
-            backend::residual(rhs, S->system_matrix(), x, *rs);
-
-            backend::spmv(one, *Fpp, *rs, zero, *rp);
-            AMGCL_TIC("pprecond");
-            P->apply(*rp, *xp);
-            AMGCL_TOC("pprecond");
-
-            backend::spmv(one, *Scatter, *xp, one, x);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return S->system_matrix_ptr();
-        }
-
-        const matrix& system_matrix() const {
-            return S->system_matrix();
-        }
-
-        template <class Matrix>
-        void partial_update(
-                const Matrix &K,
-                bool update_transfer_ops = true,
-                const backend_params &bprm = backend_params()
-              )
-        {
-            auto K_ptr = std::make_shared<build_matrix>(K);
-            // Update global preconditioner
-            S = std::make_shared<SPrecond>(K_ptr, prm.sprecond, bprm);
-            if(update_transfer_ops){
-              // Update transfer operator Fpp
-              update_transfer(
-                  K_ptr,
-                  bprm,
-                  std::integral_constant<bool, math::static_rows<value_type>::value == 1>()
-                );
-            }
-        }
-
-    private:
-        size_t n, np;
-
-        std::shared_ptr<PPrecond> P;
-        std::shared_ptr<SPrecond> S;
-
-        std::shared_ptr<matrix_p> Fpp, Scatter;
-        std::shared_ptr<vector>   rs;
-        std::shared_ptr<vector_p> rp, xp;
-
-        // Returns pressure transfer operator fpp and (optionally)
-        // partially constructed pressure system matrix App.
-        std::tuple<std::shared_ptr<build_matrix_p>, std::shared_ptr<build_matrix_p>>
-        first_scalar_pass(std::shared_ptr<build_matrix> K, bool get_app = true) {
-            typedef typename backend::row_iterator<build_matrix>::type row_iterator;
-            const int       B = prm.block_size;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            np = N / B;
-
-            auto fpp = std::make_shared<build_matrix_p>();
-            fpp->set_size(np, N);
-            fpp->set_nonzeros(N);
-            fpp->ptr[0] = 0;
-
-            std::shared_ptr<build_matrix_p> App;
-
-            if (get_app) {
-                App = std::make_shared<build_matrix>();
-                App->set_size(np, np, true);
-            }
-
-            // Get the pressure matrix nonzero pattern,
-            // extract and invert block diagonals.
-#pragma omp parallel
-            {
-                std::vector<row_iterator> k; k.reserve(B);
-                multi_array<scalar_type, 2> v(B, B);
-
-#pragma omp for
-                for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(np); ++ip) {
-                    ptrdiff_t ik = ip * B;
-                    bool      done = true;
-                    ptrdiff_t cur_col = 0;
-
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(*K, ik + i));
-
-                        if (k.back() && k.back().col() < N) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-
-                        fpp->col[ik + i] = ik + i;
-                    }
-                    fpp->ptr[ip+1] = ik + B;
-
-                    while (!done) {
-                        if (get_app) ++App->ptr[ip+1];
-
-                        ptrdiff_t end = (cur_col + 1) * B;
-
-                        if (cur_col == ip) {
-                            // This is diagonal block.
-                            // Capture its (transposed) value,
-                            // invert it and put the relevant row into fpp.
-                            for(int i = 0; i < B; ++i)
-                                for(int j = 0; j < B; ++j) v(i,j) = 0;
-
-                            for(int i = 0; i < B; ++i)
-                                for(; k[i] && k[i].col() < end; ++k[i])
-                                    v(k[i].col() % B, i) = k[i].value();
-
-                            invert(v.data(), &fpp->val[ik]);
-
-                            if (!get_app) break;
-                        } else {
-                            // This is off-diagonal block.
-                            // Just skip it.
-                            for(int i = 0; i < B; ++i)
-                                while(k[i] && k[i].col() < end) ++k[i];
-                        }
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i] && k[i].col() < N) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-                }
-            }
-
-            if (get_app)
-                App->set_nonzeros(App->scan_row_sizes());
-
-            return std::make_tuple(fpp, App);
-        }
-
-        // The system matrix has scalar values
-        void init(std::shared_ptr<build_matrix> K, const backend_params bprm, std::true_type)
-        {
-            typedef typename backend::row_iterator<build_matrix>::type row_iterator;
-            const int       B = prm.block_size;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            np = N / B;
-
-            std::shared_ptr<build_matrix_p> fpp, App;
-            std::tie(fpp, App) = first_scalar_pass(K);
-
-            auto scatter = std::make_shared<build_matrix_p>();
-            scatter->set_size(n, np);
-            scatter->set_nonzeros(np);
-            scatter->ptr[0] = 0;
-
-#pragma omp parallel
-            {
-                std::vector<row_iterator> k; k.reserve(B);
-
-#pragma omp for
-                for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(np); ++ip) {
-                    ptrdiff_t ik = ip * B;
-                    ptrdiff_t head = App->ptr[ip];
-                    bool      done = true;
-                    ptrdiff_t cur_col;
-
-                    value_type_p *d = &fpp->val[ik];
-
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(*K, ik + i));
-
-                        if (k.back() && k.back().col() < N) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-                    }
-
-                    while (!done) {
-                        ptrdiff_t    end = (cur_col + 1) * B;
-                        value_type_p app = 0;
-
-                        for(int i = 0; i < B; ++i) {
-                            for(; k[i] && k[i].col() < end; ++k[i]) {
-                                if (k[i].col() % B == 0) {
-                                    app += d[i] * k[i].value();
-                                }
-                            }
-                        }
-
-                        App->col[head] = cur_col;
-                        App->val[head] = app;
-                        ++head;
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i] && k[i].col() < N) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-
-                    scatter->col[ip] = ip;
-                    scatter->val[ip] = math::identity<value_type_p>();
-
-                    ptrdiff_t nnz = ip;
-                    for(int i = 0; i < B; ++i) {
-                        if (i == 0) ++nnz;
-                        scatter->ptr[ik + i + 1] = nnz;
-                    }
-                }
-            }
-
-            for(size_t i = N; i < n; ++i)
-                scatter->ptr[i+1] = scatter->ptr[i];
-
-            AMGCL_TIC("pprecond");
-            P = std::make_shared<PPrecond>(App, prm.pprecond, bprm);
-            AMGCL_TOC("pprecond");
-            AMGCL_TIC("sprecond");
-            S = std::make_shared<SPrecond>(K,   prm.sprecond, bprm);
-            AMGCL_TOC("sprecond");
-
-            Fpp     = backend_type_p::copy_matrix(fpp, bprm);
-            Scatter = backend_type_p::copy_matrix(scatter, bprm);
-
-            rp = backend_type_p::create_vector(np, bprm);
-            xp = backend_type_p::create_vector(np, bprm);
-            rs = backend_type::create_vector(n, bprm);
-        }
-
-        void update_transfer(std::shared_ptr<build_matrix> K, const backend_params bprm, std::true_type)
-        {
-            auto fpp = std::get<0>(first_scalar_pass(K, /*get_app*/false));
-            Fpp = backend_type_p::copy_matrix(fpp, bprm);
-        }
-
-        // The system matrix has block values
-        void init(std::shared_ptr<build_matrix> K, const backend_params bprm, std::false_type)
-        {
-            const int       B = math::static_rows<value_type>::value;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            np = N;
-
-            auto fpp = std::make_shared<build_matrix_p>();
-            fpp->set_size(np, np * B);
-            fpp->set_nonzeros(np * B);
-            fpp->ptr[0] = 0;
-
-            auto scatter = std::make_shared<build_matrix_p>();
-            scatter->set_size(np * B, np);
-            scatter->set_nonzeros(np);
-            scatter->ptr[0] = 0;
-
-            auto App = std::make_shared<build_matrix_p>();
-            App->set_size(np, np, true);
-            App->set_nonzeros(K->nnz);
-            App->ptr[0] = 0;
-
-#pragma omp parallel for
-            for (ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(np); ++i) {
-                ptrdiff_t ik = i * B;
-                for(int k = 0; k < B; ++k, ++ik) {
-                    fpp->col[ik] = ik;
-                    scatter->ptr[ik + 1] = i + 1;
-                }
-
-                fpp->ptr[i + 1] = ik;
-                scatter->col[i] = i;
-                scatter->val[i] = math::identity<value_type_p>();
-
-                ptrdiff_t row_beg = K->ptr[i];
-                ptrdiff_t row_end = K->ptr[i + 1];
-                App->ptr[i+1] = row_end;
-
-                // Extract and invert block diagonals
-                value_type_p *d = &fpp->val[i * B];
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    if (K->col[j] == i) {
-                        value_type v = math::adjoint(K->val[j]);
-                        invert(v.data(), d);
-                        break;
-                    }
-                }
-
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    value_type_p app = 0;
-                    for(int k = 0; k < B; ++k)
-                        app += d[k] * K->val[j](k,0);
-
-                    App->col[j] = K->col[j];
-                    App->val[j] = app;
-                }
-            }
-
-            AMGCL_TIC("pprecond");
-            P = std::make_shared<PPrecond>(App, prm.pprecond, bprm);
-            AMGCL_TOC("pprecond");
-            AMGCL_TIC("sprecond");
-            S = std::make_shared<SPrecond>(K,   prm.sprecond, bprm);
-            AMGCL_TOC("sprecond");
-
-
-            Fpp     = backend_type_p::copy_matrix(fpp, bprm);
-            Scatter = backend_type_p::copy_matrix(scatter, bprm);
-
-            rp = backend_type_p::create_vector(np, bprm);
-            xp = backend_type_p::create_vector(np, bprm);
-            rs = backend_type::create_vector(n, bprm);
-        }
-
-        void update_transfer(std::shared_ptr<build_matrix> K, const backend_params bprm, std::false_type)
-        {
-            const int       B = math::static_rows<value_type>::value;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            np = N;
-
-            auto fpp = std::make_shared<build_matrix_p>();
-            fpp->set_size(np, np * B);
-            fpp->set_nonzeros(np * B);
-            fpp->ptr[0] = 0;
-
-#pragma omp parallel for
-            for (ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(np); ++i) {
-                ptrdiff_t ik = i * B;
-                for(int k = 0; k < B; ++k, ++ik) {
-                    fpp->col[ik] = ik;
-                }
-
-                fpp->ptr[i + 1] = ik;
-
-                ptrdiff_t row_beg = K->ptr[i];
-                ptrdiff_t row_end = K->ptr[i + 1];
-
-                // Extract and invert block diagonals
-                value_type_p *d = &fpp->val[i * B];
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    if (K->col[j] == i) {
-                        value_type v = math::adjoint(K->val[j]);
-                        invert(v.data(), d);
-                        break;
-                    }
-                }
-            }
-            Fpp = backend_type_p::copy_matrix(fpp, bprm);
-        }
-
-        // Inverts dense matrix A;
-        // Returns the first column of the inverted matrix.
-        void invert(scalar_type *A, value_type_p *y)
-        {
-            const int B = math::static_rows<value_type>::value == 1 ? prm.block_size : math::static_rows<value_type>::value;
-
-            // Perform LU-factorization of A in-place
-            for(int k = 0; k < B; ++k) {
-                scalar_type d = A[k*B+k];
-                assert(!math::is_zero(d));
-                for(int i = k+1; i < B; ++i) {
-                    A[i*B+k] /= d;
-                    for(int j = k+1; j < B; ++j)
-                        A[i*B+j] -= A[i*B+k] * A[k*B+j];
-                }
-            }
-
-            // Invert unit vector in-place.
-            // Lower triangular solve:
-            for(int i = 0; i < B; ++i) {
-                value_type_p b = static_cast<value_type_p>(i == 0);
-                for(int j = 0; j < i; ++j)
-                    b -= A[i*B+j] * y[j];
-                y[i] = b;
-            }
-
-            // Upper triangular solve:
-            for(int i = B; i --> 0; ) {
-                for(int j = i+1; j < B; ++j)
-                    y[i] -= A[i*B+j] * y[j];
-                y[i] /= A[i*B+i];
-            }
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const cpr &p) {
-            os << "CPR (two-stage preconditioner)\n"
-                  "### Pressure preconditioner:\n"
-               << *p.P << "\n"
-                  "### Global preconditioner:\n"
-               << *p.S << std::endl;
-            return os;
-        }
-};
-
-} // namespace preconditioner
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/preconditioner/cpr_drs.hpp b/src/solvers/amgcl/preconditioner/cpr_drs.hpp
deleted file mode 100644
index 1fc483f..0000000
--- a/src/solvers/amgcl/preconditioner/cpr_drs.hpp
+++ /dev/null
@@ -1,625 +0,0 @@
-#ifndef AMGCL_PRECONDITIONER_CPR_DRS_HPP
-#define AMGCL_PRECONDITIONER_CPR_DRS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/preconditioner/cpr_drs.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  CPR preconditioner with Dynamic Row Sum modification.
- */
-
-#include <vector>
-#include <algorithm>
-
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace preconditioner {
-
-template <class PPrecond, class SPrecond>
-class cpr_drs {
-    static_assert(
-            math::static_rows<typename PPrecond::backend_type::value_type>::value == 1,
-            "Pressure backend should have scalar value type!"
-            );
-
-    static_assert(
-            backend::backends_compatible<
-                typename PPrecond::backend_type,
-                typename SPrecond::backend_type
-                >::value,
-            "Backends for pressure and flow preconditioners should coincide!"
-            );
-    public:
-        typedef typename SPrecond::backend_type backend_type;
-        typedef typename PPrecond::backend_type backend_type_p;
-
-        typedef typename backend_type::value_type   value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename backend_type::matrix       matrix;
-        typedef typename backend_type::vector       vector;
-        typedef typename backend_type_p::value_type value_type_p;
-        typedef typename backend_type_p::matrix     matrix_p;
-        typedef typename backend_type_p::vector     vector_p;
-
-        typedef typename backend_type::params       backend_params;
-
-        typedef typename backend::builtin<value_type>::matrix   build_matrix;
-        typedef typename backend::builtin<value_type_p>::matrix build_matrix_p;
-
-        struct params {
-            typedef typename PPrecond::params pprecond_params;
-            typedef typename SPrecond::params sprecond_params;
-
-            pprecond_params pprecond;
-            sprecond_params sprecond;
-
-            int    block_size;
-            size_t active_rows;
-            double eps_dd;
-            double eps_ps;
-
-            std::vector<double> weights;
-
-            params()
-                : block_size(math::static_rows<value_type>::value == 1 ? 2 : math::static_rows<value_type>::value),
-                  active_rows(0), eps_dd(0.2), eps_ps(0.02) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, pprecond),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, sprecond),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, block_size),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, active_rows),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, eps_dd),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, eps_ps)
-            {
-                void  *ptr = 0;
-                size_t n   = 0;
-
-                ptr = p.get("weights",      ptr);
-                n   = p.get("weights_size", n);
-
-                if (ptr) {
-                    precondition(n > 0,
-                            "Error in cpr_wdrs parameters: "
-                            "weights is set, but weights_size is not"
-                            );
-
-                    weights.assign(
-                            static_cast<double*>(ptr),
-                            static_cast<double*>(ptr) + n);
-                }
-
-                check_params(p, {"pprecond", "sprecond", "block_size", "active_rows", "eps_dd", "eps_ps", "weights", "weights_size"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path = "") const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, pprecond);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, sprecond);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, block_size);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, active_rows);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, eps_dd);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, eps_ps);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        cpr_drs(
-                const Matrix &K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-               ) : prm(prm), n(backend::rows(K))
-        {
-            init(std::make_shared<build_matrix>(K), bprm,
-                    std::integral_constant<bool, math::static_rows<value_type>::value == 1>());
-        }
-
-        cpr_drs(
-                std::shared_ptr<build_matrix> K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-               ) : prm(prm), n(backend::rows(*K))
-        {
-            init(K, bprm,
-                    std::integral_constant<bool, math::static_rows<value_type>::value == 1>());
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            AMGCL_TIC("sprecond");
-            S->apply(rhs, x);
-            AMGCL_TOC("sprecond");
-            backend::residual(rhs, S->system_matrix(), x, *rs);
-
-            backend::spmv(one, *Fpp, *rs, zero, *rp);
-            AMGCL_TIC("pprecond");
-            P->apply(*rp, *xp);
-            AMGCL_TOC("pprecond");
-
-            backend::spmv(one, *Scatter, *xp, one, x);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return S->system_matrix_ptr();
-        }
-
-        const matrix& system_matrix() const {
-            return S->system_matrix();
-        }
-
-        /* Perform a partial update of the CPR preconditioner. This function
-         * leaves the AMG hierarchy intact, but updates the global preconditioner
-         * SPrecond and optionally also the transfer operator Fpp.
-         */
-        template <class Matrix>
-        void partial_update(
-                const Matrix &K,
-                bool update_transfer_ops = true,
-                const backend_params &bprm = backend_params()
-              )
-        {
-            auto K_ptr = std::make_shared<build_matrix>(K);
-            // Update global preconditioner
-            S = std::make_shared<SPrecond>(K_ptr, prm.sprecond, bprm);
-            if(update_transfer_ops){
-              // Update transfer operator Fpp
-              update_transfer(
-                  K_ptr,
-                  bprm,
-                  std::integral_constant<bool, math::static_rows<value_type>::value == 1>()
-                );
-            }
-        }
-
-    private:
-        size_t n, np;
-
-        std::shared_ptr<PPrecond> P;
-        std::shared_ptr<SPrecond> S;
-
-        std::shared_ptr<matrix_p> Fpp, Scatter;
-        std::shared_ptr<vector>   rs;
-        std::shared_ptr<vector_p> rp, xp;
-
-        // Returns pressure transfer operator fpp and (optionally)
-        // partially constructed pressure system matrix App.
-        std::tuple<std::shared_ptr<build_matrix_p>, std::shared_ptr<build_matrix_p>>
-        first_scalar_pass(std::shared_ptr<build_matrix> K, bool get_app = true) {
-            typedef typename backend::row_iterator<build_matrix>::type row_iterator;
-            const int       B = prm.block_size;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            np = N / B;
-
-            auto fpp = std::make_shared<build_matrix_p>();
-            fpp->set_size(np, n);
-            fpp->set_nonzeros(n);
-            fpp->ptr[0] = 0;
-
-            std::shared_ptr<build_matrix_p> App;
-            if (get_app) {
-                App = std::make_shared<build_matrix_p>();
-                App->set_size(np, np, true);
-            }
-
-#pragma omp parallel
-            {
-                std::vector<value_type> a_dia(B), a_off(B), a_top(B);
-                std::vector<row_iterator> k; k.reserve(B);
-
-#pragma omp for
-                for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(np); ++ip) {
-                    ptrdiff_t ik = ip * B;
-                    bool      done = true;
-                    ptrdiff_t cur_col = 0;
-
-                    std::fill(a_dia.begin(), a_dia.end(), 0);
-                    std::fill(a_off.begin(), a_off.end(), 0);
-                    std::fill(a_top.begin(), a_top.end(), 0);
-
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(*K, ik + i));
-
-                        if (k.back() && k.back().col() < N) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-                    }
-
-                    while (!done) {
-                        if (get_app) ++App->ptr[ip+1];
-
-                        ptrdiff_t end = (cur_col + 1) * B;
-
-                        for(int i = 0; i < B; ++i) {
-                            for(; k[i] && k[i].col() < end; ++k[i]) {
-                                ptrdiff_t  c = k[i].col() % B;
-                                value_type v = k[i].value();
-
-                                if (i == 0) {
-                                    a_top[c] += std::abs(v);
-                                }
-
-                                if (c == 0) {
-                                    if (cur_col == ip) {
-                                        a_dia[i] = v;
-                                    } else {
-                                        a_off[i] += std::abs(v);
-                                    }
-                                }
-                            }
-                        }
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i] && k[i].col() < N) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-
-                    for(int i = 0; i < B; ++i) {
-                        fpp->col[ik+i] = ik+i;
-                        double delta = 1;
-
-                        if (!prm.weights.empty())
-                            delta *= prm.weights[ik+i];
-
-                        if (i > 0) {
-                            if (a_dia[i] < prm.eps_dd * a_off[i])
-                                delta = 0;
-
-                            if (a_top[i] < prm.eps_ps * std::abs(a_dia[0]))
-                                delta = 0;
-                        }
-
-                        fpp->val[ik+i] = delta;
-                    }
-
-                    fpp->ptr[ip+1] = ik + B;
-                }
-            }
-
-            App->set_nonzeros(App->scan_row_sizes());
-
-            return std::make_tuple(fpp, App);
-        }
-
-        void init(std::shared_ptr<build_matrix> K, const backend_params bprm, std::true_type)
-        {
-            typedef typename backend::row_iterator<build_matrix>::type row_iterator;
-            const int       B = prm.block_size;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            precondition(
-                    prm.weights.empty() || prm.weights.size() == static_cast<size_t>(N),
-                    "CPR: weights size is not equal to number of active rows.");
-
-            np = N / B;
-
-            std::shared_ptr<build_matrix_p> fpp, App;
-            std::tie(fpp, App) = first_scalar_pass(K);
-
-            auto scatter = std::make_shared<build_matrix_p>();
-            scatter->set_size(n, np);
-            scatter->set_nonzeros(np);
-            scatter->ptr[0] = 0;
-
-#pragma omp parallel
-            {
-                std::vector<row_iterator> k; k.reserve(B);
-
-#pragma omp for
-                for(ptrdiff_t ip = 0; ip < static_cast<ptrdiff_t>(np); ++ip) {
-                    ptrdiff_t ik = ip * B;
-                    ptrdiff_t head = App->ptr[ip];
-                    bool      done = true;
-                    ptrdiff_t cur_col = 0;
-
-                    value_type_p *d = &fpp->val[ik];
-
-                    k.clear();
-                    for(int i = 0; i < B; ++i) {
-                        k.push_back(backend::row_begin(*K, ik + i));
-
-                        if (k.back() && k.back().col() < N) {
-                            ptrdiff_t col = k.back().col() / B;
-                            if (done) {
-                                cur_col = col;
-                                done = false;
-                            } else {
-                                cur_col = std::min(cur_col, col);
-                            }
-                        }
-                    }
-
-                    while (!done) {
-                        ptrdiff_t  end = (cur_col + 1) * B;
-                        value_type_p app = 0;
-
-                        for(int i = 0; i < B; ++i) {
-                            for(; k[i] && k[i].col() < end; ++k[i]) {
-                                if (k[i].col() % B == 0) {
-                                    app += d[i] * k[i].value();
-                                }
-                            }
-                        }
-
-                        App->col[head] = cur_col;
-                        App->val[head] = app;
-                        ++head;
-
-                        // Get next column number.
-                        done = true;
-                        for(int i = 0; i < B; ++i) {
-                            if (k[i] && k[i].col() < N) {
-                                ptrdiff_t col = k[i].col() / B;
-                                if (done) {
-                                    cur_col = col;
-                                    done = false;
-                                } else {
-                                    cur_col = std::min(cur_col, col);
-                                }
-                            }
-                        }
-                    }
-
-                    scatter->col[ip] = ip;
-                    scatter->val[ip] = math::identity<value_type>();
-
-                    ptrdiff_t nnz = ip;
-                    for(int i = 0; i < B; ++i) {
-                        if (i == 0) ++nnz;
-                        scatter->ptr[ik + i + 1] = nnz;
-                    }
-                }
-            }
-
-            for(size_t i = N; i < n; ++i)
-                scatter->ptr[i+1] = scatter->ptr[i];
-
-            AMGCL_TIC("pprecond");
-            P = std::make_shared<PPrecond>(App, prm.pprecond, bprm);
-            AMGCL_TOC("pprecond");
-            AMGCL_TIC("sprecond");
-            S = std::make_shared<SPrecond>(K,   prm.sprecond, bprm);
-            AMGCL_TOC("sprecond");
-
-            Fpp     = backend_type_p::copy_matrix(fpp, bprm);
-            Scatter = backend_type_p::copy_matrix(scatter, bprm);
-
-            rp = backend_type_p::create_vector(np, bprm);
-            xp = backend_type_p::create_vector(np, bprm);
-            rs = backend_type::create_vector(n, bprm);
-        }
-
-        void update_transfer(std::shared_ptr<build_matrix> K, const backend_params bprm, std::true_type)
-        {
-            auto fpp = std::get<0>(first_scalar_pass(K, /*get_app*/false));
-            Fpp = backend_type_p::copy_matrix(fpp, bprm);
-        }
-
-        void init(std::shared_ptr<build_matrix> K, const backend_params bprm, std::false_type)
-        {
-            const int       B = math::static_rows<value_type>::value;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            precondition(
-                    prm.weights.empty() || prm.weights.size() == static_cast<size_t>(N * B),
-                    "CPR: weights size is not equal to number of active rows.");
-
-            np = N;
-
-            auto fpp = std::make_shared<build_matrix_p>();
-            fpp->set_size(np, np * B);
-            fpp->set_nonzeros(np * B);
-            fpp->ptr[0] = 0;
-
-            auto scatter = std::make_shared<build_matrix_p>();
-            scatter->set_size(np * B, np);
-            scatter->set_nonzeros(np);
-            scatter->ptr[0] = 0;
-
-            auto App = std::make_shared<build_matrix_p>();
-            App->set_size(np, np, true);
-            App->set_nonzeros(K->nnz);
-            App->ptr[0] = 0;
-
-#pragma omp parallel for
-            for (ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(np); ++i) {
-                ptrdiff_t ik = i * B;
-                for(int k = 0; k < B; ++k, ++ik) {
-                    fpp->col[ik] = ik;
-                    scatter->ptr[ik + 1] = i + 1;
-                }
-                fpp->ptr[i + 1] = ik;
-                scatter->col[i] = i;
-                scatter->val[i] = math::identity<value_type_p>();
-
-                ptrdiff_t row_beg = K->ptr[i];
-                ptrdiff_t row_end = K->ptr[i + 1];
-                App->ptr[i+1] = row_end;
-
-                value_type_p *d = &fpp->val[i * B];
-                const double *w = prm.weights.empty() ? nullptr : &prm.weights[i * B];
-
-                std::array<value_type_p, B> a_dia{};
-                std::array<value_type_p, B> a_off{};
-                std::array<value_type_p, B> a_top{};
-
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    ptrdiff_t  c = K->col[j];
-                    value_type v = K->val[j];
-
-                    for(int k = 0; k < B; ++k) {
-                        a_top[k] += std::abs(v(0,k));
-                        if (c == i) {
-                            a_dia[k] = v(k,0);
-                        } else {
-                            a_off[k] += std::abs(v(k,0));
-                        }
-                    }
-                }
-
-                for(int k = 0; k < B; ++k) {
-                    if (k > 0 &&
-                            (a_dia[k] < prm.eps_dd * a_off[k] ||
-                             a_top[k] < prm.eps_ps * std::abs(a_dia[0])
-                            ))
-                    {
-                        d[k] = 0;
-                    } else {
-                        d[k] = w ? w[k] : 1.0;
-                    }
-                }
-
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    App->col[j] = K->col[j];
-
-                    value_type_p app = 0;
-                    for(int k = 0; k < B; ++k)
-                        app += d[k] * K->val[j](k,0);
-
-                    App->val[j] = app;
-                }
-            }
-
-            AMGCL_TIC("pprecond");
-            P = std::make_shared<PPrecond>(App, prm.pprecond, bprm);
-            AMGCL_TOC("pprecond");
-            AMGCL_TIC("sprecond");
-            S = std::make_shared<SPrecond>(K,   prm.sprecond, bprm);
-            AMGCL_TOC("sprecond");
-
-            Fpp     = backend_type_p::copy_matrix(fpp, bprm);
-            Scatter = backend_type_p::copy_matrix(scatter, bprm);
-
-            rp = backend_type_p::create_vector(np, bprm);
-            xp = backend_type_p::create_vector(np, bprm);
-            rs = backend_type::create_vector(n, bprm);
-        }
-
-        void update_transfer(std::shared_ptr<build_matrix> K, const backend_params bprm, std::false_type)
-        {
-            const int       B = math::static_rows<value_type>::value;
-            const ptrdiff_t N = (prm.active_rows ? prm.active_rows : n);
-
-            precondition(
-                    prm.weights.empty() || prm.weights.size() == static_cast<size_t>(N * B),
-                    "CPR: weights size is not equal to number of active rows.");
-
-            np = N;
-
-            auto fpp = std::make_shared<build_matrix_p>();
-            fpp->set_size(np, np * B);
-            fpp->set_nonzeros(np * B);
-            fpp->ptr[0] = 0;
-
-#pragma omp parallel for
-            for (ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(np); ++i) {
-                ptrdiff_t ik = i * B;
-                for(int k = 0; k < B; ++k, ++ik) {
-                    fpp->col[ik] = ik;
-                }
-                fpp->ptr[i + 1] = ik;
-
-                ptrdiff_t row_beg = K->ptr[i];
-                ptrdiff_t row_end = K->ptr[i + 1];
-
-                value_type_p *d = &fpp->val[i * B];
-                const double *w = prm.weights.empty() ? nullptr : &prm.weights[i * B];
-
-                std::array<value_type_p, B> a_dia{};
-                std::array<value_type_p, B> a_off{};
-                std::array<value_type_p, B> a_top{};
-
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    ptrdiff_t  c = K->col[j];
-                    value_type v = K->val[j];
-
-                    for(int k = 0; k < B; ++k) {
-                        a_top[k] += std::abs(v(0,k));
-                        if (c == i) {
-                            a_dia[k] = v(k,0);
-                        } else {
-                            a_off[k] += std::abs(v(k,0));
-                        }
-                    }
-                }
-
-                for(int k = 0; k < B; ++k) {
-                    if (k > 0 &&
-                            (a_dia[k] < prm.eps_dd * a_off[k] ||
-                             a_top[k] < prm.eps_ps * std::abs(a_dia[0])
-                            ))
-                    {
-                        d[k] = 0;
-                    } else {
-                        d[k] = w ? w[k] : 1.0;
-                    }
-                }
-            }
-            Fpp     = backend_type_p::copy_matrix(fpp, bprm);
-        }
-
-
-        friend std::ostream& operator<<(std::ostream &os, const cpr_drs &p) {
-            os << "CPR_DRS (two-stage preconditioner)\n"
-                  "### Pressure preconditioner:\n"
-               << *p.P << "\n"
-                  "### Global preconditioner:\n"
-               << *p.S << std::endl;
-            return os;
-        }
-};
-
-} // namespace preconditioner
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/preconditioner/dummy.hpp b/src/solvers/amgcl/preconditioner/dummy.hpp
deleted file mode 100644
index d8ded63..0000000
--- a/src/solvers/amgcl/preconditioner/dummy.hpp
+++ /dev/null
@@ -1,105 +0,0 @@
-#ifndef AMGCL_PRECONDITIONER_DUMMY_HPP
-#define AMGCL_PRECONDITIONER_DUMMY_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/preconditioner/dummy.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Dummy preconditioner (identity matrix).
- */
-
-#include <memory>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace preconditioner {
-
-template <class Backend>
-class dummy {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::matrix  matrix;
-        typedef typename Backend::vector  vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::col_type col_type;
-        typedef typename Backend::ptr_type ptr_type;
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-
-        typedef amgcl::detail::empty_params params;
-        typedef typename Backend::params backend_params;
-
-        template <class Matrix>
-        dummy(
-                const Matrix &M,
-                const params& = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : A(Backend::copy_matrix(std::make_shared<build_matrix>(M), bprm))
-        {
-        }
-
-        dummy(
-                std::shared_ptr<build_matrix> M,
-                const params& = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : A(Backend::copy_matrix(M, bprm))
-        {
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            backend::copy(rhs, x);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return A;
-        }
-
-        const matrix& system_matrix() const {
-            return *A;
-        }
-
-        size_t bytes() const {
-            return 0;
-        }
-    private:
-        std::shared_ptr<matrix>   A;
-
-        friend std::ostream& operator<<(std::ostream &os, const dummy &p) {
-            os << "identity matrix as preconditioner" << std::endl;
-            os << "  unknowns: " << backend::rows(p.system_matrix()) << std::endl;
-            os << "  nonzeros: " << backend::nonzeros(p.system_matrix()) << std::endl;
-
-            return os;
-        }
-};
-
-} // namespace preconditioner
-} // namespace amgcl
-#endif
diff --git a/src/solvers/amgcl/preconditioner/runtime.hpp b/src/solvers/amgcl/preconditioner/runtime.hpp
deleted file mode 100644
index ef23d61..0000000
--- a/src/solvers/amgcl/preconditioner/runtime.hpp
+++ /dev/null
@@ -1,423 +0,0 @@
-#ifndef AMGCL_PRECONDITIONER_RUNTIME_HPP
-#define AMGCL_PRECONDITIONER_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/preconditioner/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime-configurable wrappers around amgcl classes.
- */
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/solver/runtime.hpp>
-#include <amgcl/coarsening/runtime.hpp>
-#include <amgcl/relaxation/runtime.hpp>
-#include <amgcl/relaxation/as_preconditioner.hpp>
-#include <amgcl/preconditioner/dummy.hpp>
-#include <amgcl/make_solver.hpp>
-#include <amgcl/amg.hpp>
-
-namespace amgcl {
-namespace runtime {
-
-/// Preconditioner kinds.
-namespace precond_class {
-enum type {
-    amg,            ///< AMG
-    relaxation,     ///< Single-level relaxation
-    dummy,          ///< Identity matrix as preconditioner.
-    nested          ///< Nested solver as preconditioner.
-};
-
-inline std::ostream& operator<<(std::ostream &os, type p) {
-    switch (p) {
-        case amg:
-            return os << "amg";
-        case relaxation:
-            return os << "relaxation";
-        case dummy:
-            return os << "dummy";
-        case nested:
-            return os << "nested";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &p)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "amg")
-        p = amg;
-    else if (val == "relaxation")
-        p = relaxation;
-    else if (val == "dummy")
-        p = dummy;
-    else if (val == "nested")
-        p = nested;
-    else
-        throw std::invalid_argument("Invalid preconditioner class. Valid choices are: "
-                "amg, relaxation, dummy, nested");
-
-    return in;
-}
-} // namespace precond_class
-
-template <class Backend>
-class preconditioner {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::matrix     matrix;
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::params     backend_params;
-
-        typedef boost::property_tree::ptree params;
-
-        template <class Matrix>
-        preconditioner(
-                const Matrix &A,
-                params prm = params(),
-                const backend_params &bprm = backend_params())
-            : _class(prm.get("class", runtime::precond_class::amg)),
-              handle(0)
-        {
-            if (!prm.erase("class")) AMGCL_PARAM_MISSING("class");
-
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        handle = static_cast<void*>(new Precond(A, prm, bprm));
-                    }
-                    break;
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::relaxation::as_preconditioner<Backend, runtime::relaxation::wrapper>
-                            Precond;
-
-                        handle = static_cast<void*>(new Precond(A, prm, bprm));
-                    }
-                    break;
-                case precond_class::dummy:
-                    {
-                        typedef
-                            amgcl::preconditioner::dummy<Backend>
-                            Precond;
-
-                        handle = static_cast<void*>(new Precond(A, prm, bprm));
-                    }
-                    break;
-                case precond_class::nested:
-                    {
-                        typedef
-                            make_solver<
-                                preconditioner,
-                                runtime::solver::wrapper<Backend>
-                                >
-                            Precond;
-
-                        handle = static_cast<void*>(new Precond(A, prm, bprm));
-                    }
-                    break;
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-        ~preconditioner() {
-            switch (_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        delete static_cast<Precond*>(handle);
-                    }
-                    break;
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::relaxation::as_preconditioner<Backend, runtime::relaxation::wrapper>
-                            Precond;
-
-                        delete static_cast<Precond*>(handle);
-                    }
-                    break;
-                case precond_class::dummy:
-                    {
-                        typedef
-                            amgcl::preconditioner::dummy<Backend>
-                            Precond;
-
-                        delete static_cast<Precond*>(handle);
-                    }
-                    break;
-                case precond_class::nested:
-                    {
-                        typedef
-                            make_solver<
-                                preconditioner,
-                                runtime::solver::wrapper<Backend>
-                                >
-                            Precond;
-
-                        delete static_cast<Precond*>(handle);
-                    }
-                    break;
-                default:
-                    break;
-            }
-        }
-
-        template <class Matrix>
-        void rebuild(
-                const Matrix &A,
-                const backend_params &bprm = backend_params()
-                )
-        {
-            switch (_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        static_cast<Precond*>(handle)->rebuild(A, bprm);
-                    }
-                    break;
-                default:
-                    std::cerr << "rebuild is a noop unless the preconditioner is AMG" << std::endl;
-                    return;
-            }
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &x) const {
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        static_cast<Precond*>(handle)->apply(rhs, x);
-                    }
-                    break;
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::relaxation::as_preconditioner<Backend, runtime::relaxation::wrapper>
-                            Precond;
-
-                        static_cast<Precond*>(handle)->apply(rhs, x);
-                    }
-                    break;
-                case precond_class::dummy:
-                    {
-                        typedef
-                            amgcl::preconditioner::dummy<Backend>
-                            Precond;
-
-                        static_cast<Precond*>(handle)->apply(rhs, x);
-                    }
-                    break;
-                case precond_class::nested:
-                    {
-                        typedef
-                            make_solver<
-                                preconditioner,
-                                runtime::solver::wrapper<Backend>
-                                >
-                            Precond;
-
-                        static_cast<Precond*>(handle)->apply(rhs, x);
-                    }
-                    break;
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        return static_cast<Precond*>(handle)->system_matrix_ptr();
-                    }
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::relaxation::as_preconditioner<Backend, runtime::relaxation::wrapper>
-                            Precond;
-
-                        return static_cast<Precond*>(handle)->system_matrix_ptr();
-                    }
-                case precond_class::dummy:
-                    {
-                        typedef
-                            amgcl::preconditioner::dummy<Backend>
-                            Precond;
-
-                        return static_cast<Precond*>(handle)->system_matrix_ptr();
-                    }
-                case precond_class::nested:
-                    {
-                        typedef
-                            make_solver<
-                                preconditioner,
-                                runtime::solver::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return static_cast<Precond*>(handle)->system_matrix_ptr();
-                    }
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-        const matrix& system_matrix() const {
-            return *system_matrix_ptr();
-        }
-
-        size_t size() const {
-            return backend::rows( system_matrix() );
-        }
-
-        size_t bytes() const {
-            switch(_class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        return backend::bytes(*static_cast<Precond*>(handle));
-                    }
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::relaxation::as_preconditioner<Backend, runtime::relaxation::wrapper>
-                            Precond;
-
-                        return backend::bytes(*static_cast<Precond*>(handle));
-                    }
-                case precond_class::dummy:
-                    {
-                        typedef
-                            amgcl::preconditioner::dummy<Backend>
-                            Precond;
-
-                        return backend::bytes(*static_cast<Precond*>(handle));
-                    }
-                case precond_class::nested:
-                    {
-                        typedef
-                            make_solver<
-                                preconditioner,
-                                runtime::solver::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return backend::bytes(*static_cast<Precond*>(handle));
-                    }
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const preconditioner &p)
-        {
-            switch(p._class) {
-                case precond_class::amg:
-                    {
-                        typedef
-                            amgcl::amg<Backend, runtime::coarsening::wrapper, runtime::relaxation::wrapper>
-                            Precond;
-
-                        return os << *static_cast<Precond*>(p.handle);
-                    }
-                case precond_class::relaxation:
-                    {
-                        typedef
-                            amgcl::relaxation::as_preconditioner<Backend, runtime::relaxation::wrapper>
-                            Precond;
-
-                        return os << *static_cast<Precond*>(p.handle);
-                    }
-                case precond_class::dummy:
-                    {
-                        typedef
-                            amgcl::preconditioner::dummy<Backend>
-                            Precond;
-
-                        return os << *static_cast<Precond*>(p.handle);
-                    }
-                case precond_class::nested:
-                    {
-                        typedef
-                            make_solver<
-                                preconditioner,
-                                runtime::solver::wrapper<Backend>
-                                >
-                            Precond;
-
-                        return os << *static_cast<Precond*>(p.handle);
-                    }
-                default:
-                    throw std::invalid_argument("Unsupported preconditioner class");
-            }
-        }
-    private:
-        const runtime::precond_class::type _class;
-
-        void *handle;
-};
-
-} // namespace runtime
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/preconditioner/schur_pressure_correction.hpp b/src/solvers/amgcl/preconditioner/schur_pressure_correction.hpp
deleted file mode 100644
index 16b0720..0000000
--- a/src/solvers/amgcl/preconditioner/schur_pressure_correction.hpp
+++ /dev/null
@@ -1,633 +0,0 @@
-#ifndef AMGCL_PRECONDITIONER_SCHUR_PRESSURE_CORRECTION_HPP
-#define AMGCL_PRECONDITIONER_SCHUR_PRESSURE_CORRECTION_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2016, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/preconditioner/schur_pressure_correction.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Schur-complement pressure correction preconditioning scheme.
- *
- * [1] Elman, Howard, et al. "A taxonomy and comparison of parallel block
- *     multi-level preconditioners for the incompressible Navier–Stokes
- *     equations." Journal of Computational Physics 227.3 (2008): 1790-1808.
- * [2] Gmeiner, Björn, et al. "A quantitative performance analysis for Stokes
- *     solvers at the extreme scale." arXiv preprint arXiv:1511.02134 (2015).
- * [3] Vincent, C., and R. Boyer. "A preconditioned conjugate gradient
- *     Uzawa‐type method for the solution of the Stokes problem by mixed Q1–P0
- *     stabilized finite elements." International journal for numerical methods
- *     in fluids 14.3 (1992): 289-298.
- */
-
-#include <vector>
-
-#include <memory>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/backend/detail/mixing.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/io/mm.hpp>
-
-namespace amgcl {
-namespace preconditioner {
-
-/// Schur-complement pressure correction preconditioner
-template <class USolver, class PSolver>
-class schur_pressure_correction {
-    static_assert(
-            backend::backends_compatible<
-                typename USolver::backend_type,
-                typename PSolver::backend_type
-                >::value,
-            "Backends for pressure and flow preconditioners should coincide!"
-            );
-    public:
-        typedef
-            typename backend::detail::common_scalar_backend<
-                typename USolver::backend_type,
-                typename PSolver::backend_type
-                >::type
-            backend_type;
-
-        typedef typename backend_type::value_type value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename backend_type::matrix     matrix;
-        typedef typename backend_type::vector     vector;
-        typedef typename backend_type::params     backend_params;
-
-        typedef typename backend::builtin<value_type>::matrix build_matrix;
-
-        struct params {
-            typedef typename USolver::params usolver_params;
-            typedef typename PSolver::params psolver_params;
-
-            usolver_params usolver;
-            psolver_params psolver;
-
-            std::vector<char> pmask;
-
-            // Variant of block preconditioner to use in apply()
-            // 1: schur pressure correction:
-            //      S p = fp - Kpu Kuu^-1 fu
-            //      Kuu u = fu - Kup p
-            // 2: Block triangular:
-            //      S p = fp
-            //      Kuu u = fu - Kup p
-            int type;
-
-            // Approximate Kuu^-1 with inverted diagonal of Kuu during
-            // construction of matrix-less Schur complement.
-            // When false, USolver is used instead.
-            bool approx_schur;
-
-            // Adjust preconditioner matrix for the Schur complement system.
-            // That is, use
-            //   Kpp                                 when adjust_p == 0,
-            //   Kpp - dia(Kpu * dia(Kuu)^-1 * Kup)  when adjust_p == 1,
-            //   Kpp - Kpu * dia(Kuu)^-1 * Kup       when adjust_p == 2
-            int adjust_p;
-
-            // Use 1/sum_j(abs(Kuu_{i,j})) instead of dia(Kuu)^-1
-            // as approximation for the Kuu^-1 (as in SIMPLEC algorithm)
-            bool simplec_dia;
-
-            int verbose;
-
-            params() : type(1), approx_schur(false), adjust_p(1), simplec_dia(true), verbose(0) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_CHILD(p, usolver),
-                  AMGCL_PARAMS_IMPORT_CHILD(p, psolver),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, type),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, approx_schur),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, adjust_p),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, simplec_dia),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                size_t n = 0;
-
-                n = p.get("pmask_size", n);
-
-                precondition(n > 0,
-                        "Error in schur_complement parameters: "
-                        "pmask_size is not set");
-
-                if (p.count("pmask_pattern")) {
-                    pmask.resize(n, 0);
-
-                    std::string pattern = p.get("pmask_pattern", std::string());
-                    switch (pattern[0]) {
-                        case '%':
-                            {
-                                int start  = std::atoi(pattern.substr(1).c_str());
-                                int stride = std::atoi(pattern.substr(3).c_str());
-                                for(size_t i = start; i < n; i += stride) pmask[i] = 1;
-                            }
-                            break;
-                        case '<':
-                            {
-                                size_t m = std::atoi(pattern.c_str()+1);
-                                for(size_t i = 0; i < std::min(m, n); ++i) pmask[i] = 1;
-                            }
-                            break;
-                        case '>':
-                            {
-                                size_t m = std::atoi(pattern.c_str()+1);
-                                for(size_t i = m; i < n; ++i) pmask[i] = 1;
-                            }
-                            break;
-                        default:
-                            precondition(false, "Unknown pattern in pmask_pattern");
-                    }
-                } else if (p.count("pmask")) {
-                    void *pm = 0;
-                    pm = p.get("pmask", pm);
-                    pmask.assign(static_cast<char*>(pm), static_cast<char*>(pm) + n);
-                } else {
-                    precondition(false,
-                            "Error in schur_complement parameters: "
-                            "neither pmask_pattern, nor pmask is set"
-                            );
-                }
-
-                check_params(p, {"usolver", "psolver", "type", "approx_schur", "adjust_p", "simplec_dia", "pmask_size", "verbose"},
-                        {"pmask", "pmask_pattern"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path = "") const
-            {
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, usolver);
-                AMGCL_PARAMS_EXPORT_CHILD(p, path, psolver);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, type);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, approx_schur);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, adjust_p);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, simplec_dia);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        } prm;
-
-        template <class Matrix>
-        schur_pressure_correction(
-                const Matrix &K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : prm(prm), n(backend::rows(K)), np(0), nu(0)
-        {
-            init(std::make_shared<build_matrix>(K), bprm);
-        }
-
-        schur_pressure_correction(
-                std::shared_ptr<build_matrix> K,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : prm(prm), n(backend::rows(*K)), np(0), nu(0)
-        {
-            init(K, bprm);
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            backend::spmv(one, *x2u, rhs, zero, *rhs_u);
-            backend::spmv(one, *x2p, rhs, zero, *rhs_p);
-
-            if (prm.type == 1) {
-                // Kuu u = rhs_u
-                backend::clear(*u);
-                report("U1", (*U)(*rhs_u, *u));
-
-                // rhs_p -= Kpu u
-                backend::spmv(-one, *Kpu, *u, one, *rhs_p);
-
-                // S p = rhs_p
-                backend::clear(*p);
-                report("P1", (*P)(*this, *rhs_p, *p));
-
-                // rhs_u -= Kup p
-                backend::spmv(-one, *Kup, *p, one, *rhs_u);
-
-                // Kuu u = rhs_u
-                backend::clear(*u);
-                report("U2", (*U)(*rhs_u, *u));
-            } else if (prm.type == 2) {
-                // S p = fp
-                backend::clear(*p);
-                report("P", (*P)(*this, *rhs_p, *p));
-
-                // Kuu u = fu - Kup p
-                backend::spmv(-one, *Kup, *p, one, *rhs_u);
-                backend::clear(*u);
-                report("U", (*U)(*rhs_u, *u));
-            }
-
-            backend::spmv(one, *u2x, *u, zero, x);
-            backend::spmv(one, *p2x, *p, one, x);
-        }
-
-        template <class Alpha, class Vec1, class Beta, class Vec2>
-        void spmv(Alpha alpha, const Vec1 &x, Beta beta, Vec2 &y) const {
-            const auto one = math::identity<scalar_type>();
-            const auto zero = math::zero<scalar_type>();
-
-            // y = beta y + alpha S x, where S = Kpp - Kpu Kuu^-1 Kup
-            if (prm.adjust_p == 1) {
-                backend::spmv( alpha, P->system_matrix(), x, beta, y);
-                backend::vmul( alpha, *Ld, x, one, y);
-            } else if (prm.adjust_p == 2) {
-                backend::spmv( alpha, *Lm, x, beta, y);
-            } else {
-                backend::spmv( alpha, P->system_matrix(), x, beta, y);
-            }
-
-            backend::spmv(one, *Kup, x, zero, *tmp);
-
-            if (prm.approx_schur) {
-                backend::vmul(one, *M, *tmp, zero, *u);
-            } else {
-                backend::clear(*u);
-                (*U)(*tmp, *u);
-            }
-
-            backend::spmv(-alpha, *Kpu, *u, one, y);
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return K;
-        }
-
-        const matrix& system_matrix() const {
-            return *K;
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            b += backend::bytes(*K);
-            b += backend::bytes(*Kup);
-            b += backend::bytes(*Kpu);
-            b += backend::bytes(*x2u);
-            b += backend::bytes(*x2p);
-            b += backend::bytes(*u2x);
-            b += backend::bytes(*p2x);
-            b += backend::bytes(*rhs_u);
-            b += backend::bytes(*rhs_p);
-            b += backend::bytes(*u);
-            b += backend::bytes(*p);
-            b += backend::bytes(*tmp);
-            b += backend::bytes(*U);
-            b += backend::bytes(*P);
-
-            if (M) b += backend::bytes(*M);
-            if (Ld) b += backend::bytes(*Ld);
-            if (Lm) b += backend::bytes(*Lm);
-
-            return b;
-        }
-
-    private:
-        size_t n, np, nu;
-
-        std::shared_ptr<matrix> K, Lm, Kup, Kpu, x2u, x2p, u2x, p2x;
-        std::shared_ptr<vector> rhs_u, rhs_p, u, p, tmp;
-        std::shared_ptr<typename backend_type::matrix_diagonal> M;
-        std::shared_ptr<typename backend_type::matrix_diagonal> Ld;
-
-        std::shared_ptr<USolver> U;
-        std::shared_ptr<PSolver> P;
-
-        void init(const std::shared_ptr<build_matrix> &K, const backend_params &bprm)
-        {
-            this->K = backend_type::copy_matrix(K, bprm);
-
-            // Extract matrix subblocks.
-            auto Kuu = std::make_shared<build_matrix>();
-            auto Kpu = std::make_shared<build_matrix>();
-            auto Kup = std::make_shared<build_matrix>();
-            auto Kpp = std::make_shared<build_matrix>();
-
-            std::vector<ptrdiff_t> idx(n);
-
-            for(size_t i = 0; i < n; ++i)
-                idx[i] = (prm.pmask[i] ? np++ : nu++);
-
-            Kuu->set_size(nu, nu, true);
-            Kup->set_size(nu, np, true);
-            Kpu->set_size(np, nu, true);
-            Kpp->set_size(np, np, true);
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                ptrdiff_t ci = idx[i];
-                char      pi = prm.pmask[i];
-                for(auto k = backend::row_begin(*K, i); k; ++k) {
-                    char pj = prm.pmask[k.col()];
-
-                    if (pi) {
-                        if (pj) {
-                            ++Kpp->ptr[ci+1];
-                        } else {
-                            ++Kpu->ptr[ci+1];
-                        }
-                    } else {
-                        if (pj) {
-                            ++Kup->ptr[ci+1];
-                        } else {
-                            ++Kuu->ptr[ci+1];
-                        }
-                    }
-                }
-            }
-
-            Kuu->set_nonzeros(Kuu->scan_row_sizes());
-            Kup->set_nonzeros(Kup->scan_row_sizes());
-            Kpu->set_nonzeros(Kpu->scan_row_sizes());
-            Kpp->set_nonzeros(Kpp->scan_row_sizes());
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                ptrdiff_t ci = idx[i];
-                char      pi = prm.pmask[i];
-
-                ptrdiff_t uu_head = 0, up_head = 0, pu_head = 0, pp_head = 0;
-
-                if(pi) {
-                    pu_head = Kpu->ptr[ci];
-                    pp_head = Kpp->ptr[ci];
-                } else {
-                    uu_head = Kuu->ptr[ci];
-                    up_head = Kup->ptr[ci];
-                }
-
-                for(auto k = backend::row_begin(*K, i); k; ++k) {
-                    ptrdiff_t  j = k.col();
-                    value_type v = k.value();
-                    ptrdiff_t cj = idx[j];
-                    char      pj = prm.pmask[j];
-
-                    if (pi) {
-                        if (pj) {
-                            Kpp->col[pp_head] = cj;
-                            Kpp->val[pp_head] = v;
-                            ++pp_head;
-                        } else {
-                            Kpu->col[pu_head] = cj;
-                            Kpu->val[pu_head] = v;
-                            ++pu_head;
-                        }
-                    } else {
-                        if (pj) {
-                            Kup->col[up_head] = cj;
-                            Kup->val[up_head] = v;
-                            ++up_head;
-                        } else {
-                            Kuu->col[uu_head] = cj;
-                            Kuu->val[uu_head] = v;
-                            ++uu_head;
-                        }
-                    }
-                }
-            }
-
-            if (prm.verbose >= 2) {
-                io::mm_write("Kuu.mtx", *Kuu);
-                io::mm_write("Kpp.mtx", *Kpp);
-            }
-
-            std::shared_ptr<backend::numa_vector<value_type>> Kuu_dia;
-
-            if (prm.simplec_dia) {
-                Kuu_dia = std::make_shared<backend::numa_vector<value_type>>(nu);
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nu); ++i) {
-                    value_type s = math::zero<value_type>();
-                    for(ptrdiff_t j = Kuu->ptr[i], e = Kuu->ptr[i+1]; j < e; ++j) {
-                        s += math::norm(Kuu->val[j]);
-                    }
-                    (*Kuu_dia)[i] = math::inverse(s);
-                }
-            } else {
-                Kuu_dia = diagonal(*Kuu, /*invert = */true);
-            }
-
-            if (prm.adjust_p == 1) {
-                // Use (Kpp - dia(Kpu * dia(Kuu)^-1 * Kup))
-                // to setup the P preconditioner.
-                auto L = std::make_shared<backend::numa_vector<value_type>>(np, false);
-
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(np); ++i) {
-                    value_type s = math::zero<value_type>();
-                    for(ptrdiff_t j = Kpu->ptr[i], e = Kpu->ptr[i+1]; j < e; ++j) {
-                        ptrdiff_t  k = Kpu->col[j];
-                        value_type v = Kpu->val[j];
-                        for(ptrdiff_t jj = Kup->ptr[k], ee = Kup->ptr[k+1]; jj < ee; ++jj) {
-                            if (Kup->col[jj] == i) {
-                                s += v * (*Kuu_dia)[k] * Kup->val[jj];
-                                break;
-                            }
-                        }
-                    }
-
-                    (*L)[i] = s;
-                    for(ptrdiff_t j = Kpp->ptr[i], e = Kpp->ptr[i+1]; j < e; ++j) {
-                        if (Kpp->col[j] == i) {
-                            Kpp->val[j] -= s;
-                            break;
-                        }
-                    }
-                }
-                Ld = backend_type::copy_vector(L, bprm);
-            } else if (prm.adjust_p == 2) {
-                Lm = backend_type::copy_matrix(Kpp, bprm);
-
-                // Use (Kpp - Kpu * dia(Kuu)^-1 * Kup)
-                // to setup the P preconditioner.
-                backend::numa_vector<value_type> val(Kup->nnz);
-
-#pragma omp parallel for
-                for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(nu); ++i) {
-                    value_type d = (*Kuu_dia)[i];
-                    for(ptrdiff_t j = Kup->ptr[i], e = Kup->ptr[i+1]; j < e; ++j) {
-                        val[j] = d * Kup->val[j];
-                    }
-                }
-
-                build_matrix Kup_hat;
-
-                Kup_hat.own_data = false;
-                Kup_hat.nrows    = nu;
-                Kup_hat.ncols    = np;
-                Kup_hat.nnz      = Kup->nnz;
-                Kup_hat.ptr      = Kup->ptr;
-                Kup_hat.col      = Kup->col;
-                Kup_hat.val      = val.data();
-
-                Kpp = backend::sum(
-                        math::identity<value_type>(), *Kpp,
-                       -math::identity<value_type>(), *backend::product(*Kpu, Kup_hat));
-            }
-
-            U = std::make_shared<USolver>(*Kuu, prm.usolver, bprm);
-            P = std::make_shared<PSolver>(*Kpp, prm.psolver, bprm);
-
-            this->Kup = backend_type::copy_matrix(Kup, bprm);
-            this->Kpu = backend_type::copy_matrix(Kpu, bprm);
-
-            rhs_u = backend_type::create_vector(nu, bprm);
-            rhs_p = backend_type::create_vector(np, bprm);
-
-            u = backend_type::create_vector(nu, bprm);
-            p = backend_type::create_vector(np, bprm);
-
-            tmp = backend_type::create_vector(nu, bprm);
-
-            if (prm.approx_schur)
-                M = backend_type::copy_vector(Kuu_dia, bprm);
-
-            // Scatter/Gather matrices
-            auto x2u = std::make_shared<build_matrix>();
-            auto x2p = std::make_shared<build_matrix>();
-            auto u2x = std::make_shared<build_matrix>();
-            auto p2x = std::make_shared<build_matrix>();
-
-            x2u->set_size(nu, n, true);
-            x2p->set_size(np, n, true);
-            u2x->set_size(n, nu, true);
-            p2x->set_size(n, np, true);
-
-            {
-                ptrdiff_t x2u_head = 0, x2u_idx = 0;
-                ptrdiff_t x2p_head = 0, x2p_idx = 0;
-                ptrdiff_t u2x_head = 0, u2x_idx = 0;
-                ptrdiff_t p2x_head = 0, p2x_idx = 0;
-
-                for(size_t i = 0; i < n; ++i) {
-                    if (prm.pmask[i]) {
-                        x2p->ptr[++x2p_idx] = ++x2p_head;
-                        ++p2x_head;
-                    } else {
-                        x2u->ptr[++x2u_idx] = ++x2u_head;
-                        ++u2x_head;
-                    }
-
-                    p2x->ptr[++p2x_idx] = p2x_head;
-                    u2x->ptr[++u2x_idx] = u2x_head;
-                }
-            }
-
-            x2u->set_nonzeros();
-            x2p->set_nonzeros();
-            u2x->set_nonzeros();
-            p2x->set_nonzeros();
-
-            {
-                ptrdiff_t x2u_head = 0;
-                ptrdiff_t x2p_head = 0;
-                ptrdiff_t u2x_head = 0;
-                ptrdiff_t p2x_head = 0;
-
-                for(size_t i = 0; i < n; ++i) {
-                    ptrdiff_t j = idx[i];
-
-                    if (prm.pmask[i]) {
-                        x2p->col[x2p_head] = i;
-                        x2p->val[x2p_head] = math::identity<value_type>();
-                        ++x2p_head;
-
-                        p2x->col[p2x_head] = j;
-                        p2x->val[p2x_head] = math::identity<value_type>();
-                        ++p2x_head;
-                    } else {
-                        x2u->col[x2u_head] = i;
-                        x2u->val[x2u_head] = math::identity<value_type>();
-                        ++x2u_head;
-
-                        u2x->col[u2x_head] = j;
-                        u2x->val[u2x_head] = math::identity<value_type>();
-                        ++u2x_head;
-                    }
-                }
-            }
-
-            this->x2u = backend_type::copy_matrix(x2u, bprm);
-            this->x2p = backend_type::copy_matrix(x2p, bprm);
-            this->u2x = backend_type::copy_matrix(u2x, bprm);
-            this->p2x = backend_type::copy_matrix(p2x, bprm);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const schur_pressure_correction &p) {
-            os << "Schur complement (two-stage preconditioner)" << std::endl;
-            os << "  Unknowns: " << p.n << "(" << p.np << ")" << std::endl;
-            os << "  Nonzeros: " << backend::nonzeros(p.system_matrix()) << std::endl;
-            os << "  Memory:  " << human_readable_memory(p.bytes()) << std::endl;
-            os << std::endl;
-            os << "[ U ]\n" << *p.U << std::endl;
-            os << "[ P ]\n" << *p.P << std::endl;
-
-            return os;
-        }
-
-        template <typename I, typename E>
-        void report(const std::string &name, const std::tuple<I, E> &c) const {
-            if (prm.verbose >= 1) {
-                std::cout << name << " (" << std::get<0>(c) << ", " << std::get<1>(c) << ")\n";
-            }
-        }
-};
-
-} // namespace preconditioner
-
-namespace backend {
-
-template <class US, class PS, class Alpha, class Beta, class Vec1, class Vec2>
-struct spmv_impl< Alpha, preconditioner::schur_pressure_correction<US, PS>, Vec1, Beta, Vec2>
-{
-    static void apply(Alpha alpha, const preconditioner::schur_pressure_correction<US, PS> &A, const Vec1 &x, Beta beta, Vec2 &y)
-    {
-        A.spmv(alpha, x, beta, y);
-    }
-};
-
-template <class US, class PS, class Vec1, class Vec2, class Vec3>
-struct residual_impl< preconditioner::schur_pressure_correction<US, PS>, Vec1, Vec2, Vec3>
-{
-    static void apply(const Vec1 &rhs, const preconditioner::schur_pressure_correction<US, PS> &A, const Vec2 &x, Vec3 &r)
-    {
-        backend::copy(rhs, r);
-        A.spmv(-1, x, 1, r);
-    }
-};
-
-} // namespace backend
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/profiler.hpp b/src/solvers/amgcl/profiler.hpp
deleted file mode 100644
index d1410d4..0000000
--- a/src/solvers/amgcl/profiler.hpp
+++ /dev/null
@@ -1,216 +0,0 @@
-#ifndef AMGCL_PROFILER_H
-#define AMGCL_PROFILER_H
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/profiler.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Profiler class.
- */
-
-#include <iostream>
-#include <iomanip>
-#include <map>
-#include <string>
-#include <vector>
-#include <type_traits>
-
-#include <amgcl/perf_counter/clock.hpp>
-#include <amgcl/io/ios_saver.hpp>
-
-namespace amgcl {
-
-/// Profiler class.
-/**
- * \param Counter     Performance counter to use for profiling.
- * \param SHIFT_WIDTH Indentation for output of profiling results.
- *
- * Provides simple to use, hierarchical profile with nicely formatted output.
- */
-template <class Counter = amgcl::perf_counter::clock, unsigned SHIFT_WIDTH = 2>
-class profiler {
-    public:
-        typedef typename Counter::value_type value_type;
-        typedef double delta_type;
-
-        /// Initialization.
-        /**
-         */
-        profiler() : name("Profile") {
-            init();
-        }
-
-        /// Send additional parameters to counter.
-        /**
-         * \param name Profile title to use with output.
-         * \param args Counter arguments.
-         */
-        template <class... Args>
-        profiler(const std::string &name, Args&&... args)
-            : name(name), counter(std::forward<Args>(args)...)
-        {
-            init();
-        }
-
-        /// Starts measurement.
-        /**
-         * \param name interval name.
-         */
-        void tic(const std::string &name) {
-            stack.back()->children[name].begin = counter.current();
-            stack.push_back(&stack.back()->children[name]);
-        }
-
-        /// Stops measurement.
-        /**
-         * Returns delta in the measured value since the corresponding tic().
-         */
-        delta_type toc(const std::string& /*name*/ = "") {
-            profile_unit *top = stack.back();
-            stack.pop_back();
-
-            value_type current = counter.current();
-            delta_type delta   = current - top->begin;
-
-            top->length += delta;
-            root.length = current - root.begin;
-
-            return delta;
-        }
-
-        void reset() {
-            stack.clear();
-            root.length = 0;
-            root.children.clear();
-
-            stack.push_back(&root);
-            root.begin = counter.current();
-        }
-
-        struct scoped_ticker {
-            profiler &prof;
-            scoped_ticker(profiler &prof) : prof(prof) {}
-            ~scoped_ticker() {
-                prof.toc();
-            }
-        };
-
-        scoped_ticker scoped_tic(const std::string &name) {
-            tic(name);
-            return scoped_ticker(*this);
-        }
-    private:
-        struct profile_unit {
-            profile_unit() : length(0) {}
-
-            delta_type children_time() const {
-                delta_type s = delta_type();
-                for(typename std::map<std::string, profile_unit>::const_iterator c = children.begin(); c != children.end(); c++)
-                    s += c->second.length;
-                return s;
-            }
-
-            size_t total_width(const std::string &name, int level) const {
-                size_t w = name.size() + level;
-                for(typename std::map<std::string, profile_unit>::const_iterator c = children.begin(); c != children.end(); c++)
-                    w = std::max(w, c->second.total_width(c->first, level + SHIFT_WIDTH));
-                return w;
-            }
-
-            void print(std::ostream &out, const std::string &name,
-                    int level, delta_type total, size_t width) const
-            {
-                using namespace std;
-
-                out << "[" << setw(level) << "";
-                print_line(out, name, length, 100 * length / total, width - level);
-
-                if (children.size()) {
-                    delta_type val = length - children_time();
-                    double perc = 100.0 * val / total;
-
-                    if (perc > 1e-1) {
-                        out << "[" << setw(level + 1) << "";
-                        print_line(out, "self", val, perc, width - level - 1);
-                    }
-                }
-
-                for(typename std::map<std::string, profile_unit>::const_iterator c = children.begin(); c != children.end(); c++)
-                    c->second.print(out, c->first, level + SHIFT_WIDTH, total, width);
-            }
-
-            void print_line(std::ostream &out, const std::string &name,
-                    delta_type time, double perc, size_t width) const
-            {
-                using namespace std;
-
-                out << name << ":"
-                    << setw(width - name.size()) << ""
-                    << setw(10)
-                    << fixed << setprecision(3) << time << " " << Counter::units()
-                    << "] (" << fixed << setprecision(2) << setw(6) << perc << "%)"
-                    << endl;
-            }
-
-            value_type begin;
-            delta_type length;
-
-            std::map<std::string, profile_unit> children;
-        };
-
-        std::string name;
-        Counter counter;
-        profile_unit root;
-        std::vector<profile_unit*> stack;
-
-        void init() {
-            stack.reserve(128);
-            stack.push_back(&root);
-            root.begin = counter.current();
-        }
-
-        void print(std::ostream &out) {
-            if (stack.back() != &root)
-                out << "Warning! Profile is incomplete." << std::endl;
-            ios_saver ss(out);
-            root.print(out, name, 0, root.length, root.total_width(name, 0));
-        }
-
-        /// Sends formatted profiling data to an output stream.
-        /**
-         * \param out  Output stream.
-         * \param prof Profiler.
-         */
-        friend std::ostream& operator<<(std::ostream &out, profiler &prof) {
-            out << std::endl;
-            prof.print(out);
-            return out << std::endl;
-        }
-};
-
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/as_block.hpp b/src/solvers/amgcl/relaxation/as_block.hpp
deleted file mode 100644
index 0b48abd..0000000
--- a/src/solvers/amgcl/relaxation/as_block.hpp
+++ /dev/null
@@ -1,131 +0,0 @@
-#ifndef AMGCL_RELAXATION_AS_BLOCK_HPP
-#define AMGCL_RELAXATION_AS_BLOCK_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/as_block.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Block matrix adapter for an amgcl smoother.
- */
-
-#include <vector>
-#include <memory>
-#include <amgcl/util.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/adapter/block_matrix.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// Converts input matrix to block format before constructing an amgcl smoother.
-template <class BlockBackend, template <class> class Relax>
-struct as_block {
-    typedef typename BlockBackend::value_type BlockType;
-
-    template <class Backend>
-    class type {
-        public:
-            typedef Backend backend_type;
-
-            typedef Relax<BlockBackend>       Base;
-
-            typedef typename Backend::matrix  matrix;
-            typedef typename Backend::vector  vector;
-            typedef typename Base::params     params;
-            typedef typename Backend::params  backend_params;
-
-            typedef typename Backend::value_type value_type;
-            typedef typename Backend::col_type   col_type;
-            typedef typename Backend::ptr_type   ptr_type;
-            typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-
-            template <class Matrix>
-            type(
-                    const Matrix &A,
-                    const params &prm = params(),
-                    const backend_params &bprm = backend_params()
-                    )
-            : base(*std::make_shared<typename backend::crs<BlockType, col_type, ptr_type>>(adapter::block_matrix<BlockType>(A)), prm, bprm),
-              nrows(backend::rows(A) / math::static_rows<BlockType>::value)
-            { }
-
-            template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-            void apply_pre(
-                    const Matrix &A,
-                    const VectorRHS &rhs,
-                    VectorX &x,
-                    VectorTMP &tmp
-                    ) const
-            {
-                auto F = backend::reinterpret_as_rhs<BlockType>(rhs);
-                auto X = backend::reinterpret_as_rhs<BlockType>(x);
-                auto T = backend::reinterpret_as_rhs<BlockType>(tmp);
-                base.apply_pre(A, F, X, T);
-            }
-
-            template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-            void apply_post(
-                    const Matrix &A,
-                    const VectorRHS &rhs,
-                    VectorX &x,
-                    VectorTMP &tmp
-                    ) const
-            {
-                auto F = backend::reinterpret_as_rhs<BlockType>(rhs);
-                auto X = backend::reinterpret_as_rhs<BlockType>(x);
-                auto T = backend::reinterpret_as_rhs<BlockType>(tmp);
-                base.apply_post(A, F, X, T);
-            }
-
-            template <class Matrix, class Vec1, class Vec2>
-            void apply(const Matrix &A, const Vec1 &rhs, Vec2 &&x) const {
-                auto F = backend::reinterpret_as_rhs<BlockType>(rhs);
-                auto X = backend::reinterpret_as_rhs<BlockType>(x);
-                base.apply(A, F, X);
-            }
-
-            const matrix& system_matrix() const {
-                return base.system_matrix();
-            }
-
-            std::shared_ptr<matrix> system_matrix_ptr() const {
-                return base.system_matrix_ptr();
-            }
-
-            size_t bytes() const {
-                return base.bytes();
-            }
-        private:
-            Base base;
-            size_t nrows;
-    };
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/as_preconditioner.hpp b/src/solvers/amgcl/relaxation/as_preconditioner.hpp
deleted file mode 100644
index 7e6a608..0000000
--- a/src/solvers/amgcl/relaxation/as_preconditioner.hpp
+++ /dev/null
@@ -1,125 +0,0 @@
-#ifndef AMGCL_RELAXATION_AS_PRECONDITIONER_HPP
-#define AMGCL_RELAXATION_AS_PRECONDITIONER_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/as_preconditioner.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Use an amgcl smoother as a standalone preconditioner.
- */
-
-#include <vector>
-#include <memory>
-#include <amgcl/backend/builtin.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// Allows to use an amgcl smoother as standalone preconditioner.
-template <class Backend, template <class> class Relax>
-class as_preconditioner {
-    public:
-        typedef Backend backend_type;
-
-        typedef Relax<Backend>            smoother;
-
-        typedef typename Backend::matrix  matrix;
-        typedef typename Backend::vector  vector;
-        typedef typename smoother::params params;
-        typedef typename Backend::params  backend_params;
-
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::col_type col_type;
-        typedef typename Backend::ptr_type ptr_type;
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-
-        template <class Matrix>
-        as_preconditioner(
-                const Matrix &M,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : prm(prm)
-        {
-            init(std::make_shared<build_matrix>(M), bprm);
-        }
-
-        as_preconditioner(
-                std::shared_ptr<build_matrix> M,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                )
-            : prm(prm)
-        {
-            init(M, bprm);
-        }
-
-        template <class Vec1, class Vec2>
-        void apply(const Vec1 &rhs, Vec2 &&x) const {
-            S->apply(*A, rhs, x);
-        }
-
-        const matrix& system_matrix() const {
-            return *A;
-        }
-
-        std::shared_ptr<matrix> system_matrix_ptr() const {
-            return A;
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            if (A) b += backend::bytes(*A);
-            if (S) b += backend::bytes(*S);
-
-            return b;
-        }
-    private:
-        params prm;
-
-        std::shared_ptr<matrix>   A;
-        std::shared_ptr<smoother> S;
-
-        void init(std::shared_ptr<build_matrix> M, const backend_params &bprm) {
-            A = Backend::copy_matrix(M, bprm);
-            S = std::make_shared<smoother>(*M, prm, bprm);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const as_preconditioner &p) {
-            os << "Relaxation as preconditioner" << std::endl;
-            os << "  Unknowns: " << backend::rows(p.system_matrix()) << std::endl;
-            os << "  Nonzeros: " << backend::nonzeros(p.system_matrix()) << std::endl;
-            os << "  Memory:   " << human_readable_memory(p.bytes()) << std::endl;
-
-            return os;
-        }
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/chebyshev.hpp b/src/solvers/amgcl/relaxation/chebyshev.hpp
deleted file mode 100644
index d3f5dd0..0000000
--- a/src/solvers/amgcl/relaxation/chebyshev.hpp
+++ /dev/null
@@ -1,210 +0,0 @@
-#ifndef AMGCL_RELAXATION_CHEBYSHEV_HPP
-#define AMGCL_RELAXATION_CHEBYSHEV_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-Copyright (c) 2019 Peter Gamnitzer, UIBK (University of Innsbruck)
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/chebyshev.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Chebyshev polynomial smoother.
- *
- * Implements Algorithm 1 from
- * P. Ghysels, P. Kłosiewicz, and W. Vanroose.
- * "Improving the arithmetic intensity of multigrid with the help of polynomial smoothers".
- * Numer. Linear Algebra Appl. 2012;19:253-267. DOI: 10.1002/nla.1808
- */
-
-#include <vector>
-#include <cmath>
-
-#include <amgcl/detail/inverse.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// Chebyshev polynomial smoother.
-/**
- * \param Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- */
-template <class Backend>
-class chebyshev {
-    public:
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::vector     vector;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        /// Relaxation parameters.
-        struct params {
-            /// Chebyshev polynomial degree.
-            unsigned degree;
-
-            /// highest eigen value safety upscaling.
-            // use boosting factor for a more conservative upper bound estimate
-            // See: Adams, Brezina, Hu, Tuminaro,
-            //      PARALLEL MULTIGRID SMOOTHING: POLYNOMIAL VERSUS
-            //      GAUSS-SEIDEL, J. Comp. Phys. 188 (2003) 593-610.
-            //
-            float higher;
-
-            /// Lowest-to-highest eigen value ratio.
-            float lower;
-
-            // Number of power iterations to apply for the spectral radius
-            // estimation. When 0, use Gershgorin disk theorem to estimate
-            // spectral radius.
-            int power_iters;
-
-            // Scale the system matrix
-            bool scale;
-
-            params()
-                : degree(5), higher(1.0f), lower(1.0f / 30), power_iters(0),
-                  scale(false)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, degree),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, higher),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, lower),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, power_iters),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, scale)
-            {
-                check_params(p, {"degree", "higher", "lower", "power_iters", "scale"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, degree);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, higher);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, lower);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, power_iters);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, scale);
-            }
-#endif
-        } prm;
-
-        /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-        template <class Matrix>
-        chebyshev(
-                const Matrix &A, const params &prm,
-                const typename Backend::params &backend_prm
-            ) : prm(prm),
-                p( Backend::create_vector(rows(A), backend_prm) ),
-                r( Backend::create_vector(rows(A), backend_prm) )
-        {
-            scalar_type hi, lo;
-
-            using backend::spectral_radius;
-
-            if (prm.scale) {
-                M  = Backend::copy_vector( diagonal(A, /*invert*/true), backend_prm );
-                hi = spectral_radius<true>(A, prm.power_iters);
-            } else {
-                hi = spectral_radius<false>(A, prm.power_iters);
-            }
-
-            lo = hi * prm.lower;
-            hi *= prm.higher;
-
-            // Centre of ellipse containing the eigenvalues of A:
-            d = 0.5 * (hi + lo);
-
-            // Semi-major axis of ellipse containing the eigenvalues of A:
-            c = 0.5 * (hi - lo);
-        }
-
-        template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-        void apply_pre(
-                const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP&
-                ) const
-        {
-            solve(A, rhs, x);
-        }
-
-        template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-        void apply_post(
-                const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP&
-                ) const
-        {
-            solve(A, rhs, x);
-        }
-
-        template <class Matrix, class VectorRHS, class VectorX>
-        void apply(const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-        {
-            backend::clear(x);
-            solve(A, rhs, x);
-        }
-
-        size_t bytes() const {
-            size_t b = backend::bytes(*p) + backend::bytes(*r);
-            if (prm.scale) b += backend::bytes(*M);
-            return b;
-        }
-
-    private:
-        std::shared_ptr<typename Backend::matrix_diagonal> M;
-        mutable std::shared_ptr<vector> p, r;
-
-        scalar_type c, d;
-
-        template <class Matrix, class VectorB, class VectorX>
-        void solve(const Matrix &A, const VectorB &b, VectorX &x) const
-        {
-            static const scalar_type one  = math::identity<scalar_type>();
-            static const scalar_type zero = math::zero<scalar_type>();
-
-            scalar_type alpha = zero, beta = zero;
-
-            for (unsigned k = 0; k < prm.degree; ++k) {
-                backend::residual(b, A, x, *r);
-
-                if (prm.scale) backend::vmul(one, *M, *r, zero, *r);
-
-                if (k == 0) {
-                    alpha = math::inverse(d);
-                    beta  = zero;
-                } else if (k == 1) {
-                    alpha = 2 * d * math::inverse(2 * d * d - c * c);
-                    beta  = alpha * d - one;
-                } else {
-                    alpha = math::inverse(d - 0.25 * alpha * c * c);
-                    beta  = alpha * d - one;
-                }
-
-                backend::axpby(alpha, *r, beta, *p);
-                backend::axpby(one, *p, one, x);
-            }
-        }
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/cusparse_ilu0.hpp b/src/solvers/amgcl/relaxation/cusparse_ilu0.hpp
deleted file mode 100644
index 4a4a479..0000000
--- a/src/solvers/amgcl/relaxation/cusparse_ilu0.hpp
+++ /dev/null
@@ -1,548 +0,0 @@
-#ifndef AMGCL_RELAXATION_CUSPARSE_ILU0_HPP
-#define AMGCL_RELAXATION_CUSPARSE_ILU0_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/cusparse_ilu0.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Implementation of ILU0 smoother for CUDA backend.
- */
-
-#include <type_traits>
-
-#include <thrust/device_vector.h>
-#include <cusparse_v2.h>
-
-#include <amgcl/backend/cuda.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-template <class Backend> struct ilu0;
-
-template <typename real>
-struct ilu0< backend::cuda<real> > {
-    typedef real value_type;
-    typedef backend::cuda<double> Backend;
-
-    struct params {
-        /// Damping factor.
-        float damping;
-
-        params() : damping(1) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, damping)
-        {
-            check_params(p, {"damping"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-        }
-#endif
-    } prm;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    ilu0( const Matrix &A, const params &prm, const typename Backend::params &bprm)
-        : prm(prm), handle(bprm.cusparse_handle),
-          n(backend::rows(A)), nnz(backend::nonzeros(A)),
-          ptr(A.ptr, A.ptr + n+1),
-          col(A.col, A.col + nnz),
-          val(A.val, A.val + nnz),
-          y(n)
-    {
-        // Create matrix descriptors.
-        {
-            cusparseMatDescr_t descr;
-
-            AMGCL_CALL_CUDA( cusparseCreateMatDescr(&descr) );
-            AMGCL_CALL_CUDA( cusparseSetMatIndexBase(descr, CUSPARSE_INDEX_BASE_ZERO) );
-            AMGCL_CALL_CUDA( cusparseSetMatType(descr, CUSPARSE_MATRIX_TYPE_GENERAL) );
-
-            descr_M.reset(descr, backend::detail::cuda_deleter());
-        }
-        {
-            cusparseMatDescr_t descr;
-
-            AMGCL_CALL_CUDA( cusparseCreateMatDescr(&descr) );
-            AMGCL_CALL_CUDA( cusparseSetMatIndexBase(descr, CUSPARSE_INDEX_BASE_ZERO) );
-            AMGCL_CALL_CUDA( cusparseSetMatType(descr, CUSPARSE_MATRIX_TYPE_GENERAL) );
-            AMGCL_CALL_CUDA( cusparseSetMatFillMode(descr, CUSPARSE_FILL_MODE_LOWER) );
-            AMGCL_CALL_CUDA( cusparseSetMatDiagType(descr, CUSPARSE_DIAG_TYPE_UNIT) );
-
-            descr_L.reset(descr, backend::detail::cuda_deleter());
-        }
-        {
-            cusparseMatDescr_t descr;
-
-            AMGCL_CALL_CUDA( cusparseCreateMatDescr(&descr) );
-            AMGCL_CALL_CUDA( cusparseSetMatIndexBase(descr, CUSPARSE_INDEX_BASE_ZERO) );
-            AMGCL_CALL_CUDA( cusparseSetMatType(descr, CUSPARSE_MATRIX_TYPE_GENERAL) );
-            AMGCL_CALL_CUDA( cusparseSetMatFillMode(descr, CUSPARSE_FILL_MODE_UPPER) );
-            AMGCL_CALL_CUDA( cusparseSetMatDiagType(descr, CUSPARSE_DIAG_TYPE_NON_UNIT) );
-
-            descr_U.reset(descr, backend::detail::cuda_deleter());
-        }
-
-        // Create info structures.
-        {
-            csrilu02Info_t info;
-            AMGCL_CALL_CUDA( cusparseCreateCsrilu02Info(&info) );
-            info_M.reset(info, backend::detail::cuda_deleter());
-        }
-        {
-            csrsv2Info_t info;
-            AMGCL_CALL_CUDA( cusparseCreateCsrsv2Info(&info) );
-            info_L.reset(info, backend::detail::cuda_deleter());
-        }
-        {
-            csrsv2Info_t info;
-            AMGCL_CALL_CUDA( cusparseCreateCsrsv2Info(&info) );
-            info_U.reset(info, backend::detail::cuda_deleter());
-        }
-
-        // Allocate scratch buffer.
-        {
-            const cusparseOperation_t trans_L  = CUSPARSE_OPERATION_NON_TRANSPOSE;
-            const cusparseOperation_t trans_U  = CUSPARSE_OPERATION_NON_TRANSPOSE;
-
-            int buf_size_M;
-            int buf_size_L;
-            int buf_size_U;
-
-            AMGCL_CALL_CUDA(
-                    cusparseXcsrilu02_bufferSize(
-                        handle, n, nnz, descr_M.get(),
-                        thrust::raw_pointer_cast(&val[0]),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        info_M.get(), &buf_size_M
-                        )
-                    );
-            AMGCL_CALL_CUDA(
-                    cusparseXcsrsv2_bufferSize(
-                        handle, trans_L, n, nnz, descr_L.get(),
-                        thrust::raw_pointer_cast(&val[0]),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        info_L.get(), &buf_size_L
-                        )
-                    );
-            AMGCL_CALL_CUDA(
-                    cusparseXcsrsv2_bufferSize(
-                        handle, trans_U, n, nnz, descr_U.get(),
-                        thrust::raw_pointer_cast(&val[0]),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        info_U.get(), &buf_size_U
-                        )
-                    );
-
-            buf.resize( std::max(buf_size_M, std::max(buf_size_L, buf_size_U)) );
-        }
-
-        // Analysis and incomplete factorization of the system matrix.
-        int structural_zero;
-        int numerical_zero;
-
-        AMGCL_CALL_CUDA(
-                cusparseXcsrilu02_analysis(handle, n, nnz, descr_M.get(),
-                    thrust::raw_pointer_cast(&val[0]),
-                    thrust::raw_pointer_cast(&ptr[0]),
-                    thrust::raw_pointer_cast(&col[0]),
-                    info_M.get(), policy_M,
-                    thrust::raw_pointer_cast(&buf[0])
-                    )
-                );
-
-        precondition(
-                CUSPARSE_STATUS_ZERO_PIVOT != cusparseXcsrilu02_zeroPivot(handle, info_M.get(), &structural_zero),
-                "Zero pivot in cuSPARSE ILU0"
-                );
-
-        AMGCL_CALL_CUDA(
-                cusparseXcsrsv2_analysis(
-                    handle, trans_L, n, nnz, descr_L.get(),
-                    thrust::raw_pointer_cast(&val[0]),
-                    thrust::raw_pointer_cast(&ptr[0]),
-                    thrust::raw_pointer_cast(&col[0]),
-                    info_L.get(), policy_L,
-                    thrust::raw_pointer_cast(&buf[0])
-                    )
-                );
-
-        AMGCL_CALL_CUDA(
-                cusparseXcsrsv2_analysis(
-                    handle, trans_U, n, nnz, descr_U.get(),
-                    thrust::raw_pointer_cast(&val[0]),
-                    thrust::raw_pointer_cast(&ptr[0]),
-                    thrust::raw_pointer_cast(&col[0]),
-                    info_U.get(), policy_U,
-                    thrust::raw_pointer_cast(&buf[0])
-                    )
-                );
-
-        AMGCL_CALL_CUDA(
-                cusparseXcsrilu02(
-                    handle, n, nnz, descr_M.get(),
-                    thrust::raw_pointer_cast(&val[0]),
-                    thrust::raw_pointer_cast(&ptr[0]),
-                    thrust::raw_pointer_cast(&col[0]),
-                    info_M.get(), policy_M,
-                    thrust::raw_pointer_cast(&buf[0])
-                    )
-                );
-        precondition(
-              CUSPARSE_STATUS_ZERO_PIVOT != cusparseXcsrilu02_zeroPivot(handle, info_M.get(), &numerical_zero),
-              "Zero pivot in cuSPARSE ILU0"
-              );
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        solve(tmp);
-        backend::axpby(prm.damping, tmp, 1, x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        solve(tmp);
-        backend::axpby(prm.damping, tmp, 1, x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::copy(rhs, x);
-        solve(x);
-    }
-
-    size_t bytes() const {
-        // This is incomplete, as cusparse structs are opaque.
-        return
-            backend::bytes(ptr) +
-            backend::bytes(col) +
-            backend::bytes(val) +
-            backend::bytes(y) +
-            backend::bytes(buf);
-    }
-
-    private:
-        static const cusparseSolvePolicy_t policy_M = CUSPARSE_SOLVE_POLICY_NO_LEVEL;
-        static const cusparseSolvePolicy_t policy_L = CUSPARSE_SOLVE_POLICY_USE_LEVEL;
-        static const cusparseSolvePolicy_t policy_U = CUSPARSE_SOLVE_POLICY_USE_LEVEL;
-        static const cusparseOperation_t   trans_L  = CUSPARSE_OPERATION_NON_TRANSPOSE;
-        static const cusparseOperation_t   trans_U  = CUSPARSE_OPERATION_NON_TRANSPOSE;
-
-        cusparseHandle_t handle;
-        int n, nnz;
-
-        std::shared_ptr<std::remove_pointer<cusparseMatDescr_t>::type> descr_M, descr_L, descr_U;
-        std::shared_ptr<std::remove_pointer<csrilu02Info_t>::type> info_M;
-        std::shared_ptr<std::remove_pointer<csrsv2Info_t>::type>  info_L, info_U;
-
-        thrust::device_vector<int> ptr, col;
-        thrust::device_vector<value_type> val;
-        mutable thrust::device_vector<value_type> y;
-        mutable thrust::device_vector<char> buf;
-
-
-        template <class VectorX>
-        void solve(VectorX &x) const {
-            value_type alpha = 1;
-
-            // Solve L * y = x
-            AMGCL_CALL_CUDA(
-                    cusparseXcsrsv2_solve(
-                        handle, trans_L, n, nnz, &alpha, descr_L.get(),
-                        thrust::raw_pointer_cast(&val[0]),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        info_L.get(),
-                        thrust::raw_pointer_cast(&x[0]),
-                        thrust::raw_pointer_cast(&y[0]),
-                        policy_L,
-                        thrust::raw_pointer_cast(&buf[0])
-                        )
-                    );
-
-            // Solve U * x = y
-            AMGCL_CALL_CUDA(
-                    cusparseXcsrsv2_solve(
-                        handle, trans_U, n, nnz, &alpha, descr_U.get(),
-                        thrust::raw_pointer_cast(&val[0]),
-                        thrust::raw_pointer_cast(&ptr[0]),
-                        thrust::raw_pointer_cast(&col[0]),
-                        info_U.get(),
-                        thrust::raw_pointer_cast(&y[0]),
-                        thrust::raw_pointer_cast(&x[0]),
-                        policy_U,
-                        thrust::raw_pointer_cast(&buf[0])
-                        )
-                    );
-        }
-
-
-        static cusparseStatus_t cusparseXcsrilu02_bufferSize(
-                cusparseHandle_t handle,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                double *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrilu02Info_t info,
-                int *pBufferSizeInBytes)
-        {
-            return cusparseDcsrilu02_bufferSize(
-                handle, m, nnz, descrA, csrSortedValA, csrSortedRowPtrA,
-                csrSortedColIndA, info, pBufferSizeInBytes);
-        }
-
-        static cusparseStatus_t cusparseXcsrilu02_bufferSize(
-                cusparseHandle_t handle,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                float *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrilu02Info_t info,
-                int *pBufferSizeInBytes)
-        {
-            return cusparseScsrilu02_bufferSize(
-                handle, m, nnz, descrA, csrSortedValA, csrSortedRowPtrA,
-                csrSortedColIndA, info, pBufferSizeInBytes);
-        }
-
-        static cusparseStatus_t cusparseXcsrsv2_bufferSize(
-                cusparseHandle_t handle,
-                cusparseOperation_t transA,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                double *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrsv2Info_t info,
-                int *pBufferSizeInBytes
-                )
-        {
-            return cusparseDcsrsv2_bufferSize(
-                handle, transA, m, nnz, descrA, csrSortedValA,
-                csrSortedRowPtrA, csrSortedColIndA, info, pBufferSizeInBytes);
-        }
-
-        static cusparseStatus_t cusparseXcsrsv2_bufferSize(
-                cusparseHandle_t handle,
-                cusparseOperation_t transA,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                float *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrsv2Info_t info,
-                int *pBufferSizeInBytes
-                )
-        {
-            return cusparseScsrsv2_bufferSize(
-                handle, transA, m, nnz, descrA, csrSortedValA,
-                csrSortedRowPtrA, csrSortedColIndA, info, pBufferSizeInBytes);
-        }
-
-        static cusparseStatus_t cusparseXcsrilu02_analysis(
-                cusparseHandle_t handle,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                const double *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrilu02Info_t info,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseDcsrilu02_analysis(
-                handle, m, nnz, descrA, csrSortedValA,
-                csrSortedRowPtrA, csrSortedColIndA, info, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrilu02_analysis(
-                cusparseHandle_t handle,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                const float *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrilu02Info_t info,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseScsrilu02_analysis(
-                handle, m, nnz, descrA, csrSortedValA,
-                csrSortedRowPtrA, csrSortedColIndA, info, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrsv2_analysis(
-                cusparseHandle_t handle,
-                cusparseOperation_t transA,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                const double *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrsv2Info_t info,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseDcsrsv2_analysis(
-                    handle, transA, m, nnz, descrA, csrSortedValA,
-                    csrSortedRowPtrA, csrSortedColIndA, info, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrsv2_analysis(
-                cusparseHandle_t handle,
-                cusparseOperation_t transA,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                const float *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrsv2Info_t info,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseScsrsv2_analysis(
-                    handle, transA, m, nnz, descrA, csrSortedValA,
-                    csrSortedRowPtrA, csrSortedColIndA, info, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrilu02(cusparseHandle_t handle,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                double *csrSortedValA_valM,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrilu02Info_t info,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseDcsrilu02(handle, m, nnz, descrA,
-                    csrSortedValA_valM, csrSortedRowPtrA, csrSortedColIndA,
-                    info, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrilu02(cusparseHandle_t handle,
-                int m,
-                int nnz,
-                const cusparseMatDescr_t descrA,
-                float *csrSortedValA_valM,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrilu02Info_t info,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseScsrilu02(handle, m, nnz, descrA,
-                    csrSortedValA_valM, csrSortedRowPtrA, csrSortedColIndA,
-                    info, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrsv2_solve(
-                cusparseHandle_t handle,
-                cusparseOperation_t transA,
-                int m,
-                int nnz,
-                const double *alpha,
-                const cusparseMatDescr_t descrA,
-                const double *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrsv2Info_t info,
-                const double *f,
-                double *x,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseDcsrsv2_solve(
-                    handle, transA, m,
-                    nnz, alpha, descrA, csrSortedValA, csrSortedRowPtrA,
-                    csrSortedColIndA, info, f, x, policy, pBuffer);
-        }
-
-        static cusparseStatus_t cusparseXcsrsv2_solve(
-                cusparseHandle_t handle,
-                cusparseOperation_t transA,
-                int m,
-                int nnz,
-                const float *alpha,
-                const cusparseMatDescr_t descrA,
-                const float *csrSortedValA,
-                const int *csrSortedRowPtrA,
-                const int *csrSortedColIndA,
-                csrsv2Info_t info,
-                const float *f,
-                float *x,
-                cusparseSolvePolicy_t policy,
-                void *pBuffer
-                )
-        {
-            return cusparseScsrsv2_solve(
-                    handle, transA, m,
-                    nnz, alpha, descrA, csrSortedValA, csrSortedRowPtrA,
-                    csrSortedColIndA, info, f, x, policy, pBuffer);
-        }
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/damped_jacobi.hpp b/src/solvers/amgcl/relaxation/damped_jacobi.hpp
deleted file mode 100644
index ad6dae0..0000000
--- a/src/solvers/amgcl/relaxation/damped_jacobi.hpp
+++ /dev/null
@@ -1,143 +0,0 @@
-#ifndef AMGCL_RELAXATION_DAMPED_JACOBI_HPP
-#define AMGCL_RELAXATION_DAMPED_JACOBI_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/damped_jacobi.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Damped Jacobi relaxation scheme.
- */
-
-#include <memory>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Smoothers
-namespace relaxation {
-
-/**
- * \defgroup relaxation
- * \brief Relaxation schemes
- */
-
-/// Damped Jacobi relaxation.
-/**
- * \param Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- */
-template <class Backend>
-struct damped_jacobi {
-    typedef typename Backend::value_type               value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-
-    /// Relaxation parameters.
-    struct params {
-        /// Damping factor.
-        scalar_type damping;
-
-        params(scalar_type damping = 0.72) : damping(damping) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, damping)
-        {
-            check_params(p, {"damping"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-        }
-#endif
-    } prm;
-
-    std::shared_ptr<typename Backend::matrix_diagonal> dia;
-
-    /// Constructs smoother for the system matrix.
-    /**
-     * \param A           The system matrix.
-     * \param prm         Relaxation parameters.
-     * \param backend_prm Backend parameters.
-     */
-    template <class Matrix>
-    damped_jacobi(
-            const Matrix &A,
-            const params &prm,
-            const typename Backend::params &backend_prm
-            )
-        : prm(prm), dia( Backend::copy_vector( diagonal(A, true), backend_prm ) )
-    { }
-
-    /// Apply pre-relaxation
-    /**
-     * \param A   System matrix.
-     * \param rhs Right-hand side.
-     * \param x   Solution vector.
-     * \param tmp Scratch vector.
-     * \param prm Relaxation parameters.
-     */
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        backend::vmul(prm.damping, *dia, tmp, math::identity<scalar_type>(), x);
-    }
-
-    /// Apply post-relaxation
-    /**
-     * \param A   System matrix.
-     * \param rhs Right-hand side.
-     * \param x   Solution vector.
-     * \param tmp Scratch vector.
-     * \param prm Relaxation parameters.
-     */
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        backend::vmul(prm.damping, *dia, tmp, math::identity<scalar_type>(), x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::vmul(math::identity<scalar_type>(), *dia, rhs, math::zero<scalar_type>(), x);
-    }
-
-    size_t bytes() const {
-        return backend::bytes(*dia);
-    }
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/detail/ilu_solve.hpp b/src/solvers/amgcl/relaxation/detail/ilu_solve.hpp
deleted file mode 100644
index a095855..0000000
--- a/src/solvers/amgcl/relaxation/detail/ilu_solve.hpp
+++ /dev/null
@@ -1,471 +0,0 @@
-#ifndef AMGCL_RELAXATION_DETAIL_ILU_SOLVE_HPP
-#define AMGCL_RELAXATION_DETAIL_ILU_SOLVE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/detail/ilu_solve.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Solver for sparse triangular systems obtained as a result of an
- *         incomplete LU factorization.
- */
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/backend/builtin_hybrid.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace relaxation {
-namespace detail {
-
-template <class Backend>
-class ilu_solve {
-    public:
-        typedef typename Backend::params backend_params;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::col_type col_type;
-        typedef typename Backend::ptr_type ptr_type;
-        typedef typename Backend::matrix matrix;
-        typedef typename Backend::vector vector;
-        typedef typename Backend::matrix_diagonal matrix_diagonal;
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        struct params {
-            /// Number of Jacobi iterations.
-            unsigned    iters;
-
-            /// Damping factor.
-            scalar_type damping;
-
-            params() : iters(2), damping(0.72) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, iters)
-                , AMGCL_PARAMS_IMPORT_VALUE(p, damping)
-            {
-                check_params(p, {"iters", "damping"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, iters);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-            }
-#endif
-        } prm;
-
-    public:
-        ilu_solve(
-                std::shared_ptr<build_matrix> L,
-                std::shared_ptr<build_matrix> U,
-                std::shared_ptr<backend::numa_vector<value_type> > D,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params()
-                ) :
-            prm(prm),
-            L(Backend::copy_matrix(L, bprm)),
-            U(Backend::copy_matrix(U, bprm)),
-            D(Backend::copy_vector(D, bprm)),
-            t1(Backend::create_vector(backend::rows(*L), bprm)),
-            t2(Backend::create_vector(backend::rows(*L), bprm))
-        {}
-
-        template <class Vector>
-        void solve(Vector &x) {
-            vector *y0 = t1.get();
-            vector *y1 = t2.get();
-
-            backend::axpby(prm.damping, x, 0.0, *y0);
-            for(unsigned i = 0; i < prm.iters; ++i) {
-                backend::residual(x, *L, *y0, *y1);
-                backend::axpby(prm.damping, *y1, (1-prm.damping), *y0);
-            }
-
-            backend::vmul(prm.damping, *D, *y0, 0.0, x);
-            for(unsigned i = 0; i < prm.iters; ++i) {
-                backend::residual(*y0, *U, x, *y1);
-                backend::vmul(prm.damping, *D, *y1, (1-prm.damping), x);
-            }
-        }
-
-        size_t bytes() const {
-            return
-                backend::bytes(*L) +
-                backend::bytes(*U) +
-                backend::bytes(*D) +
-                backend::bytes(*t1) +
-                backend::bytes(*t2);
-        }
-
-    private:
-        std::shared_ptr<matrix> L;
-        std::shared_ptr<matrix> U;
-        std::shared_ptr<matrix_diagonal> D;
-        std::shared_ptr<vector> t1, t2;
-};
-
-template <class value_type, class col_type, class ptr_type>
-class ilu_solve< backend::builtin<value_type, col_type, ptr_type> > {
-    public:
-        typedef backend::builtin<value_type, col_type, ptr_type> Backend;
-        typedef typename Backend::params backend_params;
-        typedef typename Backend::matrix matrix;
-        typedef typename Backend::vector vector;
-        typedef typename Backend::matrix_diagonal matrix_diagonal;
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-        typedef typename Backend::rhs_type rhs_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        struct params {
-            /// Use serial version of the algorithm
-            bool serial;
-
-            params() : serial(num_threads() < 4) {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, serial)
-            {
-                check_params(p, {"serial"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, serial);
-            }
-#endif
-        } prm;
-
-        ilu_solve(
-                std::shared_ptr<build_matrix> L,
-                std::shared_ptr<build_matrix> U,
-                std::shared_ptr<backend::numa_vector<value_type> > D,
-                const params &prm = params(),
-                const backend_params& = backend_params()
-                ) : prm(prm)
-        {
-            if (prm.serial)
-                serial_init(L, U, D);
-            else
-                parallel_init(L, U, D);
-        }
-
-        template <class Vector>
-        void solve(Vector &x) {
-            if (prm.serial)
-                serial_solve(x);
-            else
-                parallel_solve(x);
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            if (L) b += backend::bytes(*L);
-            if (U) b += backend::bytes(*U);
-            if (D) b += backend::bytes(*D);
-
-            if (lower) b += lower->bytes();
-            if (upper) b += upper->bytes();
-
-            return b;
-        }
-
-    private:
-        static int num_threads() {
-#ifdef _OPENMP
-            return omp_get_max_threads();
-#else
-            return 1;
-#endif
-        }
-
-        static int thread_id() {
-#ifdef _OPENMP
-            return omp_get_thread_num();
-#else
-            return 0;
-#endif
-        }
-
-        // copies of the input matrices for the fallback (serial)
-        // implementation:
-        std::shared_ptr<matrix>          L;
-        std::shared_ptr<matrix>          U;
-        std::shared_ptr<matrix_diagonal> D;
-
-        void serial_init(
-                std::shared_ptr<build_matrix>    L,
-                std::shared_ptr<build_matrix>    U,
-                std::shared_ptr<matrix_diagonal> D
-                )
-        {
-            this->L = L;
-            this->U = U;
-            this->D = D;
-        }
-
-        template <class Vector>
-        void serial_solve(Vector &x) {
-            const size_t n = backend::rows(*L);
-
-            const matrix          &L = *(this->L);
-            const matrix          &U = *(this->U);
-            const matrix_diagonal &D = *(this->D);
-
-            for(size_t i = 0; i < n; i++) {
-                for(ptrdiff_t j = L.ptr[i], e = L.ptr[i+1]; j < e; ++j)
-                    x[i] -= L.val[j] * x[L.col[j]];
-            }
-
-            for(size_t i = n; i-- > 0;) {
-                for(ptrdiff_t j = U.ptr[i], e = U.ptr[i+1]; j < e; ++j)
-                    x[i] -= U.val[j] * x[U.col[j]];
-                x[i] = D[i] * x[i];
-            }
-        }
-
-        // OpenMP solver for sparse triangular systems.
-        // The solver uses level scheduling approach.
-        // Each level (a set of matrix rows that can be computed independently)
-        // is split into tasks, a task per thread, and the matrix data is
-        // distributed across threads to improve cache and NUMA locality.
-        template <bool lower>
-        struct sptr_solve {
-            // a task is a set of rows that can be computed independently by a
-            // single thread.
-            struct task {
-                ptrdiff_t beg, end; // rows to process
-
-                task(ptrdiff_t beg, ptrdiff_t end) : beg(beg), end(end) {}
-            };
-
-            int nthreads;
-
-            // thread-specific storage:
-            std::vector< std::vector<task>       > tasks;
-            std::vector< std::vector<ptrdiff_t>  > ptr;
-            std::vector< std::vector<ptrdiff_t>  > col;
-            std::vector< std::vector<value_type> > val;
-            std::vector< std::vector<ptrdiff_t>  > ord; // rows ordered by levels
-            std::vector< std::vector<value_type> > D;
-
-            template <class Matrix>
-            sptr_solve(const Matrix &A, const value_type *_D = 0)
-                : nthreads(num_threads()), tasks(nthreads),
-                  ptr(nthreads), col(nthreads), val(nthreads), ord(nthreads)
-            {
-                ptrdiff_t n    = A.nrows;
-                ptrdiff_t nlev = 0;
-
-                std::vector<ptrdiff_t> level(n, 0);
-                std::vector<ptrdiff_t> order(n, 0);
-
-
-                // 1. split rows into levels.
-                ptrdiff_t beg = lower ? 0 : n-1;
-                ptrdiff_t end = lower ? n :  -1;
-                ptrdiff_t inc = lower ? 1 :  -1;
-
-                for(ptrdiff_t i = beg; i != end; i += inc) {
-                    ptrdiff_t l = level[i];
-
-                    for(auto j = A.ptr[i]; j < A.ptr[i+1]; ++j)
-                        l = std::max(l, level[A.col[j]]+1);
-
-                    level[i] = l;
-                    nlev = std::max(nlev, l+1);
-                }
-
-
-                // 2. reorder matrix rows.
-                std::vector<ptrdiff_t> start(nlev+1, 0);
-
-                for(ptrdiff_t i = 0; i < n; ++i)
-                    ++start[level[i]+1];
-
-                std::partial_sum(start.begin(), start.end(), start.begin());
-
-                for(ptrdiff_t i = 0; i < n; ++i)
-                    order[start[level[i]]++] = i;
-
-                std::rotate(start.begin(), start.end() - 1, start.end());
-                start[0] = 0;
-
-
-                // 3. Organize matrix rows into tasks.
-                //    Each level is split into nthreads tasks.
-                std::vector<ptrdiff_t> thread_rows(nthreads, 0);
-                std::vector<ptrdiff_t> thread_cols(nthreads, 0);
-
-#pragma omp parallel
-                {
-                    int tid = thread_id();
-                    tasks[tid].reserve(nlev);
-
-                    for(ptrdiff_t lev = 0; lev < nlev; ++lev) {
-                        // split each level into tasks.
-                        ptrdiff_t lev_size = start[lev+1] - start[lev];
-                        ptrdiff_t chunk_size = (lev_size + nthreads - 1) / nthreads;
-
-                        ptrdiff_t beg = std::min(tid * chunk_size, lev_size);
-                        ptrdiff_t end = std::min(beg + chunk_size, lev_size);
-
-                        beg += start[lev];
-                        end += start[lev];
-
-                        tasks[tid].push_back(task(beg, end));
-
-                        // count rows and nonzeros in the current task
-                        thread_rows[tid] += end - beg;
-                        for(ptrdiff_t i = beg; i < end; ++i) {
-                            ptrdiff_t j = order[i];
-                            thread_cols[tid] += A.ptr[j+1] - A.ptr[j];
-                        }
-                    }
-                }
-
-                // 4. reorganize matrix data for better cache and NUMA locality.
-                if (!lower) D.resize(nthreads);
-
-#pragma omp parallel
-                {
-                    int tid = thread_id();
-
-                    col[tid].reserve(thread_cols[tid]);
-                    val[tid].reserve(thread_cols[tid]);
-                    ord[tid].reserve(thread_rows[tid]);
-                    ptr[tid].reserve(thread_rows[tid] + 1);
-                    ptr[tid].push_back(0);
-
-                    if (!lower) D[tid].reserve(thread_rows[tid]);
-
-                    for(task &t : tasks[tid]) {
-                        ptrdiff_t loc_beg = ptr[tid].size() - 1;
-                        ptrdiff_t loc_end = loc_beg;
-
-                        for(ptrdiff_t r = t.beg; r < t.end; ++r, ++loc_end) {
-                            ptrdiff_t i = order[r];
-                            if (!lower) D[tid].push_back(_D[i]);
-
-                            ord[tid].push_back(i);
-
-                            for(auto j = A.ptr[i]; j < A.ptr[i+1]; ++j) {
-                                col[tid].push_back(A.col[j]);
-                                val[tid].push_back(A.val[j]);
-                            }
-
-                            ptr[tid].push_back(col[tid].size());
-                        }
-
-                        t.beg = loc_beg;
-                        t.end = loc_end;
-                    }
-                }
-            }
-
-            template <class Vector>
-            void solve(Vector &x) const {
-#pragma omp parallel
-                {
-                    int tid = thread_id();
-
-                    for(const task &t : tasks[tid]) {
-                        for(ptrdiff_t r = t.beg; r < t.end; ++r) {
-                            ptrdiff_t i   = ord[tid][r];
-                            ptrdiff_t beg = ptr[tid][r];
-                            ptrdiff_t end = ptr[tid][r+1];
-
-                            rhs_type X = math::zero<rhs_type>();
-                            for(ptrdiff_t j = beg; j < end; ++j)
-                                X += val[tid][j] * x[col[tid][j]];
-
-                            if (lower)
-                                x[i] -= X;
-                            else
-                                x[i] = D[tid][r] * (x[i] - X);
-                        }
-
-                        // each task corresponds to a level, so we need
-                        // to synchronize across threads at this point:
-#pragma omp barrier
-                        ;
-                    }
-                }
-            }
-
-            size_t bytes() const {
-                size_t b = 0;
-
-                for(int i = 0; i < nthreads; ++i) {
-                    b += sizeof(task) * tasks[i].size();
-                    b += backend::bytes(ptr[i]);
-                    b += backend::bytes(col[i]);
-                    b += backend::bytes(val[i]);
-                    b += backend::bytes(ord[i]);
-
-                    if (!lower) b += backend::bytes(D[i]);
-                }
-
-                return b;
-            }
-        };
-
-        std::shared_ptr< sptr_solve<true > > lower;
-        std::shared_ptr< sptr_solve<false> > upper;
-
-        void parallel_init(
-                std::shared_ptr<build_matrix> L,
-                std::shared_ptr<build_matrix> U,
-                std::shared_ptr<backend::numa_vector<value_type> > D
-                )
-        {
-            lower = std::make_shared< sptr_solve<true > >(*L, D->data());
-            upper = std::make_shared< sptr_solve<false> >(*U, D->data());
-        }
-
-        template <class Vector>
-        void parallel_solve(Vector &x) {
-            lower->solve(x);
-            upper->solve(x);
-        }
-};
-
-template <class Block, class Col, class Ptr>
-class ilu_solve< backend::builtin_hybrid<Block, Col, Ptr> >
-    : public ilu_solve< backend::builtin<typename math::scalar_of<Block>::type, Col, Ptr> >
-{
-    typedef ilu_solve< backend::builtin<typename math::scalar_of<Block>::type, Col, Ptr> > Base;
-
-    public:
-        using Base::Base;
-};
-
-} // namespace detail
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/gauss_seidel.hpp b/src/solvers/amgcl/relaxation/gauss_seidel.hpp
deleted file mode 100644
index 7e8c648..0000000
--- a/src/solvers/amgcl/relaxation/gauss_seidel.hpp
+++ /dev/null
@@ -1,395 +0,0 @@
-#ifndef AMGCL_RELAXATION_GAUSS_SEIDEL_HPP
-#define AMGCL_RELAXATION_GAUSS_SEIDEL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/gauss_seidel.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Gauss-Seidel relaxation scheme.
- */
-
-#include <numeric>
-
-#include <memory>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/util.hpp>
-
-#ifdef _OPENMP
-#  include <omp.h>
-#endif
-
-namespace amgcl {
-namespace relaxation {
-
-/// Gauss-Seidel relaxation.
-/**
- * \note This is a serial relaxation and is only applicable to backends that
- * support matrix row iteration (e.g. amgcl::backend::builtin or
- * amgcl::backend::eigen).
- *
- * \param Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- */
-template <class Backend>
-struct gauss_seidel {
-    /// Relaxation parameters.
-    struct params {
-        /// Use serial version of the algorithm
-        bool serial;
-
-        params() : serial(false) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, serial)
-        {
-            check_params(p, {"serial"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, serial);
-        }
-#endif
-    };
-
-    bool is_serial;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    gauss_seidel( const Matrix &A, const params &prm, const typename Backend::params&)
-        : is_serial(prm.serial || num_threads() < 4)
-    {
-        if(!is_serial) {
-            forward  = std::make_shared< parallel_sweep<true>  >(A);
-            backward = std::make_shared< parallel_sweep<false> >(A);
-        }
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP&
-            ) const
-    {
-        if (is_serial)
-            serial_sweep(A, rhs, x, true);
-        else
-            forward->sweep(rhs, x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP&
-            ) const
-    {
-        if (is_serial)
-            serial_sweep(A, rhs, x, false);
-        else
-            backward->sweep(rhs, x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::clear(x);
-        if (is_serial) {
-            serial_sweep(A, rhs, x, true);
-            serial_sweep(A, rhs, x, false);
-        } else {
-            forward->sweep(rhs, x);
-            backward->sweep(rhs, x);
-        }
-    }
-
-    size_t bytes() const {
-        size_t b = 0;
-        if (forward)  b += forward->bytes();
-        if (backward) b += backward->bytes();
-        return b;
-    }
-
-    private:
-        static int num_threads() {
-#ifdef _OPENMP
-            return omp_get_max_threads();
-#else
-            return 1;
-#endif
-        }
-
-        static int thread_id() {
-#ifdef _OPENMP
-            return omp_get_thread_num();
-#else
-            return 0;
-#endif
-        }
-
-        template <class Matrix, class VectorRHS, class VectorX>
-        static void serial_sweep(
-                const Matrix &A, const VectorRHS &rhs, VectorX &x, bool forward)
-        {
-            typedef typename backend::value_type<Matrix>::type val_type;
-            typedef typename math::rhs_of<val_type>::type rhs_type;
-
-            const ptrdiff_t n = backend::rows(A);
-
-            const ptrdiff_t beg = forward ? 0 : n-1;
-            const ptrdiff_t end = forward ? n : -1;
-            const ptrdiff_t inc = forward ? 1 : -1;
-
-            for(ptrdiff_t i = beg; i != end; i += inc) {
-                val_type D = math::identity<val_type>();
-                rhs_type X;
-                X = rhs[i];
-
-                for (auto a = backend::row_begin(A, i); a; ++a) {
-                    ptrdiff_t c = a.col();
-                    val_type  v = a.value();
-
-                    if (c == i)
-                        D = v;
-                    else
-                        X -= v * x[c];
-                }
-
-                x[i] = math::inverse(D) * X;
-            }
-        }
-
-        template <bool forward>
-        struct parallel_sweep {
-            typedef typename Backend::value_type value_type;
-            typedef typename math::rhs_of<value_type>::type rhs_type;
-
-            struct task {
-                ptrdiff_t beg, end;
-                task(ptrdiff_t beg, ptrdiff_t end) : beg(beg), end(end) {}
-            };
-
-            int nthreads;
-
-            // thread-specific storage:
-            std::vector< std::vector<task>       > tasks;
-            std::vector< std::vector<ptrdiff_t>  > ptr;
-            std::vector< std::vector<ptrdiff_t>  > col;
-            std::vector< std::vector<value_type> > val;
-            std::vector< std::vector<ptrdiff_t>  > ord;
-
-            template <class Matrix>
-            parallel_sweep(const Matrix &A)
-                : nthreads(num_threads()), tasks(nthreads),
-                  ptr(nthreads), col(nthreads), val(nthreads), ord(nthreads)
-            {
-                ptrdiff_t n    = backend::rows(A);
-                ptrdiff_t nlev = 0;
-
-                std::vector<ptrdiff_t> level(n, 0);
-                std::vector<ptrdiff_t> order(n, 0);
-
-                // 1. split rows into levels.
-                ptrdiff_t beg = forward ? 0 : n-1;
-                ptrdiff_t end = forward ? n :  -1;
-                ptrdiff_t inc = forward ? 1 :  -1;
-
-                for(ptrdiff_t i = beg; i != end; i += inc) {
-                    ptrdiff_t l = level[i];
-
-                    for(auto a = row_begin(A, i); a; ++a) {
-                        ptrdiff_t c = a.col();
-
-                        if (forward) {
-                            if (c >= i) continue;
-                        } else {
-                            if (c <= i) continue;
-                        }
-
-                        l = std::max(l, level[c]+1);
-                    }
-
-                    level[i] = l;
-                    nlev = std::max(nlev, l+1);
-                }
-
-
-                // 2. reorder matrix rows.
-                std::vector<ptrdiff_t> start(nlev+1, 0);
-
-                for(ptrdiff_t i = 0; i < n; ++i)
-                    ++start[level[i]+1];
-
-                std::partial_sum(start.begin(), start.end(), start.begin());
-
-                for(ptrdiff_t i = 0; i < n; ++i)
-                    order[start[level[i]]++] = i;
-
-                std::rotate(start.begin(), start.end() - 1, start.end());
-                start[0] = 0;
-
-
-                // 3. Organize matrix rows into tasks.
-                //    Each level is split into nthreads tasks.
-                std::vector<ptrdiff_t> thread_rows(nthreads, 0);
-                std::vector<ptrdiff_t> thread_cols(nthreads, 0);
-
-#pragma omp parallel
-                {
-                    int tid = thread_id();
-                    tasks[tid].reserve(nlev);
-
-                    for(ptrdiff_t lev = 0; lev < nlev; ++lev) {
-                        // split each level into tasks.
-                        ptrdiff_t lev_size = start[lev+1] - start[lev];
-                        ptrdiff_t chunk_size = (lev_size + nthreads - 1) / nthreads;
-
-                        ptrdiff_t beg = std::min(tid * chunk_size, lev_size);
-                        ptrdiff_t end = std::min(beg + chunk_size, lev_size);
-
-                        beg += start[lev];
-                        end += start[lev];
-
-                        tasks[tid].push_back(task(beg, end));
-
-                        // count rows and nonzeros in the current task
-                        thread_rows[tid] += end - beg;
-                        for(ptrdiff_t i = beg; i < end; ++i) {
-                            ptrdiff_t j = order[i];
-                            thread_cols[tid] += row_nonzeros(A, j);
-                        }
-                    }
-                }
-
-                // 4. reorganize matrix data for better cache and NUMA locality.
-#pragma omp parallel
-                {
-                    int tid = thread_id();
-
-                    col[tid].reserve(thread_cols[tid]);
-                    val[tid].reserve(thread_cols[tid]);
-                    ord[tid].reserve(thread_rows[tid]);
-                    ptr[tid].reserve(thread_rows[tid] + 1);
-                    ptr[tid].push_back(0);
-
-                    for(task &t : tasks[tid]) {
-                        ptrdiff_t loc_beg = ptr[tid].size() - 1;
-                        ptrdiff_t loc_end = loc_beg;
-
-                        for(ptrdiff_t r = t.beg; r < t.end; ++r, ++loc_end) {
-                            ptrdiff_t i = order[r];
-
-                            ord[tid].push_back(i);
-
-                            for(auto a = row_begin(A, i); a; ++a) {
-                                col[tid].push_back(a.col());
-                                val[tid].push_back(a.value());
-                            }
-
-                            ptr[tid].push_back(col[tid].size());
-                        }
-
-                        t.beg = loc_beg;
-                        t.end = loc_end;
-                    }
-                }
-            }
-
-            template <class Vector1, class Vector2>
-            void sweep(const Vector1 &rhs, Vector2 &x) const {
-#pragma omp parallel
-                {
-                    int tid = thread_id();
-
-                    for(const task &t : tasks[tid]) {
-                        for(ptrdiff_t r = t.beg; r < t.end; ++r) {
-                            ptrdiff_t i   = ord[tid][r];
-                            ptrdiff_t beg = ptr[tid][r];
-                            ptrdiff_t end = ptr[tid][r+1];
-
-                            value_type D = math::identity<value_type>();
-                            rhs_type X;
-                            X = rhs[i];
-
-                            for(ptrdiff_t j = beg; j < end; ++j) {
-                                ptrdiff_t  c = col[tid][j];
-                                value_type v = val[tid][j];
-
-                                if (c == i)
-                                    D = v;
-                                else
-                                    X -= v * x[c];
-                            }
-
-                            x[i] = math::inverse(D) * X;
-                        }
-
-                        // each task corresponds to a level, so we need
-                        // to synchronize across threads at this point:
-#pragma omp barrier
-                        ;
-                    }
-                }
-            }
-
-            size_t bytes() const {
-                size_t b = 0;
-
-                for(int i = 0; i < nthreads; ++i) {
-                    b += sizeof(task) * tasks[i].size();
-                    b += backend::bytes(ptr[i]);
-                    b += backend::bytes(col[i]);
-                    b += backend::bytes(val[i]);
-                    b += backend::bytes(ord[i]);
-                }
-
-                return b;
-            }
-        };
-
-        std::shared_ptr< parallel_sweep<true>  > forward;
-        std::shared_ptr< parallel_sweep<false> > backward;
-};
-
-} // namespace relaxation
-
-namespace backend {
-
-template <class Backend>
-struct relaxation_is_supported<
-    Backend,
-    relaxation::gauss_seidel,
-    typename std::enable_if<
-        !Backend::provides_row_iterator::value
-        >::type
-    > : std::false_type
-{};
-
-} // namespace backend
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/ilu0.hpp b/src/solvers/amgcl/relaxation/ilu0.hpp
deleted file mode 100644
index db41b16..0000000
--- a/src/solvers/amgcl/relaxation/ilu0.hpp
+++ /dev/null
@@ -1,250 +0,0 @@
-#ifndef AMGCL_RELAXATION_ILU0_HPP
-#define AMGCL_RELAXATION_ILU0_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/ilu0.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Incomplete LU with zero fill-in relaxation scheme.
- */
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/relaxation/detail/ilu_solve.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// ILU(0) smoother.
-/**
- * \note ILU(0) is a serial algorithm and is only applicable to backends that
- * support matrix row iteration (e.g. amgcl::backend::builtin or
- * amgcl::backend::eigen).
- *
- * \param Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- */
-template <class Backend>
-struct ilu0 {
-    typedef typename Backend::value_type      value_type;
-    typedef typename Backend::col_type        col_type;
-    typedef typename Backend::ptr_type        ptr_type;
-    typedef typename Backend::vector          vector;
-    typedef typename Backend::matrix          matrix;
-    typedef typename Backend::matrix_diagonal matrix_diagonal;
-
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef detail::ilu_solve<Backend> ilu_solve;
-
-    /// Relaxation parameters.
-    struct params {
-        /// Damping factor.
-        scalar_type damping;
-
-        /// Parameters for sparse triangular system solver
-        typename ilu_solve::params solve;
-
-        params() : damping(1) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, damping)
-            , AMGCL_PARAMS_IMPORT_CHILD(p, solve)
-        {
-            check_params(p, {"damping", "solve"}, {"k"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, solve);
-        }
-#endif
-    } prm;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    ilu0( const Matrix &A, const params &prm, const typename Backend::params &bprm)
-      : prm(prm)
-    {
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-        const size_t n = backend::rows(A);
-
-        size_t Lnz = 0, Unz = 0;
-
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            ptrdiff_t row_beg = A.ptr[i];
-            ptrdiff_t row_end = A.ptr[i + 1];
-
-            for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                ptrdiff_t c = A.col[j];
-                if (c < i)
-                    ++Lnz;
-                else if (c > i)
-                    ++Unz;
-            }
-        }
-
-        auto L = std::make_shared<build_matrix>();
-        auto U = std::make_shared<build_matrix>();
-
-        L->set_size(n, n); L->set_nonzeros(Lnz); L->ptr[0] = 0;
-        U->set_size(n, n); U->set_nonzeros(Unz); U->ptr[0] = 0;
-
-        size_t Lhead = 0;
-        size_t Uhead = 0;
-
-        auto D = std::make_shared<backend::numa_vector<value_type> >(n, false);
-
-        std::vector<value_type*> work(n, NULL);
-
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            ptrdiff_t row_beg = A.ptr[i];
-            ptrdiff_t row_end = A.ptr[i + 1];
-
-            for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                ptrdiff_t  c = A.col[j];
-                value_type v = A.val[j];
-
-                if (c < i) {
-                    L->col[Lhead] = c;
-                    L->val[Lhead] = v;
-                    work[c] = L->val + Lhead;
-                    ++Lhead;
-                } else if (c == i) {
-                    (*D)[i] = v;
-                    work[c] = &(*D)[i];
-                } else {
-                    U->col[Uhead] = c;
-                    U->val[Uhead] = v;
-                    work[c] = U->val + Uhead;
-                    ++Uhead;
-                }
-            }
-
-            L->ptr[i+1] = Lhead;
-            U->ptr[i+1] = Uhead;
-
-            for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                ptrdiff_t c = A.col[j];
-
-                // Exit if diagonal is reached
-                if (c >= i) {
-                    precondition(c == i, "No diagonal value in system matrix");
-                    precondition(!math::is_zero((*D)[i]), "Zero pivot in ILU");
-
-                    (*D)[i] = math::inverse((*D)[i]);
-                    break;
-                }
-
-                // Compute the multiplier for jrow
-                value_type tl = (*work[c]) * (*D)[c];
-                *work[c] = tl;
-
-                // Perform linear combination
-                for(ptrdiff_t k = U->ptr[c]; k < static_cast<ptrdiff_t>(U->ptr[c+1]); ++k) {
-                    value_type *w = work[U->col[k]];
-                    if (w) *w -= tl * U->val[k];
-                }
-            }
-
-            // Get rid of zeros in the factors
-            Lhead = L->ptr[i];
-            Uhead = U->ptr[i];
-
-            for(ptrdiff_t j = Lhead, e = L->ptr[i+1]; j < e; ++j) {
-                auto v = L->val[j];
-                if (!math::is_zero(v)) {
-                    L->col[Lhead] = L->col[j];
-                    L->val[Lhead] = v;
-                    ++Lhead;
-                }
-            }
-
-            for(ptrdiff_t j = Uhead, e = U->ptr[i+1]; j < e; ++j) {
-                auto v = U->val[j];
-                if (!math::is_zero(v)) {
-                    U->col[Uhead] = U->col[j];
-                    U->val[Uhead] = v;
-                    ++Uhead;
-                }
-            }
-            L->ptr[i+1] = Lhead;
-            U->ptr[i+1] = Uhead;
-
-            // Refresh work
-            for(ptrdiff_t j = row_beg; j < row_end; ++j)
-                work[A.col[j]] = NULL;
-        }
-
-        L->nnz = Lhead;
-        U->nnz = Uhead;
-
-        ilu = std::make_shared<ilu_solve>(L, U, D, prm.solve, bprm);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        ilu->solve(tmp);
-        backend::axpby(prm.damping, tmp, math::identity<scalar_type>(), x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        ilu->solve(tmp);
-        backend::axpby(prm.damping, tmp, math::identity<scalar_type>(), x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::copy(rhs, x);
-        ilu->solve(x);
-    }
-
-    size_t bytes() const {
-        return ilu->bytes();
-    }
-
-    private:
-        std::shared_ptr<ilu_solve> ilu;
-
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/iluk.hpp b/src/solvers/amgcl/relaxation/iluk.hpp
deleted file mode 100644
index 526b6a4..0000000
--- a/src/solvers/amgcl/relaxation/iluk.hpp
+++ /dev/null
@@ -1,280 +0,0 @@
-#ifndef AMGCL_RELAXATION_ILUK_HPP
-#define AMGCL_RELAXATION_ILUK_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/iluk.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Incomplete LU with fill-in level.
- */
-
-#include <vector>
-#include <deque>
-#include <queue>
-#include <cmath>
-
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/relaxation/detail/ilu_solve.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// ILU(k) smoother.
-template <class Backend>
-struct iluk {
-    typedef typename Backend::value_type      value_type;
-    typedef typename Backend::col_type        col_type;
-    typedef typename Backend::ptr_type        ptr_type;
-    typedef typename Backend::matrix          matrix;
-    typedef typename Backend::matrix_diagonal matrix_diagonal;
-    typedef typename Backend::vector          vector;
-
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-
-    typedef detail::ilu_solve<Backend> ilu_solve;
-
-    /// Relaxation parameters.
-    struct params {
-        /// Level of fill-in.
-        int k;
-
-        /// Damping factor.
-        scalar_type damping;
-
-        /// Parameters for sparse triangular system solver
-        typename ilu_solve::params solve;
-
-        params() : k(1), damping(1) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, k)
-            , AMGCL_PARAMS_IMPORT_VALUE(p, damping)
-            , AMGCL_PARAMS_IMPORT_CHILD(p, solve)
-        {
-            check_params(p, {"k", "damping", "solve"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, k);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, solve);
-        }
-#endif
-    } prm;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    iluk( const Matrix &A, const params &prm, const typename Backend::params &bprm)
-      : prm(prm)
-    {
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-
-        const size_t n = backend::rows(A);
-
-        size_t Anz = backend::nonzeros(A);
-
-        std::vector<ptrdiff_t>  Lptr; Lptr.reserve(n+1); Lptr.push_back(0);
-        std::vector<ptrdiff_t>  Lcol; Lcol.reserve(Anz / 3);
-        std::vector<value_type> Lval; Lval.reserve(Anz / 3);
-
-        std::vector<ptrdiff_t>  Uptr; Uptr.reserve(n+1); Uptr.push_back(0);
-        std::vector<ptrdiff_t>  Ucol; Ucol.reserve(Anz / 3);
-        std::vector<value_type> Uval; Uval.reserve(Anz / 3);
-
-        std::vector<int> Ulev; Ulev.reserve(Anz / 3);
-
-        auto D = std::make_shared<backend::numa_vector<value_type> >(n, false);
-
-        sparse_vector w(n, prm.k);
-
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            w.reset(i);
-
-            for(auto a = backend::row_begin(A, i); a; ++a) {
-                w.add(a.col(), a.value(), 0);
-            }
-
-            while(!w.q.empty()) {
-                nonzero &a = w.next_nonzero();
-                a.val = a.val * (*D)[a.col];
-
-                for(ptrdiff_t j = Uptr[a.col], e = Uptr[a.col+1]; j < e; ++j) {
-                    int lev = std::max(a.lev, Ulev[j]) + 1;
-                    w.add(Ucol[j], -a.val * Uval[j], lev);
-                }
-            }
-
-            w.sort();
-
-            for(const nonzero &e : w.nz) {
-                if (e.col < i) {
-                    Lcol.push_back(e.col);
-                    Lval.push_back(e.val);
-                } else if (e.col == i) {
-                    (*D)[i] = math::inverse(e.val);
-                } else {
-                    Ucol.push_back(e.col);
-                    Uval.push_back(e.val);
-                    Ulev.push_back(e.lev);
-                }
-            }
-
-            Lptr.push_back(Lcol.size());
-            Uptr.push_back(Ucol.size());
-        }
-
-        ilu = std::make_shared<ilu_solve>(
-                std::make_shared<build_matrix>(n, n, Lptr, Lcol, Lval),
-                std::make_shared<build_matrix>(n, n, Uptr, Ucol, Uval),
-                D, prm.solve, bprm);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        ilu->solve(tmp);
-        backend::axpby(prm.damping, tmp, math::identity<scalar_type>(), x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        ilu->solve(tmp);
-        backend::axpby(prm.damping, tmp, math::identity<scalar_type>(), x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::copy(rhs, x);
-        ilu->solve(x);
-    }
-
-    size_t bytes() const {
-        return ilu->bytes();
-    }
-
-    private:
-        std::shared_ptr<ilu_solve> ilu;
-
-        struct nonzero {
-            ptrdiff_t  col;
-            value_type val;
-            int        lev;
-
-            nonzero() : col(-1) {}
-
-            nonzero(ptrdiff_t col, const value_type &val, int lev)
-                : col(col), val(val), lev(lev) {}
-
-            friend bool operator<(const nonzero &a, const nonzero &b) {
-                return a.col < b.col;
-            }
-        };
-
-        struct sparse_vector {
-            struct comp_indices {
-                const std::deque<nonzero> &nz;
-
-                comp_indices(const std::deque<nonzero> &nz) : nz(nz) {}
-
-                bool operator()(int a, int b) const {
-                    return nz[a].col > nz[b].col;
-                }
-            };
-
-            typedef
-                std::priority_queue<int, std::vector<int>, comp_indices>
-                priority_queue;
-
-            int lfil;
-
-            std::deque<nonzero>    nz;
-            std::vector<ptrdiff_t> idx;
-            priority_queue q;
-
-            ptrdiff_t dia;
-
-            sparse_vector(size_t n, int lfil)
-                : lfil(lfil), idx(n, -1), q(comp_indices(nz)), dia(0)
-            {}
-
-            void add(ptrdiff_t col, const value_type &val, int lev) {
-                if (idx[col] < 0) {
-                    if (lev <= lfil) {
-                        int p = nz.size();
-                        idx[col] = p;
-                        nz.push_back(nonzero(col, val, lev));
-                        if (col < dia) q.push(p);
-                    }
-                } else {
-                    nonzero &a = nz[idx[col]];
-                    a.val += val;
-                    a.lev = std::min(a.lev, lev);
-                }
-            }
-
-            typename std::deque<nonzero>::iterator begin() {
-                return nz.begin();
-            }
-
-            typename std::deque<nonzero>::iterator end() {
-                return nz.end();
-            }
-
-            nonzero& next_nonzero() {
-                int p = q.top();
-                q.pop();
-                return nz[p];
-            }
-
-            void sort() {
-                std::sort(nz.begin(), nz.end());
-            }
-
-            void reset(ptrdiff_t d) {
-                for(const nonzero &e : nz) idx[e.col] = -1;
-                nz.clear();
-                dia = d;
-            }
-        };
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/ilup.hpp b/src/solvers/amgcl/relaxation/ilup.hpp
deleted file mode 100644
index 29ed33f..0000000
--- a/src/solvers/amgcl/relaxation/ilup.hpp
+++ /dev/null
@@ -1,222 +0,0 @@
-#ifndef AMGCL_RELAXATION_ILUP_HPP
-#define AMGCL_RELAXATION_ILUP_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/ilup.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Incomplete LU with fill-in level.
- *
- * As opposed to the iluk, the fill-in is determined by taking a symbolic
- * power of the matrix.
- */
-
-#include <vector>
-#include <deque>
-#include <queue>
-#include <cmath>
-
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/relaxation/ilu0.hpp>
-
-namespace amgcl {
-namespace relaxation {
-namespace detail {
-
-template <class Matrix>
-std::shared_ptr<Matrix> symb_product(const Matrix &A, const Matrix &B) {
-    auto C = std::make_shared<Matrix>();
-
-    C->set_size(A.nrows, B.ncols);
-
-    auto A_ptr = A.ptr;
-    auto A_col = A.col;
-    auto B_ptr = B.ptr;
-    auto B_col = B.col;
-    auto C_ptr = C->ptr;
-    C_ptr[0] = 0;
-
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> marker(B.ncols, -1);
-
-#pragma omp for
-        for(ptrdiff_t ia = 0; ia < static_cast<ptrdiff_t>(A.nrows); ++ia) {
-            ptrdiff_t C_cols = 0;
-            for(ptrdiff_t ja = A_ptr[ia], ea = A_ptr[ia+1]; ja < ea; ++ja) {
-                ptrdiff_t ca = A_col[ja];
-
-                for(ptrdiff_t jb = B_ptr[ca], eb = B_ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t cb = B_col[jb];
-                    if (marker[cb] != ia) {
-                        marker[cb]  = ia;
-                        ++C_cols;
-                    }
-                }
-            }
-            C_ptr[ia + 1] = C_cols;
-        }
-    }
-
-    C->set_nonzeros(C->scan_row_sizes(), /*need_values = */false);
-    auto C_col = C->col;
-
-#pragma omp parallel
-    {
-        std::vector<ptrdiff_t> marker(B.ncols, -1);
-
-#pragma omp for
-        for(ptrdiff_t ia = 0; ia < static_cast<ptrdiff_t>(A.nrows); ++ia) {
-            ptrdiff_t row_beg = C_ptr[ia];
-            ptrdiff_t row_end = row_beg;
-
-            for(ptrdiff_t ja = A_ptr[ia], ea = A_ptr[ia+1]; ja < ea; ++ja) {
-                ptrdiff_t ca = A_col[ja];
-
-                for(ptrdiff_t jb = B_ptr[ca], eb = B_ptr[ca+1]; jb < eb; ++jb) {
-                    ptrdiff_t cb = B_col[jb];
-
-                    if (marker[cb] < row_beg) {
-                        marker[cb] = row_end;
-                        C_col[row_end] = cb;
-                        ++row_end;
-                    }
-                }
-            }
-
-            std::sort(C_col + row_beg, C_col + row_end);
-        }
-    }
-
-    return C;
-}
-
-} // namespace detail
-
-/// ILU(k) smoother.
-template <class Backend>
-struct ilup {
-    typedef typename Backend::value_type      value_type;
-
-    typedef ilu0<Backend> Base;
-
-    /// Relaxation parameters.
-    struct params : Base::params {
-        typedef typename Base::params BasePrm;
-
-        /// Level of fill-in.
-        int k;
-
-        params() : k(1) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : BasePrm(p), AMGCL_PARAMS_IMPORT_VALUE(p, k)
-        {
-            check_params(p, {"k", "damping", "solve"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            BasePrm::get(p, path);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, k);
-        }
-#endif
-    } prm;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    ilup( const Matrix &A, const params &prm, const typename Backend::params &bprm)
-      : prm(prm)
-    {
-        if (prm.k == 0) {
-            base = std::make_shared<Base>(A, prm, bprm);
-        } else {
-            auto P = detail::symb_product(A, A);
-            for(int k = 1; k < prm.k; ++k) {
-                P = detail::symb_product(*P, A);
-            }
-
-            ptrdiff_t n = backend::rows(A);
-            P->val = new value_type[P->nnz];
-
-#pragma omp parallel for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                ptrdiff_t p_beg = P->ptr[i];
-                ptrdiff_t p_end = P->ptr[i+1];
-                ptrdiff_t a_beg = A.ptr[i];
-                ptrdiff_t a_end = A.ptr[i+1];
-
-                std::fill(P->val + p_beg, P->val + p_end, math::zero<value_type>());
-
-                for(ptrdiff_t ja = a_beg, ea = a_end, jp = p_beg, ep = p_end; ja < ea; ++ja) {
-                    ptrdiff_t ca = A.col[ja];
-                    while(jp < ep && P->col[jp] < ca) ++jp;
-                    if (P->col[jp] == ca) P->val[jp] = A.val[ja];
-                }
-            }
-
-            base = std::make_shared<Base>(*P, prm, bprm);
-        }
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        base->apply_pre(A, rhs, x, tmp);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        base->apply_post(A, rhs, x, tmp);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        base->apply(A, rhs, x);
-    }
-
-    size_t bytes() const {
-        return base->bytes();
-    }
-
-    private:
-        std::shared_ptr<Base> base;
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/ilut.hpp b/src/solvers/amgcl/relaxation/ilut.hpp
deleted file mode 100644
index 811c903..0000000
--- a/src/solvers/amgcl/relaxation/ilut.hpp
+++ /dev/null
@@ -1,386 +0,0 @@
-#ifndef AMGCL_RELAXATION_ILUT_HPP
-#define AMGCL_RELAXATION_ILUT_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/ilut.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Incomplete LU with thresholding relaxation scheme.
- */
-
-#include <vector>
-#include <queue>
-#include <cmath>
-
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/relaxation/detail/ilu_solve.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// ILUT(p, tau) smoother.
-/**
- * \note ILUT is a serial algorithm and is only applicable to backends that
- * support matrix row iteration (e.g. amgcl::backend::builtin or
- * amgcl::backend::eigen).
- *
- * \param Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- */
-template <class Backend>
-struct ilut {
-    typedef typename Backend::value_type      value_type;
-    typedef typename Backend::col_type        col_type;
-    typedef typename Backend::ptr_type        ptr_type;
-    typedef typename Backend::matrix          matrix;
-    typedef typename Backend::matrix_diagonal matrix_diagonal;
-    typedef typename Backend::vector          vector;
-
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-
-    typedef detail::ilu_solve<Backend> ilu_solve;
-
-    /// Relaxation parameters.
-    struct params {
-        /// Fill factor.
-        scalar_type p;
-
-        /// Minimum magnitude of non-zero elements relative to the current row norm.
-        scalar_type tau;
-
-        /// Damping factor.
-        scalar_type damping;
-
-        /// Parameters for sparse triangular system solver
-        typename ilu_solve::params solve;
-
-        params() : p(2), tau(1e-2f), damping(1) {}
-
-#ifndef AMGCL_NO_BOOST
-        params(const boost::property_tree::ptree &p)
-            : AMGCL_PARAMS_IMPORT_VALUE(p, p)
-            , AMGCL_PARAMS_IMPORT_VALUE(p, tau)
-            , AMGCL_PARAMS_IMPORT_VALUE(p, damping)
-            , AMGCL_PARAMS_IMPORT_CHILD(p, solve)
-        {
-            check_params(p, {"p", "tau", "damping", "solve"});
-        }
-
-        void get(boost::property_tree::ptree &p, const std::string &path) const {
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, p);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, tau);
-            AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-            AMGCL_PARAMS_EXPORT_CHILD(p, path, solve);
-        }
-#endif
-    } prm;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    ilut( const Matrix &A, const params &prm, const typename Backend::params &bprm)
-      : prm(prm)
-    {
-        const size_t n = backend::rows(A);
-
-        size_t Lnz = 0, Unz = 0;
-
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            ptrdiff_t row_beg = A.ptr[i];
-            ptrdiff_t row_end = A.ptr[i + 1];
-
-            int lenL = 0, lenU = 0;
-            for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                ptrdiff_t c = A.col[j];
-                if (c < i)
-                    ++lenL;
-                else if (c > i)
-                    ++lenU;
-            }
-
-            Lnz += static_cast<size_t>(lenL * prm.p);
-            Unz += static_cast<size_t>(lenU * prm.p);
-        }
-
-        auto L = std::make_shared<build_matrix>();
-        auto U = std::make_shared<build_matrix>();
-
-        L->set_size(n, n); L->set_nonzeros(Lnz); L->ptr[0] = 0;
-        U->set_size(n, n); U->set_nonzeros(Unz); U->ptr[0] = 0;
-
-        auto D = std::make_shared<backend::numa_vector<value_type> >(n, false);
-
-        sparse_vector w(n);
-
-        for(ptrdiff_t i = 0, Lhead = 0, Uhead = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            w.dia = i;
-
-            int lenL = 0;
-            int lenU = 0;
-
-            scalar_type tol = math::zero<scalar_type>();
-
-            for(auto a = backend::row_begin(A, i); a; ++a) {
-                w[a.col()] = a.value();
-                tol += math::norm(a.value());
-
-                if (a.col() < i) ++lenL;
-                if (a.col() > i) ++lenU;
-            }
-            tol *= prm.tau / (lenL + lenU);
-
-            while(!w.q.empty()) {
-                ptrdiff_t k = w.next_nonzero();
-                w[k] = w[k] * (*D)[k];
-                value_type wk = w[k];
-
-                if (math::norm(wk) > tol) {
-                    for(ptrdiff_t j = U->ptr[k]; j < static_cast<ptrdiff_t>(U->ptr[k+1]); ++j)
-                        w[U->col[j]] -= wk * U->val[j];
-                }
-            }
-
-            w.move_to(
-                    static_cast<int>(lenL * prm.p),
-                    static_cast<int>(lenU * prm.p),
-                    tol, Lhead, *L, Uhead, *U, *D
-                    );
-
-            L->ptr[i+1] = Lhead;
-            U->ptr[i+1] = Uhead;
-        }
-
-        L->nnz = L->ptr[n];
-        U->nnz = U->ptr[n];
-
-        ilu = std::make_shared<ilu_solve>(L, U, D, prm.solve, bprm);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        ilu->solve(tmp);
-        backend::axpby(prm.damping, tmp, math::identity<scalar_type>(), x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        ilu->solve(tmp);
-        backend::axpby(prm.damping, tmp, math::identity<scalar_type>(), x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::copy(rhs, x);
-        ilu->solve(x);
-    }
-
-    size_t bytes() const {
-        return ilu->bytes();
-    }
-
-    private:
-        typedef typename backend::builtin<value_type, col_type, ptr_type>::matrix build_matrix;
-        std::shared_ptr<ilu_solve> ilu;
-
-        struct sparse_vector {
-            struct nonzero {
-                ptrdiff_t  col;
-                value_type val;
-
-                nonzero() : col(-1) {}
-
-                nonzero(ptrdiff_t col, const value_type &val = math::zero<value_type>())
-                    : col(col), val(val) {}
-            };
-
-            struct comp_indices {
-                const std::vector<nonzero> &nz;
-
-                comp_indices(const std::vector<nonzero> &nz) : nz(nz) {}
-
-                bool operator()(int a, int b) const {
-                    return nz[a].col > nz[b].col;
-                }
-            };
-
-            typedef
-                std::priority_queue<int, std::vector<int>, comp_indices>
-                priority_queue;
-
-            std::vector<nonzero>   nz;
-            std::vector<ptrdiff_t> idx;
-            priority_queue q;
-
-            ptrdiff_t dia;
-
-            sparse_vector(size_t n) : idx(n, -1), q(comp_indices(nz)), dia(0) {
-                nz.reserve(16);
-            }
-
-            value_type operator[](ptrdiff_t i) const {
-                if (idx[i] >= 0) return nz[idx[i]].val;
-                return math::zero<value_type>();
-            }
-
-            value_type& operator[](ptrdiff_t i) {
-                if (idx[i] == -1) {
-                    int p = nz.size();
-                    idx[i] = p;
-                    nz.push_back(nonzero(i));
-                    if (i < dia) q.push(p);
-                }
-                return nz[idx[i]].val;
-            }
-
-            typename std::vector<nonzero>::iterator begin() {
-                return nz.begin();
-            }
-
-            typename std::vector<nonzero>::iterator end() {
-                return nz.end();
-            }
-
-            ptrdiff_t next_nonzero() {
-                int p = q.top();
-                q.pop();
-                return nz[p].col;
-            }
-
-            struct higher_than {
-                scalar_type tol;
-                ptrdiff_t   dia;
-
-                higher_than(scalar_type tol, ptrdiff_t dia)
-                    : tol(tol), dia(dia) {}
-
-                bool operator()(const nonzero &v) const {
-                    return v.col == dia || math::norm(v.val) > tol;
-                }
-            };
-
-            struct L_first {
-                ptrdiff_t dia;
-
-                L_first(ptrdiff_t dia) : dia(dia) {}
-
-                bool operator()(const nonzero &v) const {
-                    return v.col < dia;
-                }
-            };
-
-            struct by_abs_val {
-                ptrdiff_t dia;
-
-                by_abs_val(ptrdiff_t dia) : dia(dia) {}
-
-                bool operator()(const nonzero &a, const nonzero &b) const {
-                    if (a.col == dia) return true;
-                    if (b.col == dia) return false;
-
-                    return math::norm(a.val) > math::norm(b.val);
-                }
-            };
-
-            struct by_col {
-                bool operator()(const nonzero &a, const nonzero &b) const {
-                    return a.col < b.col;
-                }
-            };
-
-            void move_to(
-                    int lp, int up, scalar_type tol,
-                    ptrdiff_t &Lhead, build_matrix &L,
-                    ptrdiff_t &Uhead, build_matrix &U,
-                    backend::numa_vector<value_type> &D
-                    )
-            {
-                typedef typename std::vector<nonzero>::iterator ptr;
-
-                ptr b = nz.begin();
-                ptr e = nz.end();
-
-                // Move zeros to back:
-                e = std::partition(b, e, higher_than(tol, dia));
-
-                // Split L and U:
-                ptr m = std::partition(b, e, L_first(dia));
-
-                // Get largest p elements in L and U.
-                ptr lend = std::min(b + lp, m);
-                ptr uend = std::min(m + up, e);
-
-                if (lend != m) std::nth_element(b, lend, m, by_abs_val(dia));
-                if (uend != e) std::nth_element(m, uend, e, by_abs_val(dia));
-
-                // Sort entries by column number
-                std::sort(b, lend, by_col());
-                std::sort(m, uend, by_col());
-
-                // copy L to the output matrix.
-                for(ptr a = b; a != lend; ++a) {
-                    L.col[Lhead] = a->col;
-                    L.val[Lhead] = a->val;
-
-                    ++Lhead;
-                }
-
-                // Store inverted diagonal.
-                D[dia] = math::inverse(m->val);
-
-                if (m != uend) {
-                    ++m;
-
-                    // copy U to the output matrix.
-                    for(ptr a = m; a != uend; ++a) {
-                        U.col[Uhead] = a->col;
-                        U.val[Uhead] = a->val;
-
-                        ++Uhead;
-                    }
-                }
-
-                for(const nonzero &e : nz) idx[e.col] = -1;
-                nz.clear();
-            }
-        };
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/runtime.hpp b/src/solvers/amgcl/relaxation/runtime.hpp
deleted file mode 100644
index ff8115a..0000000
--- a/src/solvers/amgcl/relaxation/runtime.hpp
+++ /dev/null
@@ -1,383 +0,0 @@
-#ifndef AMGCL_RELAXATION_RUNTIME_HPP
-#define AMGCL_RELAXATION_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime-configurable smoother as standalone preconditioner.
- */
-
-#include <type_traits>
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/relaxation/gauss_seidel.hpp>
-#include <amgcl/relaxation/ilu0.hpp>
-#include <amgcl/relaxation/iluk.hpp>
-#include <amgcl/relaxation/ilup.hpp>
-#include <amgcl/relaxation/ilut.hpp>
-#include <amgcl/relaxation/damped_jacobi.hpp>
-#include <amgcl/relaxation/spai0.hpp>
-#include <amgcl/relaxation/spai1.hpp>
-#include <amgcl/relaxation/chebyshev.hpp>
-
-namespace amgcl {
-namespace runtime {
-namespace relaxation {
-
-/// Relaxation schemes.
-enum type {
-    gauss_seidel,               ///< Gauss-Seidel smoothing
-    ilu0,                       ///< Incomplete LU with zero fill-in
-    iluk,                       ///< Level-based incomplete LU
-    ilup,                       ///< Level-based incomplete LU (fill-in is determined from A^p pattern)
-    ilut,                       ///< Incomplete LU with thresholding
-    damped_jacobi,              ///< Damped Jacobi
-    spai0,                      ///< Sparse approximate inverse of 0th order
-    spai1,                      ///< Sparse approximate inverse of 1st order
-    chebyshev                   ///< Chebyshev relaxation
-};
-
-inline std::ostream& operator<<(std::ostream &os, type r)
-{
-    switch (r) {
-        case gauss_seidel:
-            return os << "gauss_seidel";
-        case ilu0:
-            return os << "ilu0";
-        case iluk:
-            return os << "iluk";
-        case ilup:
-            return os << "ilup";
-        case ilut:
-            return os << "ilut";
-        case damped_jacobi:
-            return os << "damped_jacobi";
-        case spai0:
-            return os << "spai0";
-        case spai1:
-            return os << "spai1";
-        case chebyshev:
-            return os << "chebyshev";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &r)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "gauss_seidel")
-        r = gauss_seidel;
-    else if (val == "ilu0")
-        r = ilu0;
-    else if (val == "iluk")
-        r = iluk;
-    else if (val == "ilup")
-        r = ilup;
-    else if (val == "ilut")
-        r = ilut;
-    else if (val == "damped_jacobi")
-        r = damped_jacobi;
-    else if (val == "spai0")
-        r = spai0;
-    else if (val == "spai1")
-        r = spai1;
-    else if (val == "chebyshev")
-        r = chebyshev;
-    else
-        throw std::invalid_argument("Invalid relaxation value. Valid choices are:"
-                "gauss_seidel, ilu0, iluk, ilup, ilut, damped_jacobi, spai0, spai1, chebyshev.");
-
-    return in;
-}
-
-template <class Backend>
-struct wrapper {
-    typedef boost::property_tree::ptree params;
-    typedef typename Backend::params    backend_params;
-    type r;
-    void *handle;
-
-    template <class Matrix>
-    wrapper(const Matrix &A, params prm = params(),
-            const backend_params &bprm = backend_params()
-            )
-      : r(prm.get("type", runtime::relaxation::spai0)), handle(0)
-    {
-        if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-        switch(r) {
-
-#define AMGCL_RUNTIME_RELAXATION(type) \
-            case type: \
-                handle = call_constructor<amgcl::relaxation::type>(A, prm, bprm); \
-                break
-
-            AMGCL_RUNTIME_RELAXATION(gauss_seidel);
-            AMGCL_RUNTIME_RELAXATION(ilu0);
-            AMGCL_RUNTIME_RELAXATION(iluk);
-            AMGCL_RUNTIME_RELAXATION(ilup);
-            AMGCL_RUNTIME_RELAXATION(ilut);
-            AMGCL_RUNTIME_RELAXATION(damped_jacobi);
-            AMGCL_RUNTIME_RELAXATION(spai0);
-            AMGCL_RUNTIME_RELAXATION(spai1);
-            AMGCL_RUNTIME_RELAXATION(chebyshev);
-
-#undef AMGCL_RUNTIME_RELAXATION
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    ~wrapper() {
-        switch(r) {
-
-#define AMGCL_RUNTIME_RELAXATION(type) \
-            case type: \
-                delete static_cast<amgcl::relaxation::type<Backend>*>(handle); \
-                break
-
-            AMGCL_RUNTIME_RELAXATION(gauss_seidel);
-            AMGCL_RUNTIME_RELAXATION(ilu0);
-            AMGCL_RUNTIME_RELAXATION(iluk);
-            AMGCL_RUNTIME_RELAXATION(ilup);
-            AMGCL_RUNTIME_RELAXATION(ilut);
-            AMGCL_RUNTIME_RELAXATION(damped_jacobi);
-            AMGCL_RUNTIME_RELAXATION(spai0);
-            AMGCL_RUNTIME_RELAXATION(spai1);
-            AMGCL_RUNTIME_RELAXATION(chebyshev);
-
-#undef AMGCL_RUNTIME_RELAXATION
-        }
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        switch(r) {
-
-#define AMGCL_RUNTIME_RELAXATION(type) \
-            case type: \
-                call_apply_pre<amgcl::relaxation::type>(A, rhs, x, tmp); \
-                break
-
-            AMGCL_RUNTIME_RELAXATION(gauss_seidel);
-            AMGCL_RUNTIME_RELAXATION(ilu0);
-            AMGCL_RUNTIME_RELAXATION(iluk);
-            AMGCL_RUNTIME_RELAXATION(ilup);
-            AMGCL_RUNTIME_RELAXATION(ilut);
-            AMGCL_RUNTIME_RELAXATION(damped_jacobi);
-            AMGCL_RUNTIME_RELAXATION(spai0);
-            AMGCL_RUNTIME_RELAXATION(spai1);
-            AMGCL_RUNTIME_RELAXATION(chebyshev);
-
-#undef AMGCL_RUNTIME_RELAXATION
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        switch(r) {
-
-#define AMGCL_RUNTIME_RELAXATION(type) \
-            case type: \
-                call_apply_post<amgcl::relaxation::type>(A, rhs, x, tmp); \
-                break
-
-            AMGCL_RUNTIME_RELAXATION(gauss_seidel);
-            AMGCL_RUNTIME_RELAXATION(ilu0);
-            AMGCL_RUNTIME_RELAXATION(iluk);
-            AMGCL_RUNTIME_RELAXATION(ilup);
-            AMGCL_RUNTIME_RELAXATION(ilut);
-            AMGCL_RUNTIME_RELAXATION(damped_jacobi);
-            AMGCL_RUNTIME_RELAXATION(spai0);
-            AMGCL_RUNTIME_RELAXATION(spai1);
-            AMGCL_RUNTIME_RELAXATION(chebyshev);
-
-#undef AMGCL_RUNTIME_RELAXATION
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply( const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        switch(r) {
-
-#define AMGCL_RUNTIME_RELAXATION(type) \
-            case type: \
-                call_apply<amgcl::relaxation::type>(A, rhs, x); \
-                break
-
-            AMGCL_RUNTIME_RELAXATION(gauss_seidel);
-            AMGCL_RUNTIME_RELAXATION(ilu0);
-            AMGCL_RUNTIME_RELAXATION(iluk);
-            AMGCL_RUNTIME_RELAXATION(ilup);
-            AMGCL_RUNTIME_RELAXATION(ilut);
-            AMGCL_RUNTIME_RELAXATION(damped_jacobi);
-            AMGCL_RUNTIME_RELAXATION(spai0);
-            AMGCL_RUNTIME_RELAXATION(spai1);
-            AMGCL_RUNTIME_RELAXATION(chebyshev);
-
-#undef AMGCL_RUNTIME_RELAXATION
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    size_t bytes() const {
-        switch(r) {
-
-#define AMGCL_RUNTIME_RELAXATION(type) \
-            case type: \
-                return backend::bytes(*static_cast<amgcl::relaxation::type<Backend>*>(handle))
-
-            AMGCL_RUNTIME_RELAXATION(gauss_seidel);
-            AMGCL_RUNTIME_RELAXATION(ilu0);
-            AMGCL_RUNTIME_RELAXATION(iluk);
-            AMGCL_RUNTIME_RELAXATION(ilup);
-            AMGCL_RUNTIME_RELAXATION(ilut);
-            AMGCL_RUNTIME_RELAXATION(damped_jacobi);
-            AMGCL_RUNTIME_RELAXATION(spai0);
-            AMGCL_RUNTIME_RELAXATION(spai1);
-            AMGCL_RUNTIME_RELAXATION(chebyshev);
-
-#undef AMGCL_RUNTIME_RELAXATION
-
-            default:
-                throw std::invalid_argument("Unsupported relaxation type");
-        }
-    }
-
-    template <template <class> class Relaxation, class Matrix>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void*
-    >::type
-    call_constructor(
-            const Matrix &A, const params &prm, const backend_params &bprm)
-    {
-        return static_cast<void*>(new Relaxation<Backend>(A, prm, bprm));
-    }
-
-    template <template <class> class Relaxation, class Matrix>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void*
-    >::type
-    call_constructor(const Matrix&, const params&, const backend_params&)
-    {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp) const
-    {
-        static_cast<Relaxation<Backend>*>(handle)->apply_pre(A, rhs, x, tmp);
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_pre(const Matrix&, const VectorRHS&, VectorX&, VectorTMP&) const {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp) const
-    {
-        static_cast<Relaxation<Backend>*>(handle)->apply_post(A, rhs, x, tmp);
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply_post(const Matrix&, const VectorRHS&, VectorX&, VectorTMP&) const {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX>
-    typename std::enable_if<
-        backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x) const
-    {
-        static_cast<Relaxation<Backend>*>(handle)->apply(A, rhs, x);
-    }
-
-    template <template <class> class Relaxation, class Matrix, class VectorRHS, class VectorX>
-    typename std::enable_if<
-        !backend::relaxation_is_supported<Backend, Relaxation>::value,
-        void
-    >::type
-    call_apply(const Matrix&, const VectorRHS&, VectorX&) const {
-        throw std::logic_error("The relaxation is not supported by the backend");
-    }
-
-};
-
-} // namespace relaxation
-} // namespace runtime
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/spai0.hpp b/src/solvers/amgcl/relaxation/spai0.hpp
deleted file mode 100644
index 3a5fb0d..0000000
--- a/src/solvers/amgcl/relaxation/spai0.hpp
+++ /dev/null
@@ -1,122 +0,0 @@
-#ifndef AMGCL_RELAXATION_SPAI0_HPP
-#define AMGCL_RELAXATION_SPAI0_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/spai0.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Sparse approximate inverse relaxation scheme.
- */
-
-#include <memory>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// Sparse approximate interface smoother.
-/**
- * The inverse matrix is approximated with diagonal matrix.
- *
- * \tparam Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- * \sa \cite Broker2002
- */
-template <class Backend>
-struct spai0 {
-    typedef typename Backend::value_type      value_type;
-    typedef typename Backend::matrix_diagonal matrix_diagonal;
-
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    /// Relaxation parameters.
-    typedef amgcl::detail::empty_params params;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    spai0( const Matrix &A, const params &, const typename Backend::params &backend_prm)
-    {
-        const size_t n = rows(A);
-
-        auto m = std::make_shared< backend::numa_vector<value_type> >(n, false);
-
-#pragma omp parallel for
-        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-            value_type  num = math::zero<value_type>();
-            scalar_type den = math::zero<scalar_type>();
-
-            for(auto a = backend::row_begin(A, i); a; ++a) {
-                value_type v = a.value();
-                scalar_type norm_v = math::norm(v);
-                den += norm_v * norm_v;
-                if (a.col() == i) num += v;
-            }
-
-            (*m)[i] = math::inverse(den) * num;
-        }
-
-        M = Backend::copy_vector(m, backend_prm);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        static const scalar_type one = math::identity<scalar_type>();
-        backend::residual(rhs, A, x, tmp);
-        backend::vmul(one, *M, tmp, one, x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        static const scalar_type one = math::identity<scalar_type>();
-        backend::residual(rhs, A, x, tmp);
-        backend::vmul(one, *M, tmp, one, x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply( const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::vmul(math::identity<scalar_type>(), *M, rhs, math::zero<scalar_type>(), x);
-    }
-
-    size_t bytes() const {
-        return backend::bytes(*M);
-    }
-
-    std::shared_ptr<matrix_diagonal> M;
-};
-
-} // namespace relaxation
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/relaxation/spai1.hpp b/src/solvers/amgcl/relaxation/spai1.hpp
deleted file mode 100644
index 9c8e567..0000000
--- a/src/solvers/amgcl/relaxation/spai1.hpp
+++ /dev/null
@@ -1,176 +0,0 @@
-#ifndef AMGCL_RELAXATION_SPAI1_HPP
-#define AMGCL_RELAXATION_SPAI1_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/relaxation/spai1.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Sparse approximate inverse relaxation scheme.
- */
-
-#include <vector>
-
-#include <memory>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/util.hpp>
-#include <amgcl/detail/qr.hpp>
-
-namespace amgcl {
-namespace relaxation {
-
-/// Sparse approximate interface smoother.
-/**
- * Sparsity pattern of the approximate inverse matrix coincides with that of A.
- *
- * \tparam Backend Backend for temporary structures allocation.
- * \ingroup relaxation
- * \sa \cite Broker2002
- */
-template <class Backend>
-struct spai1 {
-    typedef typename Backend::value_type value_type;
-    typedef typename Backend::vector     vector;
-
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-
-    /// Relaxation parameters.
-    typedef amgcl::detail::empty_params params;
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::damped_jacobi
-    template <class Matrix>
-    spai1( const Matrix &A, const params &, const typename Backend::params &backend_prm)
-    {
-        typedef typename backend::value_type<Matrix>::type value_type;
-
-        const size_t n = backend::rows(A);
-        const size_t m = backend::cols(A);
-
-        auto Ainv = std::make_shared<Matrix>(A);
-
-#pragma omp parallel
-        {
-            std::vector<ptrdiff_t> marker(m, -1);
-            std::vector<ptrdiff_t> I, J;
-            std::vector<value_type> B, ek;
-            amgcl::detail::QR<value_type> qr;
-
-#pragma omp for
-            for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i) {
-                ptrdiff_t row_beg = A.ptr[i];
-                ptrdiff_t row_end = A.ptr[i + 1];
-
-                I.assign(A.col + row_beg, A.col + row_end);
-
-                J.clear();
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    ptrdiff_t c = A.col[j];
-
-                    for(ptrdiff_t jj = A.ptr[c], ee = A.ptr[c + 1]; jj < ee; ++jj) {
-                        ptrdiff_t cc = A.col[jj];
-                        if (marker[cc] < 0) {
-                            marker[cc] = 1;
-                            J.push_back(cc);
-                        }
-                    }
-                }
-                std::sort(J.begin(), J.end());
-                B.assign(I.size() * J.size(), math::zero<value_type>());
-                ek.assign(J.size(), math::zero<value_type>());
-                for(size_t j = 0; j < J.size(); ++j) {
-                    marker[J[j]] = j;
-                    if (J[j] == static_cast<ptrdiff_t>(i)) ek[j] = math::identity<value_type>();
-                }
-
-                for(ptrdiff_t j = row_beg; j < row_end; ++j) {
-                    ptrdiff_t c = A.col[j];
-
-                    for(auto a = row_begin(A, c); a; ++a)
-                        B[marker[a.col()] + J.size() * (j - row_beg)] = a.value();
-                }
-
-                qr.solve(J.size(), I.size(), &B[0], &ek[0], &Ainv->val[row_beg],
-                        amgcl::detail::col_major);
-
-                for(size_t j = 0; j < J.size(); ++j)
-                    marker[J[j]] = -1;
-            }
-        }
-
-        M = Backend::copy_matrix(Ainv, backend_prm);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_pre
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_pre(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        backend::spmv(math::identity<scalar_type>(), *M, tmp, math::identity<scalar_type>(), x);
-    }
-
-    /// \copydoc amgcl::relaxation::damped_jacobi::apply_post
-    template <class Matrix, class VectorRHS, class VectorX, class VectorTMP>
-    void apply_post(
-            const Matrix &A, const VectorRHS &rhs, VectorX &x, VectorTMP &tmp
-            ) const
-    {
-        backend::residual(rhs, A, x, tmp);
-        backend::spmv(math::identity<scalar_type>(), *M, tmp, math::identity<scalar_type>(), x);
-    }
-
-    template <class Matrix, class VectorRHS, class VectorX>
-    void apply(const Matrix&, const VectorRHS &rhs, VectorX &x) const
-    {
-        backend::spmv(math::identity<scalar_type>(), *M, rhs, math::zero<scalar_type>(), x);
-    }
-
-    size_t bytes() const {
-        return backend::bytes(*M);
-    }
-
-    std::shared_ptr<typename Backend::matrix> M;
-};
-
-} // namespace relaxation
-
-namespace backend {
-
-template <class Backend>
-struct relaxation_is_supported<
-    Backend, relaxation::spai1,
-    typename std::enable_if<
-        (amgcl::math::static_rows<typename Backend::value_type>::value > 1)
-        >::type
-    > : std::false_type
-{};
-
-} // namespace backend
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/reorder/cuthill_mckee.hpp b/src/solvers/amgcl/reorder/cuthill_mckee.hpp
deleted file mode 100644
index 5811bb4..0000000
--- a/src/solvers/amgcl/reorder/cuthill_mckee.hpp
+++ /dev/null
@@ -1,191 +0,0 @@
-#ifndef AMGCL_REORDER_CUTHILL_MCKEE_HPP
-#define AMGCL_REORDER_CUTHILL_MCKEE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/reorder/cuthill_mckee.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  (Reverse) Cuthill-McKee matrix reorder algorithm.
-
-The code is adopted from Kratos project http://www.cimne.com/kratos. The
-original code came with the following copyright notice:
-\verbatim
-Kratos Multi-Physics
-
-Copyright (c) 2012, Pooyan Dadvand, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-
-    Redistributions of source code must retain the above copyright notice, this
-    list of conditions and the following disclaimer.
-    Redistributions in binary form must reproduce the above copyright notice,
-    this list of conditions and the following disclaimer in the documentation
-    and/or other materials provided with the distribution.
-    All advertising materials mentioning features or use of this software must
-    display the following acknowledgement:
-    This product includes Kratos Multi-Physics technology.
-    Neither the name of the CIMNE nor the names of its contributors may be used
-    to endorse or promote products derived from this software without specific
-    prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ''AS IS'' AND ANY EXPRESS OR
-IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
-EVENT SHALL THE COPYRIGHT HOLDERS BE LIABLE FOR ANY DIRECT, INDIRECT,
-INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
-PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED ANDON ANY THEORY OF
-LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT(INCLUDING NEGLIGENCE
-OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THISSOFTWARE, EVEN IF
-ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-\endverbatim
-*/
-
-#include <vector>
-#include <algorithm>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace reorder {
-
-template <bool reverse = false>
-struct cuthill_mckee {
-    template <class Matrix, class Vector>
-    static void get(const Matrix &A, Vector &perm) {
-        const ptrdiff_t n = backend::rows(A);
-
-        /* The data structure used to sort and traverse the level sets:
-         *
-         * The current level set is currentLevelSet;
-         * In this level set, there are nodes with degrees from 0 (not really
-         * useful) to maxDegreeInCurrentLevelSet.
-         * firstWithDegree[i] points to a node with degree i, or to -1 if it
-         * does not exist. nextSameDegree[firstWithDegree[i]] points to the
-         * second node with that degree, etc.
-         * While the level set is being traversed, the structure for the next
-         * level set is generated; nMDICLS will be the next
-         * maxDegreeInCurrentLevelSet and nFirstWithDegree will be
-         * firstWithDegree.
-         */
-        ptrdiff_t initialNode = 0; // node to start search
-        ptrdiff_t maxDegree   = 0;
-
-        std::vector<ptrdiff_t> degree(n);
-        std::vector<ptrdiff_t> levelSet(n, 0);
-        std::vector<ptrdiff_t> nextSameDegree(n, -1);
-
-#pragma omp parallel
-        {
-            ptrdiff_t maxd = 0;
-#pragma omp for
-            for(ptrdiff_t i = 0; i < n; ++i) {
-                ptrdiff_t row_width = 0;
-                for(auto a = backend::row_begin(A, i); a; ++a, ++row_width);
-                degree[i] = row_width;
-                maxd = std::max(maxd, degree[i]);
-            }
-#pragma omp critical
-            {
-                maxDegree = std::max(maxDegree, maxd);
-            }
-        }
-
-        std::vector<ptrdiff_t> firstWithDegree(maxDegree + 1, -1);
-        std::vector<ptrdiff_t> nFirstWithDegree(maxDegree + 1);
-
-        // Initialize the first level set, made up by initialNode alone
-        perm[0] = initialNode;
-        ptrdiff_t currentLevelSet = 1;
-        levelSet[initialNode] = currentLevelSet;
-        ptrdiff_t maxDegreeInCurrentLevelSet = degree[initialNode];
-        firstWithDegree[maxDegreeInCurrentLevelSet] = initialNode;
-
-        // Main loop
-        for (ptrdiff_t next = 1; next < n; ) {
-            ptrdiff_t nMDICLS = 0;
-            std::fill(nFirstWithDegree.begin(), nFirstWithDegree.end(), -1);
-            bool empty = true; // used to detect different connected components
-
-            ptrdiff_t firstVal  = reverse ? maxDegreeInCurrentLevelSet : 0;
-            ptrdiff_t finalVal  = reverse ? -1 : maxDegreeInCurrentLevelSet + 1;
-            ptrdiff_t increment = reverse ? -1 : 1;
-
-            for(ptrdiff_t soughtDegree = firstVal; soughtDegree != finalVal; soughtDegree += increment)
-            {
-                ptrdiff_t node = firstWithDegree[soughtDegree];
-                while (node > 0) {
-                    // Visit neighbors
-                    for(auto a = backend::row_begin(A, node); a; ++a) {
-                        ptrdiff_t c = a.col();
-                        if (levelSet[c] == 0) {
-                            levelSet[c] = currentLevelSet + 1;
-                            perm[next] = c;
-                            ++next;
-                            empty = false; // this level set is not empty
-                            nextSameDegree[c] = nFirstWithDegree[degree[c]];
-                            nFirstWithDegree[degree[c]] = c;
-                            nMDICLS = std::max(nMDICLS, degree[c]);
-                        }
-                    }
-                    node = nextSameDegree[node];
-                }
-            }
-
-            ++currentLevelSet;
-            maxDegreeInCurrentLevelSet = nMDICLS;
-            for(ptrdiff_t i = 0; i <= nMDICLS; ++i)
-                firstWithDegree[i] = nFirstWithDegree[i];
-
-            if (empty) {
-                // The graph contains another connected component that we
-                // cannot reach.  Search for a node that has not yet been
-                // included in a level set, and start exploring from it.
-                bool found = false;
-                for(ptrdiff_t i = 0; i < n; ++i) {
-                    if (levelSet[i] == 0) {
-                        perm[next] = i;
-                        ++next;
-                        levelSet[i] = currentLevelSet;
-                        maxDegreeInCurrentLevelSet = degree[i];
-                        firstWithDegree[maxDegreeInCurrentLevelSet] = i;
-                        found = true;
-                        break;
-                    }
-                }
-                precondition(found, "Internal consistency error at skyline_lu");
-            }
-        }
-    }
-};
-
-} // namespace reorder
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/bicgstab.hpp b/src/solvers/amgcl/solver/bicgstab.hpp
deleted file mode 100644
index 48b3ea7..0000000
--- a/src/solvers/amgcl/solver/bicgstab.hpp
+++ /dev/null
@@ -1,304 +0,0 @@
-#ifndef AMGCL_SOLVERS_BICGSTAB_HPP
-#define AMGCL_SOLVERS_BICGSTAB_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/bicgstab.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  BiCGStab iterative method.
- */
-
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/solver/precond_side.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-/** BiConjugate Gradient Stabilized (BiCGSTAB) method.
- * \rst
- * The BiConjugate Gradient Stabilized method (Bi-CGSTAB) was developed to
- * solve nonsymmetric linear systems while avoiding the often irregular
- * convergence patterns of the Conjugate Gradient [Barr94]_.
- * \endrst
- */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class bicgstab {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        typedef typename math::inner_product_impl<
-            typename math::rhs_of<value_type>::type
-            >::return_type coef_type;
-
-
-        /// Solver parameters.
-        struct params {
-            /// Preconditioning kind (left/right).
-            preconditioner::side::type pside;
-
-            /// Maximum number of iterations.
-            size_t maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Always do at least one iteration.
-            bool check_after;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : pside(preconditioner::side::right), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  check_after(false), ns_search(false), verbose(false)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, pside),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, check_after),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"pside", "maxiter", "tol", "abstol",
-                        "check_after", "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, pside);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, check_after);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        };
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        bicgstab(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &backend_prm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-                )
-            : prm(prm), n(n),
-              r ( Backend::create_vector(n, backend_prm) ),
-              p ( Backend::create_vector(n, backend_prm) ),
-              v ( Backend::create_vector(n, backend_prm) ),
-              s ( Backend::create_vector(n, backend_prm) ),
-              t ( Backend::create_vector(n, backend_prm) ),
-              rh( Backend::create_vector(n, backend_prm) ),
-              T ( Backend::create_vector(n, backend_prm) ),
-              inner_product(inner_product)
-        { }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            namespace side = preconditioner::side;
-
-            static const coef_type one  = math::identity<coef_type>();
-            static const coef_type zero = math::zero<coef_type>();
-
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            if (prm.pside == side::left) {
-                backend::residual(rhs, A, x, *rh);
-                P.apply(*rh, *r);
-            } else {
-                backend::residual(rhs, A, x, *r);
-            }
-            backend::copy(*r, *rh);
-
-            scalar_type eps = std::max(norm_rhs * prm.tol, prm.abstol);
-            scalar_type res = prm.check_after ? 2 * eps : norm(*r);
-
-            coef_type rho1  = zero;
-            coef_type rho2  = zero;
-            coef_type alpha = zero;
-            coef_type omega = zero;
-
-            size_t iter = 0;
-            for(bool first = true; res > eps && iter < prm.maxiter; ++iter) {
-
-                rho2 = rho1;
-                rho1 = inner_product(*r, *rh);
-
-                if (first) {
-                    backend::copy(*r, *p);
-                    first = false;
-                } else {
-                    precondition(!math::is_zero(rho2), "Zero rho in BiCGStab");
-                    coef_type beta = (rho1 * alpha) / (rho2 * omega);
-                    backend::axpbypcz(one, *r, -beta * omega, *v, beta, *p);
-                }
-
-                preconditioner::spmv(prm.pside, P, A, *p, *v, *T);
-
-                alpha = rho1 / inner_product(*rh, *v);
-
-                if (prm.pside == side::left) {
-                    backend::axpby(alpha, *p, one, x);
-                } else {
-                    backend::axpby(alpha, *T, one, x);
-                }
-
-                backend::axpbypcz(one, *r, -alpha, *v, zero, *s);
-
-                if ((res = norm(*s)) > eps) {
-                    preconditioner::spmv(prm.pside, P, A, *s, *t, *T);
-
-                    omega = inner_product(*t, *s) / inner_product(*t, *t);
-
-                    precondition(!math::is_zero(omega), "Zero omega in BiCGStab");
-
-                    if (prm.pside == side::left) {
-                        backend::axpby(omega, *s, one, x);
-                    } else {
-                        backend::axpby(omega, *T, one, x);
-                    }
-
-                    backend::axpbypcz(one, *s, -omega, *t, zero, *r);
-
-                    res = norm(*r);
-                }
-
-                if (prm.verbose && iter % 5 == 0)
-                    std::cout << iter << "\t" << std::scientific << res / norm_rhs << std::endl;
-            }
-
-            return std::make_tuple(iter, res / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            return
-                backend::bytes(*r) +
-                backend::bytes(*p) +
-                backend::bytes(*v) +
-                backend::bytes(*s) +
-                backend::bytes(*t) +
-                backend::bytes(*rh) +
-                backend::bytes(*T);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const bicgstab &s) {
-            return os
-                << "Type:             BiCGStab"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    public:
-        params prm;
-
-    private:
-        size_t n;
-
-        std::shared_ptr<vector> r;
-        std::shared_ptr<vector> p;
-        std::shared_ptr<vector> v;
-        std::shared_ptr<vector> s;
-        std::shared_ptr<vector> t;
-        std::shared_ptr<vector> rh;
-        std::shared_ptr<vector> T;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return sqrt(math::norm(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/bicgstabl.hpp b/src/solvers/amgcl/solver/bicgstabl.hpp
deleted file mode 100644
index 0a53b14..0000000
--- a/src/solvers/amgcl/solver/bicgstabl.hpp
+++ /dev/null
@@ -1,499 +0,0 @@
-#ifndef AMGCL_SOLVER_BICGSTABL_HPP
-#define AMGCL_SOLVER_BICGSTABL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/solver/bicgstabl.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  BiCGStab(L) iterative method.
-
-The code is ported from PETSC BCGSL [1] and is based on [2].
-
-[1] http://www.mcs.anl.gov/petsc/petsc-current/docs/manualpages/KSP/KSPBCGSL.html
-[2] Fokkema, Diederik R. Enhanced implementation of BiCGstab (l) for solving
-    linear systems of equations. Universiteit Utrecht. Mathematisch Instituut,
-    1996.
-
-The original code came with the following license:
-
-\verbatim
-Copyright (c) 1991-2014, UChicago Argonne, LLC and the PETSc Development Team
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without modification,
-are permitted provided that the following conditions are met:
-
-* Redistributions of source code must retain the above copyright notice, this
-  list of conditions and the following disclaimer.
-* Redistributions in binary form must reproduce the above copyright notice, this
-  list of conditions and the following disclaimer in the documentation and/or
-  other materials provided with the distribution.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
-ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
-ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- \endverbatim
- */
-
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/solver/precond_side.hpp>
-#include <amgcl/detail/qr.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-/** BiCGStab(L) method.
- * \rst
- * Generalization of BiCGStab method [SlDi93]_.
- * \endrst
- */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class bicgstabl {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        typedef typename math::inner_product_impl<
-            typename math::rhs_of<value_type>::type
-            >::return_type coef_type;
-
-
-        /// Solver parameters.
-        struct params {
-            // Order of the method.
-            int L;
-
-            // Threshold used to decide when to refresh computed residuals.
-            scalar_type delta;
-
-            // Use a convex function of the MinRes and OR polynomials
-            // after the BiCG step instead of default MinRes
-            bool convex;
-
-            // Preconditioning kind (left/right).
-            preconditioner::side::type pside;
-
-            // Maximum number of iterations.
-            size_t maxiter;
-
-            // Target relative residual error.
-            scalar_type tol;
-
-            // Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : L(2), delta(0), convex(true),
-                  pside(preconditioner::side::right), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  ns_search(false), verbose(false)
-            {
-            }
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, L),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, delta),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, convex),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, pside),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"L", "delta", "convex", "pside", "maxiter",
-                        "tol", "abstol", "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, L);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, delta);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, convex);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, pside);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        };
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        bicgstabl(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &backend_prm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-                )
-            : prm(prm), n(n),
-              Rt( Backend::create_vector(n, backend_prm) ),
-              X ( Backend::create_vector(n, backend_prm) ),
-              B ( Backend::create_vector(n, backend_prm) ),
-              T ( Backend::create_vector(n, backend_prm) ),
-              R(prm.L + 1), U(prm.L + 1),
-              MZa(prm.L + 1, prm.L + 1),
-              MZb(prm.L + 1, prm.L + 1),
-              Y0(prm.L + 1), YL(prm.L + 1),
-              inner_product(inner_product)
-        {
-            precondition(prm.L > 0, "L in BiCGStab(L) should be >=1");
-
-            for(int i = 0; i <= prm.L; ++i) {
-                R[i] = Backend::create_vector(n, backend_prm);
-                U[i] = Backend::create_vector(n, backend_prm);
-            }
-        }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            namespace side = preconditioner::side;
-
-            static const coef_type one  = math::identity<coef_type>();
-            static const coef_type zero = math::zero<coef_type>();
-
-            const int L = prm.L;
-
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-
-            // Check if there is a trivial solution
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            if (prm.pside == side::left) {
-                backend::residual(rhs, A, x, *T);
-                P.apply(*T, *B);
-            } else {
-                backend::residual(rhs, A, x, *B);
-            }
-
-            scalar_type zeta0 = norm(*B);
-            scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
-
-            coef_type alpha = zero;
-            coef_type rho0  = one;
-            coef_type omega = one;
-
-            // Go
-            backend::copy(*B, *R[0]);
-            backend::copy(*B, *Rt);
-            backend::clear(*X);
-            backend::clear(*U[0]);
-
-            scalar_type zeta           = zeta0;
-            scalar_type rnmax_computed = zeta0;
-            scalar_type rnmax_true     = zeta0;
-
-            size_t iter = 0;
-            for(; iter < prm.maxiter && zeta >= eps; iter += L) {
-                // BiCG part
-                rho0 = -omega * rho0;
-
-                for(int j = 0; j < L; ++j) {
-                    coef_type rho1 = inner_product(*R[j], *Rt);
-                    precondition(!math::is_zero(rho1),
-                            "BiCGStab(L) breakdown: diverged (zero rho)");
-
-                    coef_type beta = alpha * (rho1 / rho0);
-                    rho0 = rho1;
-
-                    for(int i = 0; i <= j; ++i)
-                        backend::axpby(one, *R[i], -beta, *U[i]);
-
-                    preconditioner::spmv(prm.pside, P, A, *U[j], *U[j+1], *T);
-
-                    coef_type sigma = inner_product(*U[j+1], *Rt);
-                    precondition(!math::is_zero(sigma),
-                            "BiCGStab(L) breakdown: diverged (zero sigma)");
-                    alpha = rho1 / sigma;
-
-                    backend::axpby(alpha, *U[0], one, *X);
-
-                    for(int i = 0; i <= j; ++i)
-                        backend::axpby(-alpha, *U[i+1], one, *R[i]);
-
-                    preconditioner::spmv(prm.pside, P, A, *R[j], *R[j+1], *T);
-
-                    zeta = norm(*R[0]);
-
-                    rnmax_computed = std::max(zeta, rnmax_computed);
-                    rnmax_true     = std::max(zeta, rnmax_true);
-
-                    // Check for early exit
-                    if (zeta < eps) {
-                        iter += j+1;
-                        goto done;
-                    }
-                }
-
-                // Polynomial part
-                for(int i = 0; i <= L; ++i) {
-                    for(int j = 0; j <= i; ++j) {
-                        MZa(i, j) = inner_product(*R[i], *R[j]);
-                    }
-                }
-
-                // Symmetrize MZa
-                for (int i = 0; i <= L; ++i) {
-                    for (int j = i+1; j <= L; ++j) {
-                        MZa(i, j) = MZa(j, i) = math::adjoint(MZa(j, i));
-                    }
-                }
-
-                std::copy(MZa.data(), MZa.data() + MZa.size(), MZb.data());
-
-                if (prm.convex || L == 1) {
-                    Y0[0] = -one;
-
-                    qr.solve(L, L, MZa.stride(0), MZa.stride(1),
-                            &MZa(1, 1), &MZb(0, 1), &Y0[1]);
-                } else {
-                    Y0[0] = -one;
-                    Y0[L] = zero;
-                    qr.solve(L-1, L-1, MZa.stride(0), MZa.stride(1),
-                            &MZa(1, 1), &MZb(0, 1), &Y0[1]);
-
-                    YL[0] = zero;
-                    YL[L] = -one;
-                    qr.solve(L-1, L-1, MZa.stride(0), MZa.stride(1),
-                            &MZa(1, 1), &MZb(L, 1), &YL[1], /*computed=*/true);
-
-                    coef_type dot0 = zero;
-                    coef_type dot1 = zero;
-                    coef_type dotA = zero;
-                    for(int i = 0; i <= L; ++i) {
-                        coef_type s0 = zero;
-                        coef_type sL = zero;
-
-                        for(int j = 0; j <= L; ++j) {
-                            coef_type M = MZb(i, j);
-                            s0 += M * Y0[j];
-                            sL += M * YL[j];
-                        }
-
-                        dot0 += Y0[i] * s0;
-                        dotA += YL[i] * s0;
-                        dot1 += YL[i] * sL;
-                    }
-
-                    scalar_type kappa0 = sqrt(std::abs(std::real(dot0)));
-                    scalar_type kappa1 = sqrt(std::abs(std::real(dot1)));
-                    scalar_type kappaA = std::real(dotA);
-
-                    if (!math::is_zero(kappa0) && !math::is_zero(kappa1)) {
-                        scalar_type ghat;
-                        if (kappaA < 0.7 * kappa0 * kappa1) {
-                            ghat = (kappaA < 0) ? -0.7 * kappa0 / kappa1 : 0.7 * kappa0 / kappa1;
-                        } else {
-                            ghat = kappaA / (kappa1 * kappa1);
-                        }
-
-                        for (int i = 0; i <= L; ++i)
-                            Y0[i] -= ghat * YL[i];
-                    }
-                }
-
-                omega = Y0[L];
-                for(int h = L; h > 0 && math::is_zero(omega); --h)
-                    omega = Y0[h];
-                precondition(!math::is_zero(omega),
-                        "BiCGStab(L) breakdown: diverged (zero omega)");
-
-                backend::lin_comb(L, &Y0[1], &R[0], one, *X);
-
-                for(int i = 1; i <= L; ++i) Y0[i] = -one * Y0[i];
-
-                backend::lin_comb(L, &Y0[1], &U[1], one, *U[0]);
-                backend::lin_comb(L, &Y0[1], &R[1], one, *R[0]);
-
-                for(int i = 1; i <= L; ++i) Y0[i] = -one * Y0[i];
-
-                zeta = norm(*R[0]);
-
-                // Accurate update
-                if (prm.delta > 0) {
-                    rnmax_computed = std::max(zeta, rnmax_computed);
-                    rnmax_true     = std::max(zeta, rnmax_true);
-
-                    bool update_x = zeta < prm.delta * zeta0 && zeta0 <= rnmax_computed;
-
-                    if ((zeta < prm.delta * rnmax_true && zeta <= rnmax_true) || update_x) {
-                        preconditioner::spmv(prm.pside, P, A, *X, *R[0], *T);
-                        backend::axpby(one, *B, -one, *R[0]);
-                        rnmax_true = zeta;
-
-                        if (update_x) {
-                            if (prm.pside == side::left) {
-                                backend::axpby(one, *X, one, x);
-                            } else {
-                                backend::axpby(one, *T, one, x);
-                            }
-                            backend::clear(*X);
-                            backend::copy(*R[0], *B);
-
-                            rnmax_computed = zeta;
-                        }
-                    }
-                }
-                if (prm.verbose && iter % 5 == 0)
-                    std::cout << iter << "\t" << std::scientific << zeta / norm_rhs << std::endl;
-            }
-
-done:
-            if (prm.pside == side::left) {
-                backend::axpby(one, *X, one, x);
-            } else {
-                P.apply(*X, *T);
-                backend::axpby(one, *T, one, x);
-            }
-
-            return std::make_tuple(iter, zeta / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            b += backend::bytes(*Rt);
-            b += backend::bytes(*X);
-            b += backend::bytes(*B);
-            b += backend::bytes(*T);
-
-            for(const auto &v : R) b += backend::bytes(*v);
-            for(const auto &v : U) b += backend::bytes(*v);
-
-            b += MZa.size() * sizeof(coef_type);
-            b += MZb.size() * sizeof(coef_type);
-
-            b += backend::bytes(Y0);
-            b += backend::bytes(YL);
-
-            b += qr.bytes();
-
-            return b;
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const bicgstabl &s) {
-            return os
-                << "Type:             BiCGStab(" << s.prm.L << ")"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    public:
-        params prm;
-
-    private:
-        size_t n;
-
-        mutable std::shared_ptr< vector > Rt;
-        mutable std::shared_ptr< vector > X;
-        mutable std::shared_ptr< vector > B;
-        mutable std::shared_ptr< vector > T;
-
-        mutable std::vector< std::shared_ptr< vector > > R;
-        mutable std::vector< std::shared_ptr< vector > > U;
-
-        mutable multi_array<coef_type, 2> MZa, MZb;
-        mutable std::vector<coef_type> Y0, YL;
-        mutable amgcl::detail::QR<coef_type> qr;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return sqrt(math::norm(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/cg.hpp b/src/solvers/amgcl/solver/cg.hpp
deleted file mode 100644
index 90e2c79..0000000
--- a/src/solvers/amgcl/solver/cg.hpp
+++ /dev/null
@@ -1,258 +0,0 @@
-#ifndef AMGCL_SOLVERS_CG_HPP
-#define AMGCL_SOLVERS_CG_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/cg.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Conjugate Gradient method.
- */
-
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Iterative solvers
-namespace solver {
-
-/**
- * \defgroup solvers
- * \brief Iterative solvers
- *
- * AMGCL provides several iterative solvers, but it should be easy to use it as
- * a preconditioner with a user-provided solver.  Each solver in AMGCL is a
- * class template. Its single template parameter specifies the backend to use.
- * This allows to preallocate necessary resources at class construction.
- * Obviously, the solver backend has to coincide with the AMG backend.
- */
-
-
-/** Conjugate Gradients method.
- * \rst
- * An effective method for symmetric positive definite systems [Barr94]_.
- * \endrst
- */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class cg {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        typedef typename math::inner_product_impl<
-            typename math::rhs_of<value_type>::type
-            >::return_type coef_type;
-
-        /// Solver parameters.
-        struct params {
-            /// Maximum number of iterations.
-            size_t maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  ns_search(false), verbose(false)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"maxiter", "tol", "abstol", "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        };
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        cg(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &backend_prm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-          ) : prm(prm), n(n),
-              r(Backend::create_vector(n, backend_prm)),
-              s(Backend::create_vector(n, backend_prm)),
-              p(Backend::create_vector(n, backend_prm)),
-              q(Backend::create_vector(n, backend_prm)),
-              inner_product(inner_product)
-        { }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            static const coef_type one  = math::identity<coef_type>();
-            static const coef_type zero = math::zero<coef_type>();
-
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
-
-            coef_type rho1 = 2 * eps * one;
-            coef_type rho2 = zero;
-
-            backend::residual(rhs, A, x, *r);
-            scalar_type res_norm = norm(*r);
-
-            size_t iter = 0;
-            for(; iter < prm.maxiter && math::norm(res_norm) > eps; ++iter) {
-                P.apply(*r, *s);
-
-                rho2 = rho1;
-                rho1 = inner_product(*r, *s);
-
-                if (iter)
-                    backend::axpby(one, *s, rho1 / rho2, *p);
-                else
-                    backend::copy(*s, *p);
-
-                backend::spmv(one, A, *p, zero, *q);
-
-                coef_type alpha = rho1 / inner_product(*q, *p);
-
-                backend::axpby( alpha, *p, one,  x);
-                backend::axpby(-alpha, *q, one, *r);
-
-                res_norm = norm(*r);
-                if (prm.verbose && iter % 5 == 0)
-                    std::cout << iter << "\t" << std::scientific << res_norm / norm_rhs << std::endl;
-            }
-
-            return std::make_tuple(iter, res_norm / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            return
-                backend::bytes(*r) +
-                backend::bytes(*s) +
-                backend::bytes(*p) +
-                backend::bytes(*q);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const cg &s) {
-            return os
-                << "Type:             CG"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    public:
-        params prm;
-
-    private:
-        size_t n;
-
-        std::shared_ptr<vector> r;
-        std::shared_ptr<vector> s;
-        std::shared_ptr<vector> p;
-        std::shared_ptr<vector> q;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return sqrt(math::norm(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/detail/default_inner_product.hpp b/src/solvers/amgcl/solver/detail/default_inner_product.hpp
deleted file mode 100644
index 0792c09..0000000
--- a/src/solvers/amgcl/solver/detail/default_inner_product.hpp
+++ /dev/null
@@ -1,61 +0,0 @@
-#ifndef AMGCL_SOLVER_DETAIL_DEFAULT_INNER_PRODUCT_HPP
-#define AMGCL_SOLVER_DETAIL_DEFAULT_INNER_PRODUCT_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/detail/default_inner_product.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Default inner product getter for iterative solvers.
- *
- * Falls through to backend::inner_product().
- */
-
-#include <amgcl/backend/interface.hpp>
-
-namespace amgcl {
-namespace solver {
-namespace detail {
-
-struct default_inner_product {
-    template <class Vec1, class Vec2>
-    typename math::inner_product_impl<
-        typename backend::value_type<Vec1>::type
-    >::return_type
-    operator()(const Vec1 &x, const Vec2 &y) const {
-        return backend::inner_product(x, y);
-    }
-
-    int rank() const {
-        return 0;
-    }
-};
-
-} // namespace detail
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/detail/givens_rotations.hpp b/src/solvers/amgcl/solver/detail/givens_rotations.hpp
deleted file mode 100644
index feb399e..0000000
--- a/src/solvers/amgcl/solver/detail/givens_rotations.hpp
+++ /dev/null
@@ -1,67 +0,0 @@
-#ifndef AMGCL_SOLVER_DETAIL_GIVENS_ROTATIONS_HPP
-#define AMGCL_SOLVER_DETAIL_GIVENS_ROTATIONS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/detail/givens_rotations.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Givens plane rotations used in GMRES variants.
- */
-
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace solver {
-namespace detail {
-
-template <class T>
-inline void generate_plane_rotation(T dx, T dy, T &cs, T &sn) {
-    if (math::is_zero(dy)) {
-        cs = 1;
-        sn = 0;
-    } else if (std::abs(dy) > std::abs(dx)) {
-        T tmp = dx / dy;
-        sn = math::inverse(sqrt(math::identity<T>() + tmp * tmp));
-        cs = tmp * sn;
-    } else {
-        T tmp = dy / dx;
-        cs = math::inverse(sqrt(math::identity<T>() + tmp * tmp));
-        sn = tmp * cs;
-    }
-}
-
-template <class T>
-void apply_plane_rotation(T &dx, T &dy, T cs, T sn) {
-    T tmp = math::adjoint(cs) * dx + math::adjoint(sn) * dy;
-    dy = -sn * dx + cs * dy;
-    dx = tmp;
-}
-
-} // namespace detail
-} // namespace solver
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/eigen.hpp b/src/solvers/amgcl/solver/eigen.hpp
deleted file mode 100644
index f851047..0000000
--- a/src/solvers/amgcl/solver/eigen.hpp
+++ /dev/null
@@ -1,108 +0,0 @@
-#ifndef AMGCL_SOLVER_EIGEN_HPP
-#define AMGCL_SOLVER_EIGEN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/solver/eigen.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  Wrapper around eigen direct solvers.
-*/
-
-#include <Eigen/Dense>
-#include <Eigen/SparseCore>
-
-#include <type_traits>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-template < class Solver >
-class EigenSolver {
-    public:
-        typedef typename Solver::MatrixType MatrixType;
-        typedef typename Solver::Scalar     value_type;
-
-        typedef amgcl::detail::empty_params params;
-
-        static size_t coarse_enough() {
-            return 3000 / math::static_rows<value_type>::value;
-        }
-
-        template <class Matrix>
-        EigenSolver(const Matrix &A, const params& = params())
-            : n( backend::rows(A) )
-        {
-            typedef
-                typename std::remove_const<
-                    typename std::remove_pointer<
-                        typename backend::col_data_impl<Matrix>::type
-                        >::type
-                    >::type
-                col_type;
-
-            typedef
-                typename std::remove_const<
-                    typename std::remove_pointer<
-                        typename backend::ptr_data_impl<Matrix>::type
-                        >::type
-                    >::type
-                ptr_type;
-
-            S.compute(
-                    MatrixType(
-                        Eigen::Map<Eigen::SparseMatrix<value_type, Eigen::RowMajor, ptrdiff_t>>(
-                            backend::rows(A), backend::cols(A), backend::nonzeros(A),
-                            const_cast<ptr_type*>(backend::ptr_data(A)),
-                            const_cast<col_type*>(backend::col_data(A)),
-                            const_cast<value_type*>(backend::val_data(A))
-                            )
-                        )
-                    );
-        }
-
-        template <class Vec1, class Vec2>
-        void operator()(const Vec1 &rhs, Vec2 &x) const {
-            Eigen::Map< Eigen::Matrix<value_type, Eigen::Dynamic, 1> >
-                RHS(const_cast<value_type*>(&rhs[0]), n), X(&x[0], n);
-
-            X = S.solve(RHS);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const EigenSolver &s) {
-            return os << "eigen: " << s.n << " unknowns";
-        }
-    private:
-        ptrdiff_t n;
-        Solver S;
-};
-
-} // namespace solver
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/fgmres.hpp b/src/solvers/amgcl/solver/fgmres.hpp
deleted file mode 100644
index d9457bb..0000000
--- a/src/solvers/amgcl/solver/fgmres.hpp
+++ /dev/null
@@ -1,302 +0,0 @@
-#ifndef AMGCL_SOLVER_FGMRES_HPP
-#define AMGCL_SOLVER_FGMRES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   fgmres.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Flexible GMRES method.
- */
-
-#include <vector>
-#include <algorithm>
-#include <cmath>
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/solver/detail/givens_rotations.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-/** Flexible GMRES method.
- * \rst
- * Flexible version of the GMRES method [Saad03]_.
- * \endrst
- */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class fgmres {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename math::rhs_of<value_type>::type rhs_type;
-        typedef typename math::inner_product_impl<rhs_type>::return_type coef_type;
-
-        /// Solver parameters.
-        struct params {
-            /// Number of inner GMRES iterations per each outer iteration.
-            unsigned M;
-
-            /// Maximum number of iterations.
-            unsigned maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : M(30), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  ns_search(false), verbose(false)
-            { }
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, M),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"M", "maxiter", "tol", "abstol", "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, M);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        } prm;
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        fgmres(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-             )
-            : prm(prm), n(n),
-              H(prm.M + 1, prm.M),
-              s(prm.M + 1), cs(prm.M + 1), sn(prm.M + 1),
-              r( Backend::create_vector(n, bprm) ),
-              inner_product(inner_product)
-        {
-            v.reserve(prm.M + 1);
-            for(unsigned i = 0; i <= prm.M; ++i)
-                v.push_back(Backend::create_vector(n, bprm));
-
-            z.reserve(prm.M);
-            for(unsigned i = 0; i < prm.M; ++i)
-                z.push_back(Backend::create_vector(n, bprm));
-        }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Matrix  const &A,
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
-            scalar_type norm_r = math::zero<scalar_type>();
-
-            unsigned iter = 0;
-            while(true) {
-                backend::residual(rhs, A, x, *v[0]);
-
-                // -- Check stopping condition
-                if ((norm_r = norm(*v[0])) < eps || iter >= prm.maxiter)
-                    break;
-
-                // -- Inner GMRES iteration
-                std::fill(s.begin(), s.end(), 0);
-                s[0] = norm_r;
-
-                backend::axpby(math::inverse(norm_r), *v[0],
-                        math::zero<scalar_type>(), *v[0]);
-
-                unsigned j = 0;
-                while(true) {
-                    // -- Arnoldi process
-                    //
-                    // Build an orthonormal basis V and matrix H such that
-                    //     A V_{i-1} = V_{i} H
-
-                    vector &v_new = *v[j+1];
-
-                    P.apply(*v[j], *z[j]);
-                    backend::spmv(math::identity<scalar_type>(), A, *z[j],
-                            math::zero<scalar_type>(), v_new);
-
-                    for(unsigned k = 0; k <= j; ++k) {
-                        H(k, j) = inner_product(v_new, *v[k]);
-                        backend::axpby(-H(k, j), *v[k], math::identity<scalar_type>(), v_new);
-                    }
-                    H(j+1, j) = norm(v_new);
-
-                    backend::axpby(math::inverse(H(j+1, j)), v_new, math::zero<scalar_type>(), v_new);
-
-                    for(unsigned k = 0; k < j; ++k)
-                        detail::apply_plane_rotation(H(k, j), H(k+1, j), cs[k], sn[k]);
-
-                    detail::generate_plane_rotation(H(j, j), H(j+1, j), cs[j], sn[j]);
-                    detail::apply_plane_rotation(H(j, j), H(j+1, j), cs[j], sn[j]);
-                    detail::apply_plane_rotation(s[j], s[j+1], cs[j], sn[j]);
-
-                    scalar_type inner_res = std::abs(s[j+1]);
-
-                    if (prm.verbose && iter % 5 == 0)
-                        std::cout << iter << "\t" << std::scientific << inner_res / norm_rhs << std::endl;
-
-                    // Check for termination
-                    ++j, ++iter;
-                    if (iter >= prm.maxiter || j >= prm.M || inner_res <= eps)
-                        break;
-                }
-
-                // -- GMRES terminated: eval solution
-                for (unsigned i = j; i --> 0; ) {
-                    s[i] /= H(i, i);
-                    for (unsigned k = 0; k < i; ++k)
-                        s[k] -= H(k, i) * s[i];
-                }
-
-                backend::lin_comb(j, s, z, math::identity<scalar_type>(), x);
-            }
-
-            return std::make_tuple(iter, norm_r / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            b += H.size() * sizeof(coef_type);
-            b += backend::bytes(s);
-            b += backend::bytes(cs);
-            b += backend::bytes(sn);
-            b += backend::bytes(*r);
-
-            for(const auto &x : v) b += backend::bytes(*x);
-            for(const auto &x : z) b += backend::bytes(*x);
-
-            return b;
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const fgmres &s) {
-            return os
-                << "Type:             FGMRES(" << s.prm.M << ")"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    private:
-        size_t n;
-
-        mutable multi_array<coef_type, 2> H;
-        mutable std::vector<coef_type> s, cs, sn;
-        std::shared_ptr<vector> r;
-        std::vector< std::shared_ptr<vector> > v;
-        std::vector< std::shared_ptr<vector> > z;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return std::abs(sqrt(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/gmres.hpp b/src/solvers/amgcl/solver/gmres.hpp
deleted file mode 100644
index 5ed74f2..0000000
--- a/src/solvers/amgcl/solver/gmres.hpp
+++ /dev/null
@@ -1,322 +0,0 @@
-#ifndef AMGCL_SOLVER_GMRES_HPP
-#define AMGCL_SOLVER_GMRES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   gmres.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  GMRES method.
- */
-
-#include <vector>
-#include <algorithm>
-#include <cmath>
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/solver/detail/givens_rotations.hpp>
-#include <amgcl/solver/precond_side.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-/** Generalized Minimal Residual (GMRES) method.
- * \rst
- * The Generalized Minimal Residual method is an extension of MINRES (which is
- * only applicable to symmetric systems) to unsymmetric systems [Barr94]_.
- * \endrst
- */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class gmres {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename math::rhs_of<value_type>::type rhs_type;
-        typedef typename math::inner_product_impl<rhs_type>::return_type coef_type;
-
-        /// Solver parameters.
-        struct params {
-            /// Number of iterations before restart.
-            unsigned M;
-
-            /// Preconditioning kind (left/right).
-            preconditioner::side::type pside;
-
-            /// Maximum number of iterations.
-            unsigned maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : M(30), pside(preconditioner::side::right), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()), ns_search(false),
-                  verbose(false)
-            { }
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, M),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, pside),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"M", "pside", "maxiter", "tol", "abstol",
-                        "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, M);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, pside);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        };
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        gmres(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &backend_prm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-             )
-            : prm(prm), n(n),
-              H(prm.M + 1, prm.M),
-              s(prm.M + 1), cs(prm.M + 1), sn(prm.M + 1),
-              r( Backend::create_vector(n, backend_prm) ),
-              inner_product(inner_product)
-        {
-            v.reserve(prm.M + 1);
-            for(unsigned i = 0; i <= prm.M; ++i)
-                v.push_back( Backend::create_vector(n, backend_prm) );
-        }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Matrix  const &A,
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            namespace side = preconditioner::side;
-
-            static const scalar_type zero = math::zero<scalar_type>();
-            static const scalar_type one  = math::identity<scalar_type>();
-
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
-            scalar_type norm_r = zero;
-
-            size_t iter = 0;
-            while(true) {
-                if (prm.pside == side::left) {
-                    backend::residual(rhs, A, x, *v[0]);
-                    P.apply(*v[0], *r);
-                } else {
-                    backend::residual(rhs, A, x, *r);
-                }
-
-                // -- Check stopping condition
-                norm_r = norm(*r);
-                if (norm_r < eps || iter >= prm.maxiter) break;
-
-                // -- Inner GMRES iteration
-                backend::axpby(math::inverse(norm_r), *r, zero, *v[0]);
-
-                std::fill(s.begin(), s.end(), 0);
-                s[0] = norm_r;
-
-                unsigned j = 0;
-                while(true) {
-                    // -- Arnoldi process
-                    //
-                    // Build an orthonormal basis V and matrix H such that
-                    //     A V_{i-1} = V_{i} H
-                    vector &v_new = *v[j+1];
-
-                    preconditioner::spmv(prm.pside, P, A, *v[j], v_new, *r);
-
-                    for(unsigned k = 0; k <= j; ++k) {
-                        H(k, j) = inner_product(v_new, *v[k]);
-                        backend::axpby(-H(k, j), *v[k], one, v_new);
-                    }
-                    H(j+1, j) = norm(v_new);
-
-                    backend::axpby(math::inverse(H(j+1, j)), v_new, zero, v_new);
-
-                    for(unsigned k = 0; k < j; ++k)
-                        detail::apply_plane_rotation(H(k, j), H(k+1, j), cs[k], sn[k]);
-
-                    detail::generate_plane_rotation(H(j, j), H(j+1, j), cs[j], sn[j]);
-                    detail::apply_plane_rotation(H(j, j), H(j+1, j), cs[j], sn[j]);
-                    detail::apply_plane_rotation(s[j], s[j+1], cs[j], sn[j]);
-
-                    scalar_type inner_res = std::abs(s[j+1]);
-
-                    if (prm.verbose && iter % 5 == 0)
-                        std::cout << iter << "\t" << std::scientific << inner_res / norm_rhs << std::endl;
-
-                    // Check for termination
-                    ++j, ++iter;
-                    if (iter >= prm.maxiter || j >= prm.M || inner_res <= eps)
-                        break;
-                }
-
-                // -- GMRES terminated: eval solution
-                for (unsigned i = j; i --> 0; ) {
-                    s[i] /= H(i, i);
-                    for (unsigned k = 0; k < i; ++k)
-                        s[k] -= H(k, i) * s[i];
-                }
-
-                // -- Apply step
-                vector &dx = *r;
-                backend::lin_comb(j, s, v, zero, dx);
-
-                if (prm.pside == side::left) {
-                    backend::axpby(one, dx, one, x);
-                } else {
-                    vector &tmp = *v[0];
-                    P.apply(dx, tmp);
-                    backend::axpby(one, tmp, one, x);
-                }
-            }
-
-            return std::make_tuple(iter, norm_r / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const gmres &s) {
-            return os
-                << "Type:             GMRES(" << s.prm.M << ")"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    public:
-        params prm;
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            b += H.size() * sizeof(coef_type);
-            b += backend::bytes(s);
-            b += backend::bytes(cs);
-            b += backend::bytes(sn);
-            b += backend::bytes(*r);
-
-            for(const auto &x : v) b += backend::bytes(*x);
-
-            return b;
-        }
-    private:
-        size_t n;
-
-        mutable multi_array<coef_type, 2> H;
-        mutable std::vector<coef_type> s, cs, sn;
-        std::shared_ptr<vector> r;
-        std::vector< std::shared_ptr<vector> > v;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return std::abs(sqrt(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/idrs.hpp b/src/solvers/amgcl/solver/idrs.hpp
deleted file mode 100644
index 4e33312..0000000
--- a/src/solvers/amgcl/solver/idrs.hpp
+++ /dev/null
@@ -1,493 +0,0 @@
-#ifndef AMGCL_SOLVER_IDRS_HPP
-#define AMGCL_SOLVER_IDRS_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   idrs.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  IDR(s) method.
-
-The code is ported from Matlab code published at
-http://ta.twi.tudelft.nl/nw/users/gijzen/IDR.html.
-
-This is a very stable and efficient IDR(s) variant (implemented in the MATLAB
-code idrs.m given above) as described in: Martin B. van Gijzen and Peter
-Sonneveld, Algorithm 913: An Elegant IDR(s) Variant that Efficiently Exploits
-Bi-orthogonality Properties. ACM Transactions on Mathematical Software, Vol.
-38, No. 1, pp. 5:1-5:19, 2011 (copyright ACM).
-*/
-
-#include <vector>
-#include <algorithm>
-#include <iostream>
-
-#include <tuple>
-#include <random>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/util.hpp>
-
-#ifdef MPI_VERSION
-#  include <amgcl/mpi/util.hpp>
-#endif
-
-#ifdef _OPENMP
-#  include <omp.h>
-#endif
-
-namespace amgcl {
-namespace solver {
-
-/// IDR(s) method (Induced Dimension Reduction)
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class idrs {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename math::rhs_of<value_type>::type rhs_type;
-
-        typedef typename math::inner_product_impl<
-            typename math::rhs_of<value_type>::type
-            >::return_type coef_type;
-
-        /// Solver parameters.
-        struct params {
-            /// Dimension of the shadow space in IDR(s).
-            unsigned s;
-
-            /// Computation of omega.
-            /**
-             * If omega = 0: a standard minimum residual step is performed
-             * If omega > 0: omega is increased if
-             * the cosine of the angle between Ar and r < omega
-             * Default: omega = 0.7;
-             */
-            scalar_type omega;
-
-            /// Specifies if residual smoothing must be applied.
-            bool smoothing;
-
-            /// Residual replacement.
-            /**
-             * Determines the residual replacement strategy.
-             * If true, the recursively computed residual is replaced by the
-             * true residual.
-             * Default: No residual replacement.
-             */
-            bool replacement;
-
-            /// Maximum number of iterations.
-            unsigned maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : s(4), omega(0.7), smoothing(false),
-                  replacement(false), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  ns_search(false), verbose(false)
-            { }
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, s),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, omega),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, smoothing),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, replacement),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"s", "omega", "smoothing", "replacement",
-                        "maxiter", "tol", "abstol", "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, s);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, omega);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, smoothing);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, replacement);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        } prm;
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        idrs(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-             )
-            : prm(prm), n(n), inner_product(inner_product),
-              M(prm.s, prm.s),
-              f(prm.s), c(prm.s),
-              r(Backend::create_vector(n, bprm)),
-              v(Backend::create_vector(n, bprm)),
-              t(Backend::create_vector(n, bprm))
-        {
-            static const scalar_type one = math::identity<scalar_type>();
-            static const scalar_type zero = math::zero<scalar_type>();
-
-            if (prm.smoothing) {
-              x_s = Backend::create_vector(n, bprm);
-              r_s = Backend::create_vector(n, bprm);
-            }
-
-            G.reserve(prm.s);
-            U.reserve(prm.s);
-            for(unsigned i = 0; i < prm.s; ++i) {
-                G.push_back(Backend::create_vector(n, bprm));
-                U.push_back(Backend::create_vector(n, bprm));
-            }
-
-            // Initialize P.
-            P.reserve(prm.s);
-            {
-                std::vector<rhs_type> p(n);
-
-                int pid = inner_product.rank();
-
-#pragma omp parallel
-                {
-#ifdef _OPENMP
-                    int tid = omp_get_thread_num();
-                    int nt = omp_get_max_threads();
-#else
-                    int tid = 0;
-                    int nt = 1;
-#endif
-
-                    std::mt19937 rng(pid * nt + tid);
-                    std::uniform_real_distribution<scalar_type> rnd(-1, 1);
-
-                    for(unsigned j = 0; j < prm.s; ++j) {
-#pragma omp for
-                        for(ptrdiff_t i = 0; i < static_cast<ptrdiff_t>(n); ++i)
-                            p[i] = math::constant<rhs_type>(rnd(rng));
-
-#pragma omp single
-                        {
-                            P.push_back(Backend::copy_vector(p, bprm));
-                        }
-                    }
-                }
-
-                for(unsigned j = 0; j < prm.s; ++j) {
-                    for(unsigned k = 0; k < j; ++k) {
-                        coef_type alpha = inner_product(*P[k], *P[j]);
-                        backend::axpby(-alpha, *P[k], one, *P[j]);
-                    }
-                    scalar_type norm_pj = norm(*P[j]);
-                    backend::axpby(math::inverse(norm_pj), *P[j], zero, *P[j]);
-                }
-            }
-        }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Matrix  const &A,
-                Precond const &Prec,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            static const scalar_type one = math::identity<scalar_type>();
-            static const scalar_type zero = math::zero<scalar_type>();
-
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
-
-            // Compute initial residual:
-            backend::residual(rhs, A, x, *r);
-
-            scalar_type res_norm = norm(*r);
-            if (res_norm <= eps) {
-                // Initial guess is a good enough solution.
-                return std::make_tuple(0, res_norm / norm_rhs);
-            }
-
-            if (prm.smoothing) {
-                backend::copy( x, *x_s);
-                backend::copy(*r, *r_s);
-            }
-
-            // Initialization.
-            coef_type om = math::identity<coef_type>();
-
-            for(unsigned i = 0; i < prm.s; ++i) {
-                backend::clear(*G[i]);
-                backend::clear(*U[i]);
-
-                for(unsigned j = 0; j < prm.s; ++j)
-                    M(i, j) = (i == j);
-            }
-
-            // Main iteration loop, build G-spaces:
-            size_t iter = 0;
-            while(iter < prm.maxiter && res_norm > eps) {
-                // New righ-hand size for small system:
-                for(unsigned i = 0; i < prm.s; ++i)
-                    f[i] = inner_product(*r, *P[i]);
-
-                for(unsigned k = 0; k < prm.s; ++k) {
-                    // Compute new v
-                    backend::copy(*r, *v);
-
-                    // Solve small system (Note: M is lower triangular)
-                    // and make v orthogonal to P:
-                    for(unsigned i = k; i < prm.s; ++i) {
-                        c[i] = f[i];
-                        for(unsigned j = k; j < i; ++j)
-                            c[i] -= M(i, j) * c[j];
-                        c[i] = math::inverse(M(i, i)) * c[i];
-
-                        backend::axpby(-c[i], *G[i], one, *v);
-                    }
-
-                    Prec.apply(*v, *t);
-
-                    // Compute new U[k]
-                    backend::axpby(om, *t, c[k], *U[k]);
-                    for(unsigned i = k+1; i < prm.s; ++i)
-                        backend::axpby(c[i], *U[i], one, *U[k]);
-
-                    // Compute new G[k], G[k] is in space G_j
-                    backend::spmv(one, A, *U[k], zero, *G[k]);
-
-                    // Bi-Orthogonalise the new basis vectors:
-                    for(unsigned i = 0; i < k; ++i) {
-                        coef_type alpha = inner_product(*G[k], *P[i]) / M(i, i);
-
-                        backend::axpby(-alpha, *G[i], one, *G[k]);
-                        backend::axpby(-alpha, *U[i], one, *U[k]);
-                    }
-
-                    // New column of M = P'*G  (first k-1 entries are zero)
-                    for(unsigned i = k; i < prm.s; ++i)
-                        M(i, k) = inner_product(*G[k], *P[i]);
-
-                    precondition(!math::is_zero(M(k, k)), "IDR(s) breakdown: zero M[k,k]");
-
-                    // Make r orthogonal to q_i, i = [0..k)
-                    coef_type beta = math::inverse(M(k, k)) * f[k];
-                    backend::axpby(-beta, *G[k], one, *r);
-                    backend::axpby( beta, *U[k], one,  x);
-
-                    res_norm = norm(*r);
-
-                    // Smoothing
-                    if (prm.smoothing) {
-                        backend::axpbypcz(one, *r_s, -one, *r, zero, *t);
-                        coef_type gamma = inner_product(*t, *r_s) / inner_product(*t, *t);
-                        backend::axpby(-gamma, *t, one, *r_s);
-                        backend::axpbypcz(-gamma, *x_s, gamma, x, one, *x_s);
-                        res_norm = norm(*r_s);
-                    }
-
-                    if (prm.verbose && iter % 5 == 0)
-                        std::cout << iter << "\t" << std::scientific << res_norm / norm_rhs << std::endl;
-                    if (res_norm <= eps || ++iter >= prm.maxiter) break;
-
-                    // New f = P'*r (first k  components are zero)
-                    for(unsigned i = k + 1; i < prm.s; ++i)
-                        f[i] -= beta * M(i, k);
-                }
-
-                if (res_norm <= eps || iter >= prm.maxiter) break;
-
-                // Now we have sufficient vectors in G_j to compute residual in G_j+1
-                // Note: r is already perpendicular to P so v = r
-
-                Prec.apply(*r, *v);
-                backend::spmv(one, A, *v, zero, *t);
-
-                // Computation of a new omega
-                om = omega(*t, *r);
-                precondition(!math::is_zero(om), "IDR(s) breakdown: zero omega");
-
-                backend::axpby(-om, *t, one, *r);
-                backend::axpby( om, *v, one,  x);
-
-                if (prm.replacement) {
-                    backend::residual(rhs, A, x, *r);
-                }
-                res_norm = norm(*r);
-
-                // Smoothing.
-                if (prm.smoothing) {
-                    backend::axpbypcz(one, *r_s, -one, *r, zero, *t);
-                    coef_type gamma = inner_product(*t, *r_s) / inner_product(*t, *t);
-                    backend::axpby(-gamma, *t, one, *r_s);
-                    backend::axpbypcz(-gamma, *x_s, gamma, x, one, *x_s);
-                    res_norm = norm(*r_s);
-                }
-
-                ++iter;
-            }
-
-            if (prm.smoothing)
-                backend::copy(*x_s, x);
-
-            return std::make_tuple(iter, res_norm / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            b += M.size() * sizeof(coef_type);
-
-            b += backend::bytes(f);
-            b += backend::bytes(c);
-
-            b += backend::bytes(*r);
-            b += backend::bytes(*v);
-            b += backend::bytes(*t);
-
-            if (x_s) b += backend::bytes(*x_s);
-            if (r_s) b += backend::bytes(*r_s);
-
-            for(const auto &v : P) b += backend::bytes(*v);
-            for(const auto &v : G) b += backend::bytes(*v);
-            for(const auto &v : U) b += backend::bytes(*v);
-
-            return b;
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const idrs &s) {
-            return os
-                << "Type:             IDR(" << s.prm.s << ")"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-
-    private:
-        size_t n;
-
-        InnerProduct inner_product;
-
-        mutable multi_array<coef_type,2> M;
-        mutable std::vector<coef_type> f, c;
-
-        std::shared_ptr<vector> r, v, t;
-        std::shared_ptr<vector> x_s;
-        std::shared_ptr<vector> r_s;
-
-        std::vector< std::shared_ptr<vector> > P, G, U;
-
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return std::abs(sqrt(inner_product(x, x)));
-        }
-
-        template <class Vector1, class Vector2>
-        coef_type omega(const Vector1 &t, const Vector2 &s) const {
-            scalar_type norm_t = norm(t);
-            scalar_type norm_s = norm(s);
-
-            coef_type   ts  = inner_product(t, s);
-            scalar_type rho = math::norm(ts / (norm_t * norm_s));
-            coef_type   om  = ts / (norm_t * norm_t);
-
-            if (rho < prm.omega)
-                om *= prm.omega/rho;
-
-            return om;
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/lgmres.hpp b/src/solvers/amgcl/solver/lgmres.hpp
deleted file mode 100644
index 3e18ced..0000000
--- a/src/solvers/amgcl/solver/lgmres.hpp
+++ /dev/null
@@ -1,444 +0,0 @@
-#ifndef AMGCL_SOLVER_LGMRES_HPP
-#define AMGCL_SOLVER_LGMRES_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   lgmres.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  LGMRES method.
- *
- * Ported from scipy lgmres. The original code came with the following license:
- * \verbatim
-   Copyright (c) 2001, 2002 Enthought, Inc.
-   All rights reserved.
-
-   Copyright (c) 2003-2016 SciPy Developers.
-   All rights reserved.
-
-   Redistribution and use in source and binary forms, with or without
-   modification, are permitted provided that the following conditions are met:
-
-     a. Redistributions of source code must retain the above copyright notice,
-        this list of conditions and the following disclaimer.
-     b. Redistributions in binary form must reproduce the above copyright
-        notice, this list of conditions and the following disclaimer in the
-        documentation and/or other materials provided with the distribution.
-     c. Neither the name of Enthought nor the names of the SciPy Developers
-        may be used to endorse or promote products derived from this software
-        without specific prior written permission.
-
-
-   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
-   AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-   IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
-   ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS OR CONTRIBUTORS
-   BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
-   OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-   SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
-   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
-   CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
-   ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
-   THE POSSIBILITY OF SUCH DAMAGE.
- * \endverbatim
- */
-
-#include <vector>
-#include <algorithm>
-#include <cmath>
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/solver/detail/givens_rotations.hpp>
-#include <amgcl/solver/precond_side.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-/** "Loose" GMRES.
- * \rst
- * The LGMRES algorithm [BaJM05]_  is designed to avoid some problems
- * in the convergence in restarted GMRES, and often converges in fewer
- * iterations.
- * \endrst
- */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class lgmres {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename math::rhs_of<value_type>::type rhs_type;
-        typedef typename math::inner_product_impl<rhs_type>::return_type coef_type;
-
-        /// Solver parameters.
-        struct params {
-            /// Number of inner GMRES iterations per each outer iteration.
-            unsigned M;
-
-            /// Number of vectors to carry between inner GMRES iterations.
-            /**
-             * According to [BaJM05], good values are in the range of 1...3.
-             * However, note that if you want to use the additional vectors to
-             * accelerate solving multiple similar problems, larger values may
-             * be beneficial.
-             */
-            unsigned K;
-
-            /// Reset augmented vectors between solves.
-            /** If the solver is used to repeatedly solve similar problems,
-             *  then keeping the augmented vectors between solves may speed up
-             *  subsequent solves.
-             *  This flag, when set, resets the augmented vectors at the
-             *  beginning of each solve.
-             */
-            bool always_reset;
-
-            /// Preconditioning kind (left/right).
-            preconditioner::side::type pside;
-
-            /// Maximum number of iterations.
-            size_t maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : M(30), K(3), always_reset(true),
-                  pside(preconditioner::side::right), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  ns_search(false), verbose(false)
-            { }
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, M),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, K),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, always_reset),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, pside),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"pside", "M", "K", "always_reset", "maxiter",
-                        "tol", "abstol", "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, M);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, K);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, always_reset);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, pside);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        } prm;
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        lgmres(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &bprm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-             )
-            : prm(prm), n(n), M(prm.M + prm.K),
-              H(M + 1, M),
-              H0(M + 1, M),
-              s(M + 1), cs(M + 1), sn(M + 1),
-              r( Backend::create_vector(n, bprm) ),
-              ws(M), outer_v(prm.K),
-              inner_product(inner_product)
-        {
-            outer_v_data.reserve(prm.K);
-            for(unsigned i = 0; i < prm.K; ++i)
-                outer_v_data.push_back(Backend::create_vector(n, bprm));
-
-            vs.reserve(M + 1);
-            for(unsigned i = 0; i <= M; ++i)
-                vs.push_back(Backend::create_vector(n, bprm));
-        }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Matrix  const &A,
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            namespace side = preconditioner::side;
-
-            static const scalar_type zero = math::zero<scalar_type>();
-            static const scalar_type one  = math::identity<scalar_type>();
-
-            ios_saver ss(std::cout);
-
-            if (prm.always_reset) {
-                outer_v.clear();
-            }
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            scalar_type norm_r = zero;
-            scalar_type eps    = std::max(prm.tol * norm_rhs, prm.abstol);
-
-            unsigned iter = 0, n_outer = 0;
-            while(true) {
-                if (prm.pside == side::left) {
-                    backend::residual(rhs, A, x, *vs[0]);
-                    P.apply(*vs[0], *r);
-                } else {
-                    backend::residual(rhs, A, x, *r);
-                }
-
-                // -- Check stopping condition
-                norm_r = norm(*r);
-                if (norm_r < eps || iter >= prm.maxiter) break;
-
-                // -- Inner LGMRES iteration
-                backend::axpby(math::inverse(norm_r), *r, zero, *vs[0]);
-
-                std::fill(s.begin(), s.end(), 0);
-                s[0] = norm_r;
-
-                unsigned j = 0;
-                while(true) {
-                    // -- Arnoldi process:
-                    //
-                    // Build an orthonormal basis V and matrices W and H such that
-                    //     A W = V H
-                    // Columns of W, V, and H are stored in `ws`, `vs` and `hs`.
-                    //
-                    // The first column of V is always the residual vector,
-                    // `vs0`; V has *one more column* than the other of the
-                    // three matrices.
-                    //
-                    // The other columns in V are built by feeding in, one by
-                    // one, some vectors `z` and orthonormalizing them against
-                    // the basis so far. The trick here is to feed in first
-                    // some augmentation vectors, before starting to construct
-                    // the Krylov basis on `v0`.
-                    //
-                    // It was shown in [BaJM05] that a good choice (the LGMRES
-                    // choice) for these augmentation vectors are the `dx`
-                    // vectors obtained from a couple of the previous restart
-                    // cycles.
-                    //
-                    // Note especially that while `vs0` is always the first
-                    // column in V, there is no reason why it should also be
-                    // the first column in W. (In fact, below `vs0` comes in W
-                    // only after the augmentation vectors.)
-                    //
-                    // The rest of the algorithm then goes as in GMRES, one
-                    // solves a minimization problem in the smaller subspace
-                    // spanned by W (range) and V (image).
-
-                    vector &v_new = *vs[j+1];
-
-                    std::shared_ptr<vector> z;
-                    if (j >= M - outer_v.size()) {
-                        z = outer_v[j - (M - outer_v.size())];
-                    } else {
-                        z = vs[j];
-                    }
-
-                    ws[j] = z;
-
-                    preconditioner::spmv(prm.pside, P, A, *z, v_new, *r);
-
-                    for(unsigned k = 0; k <= j; ++k) {
-                        H0(k, j) = H(k, j) = inner_product(v_new, *vs[k]);
-                        backend::axpby(-H(k, j), *vs[k], one, v_new);
-                    }
-                    H0(j+1, j) = H(j+1, j) = norm(v_new);
-
-                    backend::axpby(math::inverse(H(j+1, j)), v_new, zero, v_new);
-
-                    for(unsigned k = 0; k < j; ++k)
-                        detail::apply_plane_rotation(H(k, j), H(k+1, j), cs[k], sn[k]);
-
-                    detail::generate_plane_rotation(H(j, j), H(j+1, j), cs[j], sn[j]);
-                    detail::apply_plane_rotation(H(j, j), H(j+1, j), cs[j], sn[j]);
-                    detail::apply_plane_rotation(s[j], s[j+1], cs[j], sn[j]);
-
-                    scalar_type inner_res = std::abs(s[j+1]);
-
-                    if (prm.verbose && iter % 5 == 0)
-                        std::cout << iter << "\t" << std::scientific << inner_res / norm_rhs << std::endl;
-
-                    // Check for termination
-                    ++j, ++iter;
-                    if (iter >= prm.maxiter || j >= M || inner_res <= eps)
-                        break;
-                }
-
-                // -- GMRES terminated: eval solution
-                for (unsigned i = j; i --> 0; ) {
-                    s[i] /= H(i, i);
-                    for (unsigned k = 0; k < i; ++k)
-                        s[k] -= H(k, i) * s[i];
-                }
-
-                vector &dx = *r;
-                backend::lin_comb(j, s, ws, zero, dx);
-
-                // -- Apply step
-                if (prm.pside == side::left) {
-                    backend::axpby(one, dx, one, x);
-                } else {
-                    vector &tmp = *ws[0];
-                    P.apply(dx, tmp);
-                    backend::axpby(one, tmp, one, x);
-                }
-
-                // -- Store LGMRES augmented vectors
-                scalar_type norm_dx = norm(dx);
-
-                if(prm.K > 0 && !math::is_zero(norm_dx)) {
-                    unsigned outer_slot = n_outer % prm.K;
-                    ++n_outer;
-
-                    norm_dx = math::inverse(norm_dx);
-                    backend::axpby(norm_dx, dx, zero, *outer_v_data[outer_slot]);
-                    outer_v.push_back(outer_v_data[outer_slot]);
-                }
-            }
-
-            return std::make_tuple(iter, norm_r / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                Precond const &P,
-                Vec1    const &rhs,
-                Vec2          &x
-                ) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            size_t b = 0;
-
-            b += H.size() * sizeof(coef_type);
-            b += H0.size() * sizeof(coef_type);
-
-            b += backend::bytes(s);
-            b += backend::bytes(cs);
-            b += backend::bytes(sn);
-
-            b += backend::bytes(*r);
-
-            for(const auto &v : vs) b += backend::bytes(*v);
-
-            for(const auto &v : outer_v_data)  b += backend::bytes(*v);
-
-            return b;
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const lgmres &s) {
-            return os
-                << "Type:             LGMRES(" << s.prm.M << "," << s.prm.K << ")"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    private:
-        size_t n, M;
-
-        mutable multi_array<coef_type, 2> H, H0;
-        mutable std::vector<coef_type> s, cs, sn;
-        std::shared_ptr<vector> r;
-        mutable std::vector< std::shared_ptr<vector> > vs, ws;
-        mutable std::vector< std::shared_ptr<vector> > outer_v_data;
-        mutable circular_buffer< std::shared_ptr<vector> > outer_v;
-
-
-        InnerProduct inner_product;
-
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return std::abs(sqrt(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/solver/precond_side.hpp b/src/solvers/amgcl/solver/precond_side.hpp
deleted file mode 100644
index a158ad0..0000000
--- a/src/solvers/amgcl/solver/precond_side.hpp
+++ /dev/null
@@ -1,100 +0,0 @@
-#ifndef AMGCL_SOLVER_PRECOND_SIDE_HPP
-#define AMGCL_SOLVER_PRECOND_SIDE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/precond_side.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Definitions and functions supporting left/right preconditioning.
- */
-
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace preconditioner {
-namespace side {
-
-enum type {
-    left,
-    right
-};
-
-inline std::ostream& operator<<(std::ostream &os, type p) {
-    switch (p) {
-        case left:
-            return os << "left";
-        case right:
-            return os << "right";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &p) {
-    std::string val;
-    in >> val;
-
-    if (val == "left")
-        p = left;
-    else if (val == "right")
-        p = right;
-    else
-        throw std::invalid_argument("Invalid preconditioning side. "
-                "Valid choices are: left, right.");
-
-    return in;
-}
-
-} // namespace side
-
-// Preconditioned matrix-vector product
-template <class Precond, class Matrix, class VecF, class VecX, class VecT>
-inline void spmv(side::type pside, const Precond &P, const Matrix &A,
-        const VecF &F, VecX &X, VecT &T)
-{
-    typedef typename backend::value_type<Matrix>::type value;
-    typedef typename math::scalar_of<value>::type scalar;
-
-    static const scalar one  = math::identity<scalar>();
-    static const scalar zero = math::zero<scalar>();
-
-    if (pside == side::left) {
-        backend::spmv(one, A, F, zero, T);
-        P.apply(T, X);
-    } else {
-        P.apply(F, T);
-        backend::spmv(one, A, T, zero, X);
-    }
-}
-
-} // namespace preconditioner
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/preonly.hpp b/src/solvers/amgcl/solver/preonly.hpp
deleted file mode 100644
index a569271..0000000
--- a/src/solvers/amgcl/solver/preonly.hpp
+++ /dev/null
@@ -1,141 +0,0 @@
-#ifndef AMGCL_SOLVER_PREONLY_HPP
-#define AMGCL_SOLVER_PREONLY_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/preonly.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Only apply preconditioner once
- */
-
-#include <tuple>
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Iterative solvers
-namespace solver {
-
-/**
- * \defgroup solvers
- * \brief Iterative solvers
- */
-
-/** Richardson iteration */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class preonly {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        typedef typename math::inner_product_impl<
-            typename math::rhs_of<value_type>::type
-            >::return_type coef_type;
-
-        /// Solver parameters.
-        typedef amgcl::detail::empty_params params;
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        preonly(
-                size_t n,
-                const params& = params(),
-                const backend_params& = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-          ) : n(n), inner_product(inner_product)
-        { }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix&, const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            P.apply(rhs, x);
-            return std::make_tuple(0, 0);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            return 0;
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const preonly &s) {
-            return os
-                << "Type:             PreOnly"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-
-    private:
-        size_t n;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return sqrt(math::norm(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/richardson.hpp b/src/solvers/amgcl/solver/richardson.hpp
deleted file mode 100644
index e86fe43..0000000
--- a/src/solvers/amgcl/solver/richardson.hpp
+++ /dev/null
@@ -1,230 +0,0 @@
-#ifndef AMGCL_SOLVER_RICHARDSON_HPP
-#define AMGCL_SOLVER_RICHARDSON_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/richardson.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Richardson iteration
- */
-
-#include <tuple>
-#include <iostream>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-
-/// Iterative solvers
-namespace solver {
-
-/**
- * \defgroup solvers
- * \brief Iterative solvers
- */
-
-/** Richardson iteration */
-template <
-    class Backend,
-    class InnerProduct = detail::default_inner_product
-    >
-class richardson {
-    public:
-        typedef Backend backend_type;
-
-        typedef typename Backend::vector     vector;
-        typedef typename Backend::value_type value_type;
-        typedef typename Backend::params     backend_params;
-
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-
-        typedef typename math::inner_product_impl<
-            typename math::rhs_of<value_type>::type
-            >::return_type coef_type;
-
-        /// Solver parameters.
-        struct params {
-            /// Damping factor
-            scalar_type damping;
-
-            /// Maximum number of iterations.
-            size_t maxiter;
-
-            /// Target relative residual error.
-            scalar_type tol;
-
-            /// Target absolute residual error.
-            scalar_type abstol;
-
-            /// Ignore the trivial solution x=0 when rhs is zero.
-            //** Useful for searching for the null-space vectors of the system */
-            bool ns_search;
-
-            /// Verbose output (show iterations and error)
-            bool verbose;
-
-            params()
-                : damping(1.0), maxiter(100), tol(1e-8),
-                  abstol(std::numeric_limits<scalar_type>::min()),
-                  ns_search(false), verbose(false)
-            {}
-
-#ifndef AMGCL_NO_BOOST
-            params(const boost::property_tree::ptree &p)
-                : AMGCL_PARAMS_IMPORT_VALUE(p, damping),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, maxiter),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, tol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, abstol),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, ns_search),
-                  AMGCL_PARAMS_IMPORT_VALUE(p, verbose)
-            {
-                check_params(p, {"damping", "maxiter", "tol", "abstol",
-                        "ns_search", "verbose"});
-            }
-
-            void get(boost::property_tree::ptree &p, const std::string &path) const {
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, damping);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, maxiter);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, tol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, abstol);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, ns_search);
-                AMGCL_PARAMS_EXPORT_VALUE(p, path, verbose);
-            }
-#endif
-        };
-
-        /// Preallocates necessary data structures for the system of size \p n.
-        richardson(
-                size_t n,
-                const params &prm = params(),
-                const backend_params &backend_prm = backend_params(),
-                const InnerProduct &inner_product = InnerProduct()
-          ) : prm(prm), n(n),
-              r(Backend::create_vector(n, backend_prm)),
-              s(Backend::create_vector(n, backend_prm)),
-              inner_product(inner_product)
-        { }
-
-        /* Computes the solution for the given system matrix \p A and the
-         * right-hand side \p rhs.  Returns the number of iterations made and
-         * the achieved residual as a ``std::tuple``. The solution vector
-         * \p x provides initial approximation in input and holds the computed
-         * solution on output.
-         *
-         * The system matrix may differ from the matrix used during
-         * initialization. This may be used for the solution of non-stationary
-         * problems with slowly changing coefficients. There is a strong chance
-         * that a preconditioner built for a time step will act as a reasonably
-         * good preconditioner for several subsequent time steps [DeSh12]_.
-         */
-        template <class Matrix, class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Matrix &A, const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            static const coef_type one = math::identity<coef_type>();
-
-            ios_saver ss(std::cout);
-
-            scalar_type norm_rhs = norm(rhs);
-            if (norm_rhs < amgcl::detail::eps<scalar_type>(1)) {
-                if (prm.ns_search) {
-                    norm_rhs = math::identity<scalar_type>();
-                } else {
-                    backend::clear(x);
-                    return std::make_tuple(0, norm_rhs);
-                }
-            }
-
-            scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
-
-            backend::residual(rhs, A, x, *r);
-            scalar_type res_norm = norm(*r);
-
-            size_t iter = 0;
-            for(; iter < prm.maxiter && math::norm(res_norm) > eps; ++iter) {
-                P.apply(*r, *s);
-                backend::axpby( prm.damping, *s, one,  x);
-                backend::residual(rhs, A, x, *r);
-                res_norm = norm(*r);
-
-                if (prm.verbose && iter % 5 == 0)
-                    std::cout << iter << "\t" << std::scientific << res_norm / norm_rhs << std::endl;
-            }
-
-            return std::make_tuple(iter, res_norm / norm_rhs);
-        }
-
-        /* Computes the solution for the given right-hand side \p rhs. The
-         * system matrix is the same that was used for the setup of the
-         * preconditioner \p P.  Returns the number of iterations made and the
-         * achieved residual as a ``std::tuple``. The solution vector \p x
-         * provides initial approximation in input and holds the computed
-         * solution on output.
-         */
-        template <class Precond, class Vec1, class Vec2>
-        std::tuple<size_t, scalar_type> operator()(
-                const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-        {
-            return (*this)(P.system_matrix(), P, rhs, x);
-        }
-
-        size_t bytes() const {
-            return
-                backend::bytes(*r) +
-                backend::bytes(*s);
-        }
-
-        friend std::ostream& operator<<(std::ostream &os, const richardson &s) {
-            return os
-                << "Type:             Richardson"
-                << "\nUnknowns:         " << s.n
-                << "\nMemory footprint: " << human_readable_memory(s.bytes())
-                << std::endl;
-        }
-    public:
-        params prm;
-
-    private:
-        size_t n;
-
-        std::shared_ptr<vector> r;
-        std::shared_ptr<vector> s;
-
-        InnerProduct inner_product;
-
-        template <class Vec>
-        scalar_type norm(const Vec &x) const {
-            return sqrt(math::norm(inner_product(x, x)));
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/solver/runtime.hpp b/src/solvers/amgcl/solver/runtime.hpp
deleted file mode 100644
index 8b15907..0000000
--- a/src/solvers/amgcl/solver/runtime.hpp
+++ /dev/null
@@ -1,282 +0,0 @@
-#ifndef AMGCL_SOLVER_RUNTIME_HPP
-#define AMGCL_SOLVER_RUNTIME_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/solver/runtime.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Runtime-configurable wrappers around amgcl iterative solvers.
- */
-
-#include <iostream>
-#include <stdexcept>
-#include <type_traits>
-
-#ifdef AMGCL_NO_BOOST
-#  error Runtime interface relies on Boost.PropertyTree!
-#endif
-
-#include <boost/property_tree/ptree.hpp>
-
-#include <amgcl/util.hpp>
-#include <amgcl/solver/cg.hpp>
-#include <amgcl/solver/bicgstab.hpp>
-#include <amgcl/solver/bicgstabl.hpp>
-#include <amgcl/solver/gmres.hpp>
-#include <amgcl/solver/lgmres.hpp>
-#include <amgcl/solver/fgmres.hpp>
-#include <amgcl/solver/idrs.hpp>
-#include <amgcl/solver/richardson.hpp>
-#include <amgcl/solver/preonly.hpp>
-#include <amgcl/solver/detail/default_inner_product.hpp>
-
-namespace amgcl {
-namespace runtime {
-namespace solver {
-
-enum type {
-    cg,         ///< Conjugate gradients method
-    bicgstab,   ///< BiConjugate Gradient Stabilized
-    bicgstabl,  ///< BiCGStab(ell)
-    gmres,      ///< GMRES
-    lgmres,     ///< LGMRES
-    fgmres,     ///< FGMRES
-    idrs,       ///< IDR(s)
-    richardson, ///< Richardson iteration
-    preonly     ///< Only apply preconditioner once
-};
-
-inline std::ostream& operator<<(std::ostream &os, type s)
-{
-    switch (s) {
-        case cg:
-            return os << "cg";
-        case bicgstab:
-            return os << "bicgstab";
-        case bicgstabl:
-            return os << "bicgstabl";
-        case gmres:
-            return os << "gmres";
-        case lgmres:
-            return os << "lgmres";
-        case fgmres:
-            return os << "fgmres";
-        case idrs:
-            return os << "idrs";
-        case richardson:
-            return os << "richardson";
-        case preonly:
-            return os << "preonly";
-        default:
-            return os << "???";
-    }
-}
-
-inline std::istream& operator>>(std::istream &in, type &s)
-{
-    std::string val;
-    in >> val;
-
-    if (val == "cg")
-        s = cg;
-    else if (val == "bicgstab")
-        s = bicgstab;
-    else if (val == "bicgstabl")
-        s = bicgstabl;
-    else if (val == "gmres")
-        s = gmres;
-    else if (val == "lgmres")
-        s = lgmres;
-    else if (val == "fgmres")
-        s = fgmres;
-    else if (val == "idrs")
-        s = idrs;
-    else if (val == "richardson")
-        s = richardson;
-    else if (val == "preonly")
-        s = preonly;
-    else
-        throw std::invalid_argument("Invalid solver value. Valid choices are: "
-                "cg, bicgstab, bicgstabl, gmres, lgmres, fgmres, idrs, richardson, preonly.");
-
-    return in;
-}
-
-template <
-    class Backend,
-    class InnerProduct = amgcl::solver::detail::default_inner_product
-    >
-struct wrapper {
-    typedef boost::property_tree::ptree                params;
-    typedef typename Backend::params                   backend_params;
-    typedef typename Backend::value_type               value_type;
-    typedef typename math::scalar_of<value_type>::type scalar_type;
-    typedef Backend                                    backend_type;
-
-    type s;
-    void *handle;
-
-    wrapper(size_t n, params prm = params(),
-            const backend_params &bprm = backend_params(),
-            const InnerProduct &inner_product = InnerProduct()
-            )
-        : s(prm.get("type", runtime::solver::bicgstab)), handle(0)
-    {
-        if (!prm.erase("type")) AMGCL_PARAM_MISSING("type");
-
-        switch(s) {
-
-#define AMGCL_RUNTIME_SOLVER(type) \
-            case type: \
-                handle = static_cast<void*>(new amgcl::solver::type<Backend, InnerProduct>(n, prm, bprm, inner_product)); \
-                break
-
-            AMGCL_RUNTIME_SOLVER(cg);
-            AMGCL_RUNTIME_SOLVER(bicgstab);
-            AMGCL_RUNTIME_SOLVER(bicgstabl);
-            AMGCL_RUNTIME_SOLVER(gmres);
-            AMGCL_RUNTIME_SOLVER(lgmres);
-            AMGCL_RUNTIME_SOLVER(fgmres);
-            AMGCL_RUNTIME_SOLVER(idrs);
-            AMGCL_RUNTIME_SOLVER(richardson);
-            AMGCL_RUNTIME_SOLVER(preonly);
-
-#undef AMGCL_RUNTIME_SOLVER
-
-            default:
-                throw std::invalid_argument("Unsupported solver type");
-        }
-    }
-
-    ~wrapper() {
-        switch(s) {
-
-#define AMGCL_RUNTIME_SOLVER(type) \
-            case type: \
-                delete static_cast<amgcl::solver::type<Backend, InnerProduct>*>(handle); \
-                break
-
-            AMGCL_RUNTIME_SOLVER(cg);
-            AMGCL_RUNTIME_SOLVER(bicgstab);
-            AMGCL_RUNTIME_SOLVER(bicgstabl);
-            AMGCL_RUNTIME_SOLVER(gmres);
-            AMGCL_RUNTIME_SOLVER(lgmres);
-            AMGCL_RUNTIME_SOLVER(fgmres);
-            AMGCL_RUNTIME_SOLVER(idrs);
-            AMGCL_RUNTIME_SOLVER(richardson);
-            AMGCL_RUNTIME_SOLVER(preonly);
-
-#undef AMGCL_RUNTIME_SOLVER
-        }
-    }
-
-    template <class Matrix, class Precond, class Vec1, class Vec2>
-    std::tuple<size_t, scalar_type> operator()(
-            const Matrix &A, const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-    {
-        switch(s) {
-
-#define AMGCL_RUNTIME_SOLVER(type) \
-            case type: \
-                return static_cast<amgcl::solver::type<Backend, InnerProduct>*>(handle)->operator()(A, P, rhs, x)
-
-            AMGCL_RUNTIME_SOLVER(cg);
-            AMGCL_RUNTIME_SOLVER(bicgstab);
-            AMGCL_RUNTIME_SOLVER(bicgstabl);
-            AMGCL_RUNTIME_SOLVER(gmres);
-            AMGCL_RUNTIME_SOLVER(lgmres);
-            AMGCL_RUNTIME_SOLVER(fgmres);
-            AMGCL_RUNTIME_SOLVER(idrs);
-            AMGCL_RUNTIME_SOLVER(richardson);
-            AMGCL_RUNTIME_SOLVER(preonly);
-
-#undef AMGCL_RUNTIME_SOLVER
-
-            default:
-                throw std::invalid_argument("Unsupported solver type");
-        }
-    }
-
-    template <class Precond, class Vec1, class Vec2>
-    std::tuple<size_t, scalar_type> operator()(
-            const Precond &P, const Vec1 &rhs, Vec2 &&x) const
-    {
-        return (*this)(P.system_matrix(), P, rhs, x);
-    }
-
-    friend std::ostream& operator<<(std::ostream &os, const wrapper &w) {
-        switch(w.s) {
-
-#define AMGCL_RUNTIME_SOLVER(type) \
-            case type: \
-                return os << *static_cast<amgcl::solver::type<Backend, InnerProduct>*>(w.handle)
-
-            AMGCL_RUNTIME_SOLVER(cg);
-            AMGCL_RUNTIME_SOLVER(bicgstab);
-            AMGCL_RUNTIME_SOLVER(bicgstabl);
-            AMGCL_RUNTIME_SOLVER(gmres);
-            AMGCL_RUNTIME_SOLVER(lgmres);
-            AMGCL_RUNTIME_SOLVER(fgmres);
-            AMGCL_RUNTIME_SOLVER(idrs);
-            AMGCL_RUNTIME_SOLVER(richardson);
-            AMGCL_RUNTIME_SOLVER(preonly);
-
-#undef AMGCL_RUNTIME_SOLVER
-
-            default:
-                throw std::invalid_argument("Unsupported solver type");
-        }
-    }
-
-    size_t bytes() const {
-        switch(s) {
-
-#define AMGCL_RUNTIME_SOLVER(type) \
-            case type: \
-                return backend::bytes(*static_cast<amgcl::solver::type<Backend, InnerProduct>*>(handle))
-
-            AMGCL_RUNTIME_SOLVER(cg);
-            AMGCL_RUNTIME_SOLVER(bicgstab);
-            AMGCL_RUNTIME_SOLVER(bicgstabl);
-            AMGCL_RUNTIME_SOLVER(gmres);
-            AMGCL_RUNTIME_SOLVER(lgmres);
-            AMGCL_RUNTIME_SOLVER(fgmres);
-            AMGCL_RUNTIME_SOLVER(idrs);
-            AMGCL_RUNTIME_SOLVER(richardson);
-            AMGCL_RUNTIME_SOLVER(preonly);
-
-#undef AMGCL_RUNTIME_SOLVER
-
-            default:
-                throw std::invalid_argument("Unsupported solver type");
-        }
-    }
-};
-
-} // namespace solver
-} // namespace runtime
-} // namespace amgcl
-#endif
diff --git a/src/solvers/amgcl/solver/skyline_lu.hpp b/src/solvers/amgcl/solver/skyline_lu.hpp
deleted file mode 100644
index 93da6f0..0000000
--- a/src/solvers/amgcl/solver/skyline_lu.hpp
+++ /dev/null
@@ -1,315 +0,0 @@
-#ifndef AMGCL_SOLVER_SKYLINE_LU_HPP
-#define AMGCL_SOLVER_SKYLINE_LU_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
-\file   amgcl/solver/skyline_lu.hpp
-\author Denis Demidov <dennis.demidov@gmail.com>
-\brief  Skyline LU factorization solver.
-
-The code is adopted from Kratos project http://www.cimne.com/kratos. The
-original code came with the following copyright notice:
-\verbatim
-Kratos Multi-Physics
-
-Copyright (c) 2012, Pooyan Dadvand, Riccardo Rossi, CIMNE (International Center for Numerical Methods in Engineering)
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-
-    Redistributions of source code must retain the above copyright notice, this
-    list of conditions and the following disclaimer.
-    Redistributions in binary form must reproduce the above copyright notice,
-    this list of conditions and the following disclaimer in the documentation
-    and/or other materials provided with the distribution.
-    All advertising materials mentioning features or use of this software must
-    display the following acknowledgement:
-    This product includes Kratos Multi-Physics technology.
-    Neither the name of the CIMNE nor the names of its contributors may be used
-    to endorse or promote products derived from this software without specific
-    prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ''AS IS'' AND ANY EXPRESS OR
-IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
-EVENT SHALL THE COPYRIGHT HOLDERS BE LIABLE FOR ANY DIRECT, INDIRECT,
-INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
-PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED ANDON ANY THEORY OF
-LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT(INCLUDING NEGLIGENCE
-OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THISSOFTWARE, EVEN IF
-ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-\endverbatim
-*/
-
-#include <vector>
-#include <algorithm>
-
-#include <amgcl/backend/interface.hpp>
-#include <amgcl/value_type/interface.hpp>
-#include <amgcl/reorder/cuthill_mckee.hpp>
-#include <amgcl/util.hpp>
-
-namespace amgcl {
-namespace solver {
-
-/// Direct solver that uses skyline LU factorization.
-template <
-    typename ValueType,
-    class ordering = reorder::cuthill_mckee<false>
-    >
-class skyline_lu {
-    public:
-        typedef ValueType value_type;
-        typedef typename math::scalar_of<value_type>::type scalar_type;
-        typedef typename math::rhs_of<value_type>::type    rhs_type;
-
-        typedef amgcl::detail::empty_params params;
-
-        static size_t coarse_enough() {
-            return 3000 / math::static_rows<value_type>::value;
-        }
-
-        template <class Matrix>
-        skyline_lu(const Matrix &A, const params& = params())
-            : n( backend::rows(A) ), perm(n), ptr(n + 1, 0), D(n, math::zero<value_type>()), y(n)
-        {
-            // Find the permutation for the ordering.
-            ordering::get(A, perm);
-
-            // Get inverse permutation
-            std::vector<int> invperm(n);
-            for(int i = 0; i < n; ++i) invperm[perm[i]] = i;
-
-            /* Let us find how large the rows of L and the columns of U should
-             * be.  Provisionally, we will store in ptr[i] the minimum required
-             * height of column i over the diagonal, and length of row i below
-             * the diagonal.  The value(i,j) in the reordered matrix will be
-             * the same as the value(perm[i],perm[j]) in the original matrix;
-             * or, the value(i,j) in the original matrix will be the same as
-             * value(invperm[i],invperm[j]) in the reordered matrix.
-             */
-
-            // Traverse the matrix finding nonzero elements
-            for(int i = 0; i < n; ++i) {
-                for(auto a = backend::row_begin(A, i); a; ++a) {
-                    int  j = a.col();
-                    value_type v = a.value();
-
-                    int newi = invperm[i];
-                    int newj = invperm[j];
-
-                    if (!math::is_zero(v)) {
-                        if (newi > newj) {
-                            // row newi needs length at least newi - newj
-                            if (ptr[newi] < newi - newj) ptr[newi]= newi - newj;
-                        } else if (newi < newj) {
-                            // column newj needs height at least newj - newi
-                            if (ptr[newj] < newj - newi) ptr[newj]= newj - newi;
-                        }
-                    }
-                }
-            }
-
-            // Transform ptr so that it doesn't contain the required lengths
-            // and heights, but the indexes to the entries
-            {
-                int last = 0;
-                for(int i = 1; i <= n; ++i) {
-                    int tmp = ptr[i];
-                    ptr[i] = ptr[i-1] + last;
-                    last = tmp;
-                }
-            }
-
-            // Allocate variables for skyline format entries
-            L.resize(ptr.back(), math::zero<value_type>());
-            U.resize(ptr.back(), math::zero<value_type>());
-
-            // And finally traverse again the CSR matrix, copying its entries
-            // into the correct places in the skyline format
-            for(int i = 0; i < n; ++i) {
-                for(auto a = backend::row_begin(A, i); a; ++a) {
-                    int  j = a.col();
-                    value_type v = a.value();
-
-                    int newi = invperm[i];
-                    int newj = invperm[j];
-
-                    if (!math::is_zero(v)) {
-                        if (newi < newj) {
-                            U[ ptr[newj + 1] + newi - newj ] = v;
-                        } else if (newi == newj) {
-                            D[newi] = v;
-                        } else /* newi > newj */ {
-                            L[ ptr[newi + 1] + newj - newi ] = v;
-                        }
-                    }
-                }
-            }
-
-            factorize();
-        }
-
-        template <class Vec1, class Vec2>
-        void operator()(const Vec1 &rhs, Vec2 &x) const {
-            // y = L^-1 * perm[rhs] ;
-            // y = U^-1 * y ;
-            // x = invperm[y];
-
-            for(int i = 0; i < n; ++i) {
-                rhs_type sum;
-                sum = rhs[perm[i]];
-                for(int k = ptr[i], j = i - ptr[i+1] + k; k < ptr[i+1]; ++k, ++j)
-                    sum -= L[k] * y[j];
-
-                y[i] = D[i] * sum;
-            }
-
-            for(int j = n - 1; j >= 0; --j) {
-                for(int k = ptr[j], i = j - ptr[j+1] + k; k < ptr[j+1]; ++k, ++i)
-                    y[i] -= U[k] * y[j];
-
-            }
-
-            for(int i = 0; i < n; ++i) x[perm[i]] = y[i];
-        }
-
-        size_t bytes() const {
-            return
-                backend::bytes(perm) +
-                backend::bytes(ptr) +
-                backend::bytes(L) +
-                backend::bytes(U) +
-                backend::bytes(D);
-        }
-    private:
-        int n;
-        std::vector<int> perm;
-        std::vector<int> ptr;
-        std::vector<value_type> L;
-        std::vector<value_type> U;
-        std::vector<value_type> D;
-
-        mutable std::vector<rhs_type> y;
-
-        /*
-         * Perform and in-place LU factorization of a skyline matrix by Crout's
-         * algorithm. The diagonal of U contains the 1's.
-         * The equivalent MATLAB code for a full matrix would be:
-         * for k=1:n-1
-         *   A(1,k+1)=A(1,k+1)/A(1,1);
-         *   for i=2:k
-         *     sum=A(i,k+1);
-         *       for j=1:i-1
-         *         sum=sum-A(i,j)*A(j,k+1);
-         *       end;
-         *       A(i,k+1)=sum/A(i,i);
-         *   end
-         *   for i=2:k
-         *     sum=A(k+1,i);
-         *     for j=1:i-1
-         *       sum=sum-A(j,i)*A(k+1,j);
-         *     end;
-         *     A(k+1,i)=sum;
-         *   end
-         *   sum=A(k+1,k+1);
-         *   for i=1:k
-         *     sum=sum-A(k+1,i)*A(i,k+1);
-         *   end
-         *   A(k+1,k+1)=sum;
-         * end
-         */
-        void factorize() {
-            precondition(!math::is_zero(D[0]), "Zero diagonal in skyline_lu");
-            D[0] = math::inverse(D[0]);
-
-            for(int k = 0; k < n - 1; ++k) {
-                // check whether A(1,k+1) lies within the skyline structure
-                if (ptr[k + 1] + k + 1 == ptr[k + 2]) {
-                    U[ptr[k+1]] = D[0] * U[ptr[k+1]];
-                }
-
-                // Compute column k+1 of U
-                int indexEntry = ptr[k + 1];
-                int iBeginCol  = k + 1 - ptr[k + 2] + ptr[k + 1];
-                for(int i = iBeginCol; i <= k; ++indexEntry, ++i) {
-                    if (i == 0) continue;
-
-                    value_type sum = U[indexEntry]; // this is element U(i,k+1)
-
-                    // Multiply row i of L and Column k+1 of U
-                    int jBeginRow  = i - ptr[i + 1] + ptr[i];
-                    int jBeginMult = std::max(iBeginCol, jBeginRow);
-
-                    int indexL = ptr[i  ] + jBeginMult - jBeginRow;
-                    int indexU = ptr[k+1] + jBeginMult - iBeginCol;
-                    for(int j = jBeginMult; j < i; ++j, ++indexL, ++indexU)
-                        sum -= L[indexL] * U[indexU];
-
-                    U[indexEntry] = D[i] * sum;
-                }
-
-                // Compute row k+1 of L
-                indexEntry = ptr[k+1];
-                int jBeginRow = k + 1 - ptr[k + 2] + ptr[k + 1];
-                for(int i = iBeginCol; i <= k; ++indexEntry, ++i) {
-                    if (i == 0) continue;
-
-                    value_type sum = L[indexEntry]; // this is the element L(k+1,i)
-
-                    // Multiply row k+1 of L and column i of U
-                    int jBeginCol  = i - ptr[i+1] + ptr[i];
-                    int jBeginMult = std::max(jBeginCol, jBeginRow);
-
-                    int indexL = ptr[k+1] + jBeginMult - jBeginRow;
-                    int indexU = ptr[i  ] + jBeginMult - jBeginCol;
-
-                    for(int j = jBeginMult; j < i; ++j, ++indexL, ++indexU)
-                        sum -= L[indexL] * U[indexU];
-
-                    L[indexEntry] = sum;
-                }
-
-                // Find element in diagonal
-                value_type sum = D[k+1];
-                for(int j = ptr[k+1]; j < ptr[k+2]; ++j)
-                    sum -= L[j] * U[j];
-
-                precondition(!math::is_zero(sum),
-                        "Zero sum in skyline_lu factorization");
-
-                D[k+1] = math::inverse(sum);
-            }
-        }
-};
-
-} // namespace solver
-} // namespace amgcl
-
-
-#endif
diff --git a/src/solvers/amgcl/util.hpp b/src/solvers/amgcl/util.hpp
deleted file mode 100644
index 28c3dab..0000000
--- a/src/solvers/amgcl/util.hpp
+++ /dev/null
@@ -1,425 +0,0 @@
-#ifndef AMGCL_UTIL_HPP
-#define AMGCL_UTIL_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/util.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Various utilities.
- */
-
-#include <iostream>
-#include <iomanip>
-#include <iterator>
-#include <vector>
-#include <array>
-#include <string>
-#include <set>
-#include <complex>
-#include <limits>
-#include <stdexcept>
-#include <cstddef>
-
-// If asked explicitly, or if boost is available, enable
-// using boost::propert_tree::ptree as amgcl parameters:
-#ifndef AMGCL_NO_BOOST
-#  include <boost/property_tree/ptree.hpp>
-#endif
-
-#include <amgcl/io/ios_saver.hpp>
-
-/* Performance measurement macros
- *
- * If AMGCL_PROFILING macro is defined at compilation, then AMGCL_TIC(name) and
- * AMGCL_TOC(name) macros correspond to prof.tic(name) and prof.toc(name).
- * amgcl::prof should be an instance of amgcl::profiler<> defined in a user
- * code similar to:
- * \code
- * namespace amgcl { profiler<> prof; }
- * \endcode
- * If AMGCL_PROFILING is undefined, then AMGCL_TIC and AMGCL_TOC are noop macros.
- */
-#ifdef AMGCL_PROFILING
-#  if !defined(AMGCL_TIC) || !defined(AMGCL_TOC)
-#    include <amgcl/profiler.hpp>
-#    define AMGCL_TIC(name) amgcl::prof.tic(name);
-#    define AMGCL_TOC(name) amgcl::prof.toc(name);
-namespace amgcl { extern profiler<> prof; }
-#  endif
-#else
-#  ifndef AMGCL_TIC
-#    define AMGCL_TIC(name)
-#  endif
-#  ifndef AMGCL_TOC
-#    define AMGCL_TOC(name)
-#  endif
-#endif
-
-#define AMGCL_DEBUG_SHOW(x)                                                    \
-    std::cout << std::setw(20) << #x << ": "                                   \
-              << std::setw(15) << std::setprecision(8) << std::scientific      \
-              << (x) << std::endl
-
-namespace amgcl {
-
-/// Throws \p message if \p condition is not true.
-template <class Condition, class Message>
-void precondition(const Condition &condition, const Message &message) {
-#ifdef _MSC_VER
-#  pragma warning(push)
-#  pragma warning(disable: 4800)
-#endif
-    if (!condition) throw std::runtime_error(message);
-#ifdef _MSC_VER
-#  pragma warning(pop)
-#endif
-}
-
-#ifndef AMGCL_NO_BOOST
-
-#define AMGCL_PARAMS_IMPORT_VALUE(p, name)                                     \
-    name( p.get(#name, params().name) )
-
-#define AMGCL_PARAMS_IMPORT_CHILD(p, name)                                     \
-    name( p.get_child(#name, amgcl::detail::empty_ptree()) )
-
-#define AMGCL_PARAMS_EXPORT_VALUE(p, path, name)                               \
-    p.put(std::string(path) + #name, name)
-
-namespace detail {
-
-template <typename T>
-inline void params_export_child(
-        boost::property_tree::ptree &p,
-        const std::string &path,
-        const char *name, const T &obj)
-{
-    obj.get(p, std::string(path) + name + ".");
-}
-
-template <>
-inline void params_export_child(
-        boost::property_tree::ptree &p,
-        const std::string &path, const char *name,
-        const boost::property_tree::ptree &obj)
-{
-    p.add_child(std::string(path) + name, obj);
-}
-
-} // namespace detail
-
-#define AMGCL_PARAMS_EXPORT_CHILD(p, path, name)                               \
-    amgcl::detail::params_export_child(p, path, #name, name)
-
-// Missing parameter action
-#ifndef AMGCL_PARAM_MISSING
-#  define AMGCL_PARAM_MISSING(name) (void)0
-#endif
-
-// Unknown parameter action
-#ifndef AMGCL_PARAM_UNKNOWN
-#  define AMGCL_PARAM_UNKNOWN(name)                                            \
-      std::cerr << "AMGCL WARNING: unknown parameter " << name << std::endl
-#endif
-
-inline void check_params(
-        const boost::property_tree::ptree &p,
-        const std::set<std::string> &names
-        )
-{
-    for(const auto &n : names) {
-        if (!p.count(n)) {
-            AMGCL_PARAM_MISSING(n);
-        }
-    }
-    for(const auto &v : p) {
-        if (!names.count(v.first)) {
-            AMGCL_PARAM_UNKNOWN(v.first);
-        }
-    }
-}
-
-inline void check_params(
-        const boost::property_tree::ptree &p,
-        const std::set<std::string> &names,
-        const std::set<std::string> &opt_names
-        )
-{
-    for(const auto &n : names) {
-        if (!p.count(n)) {
-            AMGCL_PARAM_MISSING(n);
-        }
-    }
-    for(const auto &n : opt_names) {
-        if (!p.count(n)) {
-            AMGCL_PARAM_MISSING(n);
-        }
-    }
-    for(const auto &v : p) {
-        if (!names.count(v.first) && !opt_names.count(v.first)) {
-            AMGCL_PARAM_UNKNOWN(v.first);
-        }
-    }
-}
-
-// Put parameter in form "key=value" into a boost::property_tree::ptree
-inline void put(boost::property_tree::ptree &p, const std::string &param) {
-    size_t eq_pos = param.find('=');
-    if (eq_pos == std::string::npos)
-        throw std::invalid_argument("param in amgcl::put() should have \"key=value\" format!");
-    p.put(param.substr(0, eq_pos), param.substr(eq_pos + 1));
-}
-
-#endif
-
-namespace detail {
-
-#ifndef AMGCL_NO_BOOST
-inline const boost::property_tree::ptree& empty_ptree() {
-    static const boost::property_tree::ptree p;
-    return p;
-}
-#endif
-
-struct empty_params {
-    empty_params() {}
-
-#ifndef AMGCL_NO_BOOST
-    empty_params(const boost::property_tree::ptree &p) {
-        for(const auto &v : p) {
-            AMGCL_PARAM_UNKNOWN(v.first);
-        }
-    }
-    void get(boost::property_tree::ptree&, const std::string&) const {}
-#endif
-};
-
-} // namespace detail
-
-// Iterator range
-template <class Iterator>
-class iterator_range {
-    public:
-        typedef Iterator iterator;
-        typedef Iterator const_iterator;
-        typedef typename std::iterator_traits<Iterator>::value_type value_type;
-        typedef typename std::iterator_traits<Iterator>::reference reference;
-
-        iterator_range(Iterator b, Iterator e)
-            : b(b), e(e) {}
-
-        ptrdiff_t size() const {
-            return std::distance(b, e);
-        }
-
-        Iterator begin() const {
-            return b;
-        }
-
-        Iterator end() const {
-            return e;
-        }
-
-        reference operator[](size_t i) const {
-            return b[i];
-        }
-    private:
-        Iterator b, e;
-};
-
-template <class Iterator>
-iterator_range<Iterator> make_iterator_range(Iterator b, Iterator e) {
-    return iterator_range<Iterator>(b, e);
-}
-
-// N-dimensional dense matrix
-template <class T, int N>
-class multi_array {
-    static_assert(N > 0, "Wrong number of dimensions");
-
-    public:
-        template <class... I>
-        multi_array(I... n) {
-            static_assert(sizeof...(I) == N, "Wrong number of dimensions");
-            buf.resize(init(n...));
-        }
-
-        size_t size() const {
-            return buf.size();
-        }
-
-        int stride(int i) const {
-            return strides[i];
-        }
-
-        template <class... I>
-        T operator()(I... i) const {
-            static_assert(sizeof...(I) == N, "Wrong number of indices");
-            return buf[index(i...)];
-        }
-
-        template <class... I>
-        T& operator()(I... i) {
-            static_assert(sizeof...(I) == N, "Wrong number of indices");
-            return buf[index(i...)];
-        }
-
-        const T* data() const {
-            return buf.data();
-        }
-
-        T* data() {
-            return buf.data();
-        }
-    private:
-        std::array<int, N> strides;
-        std::vector<T>  buf;
-
-        template <class... I>
-        int index(int i, I... tail) const {
-            return strides[N - sizeof...(I) - 1] * i + index(tail...);
-        }
-
-        int index(int i) const {
-            return strides[N-1] * i;
-        }
-
-        template <class... I>
-        int init(int i, I... tail) {
-            int size = init(tail...);
-            strides[N - sizeof...(I) - 1] = size;
-            return i * size;
-        }
-
-        int init(int i) {
-            strides[N-1] = 1;
-            return i;
-        }
-};
-
-template <class T>
-class circular_buffer {
-    public:
-        circular_buffer(size_t n) : start(0) {
-            buf.reserve(n);
-        }
-
-        size_t size() const {
-            return buf.size();
-        }
-
-        void push_back(const T &v) {
-            if (buf.size() < buf.capacity()) {
-                buf.push_back(v);
-            } else {
-                buf[start] = v;
-                start = (start + 1) % buf.capacity();
-            }
-        }
-
-        const T& operator[](size_t i) const {
-            return buf[(start + i) % buf.capacity()];
-        }
-
-        T& operator[](size_t i) {
-            return buf[(start + i) % buf.capacity()];
-        }
-
-        void clear() {
-            buf.clear();
-            start = 0;
-        }
-
-    private:
-        size_t start;
-        std::vector<T> buf;
-};
-
-
-namespace detail {
-
-template <class T>
-T eps(size_t n) {
-    return 2 * std::numeric_limits<T>::epsilon() * n;
-}
-
-} // namespace detail
-
-template <class T> struct is_complex : std::false_type {};
-template <class T> struct is_complex< std::complex<T> > : std::true_type {};
-
-inline std::string human_readable_memory(size_t bytes) {
-    static const char *suffix[] = {"B", "K", "M", "G", "T"};
-
-    int i = 0;
-    double m = static_cast<double>(bytes);
-    for(; i < 4 && m >= 1024.0; ++i, m /= 1024.0);
-
-    std::ostringstream s;
-    s << std::fixed << std::setprecision(2) << m << " " << suffix[i];
-    return s.str();
-}
-
-namespace detail {
-
-class non_copyable {
-    protected:
-        non_copyable() = default;
-        ~non_copyable() = default;
-
-        non_copyable(non_copyable const &) = delete;
-        void operator=(non_copyable const &x) = delete;
-};
-
-} // namespace detail
-
-namespace error {
-
-struct empty_level {};
-
-} // namespace error
-} // namespace amgcl
-
-namespace std {
-
-// Read pointers from input streams.
-// This allows to exchange pointers through boost::property_tree::ptree.
-template <class T>
-inline istream& operator>>(istream &is, T* &ptr) {
-    amgcl::ios_saver ss(is);
-
-    size_t val;
-    is >> std::hex >> val;
-
-    ptr = reinterpret_cast<T*>(val);
-
-    return is;
-}
-
-} // namespace std
-
-
-#endif
diff --git a/src/solvers/amgcl/value_type/complex.hpp b/src/solvers/amgcl/value_type/complex.hpp
deleted file mode 100644
index 0f9f933..0000000
--- a/src/solvers/amgcl/value_type/complex.hpp
+++ /dev/null
@@ -1,103 +0,0 @@
-#ifndef AMGCL_VALUE_TYPE_COMPLEX_HPP
-#define AMGCL_VALUE_TYPE_COMPLEX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2015 Christoph Sohrmann
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/value_type/complex.hpp
- * \author Christoph Sohrmann
- * \brief  Enable std::complex<T> as value type.
- */
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// Enable std::complex as a value-type.
-template <typename T>
-struct is_builtin_vector< std::vector<std::complex<T> > > : std::true_type {};
-
-} // namespace backend
-
-namespace math {
-
-/// Specialization that extracts the scalar type of a complex type.
-template <class T>
-struct scalar_of< std::complex<T> > {
-    typedef T type;
-};
-
-/// Replace scalar type in the complex type.
-template <class T, class S>
-struct replace_scalar<std::complex<T>, S> {
-    typedef std::complex<S> type;
-};
-
-/// Specialization of conjugate transpose for scalar complex arguments.
-template <typename T>
-struct adjoint_impl< std::complex<T> >
-{
-    typedef std::complex<T> return_type;
-
-    static std::complex<T> get(std::complex<T> x) {
-        return std::conj(x);
-    }
-};
-
-/// Default implementation for inner product
-/** \note Used in adjoint() */
-template <typename T>
-struct inner_product_impl< std::complex<T> > {
-    typedef std::complex<T> return_type;
-
-    static return_type get(std::complex<T> x, std::complex<T> y) {
-        return x * std::conj(y);
-    }
-};
-
-/// Specialization of constant element for complex type.
-template <typename T>
-struct constant_impl< std::complex<T> >
-{
-    static std::complex<T> get(T c) {
-        return std::complex<T>(c, c);
-    }
-};
-
-}  // namespace math
-} // namespace amgcl
-
-namespace std {
-
-template <typename V>
-bool operator<(const std::complex<V> &a, const std::complex<V> &b) {
-    return std::abs(a) < std::abs(b);
-}
-
-} // namespace std
-
-#endif /* ENABLE_COMPLEX_HPP */
diff --git a/src/solvers/amgcl/value_type/eigen.hpp b/src/solvers/amgcl/value_type/eigen.hpp
deleted file mode 100644
index 212c777..0000000
--- a/src/solvers/amgcl/value_type/eigen.hpp
+++ /dev/null
@@ -1,184 +0,0 @@
-#ifndef AMGCL_VALUE_TYPE_EIGEN_HPP
-#define AMGCL_VALUE_TYPE_EIGEN_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/value_type/eigen.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Enable statically sized eigen matrices as value types.
- */
-
-#include <Eigen/Dense>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-namespace backend {
-
-/// Enable Eigen matrix as a value-type.
-template <typename T, int N, int M>
-struct is_builtin_vector< std::vector<Eigen::Matrix<T, N, M> > > : std::true_type {};
-
-} // namespace backend
-
-namespace math {
-
-/// Scalar type of a non-scalar type.
-template <class T, int N, int M>
-struct scalar_of< Eigen::Matrix<T, N, M> > {
-    typedef typename math::scalar_of<T>::type type;
-};
-
-/// Replace scalar type in the static matrix
-template <class T, int N, int M, class S>
-struct replace_scalar< Eigen::Matrix<T, N, M>, S> {
-    typedef Eigen::Matrix<S, N, M> type;
-};
-
-/// RHS type corresponding to a non-scalar type.
-template <class T, int N>
-struct rhs_of< Eigen::Matrix<T, N, N> > {
-    typedef Eigen::Matrix<T, N, 1> type;
-};
-
-/// Element type of a non-scalar type
-template <class T, int N, int M>
-struct element_of< Eigen::Matrix<T, N, M> > {
-    typedef T type;
-};
-
-/// Whether the value type is a statically sized matrix.
-template <class T, int N, int M>
-struct is_static_matrix< Eigen::Matrix<T, N, M> > : std::true_type {};
-
-/// Number of rows for statically sized matrix types.
-template <class T, int N, int M>
-struct static_rows< Eigen::Matrix<T, N, M> > : std::integral_constant<int, N> {};
-
-/// Number of columns for statically sized matrix types.
-template <class T, int N, int M>
-struct static_cols< Eigen::Matrix<T, N, M> > : std::integral_constant<int, M> {};
-
-/// Specialization of conjugate transpose for eigen matrices.
-template <typename T, int N, int M>
-struct adjoint_impl< Eigen::Matrix<T, N, M> >
-{
-    typedef typename Eigen::Matrix<T, N, M>::AdjointReturnType return_type;
-
-    static return_type get(const Eigen::Matrix<T, N, M> &x) {
-        return x.adjoint();
-    }
-};
-
-/// Inner-product result of two Eigen vectors.
-template <class T, int N>
-struct inner_product_impl< Eigen::Matrix<T, N, 1> >
-{
-    typedef T return_type;
-    static T get(const Eigen::Matrix<T, N, 1> &x, const Eigen::Matrix<T, N, 1> &y) {
-        return x.adjoint() * y;
-    }
-};
-
-/// Inner-product result of two Eigen matrices.
-template <class T, int N, int M>
-struct inner_product_impl< Eigen::Matrix<T, N, M> >
-{
-    typedef Eigen::Matrix<T, M, M> return_type;
-
-    static return_type get(const Eigen::Matrix<T, N, M> &x, const Eigen::Matrix<T, N, M> &y) {
-        return x.adjoint() * y;
-    }
-};
-
-/// Specialization of element norm for eigen matrices.
-template <typename T, int N, int M>
-struct norm_impl< Eigen::Matrix<T, N, M> >
-{
-    static typename math::scalar_of<T>::type get(const Eigen::Matrix<T, N, M> &x) {
-        return x.norm();
-    }
-};
-
-/// Specialization of zero element for eigen matrices.
-template <typename T, int N, int M>
-struct zero_impl< Eigen::Matrix<T, N, M> >
-{
-    static Eigen::Matrix<T, N, M> get() {
-        return Eigen::Matrix<T, N, M>::Zero();
-    }
-};
-
-/// Specialization of zero element for eigen matrices.
-template <typename T, int N, int M>
-struct is_zero_impl< Eigen::Matrix<T, N, M> >
-{
-    static bool get(const Eigen::Matrix<T, N, M> &x) {
-        return x.isZero();
-    }
-};
-
-/// Specialization of identity for eigen matrices.
-template <typename T, int N>
-struct identity_impl< Eigen::Matrix<T, N, N> >
-{
-    static Eigen::Matrix<T, N, N> get() {
-        return Eigen::Matrix<T, N, N>::Identity();
-    }
-};
-
-/// Specialization of constant for eigen matrices.
-template <typename T, int N, int M>
-struct constant_impl< Eigen::Matrix<T, N, M> >
-{
-    static Eigen::Matrix<T, N, M> get(T c) {
-        return Eigen::Matrix<T, N, M>::Constant(c);
-    }
-};
-
-/// Specialization of inversion for eigen matrices.
-template <typename T, int N>
-struct inverse_impl< Eigen::Matrix<T, N, N> >
-{
-    static Eigen::Matrix<T, N, N> get(const Eigen::Matrix<T, N, N> &x) {
-        return x.inverse();
-    }
-};
-
-} // namespace math
-} // namespace amgcl
-
-namespace Eigen {
-
-template <class A, class B>
-bool operator<(const MatrixBase<A> &a, const MatrixBase<B> &b) {
-    return a.trace() < b.trace();
-}
-
-} // namespace Eigen
-
-#endif
diff --git a/src/solvers/amgcl/value_type/interface.hpp b/src/solvers/amgcl/value_type/interface.hpp
deleted file mode 100644
index 7b57e35..0000000
--- a/src/solvers/amgcl/value_type/interface.hpp
+++ /dev/null
@@ -1,205 +0,0 @@
-#ifndef AMGCL_VALUE_TYPE_INTERFACE_HPP
-#define AMGCL_VALUE_TYPE_INTERFACE_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/value_type/interface.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Support for various value types.
- */
-
-#include <type_traits>
-
-namespace amgcl {
-namespace math {
-
-/// Scalar type of a non-scalar type.
-template <class T, class Enable = void>
-struct scalar_of {
-    typedef T type;
-};
-
-/// RHS type corresponding to a non-scalar type.
-template <class T, class Enable = void>
-struct rhs_of {
-    typedef T type;
-};
-
-/// Element type of a non-scalar type
-template <class T, class Enable = void>
-struct element_of {
-    typedef T type;
-};
-
-/// Replace scalar type in the static matrix
-template<class T, class S, class Enable = void>
-struct replace_scalar {
-    typedef S type;
-};
-
-/// Whether the value type is a statically sized matrix.
-template <class T, class Enable = void>
-struct is_static_matrix : std::false_type {};
-
-/// Number of rows for statically sized matrix types.
-template <class T, class Enable = void>
-struct static_rows : std::integral_constant<int, 1> {};
-
-/// Number of columns for statically sized matrix types.
-template <class T, class Enable = void>
-struct static_cols : std::integral_constant<int, 1> {};
-
-
-/// Default implementation for conjugate transpose.
-/** \note Used in adjoint() */
-template <typename ValueType, class Enable = void>
-struct adjoint_impl {
-    typedef ValueType return_type;
-
-    static ValueType get(ValueType x) {
-        return x;
-    }
-};
-
-/// Default implementation for inner product
-/** \note Used in inner_product() */
-template <typename ValueType, class Enable = void>
-struct inner_product_impl {
-    typedef ValueType return_type;
-
-    static return_type get(ValueType x, ValueType y) {
-        return x * y;
-    }
-};
-
-/// Default implementation for element norm.
-/** \note Used in zero() */
-template <typename ValueType, class Enable = void>
-struct norm_impl {
-    static typename scalar_of<ValueType>::type get(ValueType x) {
-        return std::abs(x);
-    }
-};
-
-/// Default implementation for the zero element.
-/** \note Used in zero() */
-template <typename ValueType, class Enable = void>
-struct zero_impl {
-    static ValueType get() {
-        return static_cast<ValueType>(0);
-    }
-};
-
-/// Default implementation for zero check.
-/** \note Used in is_zero() */
-template <typename ValueType, class Enable = void>
-struct is_zero_impl {
-    static bool get(const ValueType &x) {
-        return x == zero_impl<ValueType>::get();
-    }
-};
-
-/// Default implementation for the identity element.
-/** \note Used in identity() */
-template <typename ValueType, class Enable = void>
-struct identity_impl {
-    static ValueType get() {
-        return static_cast<ValueType>(1);
-    }
-};
-
-/// Default implementation for the constant element.
-/** \note Used in constant() */
-template <typename ValueType, class Enable = void>
-struct constant_impl {
-    static ValueType get(typename scalar_of<ValueType>::type c) {
-        return static_cast<ValueType>(c);
-    }
-};
-
-/// Default implementation of inversion operation.
-/** \note Used in inverse() */
-template <typename ValueType, class Enable = void>
-struct inverse_impl {
-    static ValueType get(const ValueType &x) {
-        return identity_impl<ValueType>::get() / x;
-    }
-};
-
-/// Return conjugate transpose of argument.
-template <typename ValueType>
-typename adjoint_impl<ValueType>::return_type
-adjoint(ValueType x) {
-    return adjoint_impl<ValueType>::get(x);
-}
-
-/// Return inner product of two arguments.
-template <typename ValueType>
-typename inner_product_impl<ValueType>::return_type
-inner_product(ValueType x, ValueType y) {
-    return inner_product_impl<ValueType>::get(x, y);
-}
-
-/// Compute norm of an element.
-template <typename ValueType>
-typename scalar_of<ValueType>::type norm(const ValueType &a) {
-    return norm_impl<ValueType>::get(a);
-}
-
-/// Create zero element of type ValueType.
-template <typename ValueType>
-ValueType zero() {
-    return zero_impl<ValueType>::get();
-}
-
-/// Return true if argument is considered zero.
-template <typename ValueType>
-bool is_zero(const ValueType &x) {
-    return is_zero_impl<ValueType>::get(x);
-}
-
-/// Create identity of type ValueType.
-template <typename ValueType>
-ValueType identity() {
-    return identity_impl<ValueType>::get();
-}
-
-/// Create one element of type ValueType.
-template <typename ValueType>
-ValueType constant(typename scalar_of<ValueType>::type c) {
-    return constant_impl<ValueType>::get(c);
-}
-
-/// Return inverse of the argument.
-template <typename ValueType>
-ValueType inverse(const ValueType &x) {
-    return inverse_impl<ValueType>::get(x);
-}
-
-} // namespace math
-} // namespace amgcl
-
-#endif
diff --git a/src/solvers/amgcl/value_type/static_matrix.hpp b/src/solvers/amgcl/value_type/static_matrix.hpp
deleted file mode 100644
index 1a39f01..0000000
--- a/src/solvers/amgcl/value_type/static_matrix.hpp
+++ /dev/null
@@ -1,342 +0,0 @@
-#ifndef AMGCL_VALUE_TYPE_STATIC_MATRIX_HPP
-#define AMGCL_VALUE_TYPE_STATIC_MATRIX_HPP
-
-/*
-The MIT License
-
-Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-*/
-
-/**
- * \file   amgcl/value_type/static_matrix.hpp
- * \author Denis Demidov <dennis.demidov@gmail.com>
- * \brief  Enable statically sized matrices as value types.
- */
-
-#include <array>
-#include <type_traits>
-
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/interface.hpp>
-
-namespace amgcl {
-
-template <typename T, int N, int M>
-struct static_matrix {
-    std::array<T, N * M> buf;
-
-    T operator()(int i, int j) const {
-        return buf[i * M + j];
-    }
-
-    T& operator()(int i, int j) {
-        return buf[i * M + j];
-    }
-
-    T operator()(int i) const {
-        return buf[i];
-    }
-
-    T& operator()(int i) {
-        return buf[i];
-    }
-
-    const T* data() const {
-        return buf.data();
-    }
-
-    T* data() {
-        return buf.data();
-    }
-
-    template <typename U>
-    const static_matrix& operator=(const static_matrix<U,N,M> &y) {
-        for(int i = 0; i < N * M; ++i)
-            buf[i] = y.buf[i];
-        return *this;
-    }
-
-    template <typename U>
-    const static_matrix& operator+=(const static_matrix<U,N,M> &y) {
-        for(int i = 0; i < N * M; ++i)
-            buf[i] += y.buf[i];
-        return *this;
-    }
-
-    template <typename U>
-    const static_matrix& operator-=(const static_matrix<U,N,M> &y) {
-        for(int i = 0; i < N * M; ++i)
-            buf[i] -= y.buf[i];
-        return *this;
-    }
-
-    const static_matrix& operator*=(T c) {
-        for(int i = 0; i < N * M; ++i)
-            buf[i] *= c;
-        return *this;
-    }
-
-
-    friend static_matrix operator*(T a, static_matrix x)
-    {
-        return x *= a;
-    }
-
-    friend static_matrix operator-(static_matrix x)
-    {
-        for(int i = 0; i < N * M; ++i)
-            x.buf[i] = -x.buf[i];
-        return x;
-    }
-
-    friend bool operator<(const static_matrix &x, const static_matrix &y)
-    {
-        T xtrace = math::zero<T>();
-        T ytrace = math::zero<T>();
-
-        const int K = N < M ? N : M;
-
-        for(int i = 0; i < K; ++i) {
-            xtrace += x(i,i);
-            ytrace += y(i,i);
-        }
-
-        return xtrace < ytrace;
-    }
-
-    friend std::ostream& operator<<(std::ostream &os, const static_matrix &a) {
-        for(int i = 0; i < N; ++i) {
-            for(int j = 0; j < M; ++j) {
-                os << " " << a(i,j);
-            }
-            os << std::endl;
-        }
-        return os;
-    }
-};
-
-template <typename T, typename U, int N, int M>
-static_matrix<T, N, M> operator+(static_matrix<T, N, M> a, const static_matrix<U, N, M> &b)
-{
-    return a += b;
-}
-
-template <typename T, typename U, int N, int M>
-static_matrix<T, N, M> operator-(static_matrix<T, N, M> a, const static_matrix<U, N, M> &b)
-{
-    return a -= b;
-}
-
-template <typename T, typename U, int N, int K, int M>
-static_matrix<T, N, M> operator*(
-        const static_matrix<T, N, K> &a,
-        const static_matrix<U, K, M> &b
-        )
-{
-    static_matrix<T, N, M> c;
-    for(int i = 0; i < N; ++i) {
-        for(int j = 0; j < M; ++j)
-            c(i,j) = math::zero<T>();
-        for(int k = 0; k < K; ++k) {
-            T aik = a(i,k);
-            for(int j = 0; j < M; ++j)
-                c(i,j) += aik * b(k,j);
-        }
-    }
-    return c;
-}
-
-template <class T> struct is_static_matrix : std::false_type {};
-
-template <class T, int N, int M>
-struct is_static_matrix< static_matrix<T, N, M> > : std::true_type {};
-
-namespace backend {
-
-/// Enable static matrix as a value-type.
-template <typename T, int N, int M>
-struct is_builtin_vector< std::vector<static_matrix<T, N, M> > > : std::true_type {};
-
-} // namespace backend
-
-namespace math {
-
-/// Scalar type of a non-scalar type.
-template <class T, int N, int M>
-struct scalar_of< static_matrix<T, N, M> > {
-    typedef typename scalar_of<T>::type type;
-};
-
-/// Replace scalar type in the static matrix.
-template <class T, int N, int M, class S>
-struct replace_scalar<static_matrix<T, N, M>, S> {
-    typedef static_matrix<S, N, M> type;
-};
-
-/// RHS type corresponding to a non-scalar type.
-template <class T, int N>
-struct rhs_of< static_matrix<T, N, N> > {
-    typedef static_matrix<T, N, 1> type;
-};
-
-/// Element type of a non-scalar type
-template <class T, int N, int M>
-struct element_of< static_matrix<T, N, M> > {
-    typedef T type;
-};
-
-/// Whether the value type is a statically sized matrix.
-template <class T, int N, int M>
-struct is_static_matrix< static_matrix<T, N, M> > : std::true_type {};
-
-/// Number of rows for statically sized matrix types.
-template <class T, int N, int M>
-struct static_rows< static_matrix<T, N, M> > : std::integral_constant<int, N> {};
-
-/// Number of columns for statically sized matrix types.
-template <class T, int N, int M>
-struct static_cols< static_matrix<T, N, M> > : std::integral_constant<int, M> {};
-
-/// Specialization of conjugate transpose for static matrices.
-template <typename T, int N, int M>
-struct adjoint_impl< static_matrix<T, N, M> >
-{
-    typedef static_matrix<T, M, N> return_type;
-
-    static static_matrix<T, M, N> get(const static_matrix<T, N, M> &x) {
-        static_matrix<T, M, N> y;
-        for(int i = 0; i < N; ++i)
-            for(int j = 0; j < M; ++j)
-                y(j,i) = math::adjoint(x(i,j));
-        return y;
-    }
-};
-
-/// Inner-product result of two static vectors.
-template <class T, int N>
-struct inner_product_impl< static_matrix<T, N, 1> >
-{
-    typedef T return_type;
-    static T get(const static_matrix<T, N, 1> &x, const static_matrix<T, N, 1> &y) {
-        T sum = math::zero<T>();
-        for(int i = 0; i < N; ++i)
-            sum += x(i) * math::adjoint(y(i));
-        return sum;
-    }
-};
-
-/// Inner-product result of two static matrices.
-template <class T, int N, int M>
-struct inner_product_impl< static_matrix<T, N, M> >
-{
-    typedef static_matrix<T, M, M> return_type;
-
-    static return_type get(const static_matrix<T, N, M> &x, const static_matrix<T, N, M> &y) {
-        static_matrix<T, M, M> p;
-        for(int i = 0; i < M; ++i) {
-            for(int j = 0; j < M; ++j) {
-                T sum = math::zero<T>();
-                for(int k = 0; k < N; ++k)
-                    sum += x(k,i) * math::adjoint(y(k,j));
-                p(i,j) = sum;
-            }
-        }
-        return p;
-    }
-};
-
-/// Implementation of Frobenius norm for static matrices.
-template <typename T, int N, int M>
-struct norm_impl< static_matrix<T, N, M> >
-{
-    static typename math::scalar_of<T>::type get(const static_matrix<T, N, M> &x) {
-        T s = math::zero<T>();
-        for(int i = 0; i < N * M; ++i)
-            s += x(i) * math::adjoint(x(i));
-        return sqrt(math::norm(s));
-    }
-};
-
-/// Specialization of zero element for static matrices.
-template <typename T, int N, int M>
-struct zero_impl< static_matrix<T, N, M> >
-{
-    static static_matrix<T, N, M> get() {
-        static_matrix<T, N, M> z;
-        for(int i = 0; i < N * M; ++i)
-            z(i) = math::zero<T>();
-        return z;
-    }
-};
-
-/// Specialization of zero element for static matrices.
-template <typename T, int N, int M>
-struct is_zero_impl< static_matrix<T, N, M> >
-{
-    static bool get(const static_matrix<T, N, M> &x) {
-        for(int i = 0; i < N * M; ++i)
-            if (!math::is_zero(x(i))) return false;
-        return true;
-    }
-};
-
-/// Specialization of identity for static matrices.
-template <typename T, int N>
-struct identity_impl< static_matrix<T, N, N> >
-{
-    static static_matrix<T, N, N> get() {
-        static_matrix<T, N, N> I;
-        for(int i = 0; i < N; ++i)
-            for(int j = 0; j < N; ++j)
-                I(i,j) = static_cast<T>(i == j);
-        return I;
-    }
-};
-
-/// Specialization of constant for static matrices.
-template <typename T, int N, int M>
-struct constant_impl< static_matrix<T, N, M> >
-{
-    static static_matrix<T, N, M> get(T c) {
-        static_matrix<T, N, M> C;
-        for(int i = 0; i < N * M; ++i)
-            C(i) = c;
-        return C;
-    }
-};
-
-/// Specialization of inversion for static matrices.
-template <typename T, int N>
-struct inverse_impl< static_matrix<T, N, N> >
-{
-    static static_matrix<T, N, N> get(static_matrix<T, N, N> A) {
-        std::array<T, N * N> buf;
-        std::array<int, N> p;
-        detail::inverse(N, A.data(), buf.data(), p.data());
-        return A;
-    }
-};
-
-
-} // namespace math
-} // namespace amgcl
-
-#endif