d2/d30/parallel__symmetric__successive__over__relaxation_8h_source.html

/*

 * Copyright 2023 MusicScience37 (Kenta Kabashima)

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *     http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */

#pragma once


#include <algorithm>

#include <cmath>


#include <Eigen/Core>

#include <omp.h>


#include "num_collect/base/concepts/dense_vector_of.h"

#include "num_collect/base/concepts/real_scalar.h"

#include "num_collect/base/concepts/sparse_matrix.h"

#include "num_collect/base/exception.h"

#include "num_collect/base/index_type.h"

#include "num_collect/base/precondition.h"

#include "num_collect/linear/iterative_solver_base.h"

#include "num_collect/logging/log_tag_view.h"

#include "num_collect/logging/logging_macros.h"

#include "num_collect/logging/logging_mixin.h"


namespace num_collect::linear {


template <base::concepts::sparse_matrix Matrix>

class parallel_symmetric_successive_over_relaxation;


constexpr auto parallel_symmetric_successive_over_relaxation_tag =

    logging::log_tag_view(

        "num_collect::linear::parallel_symmetric_successive_over_relaxation");


namespace impl {


template <base::concepts::sparse_matrix Matrix>


struct iterative_solver_traits<

    parallel_symmetric_successive_over_relaxation<Matrix>> {

    using matrix_type = Matrix;

};


}  // namespace impl


template <base::concepts::sparse_matrix Matrix>


class parallel_symmetric_successive_over_relaxation

    : public iterative_solver_base<

          parallel_symmetric_successive_over_relaxation<Matrix>>,

      public logging::logging_mixin {

    static_assert(Matrix::IsRowMajor == 1, "Row major matrix is required.");

    static_assert(base::concepts::real_scalar<typename Matrix::Scalar>,

        "Complex matrices are not supported.");


public:

    using base_type = iterative_solver_base<

        parallel_symmetric_successive_over_relaxation<Matrix>>;


    using typename base_type::matrix_type;

    using typename base_type::real_scalar_type;

    using typename base_type::scalar_type;

    using typename base_type::storage_index_type;


protected:

    using base_type::coeff;


public:

    using vector_type = Eigen::VectorX<scalar_type>;


    parallel_symmetric_successive_over_relaxation()

        : logging::logging_mixin(

              parallel_symmetric_successive_over_relaxation_tag) {}


    void compute(const matrix_type& coeff) {

        base_type::compute(coeff);

        diag_ = coeff.diagonal();

        inv_diag_ = diag_.cwiseInverse();

        intermidiate_solution_.resize(coeff.cols());

        NUM_COLLECT_PRECONDITION(inv_diag_.array().isFinite().all(),

            "All diagonal elements of the coefficient matrix must not be "

            "zero.");

        run_parallel_ =

            (coeff.nonZeros() / omp_get_max_threads() > 1000);  // NOLINT

    }


    template <base::concepts::dense_vector_of<scalar_type> Right,

        base::concepts::dense_vector_of<scalar_type> Solution>


    void solve_vector_in_place(const Right& right, Solution& solution) const {

        const auto& coeff_ref = coeff();


        NUM_COLLECT_PRECONDITION(coeff_ref.rows() == coeff_ref.cols(),

            "Coefficient matrix must be a square matrix.");

        NUM_COLLECT_PRECONDITION(right.rows() == coeff_ref.cols(),

            "Right-hand-side vector must have the number of elements same as "

            "the size of the coefficient matrix.");

        NUM_COLLECT_PRECONDITION(solution.rows() == coeff_ref.cols(),

            "Solution vector must have the number of elements same as the size "

            "of the coefficient matrix.");


        iterations_ = 0;

        const scalar_type right_norm = right.squaredNorm();

        const index_type max_iterations = base_type::max_iterations();

        while (iterations_ < max_iterations) {

            if (run_parallel_) {

                iterate_parallel(coeff_ref, right, solution);

            } else {

                iterate_no_parallel(coeff_ref, right, solution);

            }

            if (!std::isfinite(residual_)) {

                NUM_COLLECT_LOG_AND_THROW(algorithm_failure,

                    "Failure in "

                    "parallel_symmetric_successive_over_relaxation.");

            }

            ++iterations_;

            using std::sqrt;

            residual_rate_ = sqrt(residual_ / right_norm);

            if (residual_rate_ < base_type::tolerance()) {

                break;

            }

        }

    }


    [[nodiscard]] auto iterations() const noexcept -> index_type {

        return iterations_;

    }


    [[nodiscard]] auto residual_rate() const noexcept -> scalar_type {

        return residual_rate_;

    }


    auto relaxation_coeff(const scalar_type& val)

        -> parallel_symmetric_successive_over_relaxation& {

        NUM_COLLECT_PRECONDITION(static_cast<scalar_type>(0) < val &&

                val < static_cast<scalar_type>(2),

            "Relaxation coefficient must be in the range (0, 2).");

        relaxation_coeff_ = val;

        return *this;

    }


    auto run_parallel(bool val)

        -> parallel_symmetric_successive_over_relaxation& {

        run_parallel_ = val;

        return *this;

    }


private:

    template <base::concepts::dense_vector_of<scalar_type> Right,

        base::concepts::dense_vector_of<scalar_type> Solution>


    void iterate_parallel(const matrix_type& coeff_ref, const Right& right,

        Solution& solution) const {

        const index_type size = coeff_ref.rows();

        const scalar_type prev_sol_coeff =

            static_cast<scalar_type>(1) - relaxation_coeff_;

        residual_ = static_cast<scalar_type>(0);


#pragma omp parallel

        {

            const index_type num_threads = omp_get_num_threads();

            const index_type thread_id = omp_get_thread_num();

            const index_type rows_per_thread =

                (size + num_threads - 1) / num_threads;

            const index_type my_start_row = thread_id * rows_per_thread;

            const index_type my_last_row =

                std::min(my_start_row + rows_per_thread, size);


            if (iterations_ == 0) {

                NUM_COLLECT_LOG_TRACE(this->logger(),

                    "my rows: {} - {} (whole rows: {})", my_start_row,

                    my_last_row, size);

            }


            auto my_residual = static_cast<scalar_type>(0);


            // Forward update.

            for (index_type i = my_start_row; i < my_last_row; ++i) {

                my_residual += process_row_forward(coeff_ref, right, solution,

                    i, my_start_row, prev_sol_coeff);

            }


#pragma omp barrier


            // Backward update.

            for (index_type i = my_last_row - 1; i >= my_start_row; --i) {

                process_row_backward(

                    coeff_ref, right, solution, i, my_last_row, prev_sol_coeff);

            }


#pragma omp critical

            residual_ += my_residual;

        }

    }


    template <base::concepts::dense_vector_of<scalar_type> Right,

        base::concepts::dense_vector_of<scalar_type> Solution>


    void iterate_no_parallel(const matrix_type& coeff_ref, const Right& right,

        Solution& solution) const {

        const index_type size = coeff_ref.rows();

        const scalar_type prev_sol_coeff =

            static_cast<scalar_type>(1) - relaxation_coeff_;

        residual_ = static_cast<scalar_type>(0);


        // Forward update.

        for (index_type i = 0; i < size; ++i) {

            residual_ += process_row_forward(

                coeff_ref, right, solution, i, 0, prev_sol_coeff);

        }


        // Backward update.

        for (index_type i = size - 1; i >= 0; --i) {

            process_row_backward(

                coeff_ref, right, solution, i, size, prev_sol_coeff);

        }

    }


    template <base::concepts::dense_vector_of<scalar_type> Right,

        base::concepts::dense_vector_of<scalar_type> Solution>


    auto process_row_forward(const matrix_type& coeff_ref, const Right& right,

        Solution& solution, index_type i, index_type start_row,

        const scalar_type& prev_sol_coeff) const -> scalar_type {

        scalar_type numerator = right(i);

        for (typename matrix_type::InnerIterator iter(coeff_ref, i); iter;

            ++iter) {

            if (start_row <= iter.index() && iter.index() < i) {

                numerator -=

                    iter.value() * intermidiate_solution_(iter.index());

            } else if (iter.index() != i) {

                numerator -= iter.value() * solution(iter.index());

            }

        }

        const scalar_type row_residual = numerator - diag_(i) * solution(i);

        intermidiate_solution_(i) =

            relaxation_coeff_ * numerator * inv_diag_(i) +

            prev_sol_coeff * solution(i);

        return row_residual * row_residual;

    }


    template <base::concepts::dense_vector_of<scalar_type> Right,

        base::concepts::dense_vector_of<scalar_type> Solution>


    void process_row_backward(const matrix_type& coeff_ref, const Right& right,

        Solution& solution, index_type i, index_type end_row,

        const scalar_type& prev_sol_coeff) const {

        scalar_type numerator = right(i);

        for (typename matrix_type::InnerIterator iter(coeff_ref, i); iter;

            ++iter) {

            if (i < iter.index() && iter.index() < end_row) {

                numerator -= iter.value() * solution(iter.index());

            } else if (iter.index() != i) {

                numerator -=

                    iter.value() * intermidiate_solution_(iter.index());

            }

        }

        solution(i) = relaxation_coeff_ * numerator * inv_diag_(i) +

            prev_sol_coeff * intermidiate_solution_(i);

    }


    bool run_parallel_{true};


    mutable index_type iterations_{};


    mutable scalar_type residual_{};


    mutable scalar_type residual_rate_{};


    scalar_type relaxation_coeff_{static_cast<scalar_type>(1)};


    vector_type diag_{};


    vector_type inv_diag_{};


    mutable vector_type intermidiate_solution_{};

};


}  // namespace num_collect::linear

num_collect::algorithm_failure
Class of exception on failure in algorithm.
Definition exception.h:93

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::storage_index_type
StorageIndex storage_index_type
Definition iterative_solver_base.h:75

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::coeff
auto coeff() const noexcept -> const matrix_type &
Definition iterative_solver_base.h:243

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::matrix_type
MatrixType matrix_type
Definition iterative_solver_base.h:71

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::scalar_type
Scalar scalar_type
Definition iterative_solver_base.h:73

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::iterative_solver_base
iterative_solver_base()
Definition iterative_solver_base.h:91

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::tolerance
auto tolerance() const noexcept -> real_scalar_type
Definition iterative_solver_base.h:130

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::real_scalar_type
RealScalar real_scalar_type
Definition iterative_solver_base.h:77

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::compute
auto compute(const matrix_type &coeff) -> parallel_symmetric_successive_over_relaxation< Matrix > &
Definition iterative_solver_base.h:101

num_collect::linear::iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > >::max_iterations
auto max_iterations() const noexcept -> index_type
Definition iterative_solver_base.h:152

num_collect::linear::parallel_symmetric_successive_over_relaxation
Class to solve linear equations using symmetric successive over-relaxation using threads golub2013.
Definition parallel_symmetric_successive_over_relaxation.h:75

num_collect::linear::parallel_symmetric_successive_over_relaxation::iterations
auto iterations() const noexcept -> index_type
Get the number of iterations.
Definition parallel_symmetric_successive_over_relaxation.h:173

num_collect::linear::parallel_symmetric_successive_over_relaxation::base_type
iterative_solver_base< parallel_symmetric_successive_over_relaxation< Matrix > > base_type
Type of the base class.
Definition parallel_symmetric_successive_over_relaxation.h:82

num_collect::linear::parallel_symmetric_successive_over_relaxation::solve_vector_in_place
void solve_vector_in_place(const Right &right, Solution &solution) const
Iterate repeatedly until stop criterion is satisfied for a vector.
Definition parallel_symmetric_successive_over_relaxation.h:131

num_collect::linear::parallel_symmetric_successive_over_relaxation::intermidiate_solution_
vector_type intermidiate_solution_
Intermidiate solution vector.
Definition parallel_symmetric_successive_over_relaxation.h:392

num_collect::linear::parallel_symmetric_successive_over_relaxation::relaxation_coeff
auto relaxation_coeff(const scalar_type &val) -> parallel_symmetric_successive_over_relaxation &
Set the relaxation coefficient.
Definition parallel_symmetric_successive_over_relaxation.h:194

num_collect::linear::parallel_symmetric_successive_over_relaxation::coeff
auto coeff() const noexcept -> const matrix_type &
Get the coefficient matrix.
Definition iterative_solver_base.h:243

num_collect::linear::parallel_symmetric_successive_over_relaxation::iterate_no_parallel
void iterate_no_parallel(const matrix_type &coeff_ref, const Right &right, Solution &solution) const
Iterate once in single thread.
Definition parallel_symmetric_successive_over_relaxation.h:284

num_collect::linear::parallel_symmetric_successive_over_relaxation::parallel_symmetric_successive_over_relaxation
parallel_symmetric_successive_over_relaxation()
Constructor.
Definition parallel_symmetric_successive_over_relaxation.h:100

num_collect::linear::parallel_symmetric_successive_over_relaxation::run_parallel
auto run_parallel(bool val) -> parallel_symmetric_successive_over_relaxation &
Set whether to run in parallel.
Definition parallel_symmetric_successive_over_relaxation.h:211

num_collect::linear::parallel_symmetric_successive_over_relaxation::residual_
scalar_type residual_
Last residual.
Definition parallel_symmetric_successive_over_relaxation.h:377

num_collect::linear::parallel_symmetric_successive_over_relaxation::relaxation_coeff_
scalar_type relaxation_coeff_
Relaxation coefficient.
Definition parallel_symmetric_successive_over_relaxation.h:383

num_collect::linear::parallel_symmetric_successive_over_relaxation::vector_type
Eigen::VectorX< scalar_type > vector_type
Type of vectors.
Definition parallel_symmetric_successive_over_relaxation.h:95

num_collect::linear::parallel_symmetric_successive_over_relaxation::residual_rate_
scalar_type residual_rate_
Rate of last residual.
Definition parallel_symmetric_successive_over_relaxation.h:380

num_collect::linear::parallel_symmetric_successive_over_relaxation::run_parallel_
bool run_parallel_
Whether to run in parallel.
Definition parallel_symmetric_successive_over_relaxation.h:371

num_collect::linear::parallel_symmetric_successive_over_relaxation::process_row_forward
auto process_row_forward(const matrix_type &coeff_ref, const Right &right, Solution &solution, index_type i, index_type start_row, const scalar_type &prev_sol_coeff) const -> scalar_type
Process a row in the forward update.
Definition parallel_symmetric_successive_over_relaxation.h:319

num_collect::linear::parallel_symmetric_successive_over_relaxation::diag_
vector_type diag_
Diagonal coefficients.
Definition parallel_symmetric_successive_over_relaxation.h:386

num_collect::linear::parallel_symmetric_successive_over_relaxation::iterations_
index_type iterations_
Number of iterations.
Definition parallel_symmetric_successive_over_relaxation.h:374

num_collect::linear::parallel_symmetric_successive_over_relaxation::inv_diag_
vector_type inv_diag_
Inverse of diagonal coefficients.
Definition parallel_symmetric_successive_over_relaxation.h:389

num_collect::linear::parallel_symmetric_successive_over_relaxation::iterate_parallel
void iterate_parallel(const matrix_type &coeff_ref, const Right &right, Solution &solution) const
Iterate once in parallel.
Definition parallel_symmetric_successive_over_relaxation.h:229

num_collect::linear::parallel_symmetric_successive_over_relaxation::process_row_backward
void process_row_backward(const matrix_type &coeff_ref, const Right &right, Solution &solution, index_type i, index_type end_row, const scalar_type &prev_sol_coeff) const
Process a row in the backward update.
Definition parallel_symmetric_successive_over_relaxation.h:353

num_collect::linear::parallel_symmetric_successive_over_relaxation::residual_rate
auto residual_rate() const noexcept -> scalar_type
Get the rate of the last residual.
Definition parallel_symmetric_successive_over_relaxation.h:184

num_collect::linear::parallel_symmetric_successive_over_relaxation::compute
void compute(const matrix_type &coeff)
Prepare to solve.
Definition parallel_symmetric_successive_over_relaxation.h:109

num_collect::logging::log_tag_view
Class of tags of logs without memory management.
Definition log_tag_view.h:35

num_collect::logging::logging_mixin
Class to incorporate logging in algorithms.
Definition logging_mixin.h:32

num_collect::logging::logging_mixin::logging_mixin
logging_mixin(log_tag_view tag)
Constructor.
Definition logging_mixin.h:39

num_collect::logging::logging_mixin::logger
auto logger() const noexcept -> const num_collect::logging::logger &
Access to the logger.
Definition logging_mixin.h:46

num_collect::base::concepts::real_scalar
Concept of real scalars.
Definition real_scalar.h:55

dense_vector_of.h
Definition of dense_vector_of concept.

exception.h
Definition of exceptions.

index_type.h
Definition of index_type type.

iterative_solver_base.h
Definition of iterative_solver_base class.

log_tag_view.h
Definition of log_tag_view class.

logging_macros.h
Definition of macros for logging.

NUM_COLLECT_LOG_TRACE
#define NUM_COLLECT_LOG_TRACE(LOGGER,...)
Write a trace log.
Definition logging_macros.h:184

NUM_COLLECT_LOG_AND_THROW
#define NUM_COLLECT_LOG_AND_THROW(EXCEPTION_TYPE,...)
Write an error log and throw an exception for an error.
Definition logging_macros.h:333

logging_mixin.h
Definition of logging_mixin class.

num_collect::base::index_type
std::ptrdiff_t index_type
Type of indices in this library.
Definition index_type.h:33

num_collect::linear::impl
Namespace of internal implementations.
Definition algebraic_multigrid_solver.h:55

num_collect::linear
Namespace of solvers of linear equations.
Definition algebraic_multigrid_solver.h:46

num_collect::linear::parallel_symmetric_successive_over_relaxation_tag
constexpr auto parallel_symmetric_successive_over_relaxation_tag
Log tag of parallel_symmetric_successive_over_relaxation.
Definition parallel_symmetric_successive_over_relaxation.h:45

num_collect::logging
Namespace of logging.
Definition formattable_iteration_parameter_value.h:27

precondition.h
Definition of NUM_COLLECT_PRECONDITION macro.

NUM_COLLECT_PRECONDITION
#define NUM_COLLECT_PRECONDITION(CONDITION,...)
Check whether a precondition is satisfied and throw an exception if not.
Definition precondition.h:137

real_scalar.h
Definition of real_scalar concept.

sparse_matrix.h
Definition of sparse_matrix concept.

num_collect::linear::impl::iterative_solver_traits< parallel_symmetric_successive_over_relaxation< Matrix > >::matrix_type
Matrix matrix_type
Type of the matrix.
Definition parallel_symmetric_successive_over_relaxation.h:60

num_collect::linear::impl::iterative_solver_traits
Traits of iterative solvers.
Definition iterative_solver_base.h:43