feat3/amavanka_8hpp_source.html

// FEAT3: Finite Element Analysis Toolbox, Version 3

// Copyright (C) 2010 by Stefan Turek & the FEAT group

// FEAT3 is released under the GNU General Public License version 3,

// see the file 'copyright.txt' in the top level directory for details.


#pragma once


#include <kernel/lafem/null_matrix.hpp>

#include <kernel/lafem/sparse_matrix_bcsr.hpp>

#include <kernel/lafem/sparse_matrix_csr.hpp>

#include <kernel/lafem/saddle_point_matrix.hpp>

#include <kernel/lafem/tuple_matrix.hpp>

#include <kernel/global/matrix.hpp>

#include <kernel/solver/base.hpp>

#include <kernel/solver/amavanka_base.hpp>

#include <kernel/util/stop_watch.hpp>


namespace FEAT

{

  namespace Solver

  {

    template<typename Matrix_, typename Filter_>

    class AmaVanka :

      public Solver::SolverBase<typename Matrix_::VectorTypeL>

    {

    public:

      typedef Solver::SolverBase<typename Matrix_::VectorTypeL> BaseClass;


      typedef typename Matrix_::DataType DataType;

      typedef typename Matrix_::IndexType IndexType;

      typedef typename Matrix_::VectorTypeL VectorType;


    protected:

      typedef typename Intern::AmaVankaMatrixHelper<Matrix_>::VankaMatrix VankaMatrixType;


      const Matrix_& _matrix;

      const Filter_& _filter;

      VankaMatrixType _vanka;

      bool _auto_macros;

      bool _skip_singular;

      std::vector<Adjacency::Graph> _macro_dofs, _dof_macros;

      std::vector<int> _macro_mask;

      Index _num_steps;

      DataType _omega;

      VectorType _vec_c, _vec_d;


      // stop watch for symbolic factorization

      StopWatch watch_init_symbolic;

      // stop watch for numeric factorization

      StopWatch watch_init_numeric;

      // stop watch for apply time

      StopWatch watch_apply;


      int _num_threads;


    public:

      explicit AmaVanka(const Matrix_& matrix, const Filter_& filter,

        const DataType omega = DataType(1), const Index num_steps = Index(1)) :

        _matrix(matrix),

        _filter(filter),

        _vanka(),

        _auto_macros(true),

        _skip_singular(false),

        _num_steps(num_steps),

        _omega(omega)

      {

      }


      void clear_macro_dofs()

      {

        this->_macro_dofs.clear();

        _auto_macros = true;

      }


      void push_macro_dofs(Adjacency::Graph&& dofs)

      {

        _auto_macros = false;


        // make sure that we do not push more graphs than we have blocks

        if(int(_macro_dofs.size()) >= Intern::AmaVankaMatrixHelper<Matrix_>::num_blocks)

          XABORTM("all macro-dofs graphs have already been added");


        // make sure that the number of macros matches our previous graph

        if(!_macro_dofs.empty() && (_macro_dofs.back().get_num_nodes_domain() != dofs.get_num_nodes_domain()))

          XABORTM("macro count mismatch");


        // push graph into the list

        _macro_dofs.emplace_back(std::forward<Adjacency::Graph>(dofs));


        // sort the dof indices

        _macro_dofs.back().sort_indices();

      }


      void set_num_steps(Index num_steps)

      {

        XASSERT(num_steps > Index(0));

        this->_num_steps = num_steps;

      }


      void set_omega(DataType omega)

      {

        XASSERT(omega > DataType(0));

        this->_omega = omega;

      }


      void set_skip_singular(bool skip_sing)

      {

        this->_skip_singular = skip_sing;

      }


      std::size_t bytes() const

      {

        std::size_t s = _vanka.bytes();

        for(const auto& g : _macro_dofs)

          s += sizeof(Index) * std::size_t(g.get_num_nodes_domain() + g.get_num_indices());

        for(const auto& g : _dof_macros)

          s += sizeof(Index) * std::size_t(g.get_num_nodes_domain() + g.get_num_indices());

        s += _vec_c.bytes();

        s += _vec_d.bytes();

        return s;

      }


      std::size_t data_size() const

      {

        return std::size_t(_vanka.template used_elements<LAFEM::Perspective::pod>());

      }


      void reset_timings()

      {

        watch_init_symbolic.reset();

        watch_init_numeric.reset();

        watch_apply.reset();

      }


      double time_init_symbolic() const

      {

        return watch_init_symbolic.elapsed();

      }


      double time_init_numeric() const

      {

        return watch_init_numeric.elapsed();

      }


      double time_apply() const

      {

        return watch_apply.elapsed();

      }


      virtual String name() const override

      {

        return "AmaVanka";

      }


      virtual void init_symbolic() override

      {

        watch_init_symbolic.start();


        BaseClass::init_symbolic();


        // we also need two vectors if we have to perform multiple steps

        if(this->_num_steps > Index(1))

        {

          this->_vec_c = this->_matrix.create_vector_l();

          this->_vec_d = this->_matrix.create_vector_l();

        }


        // automatically deduct macros?

        if(this->_auto_macros)

        {

          // try to deduct macros by pressure matrices in SaddlePointMatrix

          if(!Intern::AmaVankaCore::deduct_macro_dofs(this->_matrix, this->_macro_dofs))

            XABORTM("Cannot auto-deduct macros for this matrix type");

        }


        // make sure we have one macro-dof graph for each matrix block

        XASSERTM(int(_macro_dofs.size()) == Intern::AmaVankaMatrixHelper<Matrix_>::num_blocks,

           "invalid number of macro-dof graphs; did you push all of them?");


        // compute dof-macro graphs by transposing

        this->_dof_macros.resize(this->_macro_dofs.size());

        for(std::size_t i(0); i < this->_macro_dofs.size(); ++i)

        {

          // ensure that we have the same number of macros in all graphs

          XASSERT(this->_macro_dofs.at(i).get_num_nodes_domain() == this->_macro_dofs.front().get_num_nodes_domain());


          // transpose macro-dofs graph

          this->_dof_macros.at(i) = Adjacency::Graph(Adjacency::RenderType::transpose, this->_macro_dofs.at(i));

        }


        // allocate macro skip mask?

        if(this->_skip_singular)

          this->_macro_mask.resize(this->_macro_dofs.front().get_num_nodes_domain(), 0);


        Solver::Intern::AmaVankaCore::alloc(this->_vanka, this->_dof_macros, this->_macro_dofs, Index(0), Index(0));


        watch_init_symbolic.stop();

      }


      virtual void done_symbolic() override

      {

        this->_vanka.clear();

        this->_macro_mask.clear();

        this->_dof_macros.clear();

        if(this->_auto_macros)

          this->_macro_dofs.clear();

        if(this->_num_steps > Index(1))

        {

          this->_vec_d.clear();

          this->_vec_c.clear();

        }

        BaseClass::done_symbolic();

      }


      virtual void init_numeric() override

      {

        const DataType eps = Math::eps<DataType>();


        watch_init_numeric.start();

        BaseClass::init_numeric();


        this->_vanka.format();


        // get maximum macro size

        const Index num_macros = Index(this->_macro_dofs.front().get_num_nodes_domain());

        const Index stride = Intern::AmaVankaCore::calc_stride(this->_vanka, this->_macro_dofs);


        FEAT_PRAGMA_OMP(parallel)

        {

          // allocate arrays for local matrix

          std::vector<DataType> vec_local(stride*stride, DataType(0)), vec_local_t(stride*stride, DataType(0));

          std::vector<Index> vec_pivot(stride);

          DataType* local = vec_local.data();

          DataType* local_t = vec_local_t.data();

          Index* pivot = vec_pivot.data();


          // loop over all macros

          FEAT_PRAGMA_OMP(for)

          for(Index imacro = 0; imacro < num_macros; ++imacro)

          {

            // gather local matrix

            const std::pair<Index,Index> nrc = Intern::AmaVankaCore::gather(this->_matrix,

              local, stride, imacro, this->_macro_dofs, Index(0), Index(0), Index(0), Index(0));


            // make sure we have gathered a square matrix

            XASSERTM(nrc.first == nrc.second, "local matrix is not square");


            // assume a non-singular matrix

            bool singular = false;


            // do we check for singular macros?

            if(this->_skip_singular)

            {

              // the approach used for checking the regularity of the local matrix is to check whether

              //

              //     || I - A*A^{-1} ||_F^2 < eps

              //

              // we could try to analyse the pivots returned by invert_matrix function instead, but

              // unfortunately this approach sometimes leads to false positives


              // make a backup if checking for singularity

              for(Index i(0); i < nrc.first; ++i)

                for(Index j(0); j < nrc.second; ++j)

                  local_t[i*stride+j] = local[i*stride+j];


              // invert local matrix

              Math::invert_matrix(nrc.first, stride, local, pivot);


              // compute (squared) Frobenius norm of (I - A*A^{-1})

              DataType norm = DataType(0);

              for(Index i(0); i < nrc.first; ++i)

              {

                for(Index j(0); j < nrc.first; ++j)

                {

                  DataType xij = DataType(i == j ? 1 : 0);

                  for(Index k(0); k < nrc.first; ++k)

                    xij -= local_t[i*stride+k] * local[k*stride+j]; // A_ik * (A^{-1})_kj

                  norm += xij * xij;

                }

              }


              // is the matrix block singular?

              // Note: we check for !(norm < eps) instead of (norm >= eps),

              // because the latter one evaluates to false if norm is NaN,

              // which would result in a false negative

              singular = !(norm < eps);


              // set macro regularity mask

              this->_macro_mask[imacro] = (singular ? 0 : 1);

            }

            else // no singularity check

            {

              // invert local matrix

              Math::invert_matrix(nrc.first, stride, local, pivot);

            }


            // scatter local matrix

            if(!singular)

            {

              FEAT_PRAGMA_OMP(critical)

              {

                Intern::AmaVankaCore::scatter_add(this->_vanka, local, stride, imacro, this->_macro_dofs,

                  Index(0), Index(0), Index(0), Index(0));

              }

            }


            // reformat local matrix

            for(Index i(0); i < nrc.first; ++i)

              for(Index j(0); j < nrc.second; ++j)

                local[i*stride+j] = DataType(0);

          } // #pragma omp for

        } // #pragma omp parallel


        // scale rows of Vanka matrix

        Solver::Intern::AmaVankaCore::scale_rows(this->_vanka, this->_omega, this->_dof_macros, this->_macro_mask, Index(0), Index(0));


        watch_init_numeric.stop();

      }


      virtual Status apply(VectorType& vec_x, const VectorType& vec_b) override

      {

        watch_apply.start();


        // first step

        this->_vanka.apply(vec_x, vec_b);

        this->_filter.filter_cor(vec_x);


        // steps 2, ..., n   (if any)

        for(Index step(1); step < _num_steps; ++step)

        {

          // compute defect

          this->_matrix.apply(this->_vec_d, vec_x, vec_b, -DataType(1));

          // filter defect

          this->_filter.filter_def(this->_vec_d);

          // apply Vanka matrix

          this->_vanka.apply(this->_vec_c, this->_vec_d);

          // filter correct

          this->_filter.filter_cor(this->_vec_c);

          // update solution

          vec_x.axpy(this->_vec_c);

        }


        watch_apply.stop();


        return Status::success;

      }


      bool compare(const AmaVanka* other) const

      {

        return Intern::AmaVankaMatrixHelper<VankaMatrixType>::compare(this->_vanka, other->_vanka);

      }

    }; // class AmaVanka


    template<typename Matrix_, typename Filter_>

    std::shared_ptr<AmaVanka<Matrix_, Filter_>> new_amavanka(const Matrix_& matrix, const Filter_& filter,

      typename Matrix_::DataType omega = typename Matrix_::DataType(1), Index num_steps = Index(1))

    {

      return std::make_shared<AmaVanka<Matrix_, Filter_>>(matrix, filter, omega, num_steps);

    }

  } // namespace Solver

} // namespace FEAT

XABORTM
#define XABORTM(msg)
Abortion macro definition with custom message.
Definition: assertion.hpp:192

XASSERT
#define XASSERT(expr)
Assertion macro definition.
Definition: assertion.hpp:262

XASSERTM
#define XASSERTM(expr, msg)
Assertion macro definition with custom message.
Definition: assertion.hpp:263

FEAT::Adjacency::Graph
Adjacency Graph implementation.
Definition: graph.hpp:34

FEAT::Solver::AmaVanka
Additive Macro-wise Matrix-based Vanka preconditioner/smoother.
Definition: amavanka.hpp:65

FEAT::Solver::AmaVanka::bytes
std::size_t bytes() const
Returns the total number of bytes currently allocated in this object.
Definition: amavanka.hpp:212

FEAT::Solver::AmaVanka::name
virtual String name() const override
Returns the name of the solver.
Definition: amavanka.hpp:270

FEAT::Solver::AmaVanka::_matrix
const Matrix_ & _matrix
the system matrix
Definition: amavanka.hpp:82

FEAT::Solver::AmaVanka::_macro_mask
std::vector< int > _macro_mask
the macro mask
Definition: amavanka.hpp:94

FEAT::Solver::AmaVanka::DataType
Matrix_::DataType DataType
our data type
Definition: amavanka.hpp:71

FEAT::Solver::AmaVanka::apply
virtual Status apply(VectorType &vec_x, const VectorType &vec_b) override
applies the preconditioner
Definition: amavanka.hpp:444

FEAT::Solver::AmaVanka::time_apply
double time_apply() const
Returns the total accumulated time for the solver application.
Definition: amavanka.hpp:264

FEAT::Solver::AmaVanka::_num_steps
Index _num_steps
number of steps
Definition: amavanka.hpp:96

FEAT::Solver::AmaVanka::set_omega
void set_omega(DataType omega)
Sets the damping parameter omega.
Definition: amavanka.hpp:192

FEAT::Solver::AmaVanka::_vec_c
VectorType _vec_c
temporary vectors
Definition: amavanka.hpp:100

FEAT::Solver::AmaVanka::IndexType
Matrix_::IndexType IndexType
our index type
Definition: amavanka.hpp:73

FEAT::Solver::AmaVanka::_auto_macros
bool _auto_macros
deduct macro dofs automatically?
Definition: amavanka.hpp:88

FEAT::Solver::AmaVanka::_omega
DataType _omega
damping parameter
Definition: amavanka.hpp:98

FEAT::Solver::AmaVanka::_skip_singular
bool _skip_singular
skip singular macros?
Definition: amavanka.hpp:90

FEAT::Solver::AmaVanka::_num_threads
int _num_threads
number of threads for numeric factorization
Definition: amavanka.hpp:110

FEAT::Solver::AmaVanka::init_numeric
virtual void init_numeric() override
Performs numeric factorization.
Definition: amavanka.hpp:338

FEAT::Solver::AmaVanka::reset_timings
void reset_timings()
Resets the internal stop watches for time measurement.
Definition: amavanka.hpp:238

FEAT::Solver::AmaVanka::init_symbolic
virtual void init_symbolic() override
Performs symbolic factorization.
Definition: amavanka.hpp:276

FEAT::Solver::AmaVanka::time_init_symbolic
double time_init_symbolic() const
Returns the total accumulated time for symbolic initialization.
Definition: amavanka.hpp:248

FEAT::Solver::AmaVanka::data_size
std::size_t data_size() const
Returns the total data size used by the AmaVanka smoother.
Definition: amavanka.hpp:230

FEAT::Solver::AmaVanka::set_skip_singular
void set_skip_singular(bool skip_sing)
Sets whether singular macros are to be skipped.
Definition: amavanka.hpp:204

FEAT::Solver::AmaVanka::_filter
const Filter_ & _filter
the system filter
Definition: amavanka.hpp:84

FEAT::Solver::AmaVanka::VectorType
Matrix_::VectorTypeL VectorType
our vector type
Definition: amavanka.hpp:75

FEAT::Solver::AmaVanka::AmaVanka
AmaVanka(const Matrix_ &matrix, const Filter_ &filter, const DataType omega=DataType(1), const Index num_steps=Index(1))
Constructor.
Definition: amavanka.hpp:128

FEAT::Solver::AmaVanka::time_init_numeric
double time_init_numeric() const
Returns the total accumulated time for numeric initialization.
Definition: amavanka.hpp:256

FEAT::Solver::AmaVanka::_vanka
VankaMatrixType _vanka
the Vanka preconditioner matrix
Definition: amavanka.hpp:86

FEAT::Solver::AmaVanka::done_symbolic
virtual void done_symbolic() override
Releases the symbolic factorization data.
Definition: amavanka.hpp:322

FEAT::Solver::AmaVanka::set_num_steps
void set_num_steps(Index num_steps)
Sets the number of smoothing steps.
Definition: amavanka.hpp:180

FEAT::Solver::AmaVanka::BaseClass
Solver::SolverBase< typename Matrix_::VectorTypeL > BaseClass
our base-class
Definition: amavanka.hpp:68

FEAT::Solver::AmaVanka::push_macro_dofs
void push_macro_dofs(Adjacency::Graph &&dofs)
Pushes the dofs-at-macro graph of the next block.
Definition: amavanka.hpp:155

FEAT::Solver::AmaVanka::clear_macro_dofs
void clear_macro_dofs()
Clears the macro dofs graphs.
Definition: amavanka.hpp:143

FEAT::Solver::AmaVanka::VankaMatrixType
Intern::AmaVankaMatrixHelper< Matrix_ >::VankaMatrix VankaMatrixType
the type of our Vanka matrix
Definition: amavanka.hpp:79

FEAT::Solver::AmaVanka::_macro_dofs
std::vector< Adjacency::Graph > _macro_dofs
the DOF-macro graphs
Definition: amavanka.hpp:92

FEAT::Solver::SolverBase
Polymorphic solver interface.
Definition: base.hpp:183

FEAT::Solver::SolverBase< typename Matrix_::VectorTypeL >::init_symbolic
virtual void init_symbolic()
Symbolic initialization method.
Definition: base.hpp:227

FEAT::Solver::SolverBase< typename Matrix_::VectorTypeL >::init_numeric
virtual void init_numeric()
Numeric initialization method.
Definition: base.hpp:237

FEAT::Solver::SolverBase< typename Matrix_::VectorTypeL >::done_symbolic
virtual void done_symbolic()
Symbolic finalization method.
Definition: base.hpp:255

FEAT::StopWatch
Stop-Watch class.
Definition: stop_watch.hpp:21

FEAT::StopWatch::elapsed
double elapsed() const
Returns the total elapsed time in seconds.
Definition: stop_watch.hpp:70

FEAT::StopWatch::start
void start()
Starts the stop-watch.
Definition: stop_watch.hpp:43

FEAT::StopWatch::reset
void reset()
Resets the elapsed time.
Definition: stop_watch.hpp:36

FEAT::StopWatch::stop
void stop()
Stops the stop-watch and increments elapsed time.
Definition: stop_watch.hpp:51

FEAT::String
String class implementation.
Definition: string.hpp:46

FEAT::Adjacency::RenderType::transpose
@ transpose
Render-Transpose mode.

FEAT::Math::invert_matrix
DT_ invert_matrix(const IT_ n, const IT_ stride, DT_ a[], IT_ p[])
Inverts a matrix and returns its determinant.
Definition: math.hpp:1292

FEAT::Solver::new_amavanka
std::shared_ptr< AmaVanka< Matrix_, Filter_ > > new_amavanka(const Matrix_ &matrix, const Filter_ &filter, typename Matrix_::DataType omega=typename Matrix_::DataType(1), Index num_steps=Index(1))
Creates a new AmaVanka smoother object.
Definition: amavanka.hpp:497

FEAT::Solver::Status
Status
Solver status return codes enumeration.
Definition: base.hpp:47

FEAT::Solver::Status::success
@ success
solving successful (convergence criterion fulfilled)

FEAT
FEAT namespace.
Definition: adjactor.hpp:12

FEAT::Index
std::uint64_t Index
Index data type.
Definition: base_header.hpp:122