feat3/ilu__precond_8hpp_source.html

// FEAT3: Finite Element Analysis Toolbox, Version 3

// Copyright (C) 2010 by Stefan Turek & the FEAT group

// FEAT3 is released under the GNU General Public License version 3,

// see the file 'copyright.txt' in the top level directory for details.


#pragma once


// includes, FEAT

#include <kernel/solver/base.hpp>

#include <kernel/lafem/sparse_matrix_csr.hpp>

#include <kernel/lafem/sparse_matrix_bcsr.hpp>


// includes, system

#include <vector>


namespace FEAT

{

  namespace Solver

  {

    namespace Intern

    {

      int cuda_ilu_apply(double * y, const double * x, double * csrVal, int * csrRowPtr, int * csrColInd, void * vinfo);

      void * cuda_ilu_init_symbolic(int m, int nnz, double * csrVal, int * csrRowPtr, int * csrColInd);

      void cuda_ilu_init_numeric(double * csrVal, int * csrRowPtr, int * csrColInd, void * vinfo);

      void cuda_ilu_done_symbolic(void * vinfo);


      int cuda_ilub_apply(double * y, const double * x, double * csrVal, int * csrRowPtr, int * csrColInd, void * vinfo);

      void * cuda_ilub_init_symbolic(int m, int nnz, double * csrVal, int * csrRowPtr, int * csrColInd, const int blocksize);

      void cuda_ilub_init_numeric(double * csrVal, int * csrRowPtr, int * csrColInd, void * vinfo);

      void cuda_ilub_done_symbolic(void * vinfo);


      template<typename IT_>

      class ILUCoreSymbolic

      {

      protected:

        IT_ _n;

        std::vector<IT_> _row_ptr_l, _col_idx_l;

        std::vector<IT_> _row_ptr_u, _col_idx_u;

        //std::vector<IT_> _lvl_l, _lvl_u;


      public:

        void clear()

        {

          _n = IT_(0);

          _row_ptr_l.clear();

          _col_idx_l.clear();

          _row_ptr_u.clear();

          _col_idx_u.clear();

          //_lvl_l.clear();

          //_lvl_u.clear();

        }


        IT_ get_nnze_l() const

        {

          return _row_ptr_l.empty() ? IT_(0) : _row_ptr_l.back();

        }


        IT_ get_nnze_u() const

        {

          return _row_ptr_u.empty() ? IT_(0) : _row_ptr_u.back();

        }


        IT_ get_nnze() const

        {

          return _n + get_nnze_l() + get_nnze_u();

        }


        std::size_t bytes_symbolic() const

        {

          return sizeof(IT_) * (_row_ptr_l.size() + _row_ptr_u.size() + _col_idx_l.size() + _col_idx_u.size());

        }


        void set_struct_csr(const IT_ n, const IT_* row_ptr_a, const IT_* col_idx_a)

        {

          // First of all, let's guess the number of non-zeros for L and U:

          // In most of our cases, the sparsity pattern of A is symmetric,

          // so we have a guess of (nz(A)-n)/2 for both L and U:

          const IT_ nzul = (Math::max(row_ptr_a[n], n) - n) / IT_(2);


          // store size and clear containers

          _n = n;

          _row_ptr_l.clear();

          _col_idx_l.clear();

          _row_ptr_u.clear();

          _col_idx_u.clear();


          // reserve our non-zero guess

          _row_ptr_l.reserve(n+1);

          _row_ptr_u.reserve(n+1);

          _col_idx_l.reserve(nzul);

          _col_idx_u.reserve(nzul);


          // initialize row-pointers

          _row_ptr_l.push_back(0);

          _row_ptr_u.push_back(0);


          // loop over all matrix rows

          for(IT_ i(0); i < n; ++i)

          {

            IT_ j = row_ptr_a[i];

            const IT_ jend = row_ptr_a[i+1];

            for(; (j < jend) && (col_idx_a[j] < i); ++j)

            {

              _col_idx_l.push_back(col_idx_a[j]);

            }

            if(col_idx_a[j] != i)

              throw InvalidMatrixStructureException();

            for(++j; j < jend; ++j)

            {

              _col_idx_u.push_back(col_idx_a[j]);

            }

            _row_ptr_l.push_back(IT_(_col_idx_l.size()));

            _row_ptr_u.push_back(IT_(_col_idx_u.size()));

          }


          //_lvl_l.resize(_col_idx_l.size(), IT_(0));

          //_lvl_u.resize(_col_idx_u.size(), IT_(0));

        }


        template<typename DT_>

        void set_struct(const LAFEM::SparseMatrixCSR<DT_, IT_>& matrix)

        {

          this->set_struct_csr(IT_(matrix.rows()), matrix.row_ptr(), matrix.col_ind());

        }


        template<typename DT_, int m_, int n_>

        void set_struct(const LAFEM::SparseMatrixBCSR<DT_, IT_, m_, n_>& matrix)

        {

          this->set_struct_csr(IT_(matrix.rows()), matrix.row_ptr(), matrix.col_ind());

        }


        void factorize_symbolic(const int p)

        {

          if(p < 1)

            return;


          // our new level-p structures for L and U

          std::vector<IT_> new_ptr_l, new_idx_l, new_ptr_u, new_idx_u;


          // our temporary level arrays

          std::vector<int> new_lvl_l, new_lvl_u;


          // initialize new row pointers

          new_ptr_l.push_back(IT_(0));

          new_ptr_u.push_back(IT_(0));


          // loop over all rows

          for(IT_ i(0); i < _n; ++i)

          {

            // first off, add all level 0 entries to L and U

            for(IT_ j(_row_ptr_l[i]); j < _row_ptr_l[i+1]; ++j)

            {

              new_idx_l.push_back(_col_idx_l[j]);

              new_lvl_l.push_back(0);

            }

            for(IT_ j(_row_ptr_u[i]); j < _row_ptr_u[i+1]; ++j)

            {

              new_idx_u.push_back(_col_idx_u[j]);

              new_lvl_u.push_back(0);

            }


            // loop over row L_i

            for(IT_ j(new_ptr_l[i]); j < IT_(new_idx_l.size()); ++j)

            {

              // get column index and level of L_ij

              const IT_ cj = new_idx_l[j];

              const int lj = new_lvl_l[j];

              IT_ olj = j;

              IT_ ouj = new_ptr_u[i];


              // loop over row U_j

              for(IT_ k(new_ptr_u[cj]); k < new_ptr_u[cj+1]; ++k)

              {

                // get column index and level of U_jk

                const IT_ ck = new_idx_u[k];

                const int lk = new_lvl_u[k];


                // compute level of entry L/U_ik

                const int ll = lj + lk + 1;

                if(ll > p)

                  continue;


                // insert into L or U

                if(ck < i)

                  olj = _insert(new_idx_l, new_lvl_l, olj, ck, ll);

                else if(ck > i)

                  ouj = _insert(new_idx_u, new_lvl_u, ouj, ck, ll);

              }

            }


            // update row-pointers

            new_ptr_l.push_back(IT_(new_idx_l.size()));

            new_ptr_u.push_back(IT_(new_idx_u.size()));

          }


          // replace old arrays

          _row_ptr_l = std::move(new_ptr_l);

          _col_idx_l = std::move(new_idx_l);

          _row_ptr_u = std::move(new_ptr_u);

          _col_idx_u = std::move(new_idx_u);


          //_lvl_l = new_lvl_l;

          //_lvl_u = new_lvl_u;

        }


      protected:

        static IT_ _insert(std::vector<IT_>& idx, std::vector<int>& lvl, IT_ i, const IT_ j, const int l)

        {

          // get the current length of the column-index vector

          IT_ n = IT_(idx.size());


          // loop over the row and try to find our entry

          for(; i < n; ++i)

          {

            if(idx[i] == j)

            {

              // the entry that we want to add already exists in the sparsity pattern,

              // so check whether we need to adapt its level

              if(l < lvl[i])

                lvl[i] = l;


              // return next entry starting position

              return ++i;

            }

            else if(j < idx[i])

            {

              // we have reached a column index beyond the entry we want to add,

              // so stop searching

              break;

            }

          }


          // the entry we want to add does not yet exist in the sparsity pattern,

          // so we add it at position i by linear insertion:

          idx.push_back(IT_(0));

          lvl.push_back(0);


          // shift all entries backward by one position

          for(IT_ k(n); k > i; --k)

          {

            idx[k] = idx[k-1];

            lvl[k] = lvl[k-1];

          }


          // insert at desired position

          idx[i] = j;

          lvl[i] = l;


          // return next entry starting position

          return ++i;

        }

      }; // class ILUCoreSymbolic


      template<typename DT_, typename IT_>

      class ILUCoreScalar :

        public ILUCoreSymbolic<IT_>

      {

      protected:

        typedef ILUCoreSymbolic<IT_> BaseClass;


        std::vector<DT_> _data_l, _data_u, _data_d;


      public:

        void clear()

        {

          BaseClass::clear();

          _data_l.clear();

          _data_u.clear();

          _data_d.clear();

        }


        void alloc_data()

        {

          // resize data arrays

          _data_d.resize(this->_n);

          _data_l.resize(this->_col_idx_l.size());

          _data_u.resize(this->_col_idx_u.size());

        }


        std::size_t bytes_numeric() const

        {

          return sizeof(DT_) * (_data_l.size() + _data_u.size() + _data_d.size());

        }


        std::size_t bytes() const

        {

          return this->bytes_numeric() + this->bytes_symbolic();

        }


        void copy_data_csr(const IT_* row_ptr_a, const IT_* col_idx_a, const DT_* data_a)

        {

          // loop over all rows

          for(IT_ i(0); i < this->_n; ++i)

          {

            // get row pointer of a

            IT_ ra = row_ptr_a[i];

            IT_ xa = row_ptr_a[i+1];


            // fetch row i of L

            for(IT_ j(this->_row_ptr_l[i]); j < this->_row_ptr_l[i+1]; ++j)

            {

              if(this->_col_idx_l[j] == col_idx_a[ra])

                _data_l[j] = data_a[ra++];

              else //if(this->_col_idx_l[j] < col_idx_a[ra])

                _data_l[j] = DT_(0);

            }


            // fetch diagonal of a

            _data_d[i] = data_a[ra++];


            // fetch row i of U

            for(IT_ j(this->_row_ptr_u[i]); j < this->_row_ptr_u[i+1]; ++j)

            {

              if((ra < xa) && (this->_col_idx_u[j] == col_idx_a[ra]))

                _data_u[j] = data_a[ra++];

              else// if(this->_col_idx_u[j] < col_idx_a[ra])

                _data_u[j] = DT_(0);

            }

          }

        }


        void copy_data(const LAFEM::SparseMatrixCSR<DT_, IT_>& matrix)

        {

          this->copy_data_csr(matrix.row_ptr(), matrix.col_ind(), matrix.val());

        }


        void factorize_numeric_il_du()

        {

          // get data arrays

          const IT_* rptr_l = this->_row_ptr_l.data();

          const IT_* rptr_u = this->_row_ptr_u.data();

          const IT_* cidx_l = (this->_col_idx_l.empty() ? nullptr : this->_col_idx_l.data());

          const IT_* cidx_u = (this->_col_idx_u.empty() ? nullptr : this->_col_idx_u.data());

          DT_* data_l = (this->_data_l.empty() ? nullptr : this->_data_l.data());

          DT_* data_u = (this->_data_u.empty() ? nullptr : this->_data_u.data());

          DT_* data_d = this->_data_d.data();


          // loop over all rows

          for(IT_ i(0); i < this->_n; ++i)

          {

            // get row-end pointers of L and U

            const IT_ ql = rptr_l[i+1];

            const IT_ qu = rptr_u[i+1];


            // loop over row i of L

            for(IT_ j(rptr_l[i]); j < rptr_l[i+1]; ++j)

            {

              // get column index of L_ij

              const IT_ cj = cidx_l[j];


              // get L/U pointers

              IT_ pl = j;

              IT_ pu = rptr_u[i];


              // update L_ij <- L_ij / D_jj

              data_l[j] *= data_d[cj];


              // loop over row j of U and process row i of L

              IT_ k(rptr_u[cj]);

              for(; k < rptr_u[cj+1]; ++k)

              {

                const IT_ ck = cidx_u[k];

                if(ck >= i)

                  break;

                for(; (pl < ql) && (cidx_l[pl] <= ck); ++pl)

                {

                  if(cidx_l[pl] == ck)

                    data_l[pl] -= data_l[j] * data_u[k];

                }

              }


              // process main diagonal entry

              if((k < rptr_u[cj+1]) && (cidx_u[k] == i))

              {

                data_d[i] -= data_l[j] * data_u[k];

                ++k;

              }

              // loop over row j of U and process row i of U

              for(; k < rptr_u[cj+1]; ++k)

              {

                const IT_ ck = cidx_u[k];

                for(; (pu < qu) && (cidx_u[pu] <= ck); ++pu)

                {

                  if(cidx_u[pu] == ck)

                    data_u[pu] -= data_l[j] * data_u[k];

                }

              }

            }


            // invert main diagonal entry

            data_d[i] = DT_(1) / data_d[i];

          }

        }


        void solve_il(DT_* x, const DT_* b) const

        {


          const IT_* rptr = this->_row_ptr_l.data();

          const IT_* cidx = (this->_col_idx_l.empty() ? nullptr : this->_col_idx_l.data());

          const DT_* data_l = (this->_data_l.empty() ? nullptr : this->_data_l.data());


          for(IT_ i(0); i < this->_n; ++i)

          {

            DT_ r(b[i]);

            for(IT_ j(rptr[i]); j < rptr[i+1]; ++j)

            {

              r -= data_l[j] * x[cidx[j]];

            }

            x[i] = r;

          }

        }


        void solve_du(DT_* x, const DT_* b) const

        {

          const IT_* rptr = this->_row_ptr_u.data();

          const IT_* cidx = (this->_col_idx_u.empty() ? nullptr : this->_col_idx_u.data());

          const DT_* data_u = (this->_data_u.empty() ? nullptr : this->_data_u.data());

          const DT_* data_d = this->_data_d.data();


          for(IT_ i(this->_n); i > IT_(0); )

          {

            --i;

            DT_ r(b[i]);

            for(IT_ j(rptr[i]); j < rptr[i+1]; ++j)

            {

              r -= data_u[j] * x[cidx[j]];

            }

            x[i] = data_d[i] * r;

          }

        }


        void solve_ilt(DT_* x, const DT_* b) const

        {

          const IT_* rptr = this->_row_ptr_l.data();

          const IT_* cidx = (this->_col_idx_l.empty() ? nullptr : this->_col_idx_l.data());

          const DT_* data_l = (this->_data_l.empty() ? nullptr : this->_data_l.data());


          if(x != b)

          {

            for(IT_ i(0); i < this->_n; ++i)

              x[i] = b[i];

          }


          for(IT_ i(this->_n); i > IT_(0); )

          {

            --i;

            for(IT_ j(rptr[i]); j < rptr[i+1]; ++j)

            {

              // x_j -= L_ij * x[i]

              x[cidx[j]] -= data_l[j] * x[i];

            }

          }

        }


        void solve_dut(DT_* x, const DT_* b) const

        {

          const IT_* rptr = this->_row_ptr_u.data();

          const IT_* cidx = (this->_col_idx_u.empty() ? nullptr : this->_col_idx_u.data());

          const DT_* data_u = (this->_data_u.empty() ? nullptr : this->_data_u.data());

          const DT_* data_d = this->_data_d.data();


          if(x != b)

          {

            for(IT_ i(0); i < this->_n; ++i)

              x[i] = b[i];

          }


          for(IT_ i(0); i < this->_n; ++i)

          {

            x[i] *= data_d[i];

            for(IT_ j(rptr[i]); j < rptr[i+1]; ++j)

            {

              // x_j -= U_ij * x_i

              x[cidx[j]] -= data_u[j] * x[i];

            }

          }

        }

      }; // class ILUCoreScalar


      template<typename DT_, typename IT_, int dim_>

      class ILUCoreBlocked :

        public ILUCoreSymbolic<IT_>

      {

      protected:

        typedef ILUCoreSymbolic<IT_> BaseClass;


        static_assert(dim_ > 0, "invalid block dimension");


        typedef Tiny::Matrix<DT_, dim_, dim_> MatBlock;

        typedef Tiny::Vector<DT_, dim_> VecBlock;


        std::vector<MatBlock> _data_l, _data_u, _data_d;


      public:

        void clear()

        {

          BaseClass::clear();

          _data_l.clear();

          _data_u.clear();

          _data_d.clear();

        }


        void alloc_data()

        {

          // resize data arrays

          _data_d.resize(this->_n);

          _data_l.resize(this->_col_idx_l.size());

          _data_u.resize(this->_col_idx_u.size());

        }


        std::size_t bytes_numeric() const

        {

          return sizeof(DT_) * std::size_t(Math::sqr(dim_)) * (_data_l.size() + _data_u.size() + _data_d.size());

        }


        std::size_t bytes() const

        {

          return this->bytes_numeric() + this->bytes_symbolic();

        }


        void copy_data_bcsr(const IT_* row_ptr_a, const IT_* col_idx_a, const MatBlock* data_a)

        {

          // loop over all rows

          for(IT_ i(0); i < this->_n; ++i)

          {

            // get row pointer of a

            IT_ ra = row_ptr_a[i];

            IT_ xa = row_ptr_a[i+1];


            // fetch row i of L

            for(IT_ j(this->_row_ptr_l[i]); j < this->_row_ptr_l[i+1]; ++j)

            {

              if(this->_col_idx_l[j] == col_idx_a[ra])

                _data_l[j] = data_a[ra++];

              else //if(this->_col_idx_l[j] < col_idx_a[ra])

                _data_l[j] = DT_(0);

            }


            // fetch diagonal of a

            _data_d[i] = data_a[ra++];


            // fetch row i of U

            for(IT_ j(this->_row_ptr_u[i]); j < this->_row_ptr_u[i+1]; ++j)

            {

              if((ra < xa) && (this->_col_idx_u[j] == col_idx_a[ra]))

                _data_u[j] = data_a[ra++];

              else// if(this->_col_idx_u[j] < col_idx_a[ra])

                _data_u[j] = DT_(0);

            }

          }

        }


        void copy_data(const LAFEM::SparseMatrixBCSR<DT_, IT_, dim_, dim_>& matrix)

        {

          this->copy_data_bcsr(matrix.row_ptr(), matrix.col_ind(), matrix.val());

        }


        void factorize_numeric_il_du()

        {

          // get data arrays

          const IT_* rptr_l = this->_row_ptr_l.data();

          const IT_* rptr_u = this->_row_ptr_u.data();

          const IT_* cidx_l = (this->_col_idx_l.empty() ? nullptr : this->_col_idx_l.data());

          const IT_* cidx_u = (this->_col_idx_u.empty() ? nullptr : this->_col_idx_u.data());

          MatBlock* data_l = (this->_data_l.empty() ? nullptr : this->_data_l.data());

          MatBlock* data_u = (this->_data_u.empty() ? nullptr : this->_data_u.data());

          MatBlock* data_d = this->_data_d.data();


          // loop over all rows

          for(IT_ i(0); i < this->_n; ++i)

          {

            // get row-end pointers of L and U

            const IT_ ql = rptr_l[i+1];

            const IT_ qu = rptr_u[i+1];


            // loop over row i of L

            for(IT_ j(rptr_l[i]); j < rptr_l[i+1]; ++j)

            {

              // get column index of L_ij

              const IT_ cj = cidx_l[j];


              // get L/U pointers

              IT_ pl = j;

              IT_ pu = rptr_u[i];


              // update L_ij <- D_jj^{-1} * L_ij

              {

                //data_l[j] *= data_d[cj];

                const MatBlock l_ij(data_l[j]);

                data_l[j].set_mat_mat_mult(data_d[cj], l_ij);

              }


              // loop over row j of U and process row i of L

              IT_ k(rptr_u[cj]);

              for(; k < rptr_u[cj+1]; ++k)

              {

                const IT_ ck = cidx_u[k];

                if(ck >= i)

                  break;

                for(; (pl < ql) && (cidx_l[pl] <= ck); ++pl)

                {

                  if(cidx_l[pl] == ck)

                    //data_l[pl] -= data_l[j] * data_u[k];

                    data_l[pl].add_mat_mat_mult(data_l[j], data_u[k], -DT_(1));

                }

              }


              // process main diagonal entry

              if((k < rptr_u[cj+1]) && (cidx_u[k] == i))

              {

                //data_d[i] -= data_l[j] * data_u[k];

                data_d[i].add_mat_mat_mult(data_l[j], data_u[k], -DT_(1));

                ++k;

              }


              // loop over row j of U and process row i of U

              for(; k < rptr_u[cj+1]; ++k)

              {

                const IT_ ck = cidx_u[k];

                for(; (pu < qu) && (cidx_u[pu] <= ck); ++pu)

                {

                  if(cidx_u[pu] == ck)

                    //data_u[pu] -= data_l[j] * data_u[k];

                    data_u[pu].add_mat_mat_mult(data_l[j], data_u[k], -DT_(1));

                }

              }

            }


            // invert main diagonal entry

            {

              //data_d[i] = DT_(1) / data_d[i];

              const MatBlock d_ii(data_d[i]);

              data_d[i].set_inverse(d_ii);

            }

          }

        }


        void solve_il(VecBlock* x, const VecBlock* b) const

        {

          const IT_* rptr = this->_row_ptr_l.data();

          const IT_* cidx = (this->_col_idx_l.empty() ? nullptr : this->_col_idx_l.data());

          const MatBlock* data_l = (this->_data_l.empty() ? nullptr : this->_data_l.data());


          for(IT_ i(0); i < this->_n; ++i)

          {

            VecBlock r(b[i]);

            for(IT_ j(rptr[i]); j < rptr[i+1]; ++j)

            {

              //r -= data_l[j] * x[cidx[j]];

              r.add_mat_vec_mult(data_l[j], x[cidx[j]], -DT_(1));

            }

            x[i] = r;

          }

        }


        void solve_du(VecBlock* x, const VecBlock* b) const

        {

          const IT_* rptr = this->_row_ptr_u.data();

          const IT_* cidx = (this->_col_idx_u.empty() ? nullptr : this->_col_idx_u.data());

          const MatBlock* data_u = (this->_data_u.empty() ? nullptr : this->_data_u.data());

          const MatBlock* data_d = this->_data_d.data();


          for(IT_ i(this->_n); i > IT_(0); )

          {

            --i;

            VecBlock r(b[i]);

            for(IT_ j(rptr[i]); j < rptr[i+1]; ++j)

            {

              //r -= data_u[j] * x[cidx[j]];

              r.add_mat_vec_mult(data_u[j], x[cidx[j]], -DT_(1));

            }

            //x[i] = data_d[i] * r;

            x[i].set_mat_vec_mult(data_d[i], r);

          }

        }

      }; // class ILUCoreBlocked

    } // namespace Intern


    template<typename Matrix_>

    class ILUPrecondBase

    {

    public:

      typedef typename Matrix_::DataType DataType;

      typedef typename Matrix_::VectorTypeL VectorType;


      virtual void set_fill_in_param(int p) = 0;


      virtual void init_symbolic() = 0;


      virtual void done_symbolic() = 0;


      virtual void init_numeric() = 0;


      virtual String name() const = 0;


      virtual Status apply(VectorType& vec_cor, const VectorType& vec_def) = 0;


      virtual ~ILUPrecondBase() {}

    }; // ILUPrecondBase class


    template<PreferredBackend backend_, typename Matrix_, typename Filter_>

    class ILUPrecondWithBackend;


    template<typename DT_, typename IT_, typename Filter_>

    class ILUPrecondWithBackend<PreferredBackend::generic, LAFEM::SparseMatrixCSR<DT_, IT_>, Filter_> :

      public ILUPrecondBase<typename LAFEM::SparseMatrixCSR<DT_, IT_>>

    {

    public:

      typedef LAFEM::SparseMatrixCSR<DT_, IT_> MatrixType;

      typedef DT_ DataType;

      typedef IT_ IndexType;

      typedef Filter_ FilterType;

      typedef typename MatrixType::VectorTypeL VectorType;


    protected:

      const MatrixType& _matrix;

      const FilterType& _filter;

      Intern::ILUCoreScalar<DataType, IndexType> _ilu;

      int _p;


    public:

      explicit ILUPrecondWithBackend(const MatrixType& matrix, const FilterType& filter, const int p = 0) :

        _matrix(matrix),

        _filter(filter),

        _p(p)

      {

      }


      explicit ILUPrecondWithBackend(const String& section_name, const PropertyMap* section,

        const MatrixType& matrix, const FilterType& filter) :

        _matrix(matrix),

        _filter(filter),

        _p(-1)

      {

        auto fill_in_param_p = section->query("fill_in_param");

        if(fill_in_param_p.second && !fill_in_param_p.first.parse(_p))

          throw ParseError(section_name + ".fill_in_param", fill_in_param_p.first, "a non-negative integer");

      }


      virtual ~ILUPrecondWithBackend()

      {

      }


      virtual void set_fill_in_param(int p) override

      {

        XASSERT(p > 0);

        _p = p;

      }


      virtual String name() const override

      {

        return "ILU";

      }


      virtual void init_symbolic() override

      {

        if (_matrix.columns() != _matrix.rows())

        {

          XABORTM("Matrix is not square!");

        }


        // set matrix structure

        _ilu.set_struct(_matrix);


        // perform symbolic factorization

        _ilu.factorize_symbolic(_p);


        // allocate data arrays

        _ilu.alloc_data();

      }


      virtual void done_symbolic() override

      {

        _ilu.clear();

      }


      virtual void init_numeric() override

      {

        _ilu.copy_data(_matrix);

        _ilu.factorize_numeric_il_du();

      }


      virtual Status apply(VectorType& out, const VectorType& in) override

      {

        TimeStamp ts_start;


        // get vector data arrays

        DataType* x = out.elements();

        const DataType* b = in.elements();


        // solve: (I+L)*y = b

        _ilu.solve_il(x, b);


        // solve: (D+U)*x = y

        _ilu.solve_du(x, x);


        // apply filter

        this->_filter.filter_cor(out);


        TimeStamp ts_stop;

        Statistics::add_time_precon(ts_stop.elapsed(ts_start));

        Statistics::add_flops(_ilu.get_nnze() * 2 + out.size());


        return Status::success;

      }

    }; // class ILUPrecondWithBackend<generic, SparseMatrixCSR,...>


    template<typename DT_, typename IT_, int dim_, typename Filter_>

    class ILUPrecondWithBackend<PreferredBackend::generic, LAFEM::SparseMatrixBCSR<DT_, IT_, dim_, dim_>, Filter_> :

      public ILUPrecondBase<typename LAFEM::SparseMatrixBCSR<DT_, IT_, dim_, dim_>>

    {

    public:

      typedef LAFEM::SparseMatrixBCSR<DT_, IT_, dim_, dim_> MatrixType;

      typedef DT_ DataType;

      typedef IT_ IndexType;

      typedef Filter_ FilterType;

      typedef typename MatrixType::VectorTypeL VectorType;


    protected:

      const MatrixType& _matrix;

      const FilterType& _filter;

      Intern::ILUCoreBlocked<DataType, IndexType, dim_> _ilu;

      int _p;


    public:

      explicit ILUPrecondWithBackend(const MatrixType& matrix, const FilterType& filter, const int p = 0) :

        _matrix(matrix),

        _filter(filter),

        _p(p)

      {

      }


      explicit ILUPrecondWithBackend(const String& section_name, const PropertyMap* section,

        const MatrixType& matrix, const FilterType& filter) :

        _matrix(matrix),

        _filter(filter),

        _p(-1)

      {

        auto fill_in_param_p = section->query("fill_in_param");

        if(fill_in_param_p.second && !fill_in_param_p.first.parse(_p))

          throw ParseError(section_name + ".fill_in_param", fill_in_param_p.first, "a non-negative integer");

      }


      virtual ~ILUPrecondWithBackend()

      {

      }


      virtual void set_fill_in_param(int p) override

      {

        XASSERT(p > 0);

        _p = p;

      }


      virtual String name() const override

      {

        return "ILU";

      }


      virtual void init_symbolic() override

      {

        if (_matrix.columns() != _matrix.rows())

        {

          XABORTM("Matrix is not square!");

        }


        // set matrix structure

        _ilu.set_struct(_matrix);


        // perform symbolic factorization

        _ilu.factorize_symbolic(_p);


        // allocate data arrays

        _ilu.alloc_data();

      }


      virtual void done_symbolic() override

      {

        _ilu.clear();

      }


      virtual void init_numeric() override

      {

        _ilu.copy_data(_matrix);

        _ilu.factorize_numeric_il_du();

      }


      virtual Status apply(VectorType& out, const VectorType& in) override

      {

        TimeStamp ts_start;


        // get vector data arrays

        auto* x = out.elements();

        const auto* b = in.elements();


        // solve: (I+L)*y = b

        _ilu.solve_il(x, b);


        // solve: (D+U)*x = y

        _ilu.solve_du(x, x);


        // apply filter

        this->_filter.filter_cor(out);


        TimeStamp ts_stop;

        Statistics::add_time_precon(ts_stop.elapsed(ts_start));

        Statistics::add_flops(_ilu.get_nnze() * 2 + out.size());


        return Status::success;

      }

    }; // class ILUPrecondWithBackend<generic, SparseMatrixBCSR<...>,...>


#ifdef FEAT_HAVE_CUDA

    template<typename Filter_>

    class ILUPrecondWithBackend<PreferredBackend::cuda, LAFEM::SparseMatrixCSR<double, unsigned int>, Filter_> :

      public ILUPrecondBase<LAFEM::SparseMatrixCSR<double, unsigned int>>

    {

    public:

      typedef LAFEM::SparseMatrixCSR<double, unsigned int> MatrixType;

      typedef Filter_ FilterType;

      typedef typename MatrixType::VectorTypeL VectorType;

      typedef typename MatrixType::DataType DataType;


    protected:

      const MatrixType& _matrix;

      MatrixType _lu_matrix;

      const FilterType& _filter;

      void * cuda_info;


    public:

      explicit ILUPrecondWithBackend(const MatrixType& matrix, const FilterType& filter, const int = 0) :

        _matrix(matrix),

        _filter(filter)

      {

      }


      explicit ILUPrecondWithBackend(const String& section_name, const PropertyMap* section,

        const MatrixType& matrix, const FilterType& filter) :

        _matrix(matrix),

        _filter(filter)

      {

        // Check for _p

        auto fill_in_param_p = section->query("fill_in_param");

        if(fill_in_param_p.second)

        {

          XASSERTM(std::stoi(fill_in_param_p.first) == 0, "For PreferredBackend::cuda, the fill in parameter has to be == 0!");

        }

      }


      virtual ~ILUPrecondWithBackend()

      {

      }


      virtual void set_fill_in_param(int p) override

      {

        XASSERTM(p == 0, "For PreferredBackend::cuda, the fill in parameter has to be == 0!");

      }


      virtual String name() const override

      {

        return "ILU";

      }


      virtual void init_symbolic() override

      {

        if (_matrix.columns() != _matrix.rows())

        {

          XABORTM("Matrix is not square!");

        }


        _lu_matrix.clone(_matrix, LAFEM::CloneMode::Layout);


        cuda_info = Intern::cuda_ilu_init_symbolic(

          (int)_lu_matrix.rows(),

          (int)_lu_matrix.used_elements(),

          _lu_matrix.val(),

          (int*)_lu_matrix.row_ptr(),

          (int*)_lu_matrix.col_ind());

      }


      virtual void done_symbolic() override

      {

        Intern::cuda_ilu_done_symbolic(cuda_info);

      }


      virtual void init_numeric() override

      {

        _lu_matrix.copy(_matrix);


        Intern::cuda_ilu_init_numeric(

          _lu_matrix.val(),

          (int*)_lu_matrix.row_ptr(),

          (int*)_lu_matrix.col_ind(),

          cuda_info);

      }


      virtual Status apply(VectorType& vec_cor, const VectorType& vec_def) override

      {

        XASSERTM(_matrix.rows() == vec_cor.size(), "matrix / vector size mismatch!");

        XASSERTM(_matrix.rows() == vec_def.size(), "matrix / vector size mismatch!");


        TimeStamp ts_start;


        int status = Intern::cuda_ilu_apply(

          vec_cor.elements(),

          vec_def.elements(),

          _lu_matrix.val(),

          (int*)_lu_matrix.row_ptr(),

          (int*)_lu_matrix.col_ind(),

          cuda_info);


        this->_filter.filter_cor(vec_cor);


        TimeStamp ts_stop;

        Statistics::add_time_precon(ts_stop.elapsed(ts_start));

        Statistics::add_flops(_matrix.used_elements() * 2 + vec_cor.size());


        return (status == 0) ? Status::success :  Status::aborted;

      }

    }; // class ILUPrecondWithBackend<cuda, SparseMatrixCSR<...>,...>


    /*

    template<typename Filter_>

    class ILUPrecond<LAFEM::SparseMatrixCSR<Mem::CUDA, float, unsigned int>, Filter_> :

      public SolverBase<LAFEM::SparseMatrixCSR<Mem::CUDA, float, unsigned int>::VectorTypeL>

    {

      public:

      typedef LAFEM::SparseMatrixCSR<Mem::CUDA, float, unsigned int> MatrixType;

      typedef typename MatrixType::VectorTypeL VectorType;

      typedef Filter_ FilterType;


      explicit ILUPrecond(const MatrixType&, const FilterType&, const int = 0)

      {

      }


      Status apply(VectorType &, const VectorType &) override

      {

          XABORTM("not implemented yet!");

      }


      String name() const override

      {

          XABORTM("not implemented yet!");

      }

    };


    template<typename Filter_>

    class ILUPrecond<LAFEM::SparseMatrixCSR<Mem::CUDA, float, unsigned long>, Filter_> :

      public SolverBase<LAFEM::SparseMatrixCSR<Mem::CUDA, float, unsigned long>::VectorTypeL>

    {

      public:

      typedef LAFEM::SparseMatrixCSR<Mem::CUDA, float, unsigned long> MatrixType;

      typedef typename MatrixType::VectorTypeL VectorType;

      typedef Filter_ FilterType;


      explicit ILUPrecond(const MatrixType&, const FilterType&, const int = 0)

      {

      }


      Status apply(VectorType &, const VectorType &) override

      {

          XABORTM("not implemented yet!");

      }


      String name() const override

      {

          XABORTM("not implemented yet!");

      }

    };


    template<typename Filter_>

    class ILUPrecond<LAFEM::SparseMatrixCSR<Mem::CUDA, double, unsigned long>, Filter_> :

      public SolverBase<LAFEM::SparseMatrixCSR<Mem::CUDA, double, unsigned long>::VectorTypeL>

    {

      public:

      typedef LAFEM::SparseMatrixCSR<Mem::CUDA, double, unsigned long> MatrixType;

      typedef typename MatrixType::VectorTypeL VectorType;

      typedef Filter_ FilterType;


      explicit ILUPrecond(const MatrixType&, const FilterType&, const int = 0)

      {

      }


      Status apply(VectorType &, const VectorType &) override

      {

          XABORTM("not implemented yet!");

      }


      String name() const override

      {

          XABORTM("not implemented yet!");

      }

    };*/


    template<typename Filter_, int blocksize_>

    class ILUPrecondWithBackend<PreferredBackend::cuda, LAFEM::SparseMatrixBCSR<double, unsigned int, blocksize_, blocksize_>, Filter_> :

      public ILUPrecondBase<typename LAFEM::SparseMatrixBCSR<double, unsigned int, blocksize_, blocksize_>>

    {

    public:

      typedef LAFEM::SparseMatrixBCSR<double, unsigned int, blocksize_, blocksize_> MatrixType;

      typedef Filter_ FilterType;

      typedef typename MatrixType::VectorTypeL VectorType;

      typedef typename MatrixType::DataType DataType;


    protected:

      const MatrixType& _matrix;

      MatrixType _lu_matrix;

      const FilterType& _filter;

      void * cuda_info;


    public:

      explicit ILUPrecondWithBackend(const MatrixType& matrix, const FilterType& filter, const int = 0) :

        _matrix(matrix),

        _filter(filter)

      {

      }


      explicit ILUPrecondWithBackend(const String& section_name, const PropertyMap* section,

        const MatrixType& matrix, const FilterType& filter) :

        _matrix(matrix),

        _filter(filter)

        {

          // Check for _p

          auto fill_in_param_p = section->query("fill_in_param");

          if(fill_in_param_p.second)

          {

            XASSERTM(std::stoi(fill_in_param_p.first) == 0, "For PreferredBackend::cuda, the fill in parameter has to be == 0!");

          }

        }


      virtual ~ILUPrecondWithBackend()

      {

      }


      virtual void set_fill_in_param(int p) override

      {

        XASSERTM(p == 0, "For PreferredBackend::cuda, the fill in parameter has to be == 0!");

      }


      virtual String name() const override

      {

        return "ILU";

      }


      virtual void init_symbolic() override

      {

        if (_matrix.columns() != _matrix.rows())

        {

          XABORTM("Matrix is not square!");

        }


        _lu_matrix.clone(_matrix, LAFEM::CloneMode::Layout);


        cuda_info = Intern::cuda_ilub_init_symbolic(

          (int)_lu_matrix.rows(),

          (int)_lu_matrix.used_elements(),

          _lu_matrix.template val<LAFEM::Perspective::pod>(),

          (int*)_lu_matrix.row_ptr(),

          (int*)_lu_matrix.col_ind(),

          blocksize_);

      }


      virtual void done_symbolic() override

      {

        Intern::cuda_ilub_done_symbolic(cuda_info);

      }


      virtual void init_numeric() override

      {

        _lu_matrix.copy(_matrix);


        Intern::cuda_ilub_init_numeric(_lu_matrix.template val<LAFEM::Perspective::pod>(), (int*)_lu_matrix.row_ptr(), (int*)_lu_matrix.col_ind(), cuda_info);

      }


      virtual Status apply(VectorType& vec_cor, const VectorType& vec_def) override

      {

        XASSERTM(_matrix.rows() == vec_cor.size(), "matrix / vector size mismatch!");

        XASSERTM(_matrix.rows() == vec_def.size(), "matrix / vector size mismatch!");


        TimeStamp ts_start;


        int status = Intern::cuda_ilub_apply(

          vec_cor.template elements<LAFEM::Perspective::pod>(),

          vec_def.template elements<LAFEM::Perspective::pod>(),

          _lu_matrix.template val<LAFEM::Perspective::pod>(),

          (int*)_lu_matrix.row_ptr(),

          (int*)_lu_matrix.col_ind(),

          cuda_info);


        this->_filter.filter_cor(vec_cor);


        TimeStamp ts_stop;

        Statistics::add_time_precon(ts_stop.elapsed(ts_start));

        Statistics::add_flops(_matrix.used_elements() * 2 + vec_cor.size());


        return (status == 0) ? Status::success :  Status::aborted;

      }

    }; // class ILUPrecondWithBackend<cuda, SparseMatrixBCSR<...>,...>

#endif //FEAT_HAVE_CUDA


    template<PreferredBackend backend_, typename Matrix_, typename Filter_>

    class ILUPrecondWithBackend :

      public ILUPrecondBase<Matrix_>

    {

      public:


      explicit ILUPrecondWithBackend(const Matrix_&, const Filter_&, const int = 0)

      {

      }


      explicit ILUPrecondWithBackend(const String& , const PropertyMap*, const Matrix_& , const Filter_& )

      {

      }


      virtual Status apply(typename Matrix_::VectorTypeL &, const typename Matrix_::VectorTypeL &) override

      {

          XABORTM("not implemented yet!");

      }


      virtual String name() const override

      {

          XABORTM("not implemented yet!");

      }


      virtual void init_symbolic() override

      {

        XABORTM("not implemented yet!");

      }


      virtual void done_symbolic() override

      {

        XABORTM("not implemented yet!");

      }


      virtual void set_fill_in_param(int /*p*/) override

      {

        XABORTM("not implemented yet!");

      }


      virtual void init_numeric() override

      {

        XABORTM("not implemented yet!");

      }

    };


    template<typename Matrix_, typename Filter_>

    class ILUPrecond : public SolverBase<typename Matrix_::VectorTypeL>

    {

    private:

      std::shared_ptr<ILUPrecondBase<Matrix_>> _impl;


    public:

      typedef Matrix_ MatrixType;

      typedef Filter_ FilterType;

      typedef typename MatrixType::VectorTypeL VectorType;

      typedef typename MatrixType::DataType DataType;


      typedef SolverBase<VectorType> BaseClass;


    public:

      ILUPrecond(PreferredBackend backend, const MatrixType& matrix, const FilterType& filter, const int p = 0)

      {

        switch (backend)

        {

          case PreferredBackend::cuda:

            _impl = std::make_shared<ILUPrecondWithBackend<PreferredBackend::cuda, Matrix_, Filter_>>(matrix, filter);

            break;

          case PreferredBackend::mkl:

          case PreferredBackend::generic:

          default:

            _impl = std::make_shared<ILUPrecondWithBackend<PreferredBackend::generic, Matrix_, Filter_>>(matrix, filter, p);

        }

      }


      ILUPrecond(const String& section_name, const PropertyMap* section, PreferredBackend backend, const MatrixType& matrix, const FilterType& filter) :

        BaseClass(section_name, section)

      {

        switch (backend)

        {

          case PreferredBackend::cuda:

            _impl = std::make_shared<ILUPrecondWithBackend<PreferredBackend::cuda, Matrix_, Filter_>>(section_name, section, matrix, filter);

            break;

          case PreferredBackend::mkl:

          case PreferredBackend::generic:

          default:

            _impl = std::make_shared<ILUPrecondWithBackend<PreferredBackend::generic, Matrix_, Filter_>>(section_name, section, matrix, filter);

        }

      }


      virtual ~ILUPrecond()

      {

      }


      virtual String name() const override

      {

        return _impl->name();

      }


      virtual void set_fill_in_param(int p)

      {

        _impl->set_fill_in_param(p);

      }


      virtual Status apply(VectorType& vec_cor, const VectorType& vec_def) override

      {

        return _impl->apply(vec_cor, vec_def);

      }


      virtual void init_symbolic() override

      {

        _impl->init_symbolic();

      }


      virtual void done_symbolic() override

      {

        _impl->done_symbolic();

      }


      virtual void init_numeric() override

      {

        _impl->init_numeric();

      }

    }; // class ILUPrecond


    template<typename Matrix_, typename Filter_>

    inline std::shared_ptr<ILUPrecond<Matrix_, Filter_>> new_ilu_precond(PreferredBackend backend,

      const Matrix_& matrix, const Filter_& filter, const int p = 0)

    {

      return std::make_shared<ILUPrecond<Matrix_, Filter_>>(backend, matrix, filter, p);

    }


    template<typename Matrix_, typename Filter_>

    inline std::shared_ptr<ILUPrecond<Matrix_, Filter_>> new_ilu_precond(

      const String& section_name, const PropertyMap* section, PreferredBackend backend,

      const Matrix_& matrix, const Filter_& filter)

    {

      return std::make_shared<ILUPrecond<Matrix_, Filter_>>(section_name, section, backend, matrix, filter);

    }

  } // namespace Solver

} // namespace FEAT

XABORTM
#define XABORTM(msg)
Abortion macro definition with custom message.
Definition: assertion.hpp:192

XASSERT
#define XASSERT(expr)
Assertion macro definition.
Definition: assertion.hpp:262

XASSERTM
#define XASSERTM(expr, msg)
Assertion macro definition with custom message.
Definition: assertion.hpp:263

FEAT::LAFEM::Container::size
Index size() const
Returns the containers size.
Definition: container.hpp:1136

FEAT::LAFEM::DenseVector< DT_, IT_ >

FEAT::LAFEM::DenseVector::elements
DT_ * elements()
Get a pointer to the data array.
Definition: dense_vector.hpp:737

FEAT::LAFEM::SparseMatrixBCSR
CSR based blocked sparse matrix.
Definition: sparse_matrix_bcsr.hpp:91

FEAT::LAFEM::SparseMatrixBCSR::VectorTypeL
Intern::BCSRVectorHelper< DT_, IT_, BlockHeight_ >::VectorType VectorTypeL
Compatible L-vector type.
Definition: sparse_matrix_bcsr.hpp:122

FEAT::LAFEM::SparseMatrixBCSR::rows
Index rows() const
Retrieve matrix row count.
Definition: sparse_matrix_bcsr.hpp:988

FEAT::LAFEM::SparseMatrixBCSR::columns
Index columns() const
Retrieve matrix column count.
Definition: sparse_matrix_bcsr.hpp:1003

FEAT::LAFEM::SparseMatrixCSR
CSR based sparse matrix.
Definition: sparse_matrix_csr.hpp:60

FEAT::LAFEM::SparseMatrixCSR::rows
Index rows() const
Retrieve matrix row count.
Definition: sparse_matrix_csr.hpp:1169

FEAT::LAFEM::SparseMatrixCSR::columns
Index columns() const
Retrieve matrix column count.
Definition: sparse_matrix_csr.hpp:1180

FEAT::ParseError
Class for parser related errors.
Definition: exception.hpp:132

FEAT::PropertyMap
A class organizing a tree of key-value pairs.
Definition: property_map.hpp:48

FEAT::PropertyMap::query
std::pair< String, bool > query(String key_path) const
Queries a value by its key path.
Definition: property_map.cpp:125

FEAT::Solver::ILUPrecondBase
Inheritances inside ilu_precond.hpp.
Definition: ilu_precond.hpp:937

FEAT::Solver::ILUPrecond
ILU(0) and ILU(p) preconditioner implementation.
Definition: ilu_precond.hpp:1669

FEAT::Solver::ILUPrecond::ILUPrecond
ILUPrecond(const String &section_name, const PropertyMap *section, PreferredBackend backend, const MatrixType &matrix, const FilterType &filter)
Constructor using a PropertyMap.
Definition: ilu_precond.hpp:1732

FEAT::Solver::ILUPrecond::~ILUPrecond
virtual ~ILUPrecond()
Empty virtual destructor.
Definition: ilu_precond.hpp:1750

FEAT::Solver::ILUPrecond::ILUPrecond
ILUPrecond(PreferredBackend backend, const MatrixType &matrix, const FilterType &filter, const int p=0)
Constructor.
Definition: ilu_precond.hpp:1699

FEAT::Solver::ILUPrecond::BaseClass
SolverBase< VectorType > BaseClass
Our base class.
Definition: ilu_precond.hpp:1680

FEAT::Solver::ILUPrecond::init_numeric
virtual void init_numeric() override
Numeric initialization method.
Definition: ilu_precond.hpp:1792

FEAT::Solver::ILUPrecond::apply
virtual Status apply(VectorType &vec_cor, const VectorType &vec_def) override
apply the preconditioner
Definition: ilu_precond.hpp:1777

FEAT::Solver::ILUPrecond::set_fill_in_param
virtual void set_fill_in_param(int p)
Sets the fill-in parameter.
Definition: ilu_precond.hpp:1766

FEAT::Solver::ILUPrecond::done_symbolic
virtual void done_symbolic() override
Symbolic finalization method.
Definition: ilu_precond.hpp:1787

FEAT::Solver::ILUPrecond::init_symbolic
virtual void init_symbolic() override
Symbolic initialization method.
Definition: ilu_precond.hpp:1782

FEAT::Solver::ILUPrecond::name
virtual String name() const override
Returns the name of the solver.
Definition: ilu_precond.hpp:1755

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixBCSR< DT_, IT_, dim_, dim_ >, Filter_ >::ILUPrecondWithBackend
ILUPrecondWithBackend(const MatrixType &matrix, const FilterType &filter, const int p=0)
Constructor.
Definition: ilu_precond.hpp:1136

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixBCSR< DT_, IT_, dim_, dim_ >, Filter_ >::name
virtual String name() const override
Returns the name of the solver.
Definition: ilu_precond.hpp:1174

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixBCSR< DT_, IT_, dim_, dim_ >, Filter_ >::~ILUPrecondWithBackend
virtual ~ILUPrecondWithBackend()
Empty virtual destructor.
Definition: ilu_precond.hpp:1157

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixBCSR< DT_, IT_, dim_, dim_ >, Filter_ >::apply
virtual Status apply(VectorType &out, const VectorType &in) override
apply the preconditioner
Definition: ilu_precond.hpp:1213

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixBCSR< DT_, IT_, dim_, dim_ >, Filter_ >::set_fill_in_param
virtual void set_fill_in_param(int p) override
Sets the fill-in parameter.
Definition: ilu_precond.hpp:1167

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixCSR< DT_, IT_ >, Filter_ >::apply
virtual Status apply(VectorType &out, const VectorType &in) override
apply the preconditioner
Definition: ilu_precond.hpp:1079

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixCSR< DT_, IT_ >, Filter_ >::set_fill_in_param
virtual void set_fill_in_param(int p) override
Sets the fill-in parameter.
Definition: ilu_precond.hpp:1033

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixCSR< DT_, IT_ >, Filter_ >::~ILUPrecondWithBackend
virtual ~ILUPrecondWithBackend()
Empty virtual destructor.
Definition: ilu_precond.hpp:1023

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixCSR< DT_, IT_ >, Filter_ >::name
virtual String name() const override
Returns the name of the solver.
Definition: ilu_precond.hpp:1040

FEAT::Solver::ILUPrecondWithBackend< PreferredBackend::generic, LAFEM::SparseMatrixCSR< DT_, IT_ >, Filter_ >::ILUPrecondWithBackend
ILUPrecondWithBackend(const MatrixType &matrix, const FilterType &filter, const int p=0)
Constructor.
Definition: ilu_precond.hpp:1002

FEAT::Solver::ILUPrecondWithBackend
ILU(0) and ILU(p) preconditioner internal implementation.
Definition: ilu_precond.hpp:1614

FEAT::Solver::SolverBase
Polymorphic solver interface.
Definition: base.hpp:183

FEAT::Statistics::add_flops
static void add_flops(Index flops)
Add an amount of flops to the global flop counter.
Definition: statistics.hpp:206

FEAT::String
String class implementation.
Definition: string.hpp:46

FEAT::TimeStamp
Time stamp class.
Definition: time_stamp.hpp:54

FEAT::TimeStamp::elapsed
double elapsed(const TimeStamp &before) const
Calculates the time elapsed between two time stamps.
Definition: time_stamp.hpp:100

FEAT::LAFEM::CloneMode::Layout
@ Layout

FEAT::Solver::Status
Status
Solver status return codes enumeration.
Definition: base.hpp:47

FEAT::Solver::Status::success
@ success
solving successful (convergence criterion fulfilled)

FEAT::Solver::Status::aborted
@ aborted
premature abort (solver aborted due to internal errors or preconditioner failure)

FEAT::Solver::new_ilu_precond
std::shared_ptr< ILUPrecond< Matrix_, Filter_ > > new_ilu_precond(PreferredBackend backend, const Matrix_ &matrix, const Filter_ &filter, const int p=0)
Creates a new ILUPrecond solver object.
Definition: ilu_precond.hpp:1817

FEAT
FEAT namespace.
Definition: adjactor.hpp:12

FEAT::PreferredBackend
PreferredBackend
The backend that shall be used in all compute heavy calculations.
Definition: backend.hpp:124

FEAT::PreferredBackend::mkl
@ mkl

FEAT::PreferredBackend::cuda
@ cuda

FEAT::PreferredBackend::generic
@ generic