feat3/parti__domain__control__base_8hpp_source.html

// FEAT3: Finite Element Analysis Toolbox, Version 3

// Copyright (C) 2010 by Stefan Turek & the FEAT group

// FEAT3 is released under the GNU General Public License version 3,

// see the file 'copyright.txt' in the top level directory for details.


#pragma once


#include <kernel/base_header.hpp>


#include <kernel/util/dist.hpp>

#include <kernel/util/dist_file_io.hpp>

#include <kernel/runtime.hpp>

#include <kernel/util/simple_arg_parser.hpp>

#include <kernel/util/property_map.hpp>

#include <kernel/util/statistics.hpp>

#include <kernel/geometry/mesh_node.hpp>

#include <kernel/geometry/partition_set.hpp>

#include <kernel/geometry/parti_2lvl.hpp>

#include <kernel/geometry/parti_iterative.hpp>

#include <kernel/geometry/parti_parmetis.hpp>

#include <kernel/geometry/parti_zoltan.hpp>


#include <control/domain/domain_control.hpp>


namespace FEAT

{

  namespace Control

  {

    namespace Domain

    {

      template<typename DomainLevel_>

      class PartiDomainControlBase :

        public Control::Domain::DomainControl<DomainLevel_>

      {

      public:

        typedef Control::Domain::DomainControl<DomainLevel_> BaseClass;

        using typename BaseClass::LevelType;

        using typename BaseClass::LayerType;

        using typename BaseClass::MeshType;

        using typename BaseClass::AtlasType;

        typedef Geometry::RootMeshNode<MeshType> MeshNodeType;

        typedef typename LevelType::PartType MeshPartType;


        typedef Real WeightType;


        class Ancestor

        {

        public:

          int layer;

          int layer_p;

          int num_procs;

          int num_parts;

          int desired_level_max, desired_level_min;


          int progeny_group, progeny_child;

          int progeny_first, progeny_count;

          Dist::Comm progeny_comm;


          bool parti_found;

          String parti_info;

          int parti_level;

          bool parti_apriori;

          Adjacency::Graph parti_graph;


          Ancestor() :

            layer(0), layer_p(0), num_procs(0), num_parts(0),

            desired_level_max(0), desired_level_min(0),

            progeny_group(0), progeny_child(0),

            progeny_first(0), progeny_count(0),

            progeny_comm(),

            parti_found(false),

            parti_info(),

            parti_level(0),

            parti_apriori(false),

            parti_graph()

          {

          }

        }; // class Ancestor


      protected:

        bool _was_created;

        Geometry::AdaptMode _adapt_mode;


        bool _allow_parti_metis;

        bool _allow_parti_genetic;

        bool _allow_parti_naive;

        bool _allow_parti_zoltan;


        bool _support_multi_layered;


        std::deque<std::pair<int,int>> _desired_levels;


        std::deque<std::pair<int,int>> _chosen_levels;


        int _required_elems_per_rank;

        double _genetic_time_init;

        double _genetic_time_mutate;


        std::deque<Ancestor> _ancestry;


      public:

        explicit PartiDomainControlBase(const Dist::Comm& comm_, bool support_multi_layered) :

          BaseClass(comm_),

          _was_created(false),

          _adapt_mode(Geometry::AdaptMode::chart),

          _allow_parti_metis(false),

          _allow_parti_genetic(false), // this one is exotic

          _allow_parti_naive(true),

          _allow_parti_zoltan(false),

          _support_multi_layered(support_multi_layered),

          _desired_levels(),

          _required_elems_per_rank(1),

          _genetic_time_init(5),

          _genetic_time_mutate(5),

          _ancestry()

        {

        }


        virtual ~PartiDomainControlBase()

        {

        }


        virtual bool parse_args(SimpleArgParser& args)

        {

          XASSERTM(!_was_created, "This function has to be called before domain control creation!");

          // Try to parse --parti-type <types...>

          {

            auto it = args.query("parti-type");

            if(it != nullptr)

            {

              // disallow all strategies by default

              this->_reset_parti_types();


              // loop over all allowed strategies

              for(const auto& t : it->second)

              {

                // give derived classes a chance first

                if(!this->_parse_parti_type(t))

                {

                  this->_comm.print("ERROR: unknown partitioner type '" + t + "'");

                  return false;

                }

              }

            }

          }


          // parse --parti-rank-elems <count>

          args.parse("parti-rank-elems", _required_elems_per_rank);


          // parse --parti-genetic-time <time-init> <time-mutate>

          args.parse("parti-genetic-time", _genetic_time_init, _genetic_time_mutate);


          // okay

          return true;

        }


        virtual bool parse_property_map(const PropertyMap& pmap)

        {

          XASSERTM(!_was_created, "This function has to be called before domain control creation!");

          auto parti_type_p = pmap.query("parti-type");

          if(parti_type_p.second)

          {

            // disallow all strategies by default

            this->_reset_parti_types();


            std::deque<String> allowed_partitioners = parti_type_p.first.split_by_whitespaces();


            for(const auto& t : allowed_partitioners)

            {

              if(!this->_parse_parti_type(t))

              {

                this->_comm.print("ERROR: unknown partitioner type '" + t + "'");

                return false;

              }

            }

          }


          auto parti_rank_elems_p = pmap.query("parti-rank-elems");

          if(parti_rank_elems_p.second)

          {

            if(!parti_rank_elems_p.first.parse(_required_elems_per_rank))

            {

              this->_comm.print("ERROR: Failed to parse 'parti-rank-elems'");

              return false;

            }

          }


          auto genetic_time_init_p = pmap.query("parti-genetic-time-init");

          if(genetic_time_init_p.second)

          {

            if(!genetic_time_init_p.first.parse(_genetic_time_init))

            {

              this->_comm.print("ERROR: Failed to parse 'parti-genetic-time-init'");

              return false;

            }

          }


          auto genetic_time_mutate_p = pmap.query("parti-genetic-time-mutate");

          if(genetic_time_mutate_p.second)

          {

            if(!genetic_time_mutate_p.first.parse(_genetic_time_mutate))

            {

              this->_comm.print("ERROR: Failed to parse 'parti-genetic-time-mutate'");

              return false;

            }

          }


          return true;

        }


        void set_adapt_mode(Geometry::AdaptMode adapt_mode)

        {

          XASSERTM(!_was_created, "This function has to be called before domain control creation!");

          _adapt_mode = adapt_mode;

        }


        Geometry::AdaptMode get_adapt_mode() const

        {

          return _adapt_mode;

        }


        void set_desired_levels(const String& slvls)

        {

          std::deque<String> sl = slvls.split_by_whitespaces();

          set_desired_levels(sl);

        }


        virtual void set_desired_levels(const std::deque<String>& slvls)

        {

          XASSERTM(!_was_created, "This function has to be called before domain control creation!");


          const int nranks = this->_comm.size();

          std::deque<String> sv;


          for(std::size_t i(0); i < slvls.size(); ++i)

          {

            int ilvl = -1, nprocs = -1;

            sv = slvls.at(i).split_by_string(":");


            if((sv.size() < std::size_t(1)) || (sv.size() > std::size_t(2)))

              throw ParseError("Invalid input format", slvls.at(i), "an int-pair 'level:patches'");


            if(!sv.front().parse(ilvl))

              throw ParseError("Failed to parse level index", slvls.at(i), "an integer");

            if((sv.size() > std::size_t(1)) && !sv.back().parse(nprocs))

              throw ParseError("Failed to parse process count" , slvls.at(i), "an integer");


            // level must be non-negative

            if(ilvl < 0)

              throw ParseError("Invalid negative level index", slvls.at(i), "a non-negative level index");


            // first level index?

            if(i == std::size_t(0))

            {

              // if the process count is given, it must match the communicator size

              if((nprocs >= 0) && (nprocs != this->_comm.size()))

                throw ParseError("Invalid number of processes for global level: '" + slvls.at(i) +

                  "', expected " + stringify(this->_comm.size()) + " but got " + stringify(nprocs));

              _desired_levels.push_back(std::make_pair(ilvl, nranks));

              continue;

            }


            // make sure the level parameter is non-ascending

            if(_desired_levels.back().first < ilvl)

              throw ParseError("Invalid non-descending level index: '" + slvls.at(i) +

                "', expected <= " + stringify(_desired_levels.back().first) + " but got " + stringify(ilvl));


            // ignore process count for last level

            if((i + 1) == slvls.size())

              nprocs = 0;

            // if the number of processes is identical to the previous one, simply ignore this parameter

            else if(_desired_levels.back().second == nprocs)

              continue;

            // the process count must not be ascending

            else if(_desired_levels.back().second < nprocs)

              throw ParseError("Invalid non-descending process count: '" + slvls.at(i) +

                "', expected < " + stringify(_desired_levels.back().second) + " but got " + stringify(nprocs));

            // the previous process count must be a multiple of the new one

            else if(_desired_levels.back().second % nprocs != 0)

              throw ParseError("Invalid indivisible process count: '" + slvls.at(i) +

                "', expected a divisor of " + stringify(_desired_levels.back().second) + " but got " + stringify(nprocs));


            // push the level-proc pair

            _desired_levels.push_back(std::make_pair(ilvl, nprocs));

          }

        }


        virtual void set_desired_levels(int lvl_max, int lvl_min = -1)

        {

          XASSERTM(!_was_created, "This function has to be called before domain control creation!");


          // single-layered hierarchy

          int _desired_level_max = lvl_max;

          int _desired_level_min = (lvl_min >= 0 ? lvl_min : lvl_max + lvl_min + 1);


          XASSERTM(_desired_level_max >= 0, "Invalid level-max");

          XASSERTM(_desired_level_min >= 0, "Invalid level-min");

          XASSERTM(_desired_level_max >= _desired_level_min, "Invalid level-min/max combination");


          _desired_levels.emplace_back(std::make_pair(_desired_level_max, this->_comm.size()));

          _desired_levels.emplace_back(std::make_pair(_desired_level_min, 0));

        }


        virtual void set_desired_levels(int lvl_max, int lvl_med, int lvl_min)

        {

          XASSERTM(!_was_created, "This function has to be called before domain control creation!");


          // double-layered hierarchy

          int _desired_level_max = lvl_max;

          int _desired_level_med = (lvl_med >= 0 ? lvl_med : lvl_max + lvl_med + 1);

          int _desired_level_min = (lvl_min >= 0 ? lvl_min : lvl_med + lvl_min + 1);


          XASSERTM(_desired_level_max >= 0, "Invalid level-max");

          XASSERTM(_desired_level_med >= 0, "Invalid level-med");

          XASSERTM(_desired_level_min >= 0, "Invalid level-min");


          // level_max must be strictly greater than level_med

          XASSERTM(_desired_level_max > _desired_level_med, "Invalid level-max/med combination");


          // level_med must be greater or equal level_min

          XASSERTM(_desired_level_med >= _desired_level_min, "Invalid level-med/min combination");


          _desired_levels.emplace_back(std::make_pair(_desired_level_max, this->_comm.size()));

          _desired_levels.emplace_back(std::make_pair(_desired_level_med, 1));

          _desired_levels.emplace_back(std::make_pair(_desired_level_min, 0));

        }


        int get_desired_level_max() const

        {

          return _desired_levels.front().first;

        }


        int get_desired_level_min() const

        {

          return _desired_levels.back().first;

        }


        virtual String format_desired_levels() const

        {

          String s;

          for(std::size_t i(0); (i + 1) < _desired_levels.size(); ++i)

          {

            s += stringify(_desired_levels.at(i).first);

            s += ":";

            s += stringify(_desired_levels.at(i).second);

            s += "  ";

          }

          s += stringify(_desired_levels.back().first);

          return s;

        }


        virtual String format_chosen_levels() const

        {

          String s;

          for(std::size_t i(0); (i + 1) < _chosen_levels.size(); ++i)

          {

            s += stringify(_chosen_levels.at(i).first);

            s += ":";

            s += stringify(_chosen_levels.at(i).second);

            s += "  ";

          }

          s += stringify(_chosen_levels.back().first);

          return s;

        }


        virtual String get_chosen_parti_info() const

        {

          String s;


          for(auto it = this->_ancestry.rbegin(); it != this->_ancestry.rend(); ++it)

          {

            if(it != this->_ancestry.rbegin())

              s += "\n";

            s += it->parti_info;

            s += " on level ";

            s += stringify(it->parti_level);

            s += " for ";

            s += stringify(it->num_parts);

            s += (it->num_parts > 1 ? " patches on " : " patch on ");

            s += stringify(it->num_procs);

            s += (it->num_procs > 1 ? " processes" : " process");

          }


          return s;

        }


        const std::deque<std::pair<int, int>> get_desired_levels() const

        {

          return this->_desired_levels;

        }


        const std::deque<std::pair<int, int>> get_chosen_levels() const

        {

          return this->_chosen_levels;

        }


        String dump_ancestry() const

        {

          String s;

          for(auto it = this->_ancestry.begin(); it != this->_ancestry.end(); ++it)

          {

            if(it != this->_ancestry.begin())

              s += " | ";

            s += stringify((*it).num_procs);

            s += ":";

            s += stringify((*it).num_parts);

            s += "[";

            s += stringify((*it).progeny_group).pad_front(2);

            s += "+";

            s += stringify((*it).progeny_child);

            s += ":";

            s += stringify((*it).progeny_first).pad_front(2);

            s += "+";

            s += stringify((*it).progeny_count);

            s += ".";

            s += stringify((*it).progeny_comm.rank());

            s += "]";

            s += "(";

            s += stringify((*it).desired_level_max);

            s += ":";

            s += stringify((*it).desired_level_min);

            s += ")";

            s += ((*it).layer >= 0 ? "*" : " ");

            s += ((*it).layer_p >= 0 ? ">" : " ");

          }

          return s;

        }


        const std::deque<Ancestor>& get_ancestry() const

        {

          return this->_ancestry;

        }


        std::vector<char> serialize_partitioning() const

        {

          BinaryStream bs;

          typedef std::uint64_t u64;


          // serialization magic number: "F3PaDoCo"

          const std::uint64_t magic = 0x6F436F4461503346;


          XASSERT(this->_num_global_layers >= this->_ancestry.size());


          if(this->_comm.rank() == 0)

          {

            // dump magic

            bs.write((const char*)&magic, 8u);


            // write finest level

            const u64 lev = u64(this->_virt_levels.front()->get_level_index());

            bs.write((const char*)&lev, 8u);


            // serialize ancestry/layers

            const u64 na = u64(this->_ancestry.size());

            bs.write((const char*)&na, 8u);


            // write number of ranks per layer in reverse order

            for(auto it = this->_ancestry.rbegin(); it != this->_ancestry.rend(); ++it)

            {

              // write ranks

              const u64 np = u64(it->num_procs);

              const u64 pl = u64(it->parti_level);

              bs.write((const char*)&np, 8u);

              bs.write((const char*)&pl, 8u);

            }

          }


          // loop over all ancestry graphs

          for(auto it = this->_ancestry.rbegin(); it != this->_ancestry.rend(); ++it)

          {

            if(it == this->_ancestry.rbegin())

            {

              std::vector<char> buf = it->parti_graph.serialize();

              bs.write(buf.data(), std::streamsize(buf.size()));

              continue;

            }


            // get layer index

            if(it->layer_p < 0)

              continue;


            // get parent layer communicator

            const std::size_t ilp = std::size_t(it->layer_p);

            XASSERT(ilp < this->_layers.size());

            const Dist::Comm& comm_p = this->_layers.at(ilp)->comm();


            // serialize graph

            std::vector<char> buf = it->parti_graph.serialize();


            // choose maximum size

            u64 buf_size = buf.size();


            // gather individual buffer sizes on rank 0

            std::vector<u64> all_sizes;

            if(comm_p.rank() == 0)

              all_sizes.resize(std::size_t(comm_p.size()));

            comm_p.gather(&buf_size, 1u, all_sizes.data(), 1u, 0);


            // allreduce maximum size

            comm_p.allreduce(&buf_size, &buf_size, std::size_t(1), Dist::op_max);


            // adjust buffer size

            if(buf_size > u64(buf.size()))

              buf.resize(buf_size);


            // on rank 0, allocate common buffer

            std::vector<char> com_buf;

            if(comm_p.rank() == 0)

              com_buf.resize(std::size_t(buf_size * u64(comm_p.size())));


            // gather all buffers on rank 0

            comm_p.gather(buf.data(), buf_size, com_buf.data(), buf_size, 0);


            // write each individual buffer

            if(comm_p.rank() == 0)

            {

              char* x = com_buf.data();

              for(u64 k(0); k < u64(comm_p.size()); ++k)

                bs.write(&x[k*buf_size], std::streamsize(all_sizes[k]));

            }

          }


          return bs.container();

        }


      protected:

        virtual void _reset_parti_types()

        {

          _allow_parti_metis = _allow_parti_naive = false;

          _allow_parti_genetic = _allow_parti_zoltan = false;

        }


        virtual bool _parse_parti_type(const String& type)

        {

          if((type.compare_no_case("metis") == 0) || (type.compare_no_case("parmetis") == 0))

            return _allow_parti_metis = true;

          else if(type.compare_no_case("genetic") == 0)

            return _allow_parti_genetic = true;

          else if(type.compare_no_case("naive") == 0)

            return _allow_parti_naive = true;

          else if(type.compare_no_case("zoltan") == 0)

            return _allow_parti_zoltan = true;

          else

            return false;

        }


        virtual std::vector<WeightType> _compute_weights(Ancestor& DOXY(ancestor), const MeshNodeType& DOXY(base_mesh_node))

        {

          return std::vector<WeightType>();

        }


        virtual void _create_ancestry_single()

        {

          // for more than 2 desired levels, call _create_ancestry_scattered

          XASSERTM(this->_desired_levels.size() <= std::size_t(2), "multi-layered control is desired here");


          // allocate and create ancestry

          this->_ancestry.resize(std::size_t(1));

          Ancestor& ancestor = this->_ancestry.front();


          // set the layer index to 0

          ancestor.layer = 0;


          // set the parent layer index to -1

          ancestor.layer_p = -1;


          // set the total number of processes for this layer

          ancestor.num_procs = this->_comm.size();


          // set the total number of partitions per progeny group

          ancestor.num_parts = this->_comm.size();


          // set desired maximum level

          ancestor.desired_level_max = this->_desired_levels.front().first;


          // set desired minimum level (may be = level_max)

          ancestor.desired_level_min = this->_desired_levels.back().first;


          // set the progeny group

          ancestor.progeny_group = 0;

          ancestor.progeny_child = this->_comm.rank();


          // create the progeny communicator

          ancestor.progeny_count = this->_comm.size();

          ancestor.progeny_first = 0;

          ancestor.progeny_comm = this->_comm.comm_dup();

        }


        // Note: all following member functions are only required for parallel builds,

        // so we enclose them in the following #if-block to reduce compile times.


#if defined(FEAT_HAVE_MPI) || defined(DOXYGEN)


        virtual void _create_multi_layers_scattered()

        {

          // create and push global layer

          this->push_layer(std::make_shared<LayerType>(this->_comm.comm_dup(), 0));


          // loop over all desired layers

          for(std::size_t ilay(1u); (ilay+1u) < this->_desired_levels.size(); ++ilay)

          {

            // get child layer

            std::shared_ptr<LayerType> layer_c = this->_layers.back();


            // get child layer communicator

            const Dist::Comm& comm_c = layer_c->comm();


            // get number of processes in child comm

            const int nprocs_c = comm_c.size();


            // get desired number of processes for parent comm

            const int nprocs_p = this->_desired_levels.at(ilay).second;

            XASSERT(nprocs_p < nprocs_c);

            XASSERT(nprocs_p > 0);

            XASSERT(nprocs_c % nprocs_p == 0); // same number of children for each parent


            // compute number of siblings = children per parent

            const int num_sibs = nprocs_c / nprocs_p;


            // get my rank in child comm

            const int my_rank_c = comm_c.rank();


            // compute my parent's rank in child comm

            const int parent_rank_c = (my_rank_c / num_sibs) * num_sibs;


            // create our sibling communicator and set the parent rank

            layer_c->set_parent(comm_c.comm_create_range_incl(num_sibs, parent_rank_c), 0);


            // next, create the actual parent communicator

            Dist::Comm comm_p = comm_c.comm_create_range_incl(nprocs_p, 0, num_sibs);


            // Are we the parent?

            if(parent_rank_c == my_rank_c)

            {

              // make sure we have a valid communicator

              XASSERT(!comm_p.is_null());


              // push the parent layer

              this->push_layer(std::make_shared<LayerType>(std::move(comm_p), int(ilay)));

            }

            else

            {

              // We are not a parent, so we must have received a null communicator

              XASSERT(comm_p.is_null());


              // Exit the loop, as we are not part of the party anymore...

              break;

            }

          }

        }


        virtual void _create_ancestry_scattered()

        {

          // the layers must have been created already

          XASSERT(!this->_layers.empty());


          // create a deque with the number of processes for each layer

          std::deque<int> num_procs;

          for(auto it = this->_desired_levels.begin(); it != this->_desired_levels.end(); ++it)

          {

            if(it->second > 1)

              num_procs.push_back(it->second);

          }

          // manually add the base-layer

          num_procs.push_back(1);


          // allocate and create ancestry

          this->_ancestry.resize(num_procs.size()-std::size_t(1));


          // set up the ancestry

          const int main_rank = this->_comm.rank();

          const int main_size = this->_comm.size();

          for(std::size_t i(0); i < this->_ancestry.size(); ++i)

          {

            // get our ancestor info

            Ancestor& ancestor = this->_ancestry.at(i);


            // set the layer index (or -1, if this process is not part of that layer)

            ancestor.layer = (i < this->_layers.size() ? int(i) : -1);


            // set the parent layer index (or -1, if this process is not in the parent layer)

            ancestor.layer_p = ((i+1u) < this->_layers.size() ? int(i)+1 : -1);


            // set the total number of processes for this layer

            ancestor.num_procs = num_procs.at(i);


            // set the total number of partitions per progeny group

            ancestor.num_parts = num_procs.at(i) / num_procs.at(i+1u);


            // set desired maximum level

            XASSERT(i < this->_desired_levels.size());

            ancestor.desired_level_max = this->_desired_levels.at(i).first;


            // set desired minimum level

            if((i+1u) < this->_desired_levels.size())

              ancestor.desired_level_min = this->_desired_levels.at(i+1).first;

            else

              ancestor.desired_level_min = ancestor.desired_level_max;


            // set the progeny group

            ancestor.progeny_group = ((main_rank * num_procs.at(i+1u)) / main_size) * ancestor.num_parts;

            ancestor.progeny_child = ((main_rank * num_procs.at(i)) / main_size) % ancestor.num_parts;


            // create the progeny communicator

            ancestor.progeny_count = main_size / num_procs.at(i+1u);

            ancestor.progeny_first = (main_rank / ancestor.progeny_count) * ancestor.progeny_count;

            ancestor.progeny_comm = this->_comm.comm_create_range_incl(ancestor.progeny_count, ancestor.progeny_first);

          }

        }


        virtual void _split_basemesh_halos(

          const Ancestor& ancestor,

          const MeshNodeType& base_mesh_node,

          MeshNodeType& patch_mesh_node,

          std::vector<int>& neighbor_ranks)

        {

          // get the map of the base-mesh halos

          const std::map<int, std::unique_ptr<MeshPartType>>& base_halo_map = base_mesh_node.get_halo_map();


          // if the base mesh has no halos, then we can jump out of here

          if(base_halo_map.empty())

            return;


          // get number of halos

          const std::size_t num_halos = base_halo_map.size();


          // create a halo splitter

          Geometry::PatchHaloSplitter<MeshType> halo_splitter(*base_mesh_node.get_mesh(),

            *base_mesh_node.get_patch(ancestor.progeny_child));


          // add each base-mesh halo to our halo splitter and store the resulting split data size

          std::vector<int> halo_ranks;

          std::vector<std::size_t> halo_sizes;

          for(auto it = base_halo_map.begin(); it != base_halo_map.end(); ++it)

          {

            // store halo rank

            halo_ranks.push_back(it->first);


            // try to split the halo and store the resulting data size

            halo_sizes.push_back(halo_splitter.add_halo(it->first, *it->second));

          }


          // This vector will receive the split halo data from all our potential neighbor processes

          std::vector<Index> halo_recv_data;

          std::vector<std::vector<Index>> halo_send_data;


          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */

          // PHASE I: collect halo data from our siblings

          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */

          if(ancestor.layer >= 0)

          {

            XASSERT(this->_layers.size() > std::size_t(ancestor.layer));

            const LayerType& layer = *this->_layers.at(std::size_t(ancestor.layer));

            const Dist::Comm& sibling_comm = *layer.sibling_comm_ptr();

            XASSERT(!sibling_comm.is_null());

            const std::size_t num_sibls = std::size_t(sibling_comm.size());


            // get the rank of this process in various communicators

            const int sibl_rank = sibling_comm.rank();

            const int layer_rank = layer.comm().rank();


            // gather halo infos of all siblings at sibling rank 0

            std::vector<std::size_t> sibl_halo_sizes(sibl_rank == 0 ? num_halos*num_sibls : 0u);

            sibling_comm.gather(halo_sizes.data(), halo_sizes.size(), sibl_halo_sizes.data(), halo_sizes.size(), 0);


            if(sibl_rank > 0)

            {

              std::vector<std::vector<Index>> halo_split_data(num_halos);

              Dist::RequestVector send_reqs(num_halos);


              // serialize all split halos

              for(std::size_t i(0); i < num_halos; ++i)

              {

                // skip empty halos

                if(halo_sizes.at(i) == Index(0))

                  continue;


                // serialize split halo data

                halo_split_data.at(i) = halo_splitter.serialize_split_halo(halo_ranks[i], layer_rank);

                XASSERT(halo_split_data.at(i).size() == halo_sizes.at(i));


                // send split data over to our parent process

                send_reqs[i] = sibling_comm.isend(halo_split_data.at(i).data(), halo_sizes.at(i), 0);

              }


              // wait for all pending sends to finish

              send_reqs.wait_all();

            }

            else // if(sibl_rank == 0)

            {

              halo_send_data.resize(num_halos);


              // compute halo send data sizes

              for(std::size_t i(0); i < num_halos; ++i)

              {

                // determine the number of child processes for this halo

                // as well as the required send buffer size

                Index num_halo_childs = 0u;

                std::size_t buffer_size = 0u, offset = 0u;

                for(std::size_t j(0); j < num_sibls; ++j)

                {

                  // update required buffer size

                  buffer_size += sibl_halo_sizes.at(j*num_halos + i);


                  // this sibling is a child if its split halo is not empty

                  if(sibl_halo_sizes.at(j*num_halos + i) > std::size_t(0))

                    ++num_halo_childs;

                }


                // increase buffer size to store child data offsets

                buffer_size += num_halo_childs + Index(1);


                // allocate send buffer and get a pointer to its data array

                halo_send_data.at(i).resize(buffer_size);

                Index* halo_buffer = halo_send_data.at(i).data();


                // store child count as first entry of buffer

                halo_buffer[0u] = num_halo_childs;


                // initialize offset for first child

                offset = num_halo_childs + Index(1);

                Index coi = 0u; // child offset index


                // collect my own split halo

                if(sibl_halo_sizes.at(i) > Index(0))

                {

                  std::vector<Index> my_data(halo_splitter.serialize_split_halo(halo_ranks[i], layer_rank));

                  std::size_t data_size = sibl_halo_sizes.at(i);

                  halo_buffer[++coi] = Index(offset);

                  for(std::size_t k(0); k < data_size; ++k)

                    halo_buffer[offset+k] = my_data[k];

                  offset += my_data.size();

                }


                Dist::RequestVector sibl_recv_reqs(num_sibls);


                // collect the other siblings

                for(std::size_t j(1); j < num_sibls; ++j)

                {

                  // skips all sibling with empty halos

                  std::size_t data_size = sibl_halo_sizes.at(j*num_halos + i);

                  if(data_size == std::size_t(0))

                    continue;

                  XASSERT(offset+data_size <= buffer_size);


                  // store offset for this child

                  halo_buffer[++coi] = Index(offset);


                  // receive serialized data from this sibling

                  sibl_recv_reqs[j] = sibling_comm.irecv(&halo_buffer[offset], data_size, int(j));

                  offset += data_size;

                }

                XASSERT(offset == buffer_size);


                // wait for all pending receives to finish

                sibl_recv_reqs.wait_all();

              }

            }

          } // if(ancestor.layer >= 0)


          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */

          // PHASE II: exchange split halos over parent layer communicator

          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */


          if(ancestor.layer_p >= 0)

          {

            XASSERT(!halo_send_data.empty());


            // get the parent layer communicator

            const Dist::Comm& parent_comm = this->_layers.at(std::size_t(ancestor.layer_p))->comm();


            std::vector<std::size_t> halo_recv_sizes(num_halos), halo_send_sizes(num_halos);

            Dist::RequestVector halo_recv_reqs(num_halos), halo_send_reqs(num_halos);


            // exchange halo send data sizes

            for(std::size_t i(0); i < num_halos; ++i)

            {

              // get halo send size

              halo_send_sizes.at(i) = halo_send_data.at(i).size();


              // post receive requests

              halo_recv_reqs[i] = parent_comm.irecv(&halo_recv_sizes[i], std::size_t(1), halo_ranks[i]);


              // post send requests

              halo_send_reqs[i] = parent_comm.isend(&halo_send_sizes[i], std::size_t(1), halo_ranks[i]);

            }


            // wait for sends and receives to finish

            halo_recv_reqs.wait_all();

            halo_send_reqs.wait_all();


            // compute total receive buffer size

            std::size_t recv_buf_size = num_halos + std::size_t(1);

            for(std::size_t i(0); i < num_halos; ++i)

              recv_buf_size += halo_recv_sizes[i];


            // allocate receive buffer

            halo_recv_data.resize(recv_buf_size);


            // set up receive data pointers

            halo_recv_data[0] = Index(num_halos) + Index(1);

            for(std::size_t i(0); i < num_halos; ++i)

              halo_recv_data[i+1u] = Index(halo_recv_data[i] + halo_recv_sizes[i]);


            // allocate receive buffers and post receives

            for(std::size_t i(0); i < num_halos; ++i)

            {

              // resize buffer and post receive

              halo_recv_reqs[i] = parent_comm.irecv(&halo_recv_data[halo_recv_data[i]], halo_recv_sizes.at(i), halo_ranks[i]);


              // post send of actual halo buffer

              halo_send_reqs[i] = parent_comm.isend(halo_send_data.at(i).data(), halo_send_sizes.at(i), halo_ranks[i]);

            }


            // wait for sends and receives to finish

            halo_recv_reqs.wait_all();

            halo_send_reqs.wait_all();

          } // if(ancestor.layer_p >= 0)


          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */

          // PHASE III: broadcast halo receive data over progeny comm

          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */


          {

            // broadcast receive buffer size

            std::size_t recv_data_size = halo_recv_data.size();

            ancestor.progeny_comm.bcast(&recv_data_size, std::size_t(1), 0);


            // allocate buffer

            if(ancestor.progeny_comm.rank() != 0)

            {

              XASSERT(halo_recv_data.empty()); // should be empty until now

              halo_recv_data.resize(recv_data_size);

            }

            else

            {

              XASSERT(!halo_recv_data.empty()); // must not be empty

            }


            // broadcast buffer

            ancestor.progeny_comm.bcast(halo_recv_data.data(), recv_data_size, 0);

          }


          /*{

          String s;

          for(std::size_t i(0); i < num_halos; ++i)

          {

          s += stringify(halo_ranks[i]);

          s += " >";

          for(Index j(halo_recv_data[i]); j < halo_recv_data[i+1]; ++j)

          (s += " ") += stringify(halo_recv_data[j]);

          s += "\n";

          }

          this->_comm.allprint(s);

          }*/


          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */

          // PHASE IV: intersect received halo splits

          /* ******************************************************************************************************* */

          /* ******************************************************************************************************* */


          for(std::size_t i(0); i < num_halos; ++i)

          {

            // get the offset of the first date for this halo

            const Index offset = halo_recv_data.at(i);


            // get the number of child processes for this halo

            const Index num_childs = halo_recv_data.at(offset);


            // loop over all child processes

            for(Index j(0); j < num_childs; ++j)

            {

              // compute the offset of this child's data within the large buffer

              const Index buffer_offset = offset + halo_recv_data.at(offset+j+1u);


              // intersect with our other halo

              if(!halo_splitter.intersect_split_halo(halo_ranks[i], halo_recv_data, buffer_offset))

                continue; // no intersection


              // get the new neighbor's rank

              const int neighbor_rank = int(halo_recv_data.at(buffer_offset));


              // add the new neighbor to our list

              neighbor_ranks.push_back(neighbor_rank);


              // create new mesh-part

              patch_mesh_node.add_halo(neighbor_rank, halo_splitter.make_unique());

            }

          }

        }


        virtual bool _check_parti(Ancestor& ancestor, const MeshNodeType& mesh_node, bool DOXY(is_base_layer))

        {

          // We need to determine the required partitioning level for a-posteriori partitioning.

          // For this, first determine the factor by which the number of elements increases for each refinement:

          const Index factor = Index(Geometry::Intern::StandardRefinementTraits<typename BaseClass::ShapeType, BaseClass::ShapeType::dimension>::count);


          // compute minimum number of elements for a-posteriori partitioning

          const Index min_elems = Index(ancestor.num_parts) * Index(_required_elems_per_rank);


          // Okay, get the number of elements on base-mesh level 0

          Index num_elems = mesh_node.get_mesh()->get_num_elements();


          // compute refinement level on which we have enough elements

          int level = 0;

          for(; num_elems < min_elems; ++level)

          {

            num_elems *= factor;

          }


          // assume that we did not find a partitioning yet

          ancestor.parti_found = false;


          // finally, the user may have ancestor a greater level for partitioning:

          ancestor.parti_level = Math::max(ancestor.parti_level, level);


          // No a-priori partitioning; try a-posteriori partitioner later

          return false;

        }


        virtual bool _apply_parti(Ancestor& ancestor, /*const*/ MeshNodeType& base_mesh_node)

        {

          // compute weights

          std::vector<WeightType> weights = this->_compute_weights(ancestor, base_mesh_node);


          // First of all, check whether an a-priori partitioning was selected;

          // if so, then we do not have to apply any a-posteriori partitioner

          if(weights.empty() && ancestor.parti_apriori)

            return true;


          // ensure that the mesh has enough elements

          //XASSERT(ancestor.num_parts <= int(base_mesh_node.get_mesh()->get_num_elements()));

          if(base_mesh_node.get_mesh()->get_num_elements() < Index(ancestor.num_parts))

            return false;


          // try the various a-posteriori partitioners

          if(this->_apply_parti_metis(ancestor, base_mesh_node, weights))

            return true;

          if(this->_apply_parti_zoltan(ancestor, base_mesh_node, weights))

            return true;

          if(this->_apply_parti_genetic(ancestor, base_mesh_node, weights))

            return true;

          if(this->_apply_parti_naive(ancestor, base_mesh_node, weights))

            return true;


          // we should not arrive here...

          return false;

        }


        bool _apply_parti_zoltan(Ancestor& ancestor, const MeshNodeType& base_mesh_node, const std::vector<WeightType>& weights)

        {

#ifdef FEAT_HAVE_ZOLTAN

          // is this even allowed?

          if(!this->_allow_parti_zoltan)

            return false;


          // create partitioner on the corresponding progeny communicator

          Geometry::PartiZoltan partitioner(ancestor.progeny_comm);


          // get the corresponding adjacency graph for partitioning

          constexpr int shape_dim = MeshNodeType::MeshType::ShapeType::dimension;

          const auto& faces_at_elem = base_mesh_node.get_mesh()->template get_index_set<shape_dim, 0>();


          // call the partitioner

          if(!partitioner.execute(faces_at_elem, Index(ancestor.num_parts), weights))

            return false;


          // create partition graph

          ancestor.parti_graph = partitioner.build_elems_at_rank();


          // set info string

          ancestor.parti_info = String("Applied Zoltan partitioner");


          // partitioning found

          ancestor.parti_found = true;


          // okay

          return true;

#else // FEAT_HAVE_ZOLTAN

          (void)ancestor;

          (void)base_mesh_node;

          (void)weights;

          return false;

#endif // FEAT_HAVE_ZOLTAN

        }


        bool _apply_parti_metis(Ancestor& ancestor, const MeshNodeType& base_mesh_node, const std::vector<WeightType>& weights)

        {

#ifdef FEAT_HAVE_PARMETIS

          // is this even allowed?

          if(!this->_allow_parti_metis)

            return false;


          // create partitioner on the corresponding progeny communicator

          Geometry::PartiParMETIS partitioner(ancestor.progeny_comm);


          // get the corresponding adjacency graph for partitioning

          constexpr int shape_dim = MeshNodeType::MeshType::ShapeType::dimension;

          const auto& faces_at_elem = base_mesh_node.get_mesh()->template get_index_set<shape_dim, 0>();


          // get vertices-at-element and vertex set

          const auto& verts_at_elem = base_mesh_node.get_mesh()->template get_index_set<shape_dim, 0>();

          const auto& vertex_set =  base_mesh_node.get_mesh()->get_vertex_set();


          // call the partitioner

          if(!partitioner.execute(faces_at_elem, verts_at_elem, vertex_set, ancestor.num_parts, weights))

            return false;


          // create partition graph

          ancestor.parti_graph = partitioner.build_elems_at_rank();


          // set info string

          ancestor.parti_info = String("Applied ParMETIS partitioner");


          // partitioning found

          ancestor.parti_found = true;


          // okay

          return true;

#else

          (void)ancestor;

          (void)base_mesh_node;

          (void)weights;

          return false;

#endif // FEAT_HAVE_PARMETIS

        }


        bool _apply_parti_genetic(Ancestor& ancestor, /*const*/ MeshNodeType& base_mesh_node, const std::vector<WeightType>& weights)

        {

          // is this even allowed?

          if(!this->_allow_parti_genetic || !weights.empty())

            return false;


          // create a genetic partitioner

          Geometry::PartiIterative<MeshType> partitioner(

            *base_mesh_node.get_mesh(),

            ancestor.progeny_comm,

            (Index)ancestor.num_parts,

            this->_genetic_time_init,

            this->_genetic_time_mutate);


          // create elems-at-rank graph

          ancestor.parti_graph = partitioner.build_elems_at_rank();


          // set info string

          ancestor.parti_info = String("Applied genetic partitioner");


          // partitioning found

          ancestor.parti_found = true;


          // okay

          return true;

        }


        bool _apply_parti_naive(Ancestor& ancestor, const MeshNodeType& mesh_node, const std::vector<WeightType>& weights)

        {

          // is this even allowed?

          if(!this->_allow_parti_naive)

            return false;


          const Index num_parts = Index(ancestor.num_parts);

          const Index num_elems = mesh_node.get_mesh()->get_num_elements();

          XASSERTM(num_parts <= num_elems, "Base-Mesh does not have enough elements");


          // create elems-at-rank graph

          ancestor.parti_graph = Adjacency::Graph(num_parts, num_elems, num_elems);

          Index* ptr = ancestor.parti_graph.get_domain_ptr();

          Index* idx = ancestor.parti_graph.get_image_idx();


          // weighted partitioning?

          if(!weights.empty())

          {

            // compute total number of non-zero weight elements

            WeightType weight_sum(0.0);

            for(auto w : weights)

            {

              weight_sum += w;

            }


            ptr[0] = Index(0);

            WeightType weight_count(0.);

            for(Index i(1), last(0); i < num_parts; ++i)

            {

              // add as many elements as we need to achieve the target weight for this partition

              WeightType target_weight = weight_sum * WeightType(i) / WeightType(num_parts);

              for(; (weight_count < target_weight) && (last < num_elems); ++last)

                weight_count += weights[last];


              ptr[i] = last;

            }

            ptr[num_parts] = num_elems;

          }

          else

          {

            // unweighted partitioning

            ptr[0] = Index(0);

            for(Index i(1); i < num_parts; ++i)

              ptr[i] = (i*num_elems) / num_parts;

            ptr[num_parts] = num_elems;

          }


          for(Index j(0); j < num_elems; ++j)

            idx[j] = j;


          // set info string

          ancestor.parti_info = String("Applied naive partitioner");


          // partitioning found

          ancestor.parti_found = true;


          // okay

          return true;

        }

#endif // defined(FEAT_HAVE_MPI) || defined(DOXYGEN)

      }; // class HierarchDomainControl<...>

    } // namespace Domain

  } // namespace Control

} // namespace FEAT

XASSERT
#define XASSERT(expr)
Assertion macro definition.
Definition: assertion.hpp:262

XASSERTM
#define XASSERTM(expr, msg)
Assertion macro definition with custom message.
Definition: assertion.hpp:263

base_header.hpp
FEAT Kernel base header.

FEAT::Adjacency::Graph
Adjacency Graph implementation.
Definition: graph.hpp:34

FEAT::Adjacency::Graph::get_domain_ptr
Index * get_domain_ptr()
Returns the domain pointer array.
Definition: graph.hpp:359

FEAT::Adjacency::Graph::get_image_idx
Index * get_image_idx()
Returns the image node index array.
Definition: graph.hpp:374

FEAT::BinaryStream
Binary Stream class.
Definition: binary_stream.hpp:30

FEAT::BinaryStream::container
std::vector< char > & container()
Returns a reference to the internal vector container.
Definition: binary_stream.hpp:236

FEAT::Control::Domain::DomainControl
Domain control base-class template.
Definition: domain_control.hpp:457

FEAT::Control::Domain::DomainLayer
Domain Layer class.
Definition: domain_control.hpp:62

FEAT::Control::Domain::PartiDomainControlBase::Ancestor
Ancestor info class.
Definition: parti_domain_control_base.hpp:67

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::parti_apriori
bool parti_apriori
specifies whether the chosen partitioning is an a-priori partitioning strategy
Definition: parti_domain_control_base.hpp:91

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::desired_level_max
int desired_level_max
the desired minimum and maximum refinement levels for this layer
Definition: parti_domain_control_base.hpp:78

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::parti_level
int parti_level
the refinement level on which the patch is to be partitioned
Definition: parti_domain_control_base.hpp:89

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::parti_info
String parti_info
a string containing some information about the chosen partitioning
Definition: parti_domain_control_base.hpp:87

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::parti_found
bool parti_found
specifies whether a partitioning was found
Definition: parti_domain_control_base.hpp:85

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::num_procs
int num_procs
the number of processes that participate in this layer
Definition: parti_domain_control_base.hpp:74

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::parti_graph
Adjacency::Graph parti_graph
this is the actual elements-at-rank partitioning graph
Definition: parti_domain_control_base.hpp:93

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::layer_p
int layer_p
the index of the parent layer or -1, if this process is not part of the parent layer
Definition: parti_domain_control_base.hpp:72

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::layer
int layer
the index of the layer that this ancestor object belongs to
Definition: parti_domain_control_base.hpp:70

FEAT::Control::Domain::PartiDomainControlBase::Ancestor::num_parts
int num_parts
the number of partitions for each patch of the parent layer
Definition: parti_domain_control_base.hpp:76

FEAT::Control::Domain::PartiDomainControlBase
Base-Class for Hierarchical Domain Control implementations.
Definition: parti_domain_control_base.hpp:43

FEAT::Control::Domain::PartiDomainControlBase::get_chosen_levels
const std::deque< std::pair< int, int > > get_chosen_levels() const
Returns the deque of chosen refinement levels.
Definition: parti_domain_control_base.hpp:563

FEAT::Control::Domain::PartiDomainControlBase::format_desired_levels
virtual String format_desired_levels() const
Returns the desired levels formatted as a parsable string.
Definition: parti_domain_control_base.hpp:480

FEAT::Control::Domain::PartiDomainControlBase::_allow_parti_naive
bool _allow_parti_naive
allow naive partitioner?
Definition: parti_domain_control_base.hpp:121

FEAT::Control::Domain::PartiDomainControlBase::get_desired_level_min
int get_desired_level_min() const
Returns the desired minimum refinement level.
Definition: parti_domain_control_base.hpp:468

FEAT::Control::Domain::PartiDomainControlBase::PartiDomainControlBase
PartiDomainControlBase(const Dist::Comm &comm_, bool support_multi_layered)
Constructor.
Definition: parti_domain_control_base.hpp:154

FEAT::Control::Domain::PartiDomainControlBase::_compute_weights
virtual std::vector< WeightType > _compute_weights(Ancestor &ancestor, const MeshNodeType &base_mesh_node)
Computes the element partitioning weights.
Definition: parti_domain_control_base.hpp:751

FEAT::Control::Domain::PartiDomainControlBase::_reset_parti_types
virtual void _reset_parti_types()
Resets/disables all partitioner types.
Definition: parti_domain_control_base.hpp:713

FEAT::Control::Domain::PartiDomainControlBase::set_adapt_mode
void set_adapt_mode(Geometry::AdaptMode adapt_mode)
Sets the adapt-mode for refinement.
Definition: parti_domain_control_base.hpp:292

FEAT::Control::Domain::PartiDomainControlBase::dump_ancestry
String dump_ancestry() const
Debugging function: Returns a string containing encoded ancestry information.
Definition: parti_domain_control_base.hpp:571

FEAT::Control::Domain::PartiDomainControlBase::set_desired_levels
void set_desired_levels(const String &slvls)
Sets the desired levels for the partitioned hierarchy.
Definition: parti_domain_control_base.hpp:315

FEAT::Control::Domain::PartiDomainControlBase::get_desired_levels
const std::deque< std::pair< int, int > > get_desired_levels() const
Returns the deque of desired refinement levels.
Definition: parti_domain_control_base.hpp:553

FEAT::Control::Domain::PartiDomainControlBase::_desired_levels
std::deque< std::pair< int, int > > _desired_levels
desired level deque
Definition: parti_domain_control_base.hpp:129

FEAT::Control::Domain::PartiDomainControlBase::_required_elems_per_rank
int _required_elems_per_rank
required number of elements per rank for a-posteriori partitioning
Definition: parti_domain_control_base.hpp:135

FEAT::Control::Domain::PartiDomainControlBase::_chosen_levels
std::deque< std::pair< int, int > > _chosen_levels
chosen level deque
Definition: parti_domain_control_base.hpp:132

FEAT::Control::Domain::PartiDomainControlBase::_create_ancestry_scattered
virtual void _create_ancestry_scattered()
Creates the layers for a multi-layered domain control in a scattered fashion.
Definition: parti_domain_control_base.hpp:865

FEAT::Control::Domain::PartiDomainControlBase::WeightType
Real WeightType
weight type for partitioner element weights; always Real
Definition: parti_domain_control_base.hpp:61

FEAT::Control::Domain::PartiDomainControlBase::_genetic_time_mutate
double _genetic_time_mutate
time for genetic partitioner mutation
Definition: parti_domain_control_base.hpp:139

FEAT::Control::Domain::PartiDomainControlBase::_ancestry
std::deque< Ancestor > _ancestry
the partition ancestry deque
Definition: parti_domain_control_base.hpp:142

FEAT::Control::Domain::PartiDomainControlBase::_apply_parti_zoltan
bool _apply_parti_zoltan(Ancestor &ancestor, const MeshNodeType &base_mesh_node, const std::vector< WeightType > &weights)
Applies the Zoltan partitioner onto the base-mesh.
Definition: parti_domain_control_base.hpp:1339

FEAT::Control::Domain::PartiDomainControlBase::_apply_parti_naive
bool _apply_parti_naive(Ancestor &ancestor, const MeshNodeType &mesh_node, const std::vector< WeightType > &weights)
Applies the naive partitioner onto the base-mesh.
Definition: parti_domain_control_base.hpp:1486

FEAT::Control::Domain::PartiDomainControlBase::_apply_parti_metis
bool _apply_parti_metis(Ancestor &ancestor, const MeshNodeType &base_mesh_node, const std::vector< WeightType > &weights)
Applies the METIS partitioner onto the base-mesh.
Definition: parti_domain_control_base.hpp:1391

FEAT::Control::Domain::PartiDomainControlBase::parse_args
virtual bool parse_args(SimpleArgParser &args)
Parses the partitioner options from an argument parser.
Definition: parti_domain_control_base.hpp:188

FEAT::Control::Domain::PartiDomainControlBase::_apply_parti_genetic
bool _apply_parti_genetic(Ancestor &ancestor, MeshNodeType &base_mesh_node, const std::vector< WeightType > &weights)
Applies the genetic partitioner onto the base-mesh.
Definition: parti_domain_control_base.hpp:1444

FEAT::Control::Domain::PartiDomainControlBase::MeshNodeType
Geometry::RootMeshNode< MeshType > MeshNodeType
our root mesh node type
Definition: parti_domain_control_base.hpp:56

FEAT::Control::Domain::PartiDomainControlBase::get_ancestry
const std::deque< Ancestor > & get_ancestry() const
Returns a const reference to the ancestry.
Definition: parti_domain_control_base.hpp:606

FEAT::Control::Domain::PartiDomainControlBase::serialize_partitioning
std::vector< char > serialize_partitioning() const
Serializes the partitioning information into a binary buffer.
Definition: parti_domain_control_base.hpp:614

FEAT::Control::Domain::PartiDomainControlBase::_parse_parti_type
virtual bool _parse_parti_type(const String &type)
Parses a partitioner type.
Definition: parti_domain_control_base.hpp:727

FEAT::Control::Domain::PartiDomainControlBase::format_chosen_levels
virtual String format_chosen_levels() const
Returns the chosen levels formatted as a parsable string.
Definition: parti_domain_control_base.hpp:501

FEAT::Control::Domain::PartiDomainControlBase::set_desired_levels
virtual void set_desired_levels(int lvl_max, int lvl_med, int lvl_min)
Sets the desired refinement levels for a double-layered hierarchy.
Definition: parti_domain_control_base.hpp:429

FEAT::Control::Domain::PartiDomainControlBase::MeshPartType
LevelType::PartType MeshPartType
our mesh-part type
Definition: parti_domain_control_base.hpp:58

FEAT::Control::Domain::PartiDomainControlBase::get_adapt_mode
Geometry::AdaptMode get_adapt_mode() const
Gets the adapt-mode for refinement.
Definition: parti_domain_control_base.hpp:304

FEAT::Control::Domain::PartiDomainControlBase::_create_ancestry_single
virtual void _create_ancestry_single()
Creates the ancestry for a single layer (or a single process)
Definition: parti_domain_control_base.hpp:759

FEAT::Control::Domain::PartiDomainControlBase::_adapt_mode
Geometry::AdaptMode _adapt_mode
the adapt mode for refinement
Definition: parti_domain_control_base.hpp:114

FEAT::Control::Domain::PartiDomainControlBase::_allow_parti_metis
bool _allow_parti_metis
allow metis partitioner?
Definition: parti_domain_control_base.hpp:117

FEAT::Control::Domain::PartiDomainControlBase::get_desired_level_max
int get_desired_level_max() const
Returns the desired maximum refinement level.
Definition: parti_domain_control_base.hpp:458

FEAT::Control::Domain::PartiDomainControlBase::~PartiDomainControlBase
virtual ~PartiDomainControlBase()
virtual destructor
Definition: parti_domain_control_base.hpp:172

FEAT::Control::Domain::PartiDomainControlBase::set_desired_levels
virtual void set_desired_levels(const std::deque< String > &slvls)
Sets the desired levels for the partitioned hierarchy.
Definition: parti_domain_control_base.hpp:329

FEAT::Control::Domain::PartiDomainControlBase::_was_created
bool _was_created
specifies whether the domain control was already created
Definition: parti_domain_control_base.hpp:112

FEAT::Control::Domain::PartiDomainControlBase::get_chosen_parti_info
virtual String get_chosen_parti_info() const
Returns an informative string about the chosen partitioning.
Definition: parti_domain_control_base.hpp:527

FEAT::Control::Domain::PartiDomainControlBase::parse_property_map
virtual bool parse_property_map(const PropertyMap &pmap)
Parses the partitioner options from a PropertyMap.
Definition: parti_domain_control_base.hpp:232

FEAT::Control::Domain::PartiDomainControlBase::_genetic_time_init
double _genetic_time_init
time for genetic partitioner initialization
Definition: parti_domain_control_base.hpp:137

FEAT::Control::Domain::PartiDomainControlBase::_check_parti
virtual bool _check_parti(Ancestor &ancestor, const MeshNodeType &mesh_node, bool is_base_layer)
Checks for an appropriate partitioning strategy.
Definition: parti_domain_control_base.hpp:1254

FEAT::Control::Domain::PartiDomainControlBase::_support_multi_layered
bool _support_multi_layered
support multi-layered hierarchy?
Definition: parti_domain_control_base.hpp:126

FEAT::Control::Domain::PartiDomainControlBase::_apply_parti
virtual bool _apply_parti(Ancestor &ancestor, MeshNodeType &base_mesh_node)
Applies an a-posteriori partitioner.
Definition: parti_domain_control_base.hpp:1295

FEAT::Control::Domain::PartiDomainControlBase::BaseClass
Control::Domain::DomainControl< DomainLevel_ > BaseClass
Our base class.
Definition: parti_domain_control_base.hpp:46

FEAT::Control::Domain::PartiDomainControlBase::set_desired_levels
virtual void set_desired_levels(int lvl_max, int lvl_min=-1)
Sets the desired refinement levels for a single-layered hierarchy.
Definition: parti_domain_control_base.hpp:399

FEAT::Control::Domain::PartiDomainControlBase::_create_multi_layers_scattered
virtual void _create_multi_layers_scattered()
Creates the layers for a multi-layered domain control in a scattered fashion.
Definition: parti_domain_control_base.hpp:804

FEAT::Control::Domain::PartiDomainControlBase::_split_basemesh_halos
virtual void _split_basemesh_halos(const Ancestor &ancestor, const MeshNodeType &base_mesh_node, MeshNodeType &patch_mesh_node, std::vector< int > &neighbor_ranks)
Splits the base-mesh halos and computes the inter-patch-mesh halos.
Definition: parti_domain_control_base.hpp:941

FEAT::Control::Domain::PartiDomainControlBase::_allow_parti_genetic
bool _allow_parti_genetic
allow genetic partitioner?
Definition: parti_domain_control_base.hpp:119

FEAT::Control::Domain::PartiDomainControlBase::_allow_parti_zoltan
bool _allow_parti_zoltan
allow Zoltan partitioner?
Definition: parti_domain_control_base.hpp:123

FEAT::Dist::Comm
Communicator class.
Definition: dist.hpp:1349

FEAT::Dist::Comm::bcast
void bcast(void *buffer, std::size_t count, const Datatype &datatype, int root) const
Blocking broadcast.
Definition: dist.cpp:541

FEAT::Dist::Comm::comm_create_range_incl
Comm comm_create_range_incl(int count, int first=0, int stride=1) const
Creates a new sub-communicator from a strided range of ranks.
Definition: dist.cpp:472

FEAT::Dist::Comm::allreduce
void allreduce(const void *sendbuf, void *recvbuf, std::size_t count, const Datatype &datatype, const Operation &op) const
Blocking All-Reduce.
Definition: dist.cpp:655

FEAT::Dist::Comm::size
int size() const
Returns the size of this communicator.
Definition: dist.hpp:1506

FEAT::Dist::Comm::irecv
Request irecv(void *buffer, std::size_t count, const Datatype &datatype, int source, int tag=0) const
Nonblocking Receive.
Definition: dist.cpp:716

FEAT::Dist::Comm::isend
Request isend(const void *buffer, std::size_t count, const Datatype &datatype, int dest, int tag=0) const
Nonblocking Send.
Definition: dist.cpp:704

FEAT::Dist::Comm::comm
MPI_Comm comm
our MPI communicator handle
Definition: dist.hpp:1353

FEAT::Dist::Comm::gather
void gather(const void *sendbuf, std::size_t sendcount, const Datatype &sendtype, void *recvbuf, std::size_t recvcount, const Datatype &recvtype, int root) const
Blocking gather.
Definition: dist.cpp:553

FEAT::Dist::Comm::comm_dup
Comm comm_dup() const
Creates a copy of this communicator.
Definition: dist.cpp:459

FEAT::Dist::Comm::rank
int rank() const
Returns the rank of this process in this communicator.
Definition: dist.hpp:1494

FEAT::Dist::Comm::is_null
bool is_null() const
Checks whether this communicator is a null communicator.
Definition: dist.cpp:454

FEAT::Dist::Comm::print
void print(std::ostream &os, const String &msg, int root=0) const
Prints a message line to an output stream.
Definition: dist.cpp:782

FEAT::Dist::RequestVector
Communication Request vector class.
Definition: dist.hpp:640

FEAT::Dist::RequestVector::wait_all
void wait_all()
Blocks until all active requests are fulfilled.
Definition: dist.cpp:324

FEAT::Geometry::MeshAtlas< MeshType >

FEAT::Geometry::MeshNode::get_mesh
MeshType * get_mesh()
Returns the mesh of this node.
Definition: mesh_node.hpp:225

FEAT::Geometry::PartiIterative
Iterative-Partitioner class template declaration.
Definition: parti_iterative.hpp:450

FEAT::Geometry::PartiParMETIS
ParMETIS mesh/graph partitioner backend.
Definition: parti_parmetis.hpp:26

FEAT::Geometry::PartiParMETIS::execute
bool execute(const IndexSet< nf_ > &faces_at_elem, const IndexSet< nv_ > &verts_at_elem, const VertexSet_ &vertices, const Index num_parts, const std::vector< Real > &weights)
Executes the ParMETIS graph partitioner.
Definition: parti_parmetis.hpp:99

FEAT::Geometry::PartiParMETIS::build_elems_at_rank
Adjacency::Graph build_elems_at_rank() const
Builds and returns the elements-at-rank graph representing the partitioning.
Definition: parti_parmetis.hpp:112

FEAT::Geometry::PartiZoltan
Zoltan hypergraph partitioner backend.
Definition: parti_zoltan.hpp:39

FEAT::Geometry::PartiZoltan::execute
bool execute(const IndexSet< n_ > &faces_at_elem, const Index num_parts, const std::vector< Real > &weights)
Executes the Zoltan partitioner.
Definition: parti_zoltan.hpp:116

FEAT::Geometry::PartiZoltan::build_elems_at_rank
Adjacency::Graph build_elems_at_rank() const
Builds and returns the elements-at-rank graph representing the partitioning.
Definition: parti_zoltan.hpp:145

FEAT::Geometry::PatchHaloSplitter
Base-Mesh Patch Halo splitter.
Definition: patch_halo_splitter.hpp:33

FEAT::Geometry::RootMeshNode
Root mesh node class template.
Definition: mesh_node.hpp:748

FEAT::Geometry::RootMeshNode::get_patch
const MeshPartType * get_patch(int rank) const
Returns a patch meshpart for a given child.
Definition: mesh_node.hpp:962

FEAT::Geometry::RootMeshNode::get_halo_map
const std::map< int, std::unique_ptr< MeshPartType > > & get_halo_map() const
Definition: mesh_node.hpp:896

FEAT::Geometry::RootMeshNode::add_halo
void add_halo(int rank, std::unique_ptr< MeshPartType > halo_part)
Adds a halo mesh part to this mesh node.
Definition: mesh_node.hpp:874

FEAT::ParseError
Class for parser related errors.
Definition: exception.hpp:132

FEAT::PropertyMap
A class organizing a tree of key-value pairs.
Definition: property_map.hpp:48

FEAT::PropertyMap::query
std::pair< String, bool > query(String key_path) const
Queries a value by its key path.
Definition: property_map.cpp:125

FEAT::SimpleArgParser
Simple argument parser implementation.
Definition: simple_arg_parser.hpp:140

FEAT::SimpleArgParser::query
const std::pair< int, std::deque< String > > * query(const String &option) const
Query the parameters of an option.
Definition: simple_arg_parser.hpp:356

FEAT::SimpleArgParser::parse
int parse(const String &option, Prms_ &&... prms) const
Parses the parameters of an option.
Definition: simple_arg_parser.hpp:384

FEAT::String
String class implementation.
Definition: string.hpp:46

FEAT::String::split_by_whitespaces
std::deque< String > split_by_whitespaces() const
Splits the string by white-spaces.
Definition: string.hpp:518

FEAT::String::compare_no_case
int compare_no_case(const String &other) const
Compares two strings without regard to case.
Definition: string.hpp:679

FEAT::String::pad_front
String pad_front(size_type len, char c=' ') const
Pads the front of the string up to a desired length.
Definition: string.hpp:392

FEAT::Dist::op_max
const Operation op_max(MPI_MAX)
Operation wrapper for MPI_MAX.
Definition: dist.hpp:273

FEAT::Geometry::AdaptMode
AdaptMode
Adapt mode enumeration.
Definition: mesh_node.hpp:53

FEAT::Math::max
T_ max(T_ a, T_ b)
Returns the maximum of two values.
Definition: math.hpp:137

FEAT
FEAT namespace.
Definition: adjactor.hpp:12

FEAT::Real
double Real
Real data type.
Definition: base_header.hpp:128

FEAT::stringify
String stringify(const T_ &item)
Converts an item into a String.
Definition: string.hpp:944

FEAT::Index
std::uint64_t Index
Index data type.
Definition: base_header.hpp:122